CUDA_VISIBLE_DEVICES=5,6
OUT=eval_results
PORT=25312

# Table 1 - Part 1
datasets="gsm8k math"
gen_length="128 512"

for d in $datasets; do
    for g in $gen_length; do
      s=$((g / 2))
      echo "dataset=$d gen_length=$g diffusion_steps=$s port=$PORT"
      CUDA_VISIBLE_DEVICES=$CUDA_VISIBLE_DEVICES \
      torchrun --nproc_per_node 2 --master_port $PORT eval.py \
        --dataset $d --batch_size 8 --gen_length $g --block_length 32 --diffusion_steps $s \
        --output_dir "$OUT" --model_path "GSAI-ML/LLaDA-8B-Instruct"
      PORT=$((PORT+1))
    done
done

# Table 1 - Part 2
datasets="gsm8k math"
factors="4 8"

for d in $datasets; do
    for f in $factors; do
        s=$((256 / f))
        echo "dataset=$d gen_length=256 diffusion_steps=$s port=$PORT"
        CUDA_VISIBLE_DEVICES=$CUDA_VISIBLE_DEVICES \
        torchrun --nproc_per_node 2 --master_port $PORT eval.py \
            --dataset $d --batch_size 16 --gen_length 256 --block_length 32 --diffusion_steps $s \
            --output_dir "$OUT" --model_path "GSAI-ML/LLaDA-8B-Instruct"
        PORT=$((PORT+1))
    done
done

# Table 2
datasets="gsm8k math"
steps="128 256 512"

for m in $models; do
  for d in $datasets; do
    for s in $steps; do
      echo "dataset=$d steps=$s port=$PORT"
      CUDA_VISIBLE_DEVICES=$CUDA_VISIBLE_DEVICES \
      torchrun --nproc_per_node 2 --master_port $PORT eval.py \
        --dataset $d --batch_size 8 --gen_length $s --block_length 32 --diffusion_steps $s \
        --output_dir "$OUT" --model_path "GSAI-ML/LLaDA-8B-Instruct"
      PORT=$((PORT+1))
    done
  done
done

