
set -e

# D1 Table First for Argmax2 and Random 2 (TopK + Bottom K)
CUDA_VISIBLE_DEVICES=5,6
PORT=25312
OUT=eval_results
ROOT=/mnt/data/shared/shparashar/lift/SFT/sft_output

# models="argmax2 bottomk_topk"
# datasets="gsm8k math"
# gen_length="128 512"

# for m in $models; do
#   for d in $datasets; do
#     for g in $gen_length; do
#       s=$((g / 2))
#       echo "model=$m dataset=$d gen_length=$g diffusion_steps=$s port=$PORT"
#       CUDA_VISIBLE_DEVICES=$CUDA_VISIBLE_DEVICES \
#       torchrun --nproc_per_node 2 --master_port $PORT eval.py \
#         --dataset $d --batch_size 8 --gen_length $g --block_length 32 --diffusion_steps $s \
#         --output_dir "$OUT" --model_path "$ROOT/$m"
#       PORT=$((PORT+1))
#     done
#   done
# done

# Number of Steps Ablations
models="argmax2 bottomk_topk"
datasets="gsm8k math"
factors="4 8"

for m in $models; do
  for d in $datasets; do
    for f in $factors; do
        s=$((256 / f))
        echo "model=$m dataset=$d gen_length=256 diffusion_steps=$s port=$PORT"
        CUDA_VISIBLE_DEVICES=$CUDA_VISIBLE_DEVICES \
        torchrun --nproc_per_node 2 --master_port $PORT eval.py \
            --dataset $d --batch_size 8 --gen_length 256 --block_length 32 --diffusion_steps $s \
            --output_dir "$OUT" --model_path "$ROOT/$m"
        PORT=$((PORT+1))
    done
  done
done

# Number of Steps Ablations
models="mix_less"
datasets="math"
factors="4 8"

for m in $models; do
  for d in $datasets; do
    for f in $factors; do
        s=$((256 / f))
        echo "model=$m dataset=$d gen_length=256 diffusion_steps=$s port=$PORT"
        CUDA_VISIBLE_DEVICES=$CUDA_VISIBLE_DEVICES \
        torchrun --nproc_per_node 2 --master_port $PORT eval.py \
            --dataset $d --batch_size 8 --gen_length 256 --block_length 32 --diffusion_steps $s \
            --output_dir "$OUT" --model_path "$ROOT/$m"
        PORT=$((PORT+1))
    done
  done
done


