#!/bin/bash

model="Llama-3-2-1B-Instruct"
loss=digit

for seed in 1 2 3 4 5
do
    for data_split in 1 2 3 4 5 6 7 8 9 10
    do
      for ablation in cont-loss no-split-digit no-place-weighting label-smoothing
      do
        output_file="../../../data/toycos/ckpt_ablation/${seed}_train${data_split}_${model}_${loss}_${ablation}"
        num_epochs=$((250 / data_split))
        if [ ! -d "$output_file" ]; then
          echo "Runnging inference for ${output_file}."
          deepspeed --include localhost:0,1 --master_port 9501 train.py \
            --model "meta-llama/Llama-3.2-1B-Instruct" \
            --output_dir "../../../data/toycos/ckpt_ablation" \
            --data_split "train${data_split}" \
            --seed $seed \
            --batch_size 16 \
            --grad_acc 1 \
            --num_epochs $num_epochs \
            --ablation $ablation \
            --loss digit \
            --max_length 2048
        else
          echo "Output file ${output_file} already exists. Skipping."
        fi
      done
  done
done
# --model "HuggingFaceTB/SmolLM2-135M-Instruct" \
