#!/bin/bash

for seed in 1 2 3 4 5
do
  for loss in "sft" "digit" "digit_base"
  do
      for data_split in 1 2 3 4 5 6 7 8 9 10
      do
        num_epochs=$((250 / data_split))
        deepspeed --include localhost:0,1 --master_port 9501 train.py \
          --model "meta-llama/Llama-3.2-1B-Instruct" \
          --data_split "train${data_split}" \
          --seed $seed \
          --batch_size 16 \
          --grad_acc 1 \
          --num_epochs $num_epochs \
          --loss $loss \
          --max_length 2048
      done
  done
done
# --model "HuggingFaceTB/SmolLM2-135M-Instruct" \
