#!/bin/bash
#SBATCH --job-name=igb_train
#SBATCH --nodes=1
#SBATCH --ntasks=1
#SBATCH --cpus-per-task=12        
#SBATCH --time=02-00:00:00
#SBATCH --mem=100GB
#SBATCH --mail-type=BEGIN,END,FAIL
#SBATCH --output=igb_train.out
#SBATCH --error=igb_train.err

conda activate igb


FOLDER="train_spec_largevit_cifar100"
init_run=3
nruns=4

export CUDA_VISIBLE_DEVICES=0  # force all jobs to use same GPU

#### rerun last run
for run in $(seq $init_run $nruns); do
  seed=$((run + 1000))
  files=()
  for FILE in "$FOLDER"/*; do
    if [ -f "$FILE" ]; then
      files+=("$FILE")
    fi
  done
  for idx in "${!files[@]}"; do
    FILE="${files[$idx]}"
    filename="${FILE##*/}"
    basename="${filename%%.*}"
    outfile="reports/train_${basename}.out"
    python main_train.py --spec_file="$FILE" --seed="$seed" train > "$outfile" &
  done
  wait
done
echo "All training jobs completed."