#!/bin/bash
base_model=${1:-"b"}
distill=${2:-"distill"}

if [ "$base_model" = "b" ]; then
  echo "Using base model"
  base_model="deit3_base_patch16_224"
else
  echo "Using small model"
  base_model="deit3_small_patch16_224"
fi

# decide the name of the output model
if [ "$base_model" = "deit3_base_patch16_224" ]; then
  # check if distillation is used
  output_model="./output/manar_${distill}_base"
else
  output_model="./output/manar_${distill}_small"
fi

if [ "$distill" = "distill" ]; then
  echo "Using distillation"
  distill="--mem-only --kt"
else
  echo "Not using distillation"
  distill=""
fi
python main.py --model ${base_model} --batch-size 256 --drop-path 0.05 --weight-decay 0.05 --lr 1e-4 --num_workers 8 --data-path /data/shared_data/imagenet/ --output_dir ${output_model} --no_amp --grad-accum-steps 4 --tmodel ${distill}
