#!/bin/bash

# The SBATCH directives must appear before any executable line in this script.

#SBATCH --qos high2         # QOS (priority).
#SBATCH -N 1               # Number of nodes requested.
#SBATCH -n 1               # Number of tasks (i.e. processes).
#SBATCH --cpus-per-task=1  # Number of cores per task.
#SBATCH --gres=gpu:4       # Number of GPUs.
#SBATCH -t 60-00:00          # Time requested (D-HH:MM).
#SBATCH --nodelist=em5    # Uncomment if you need a specific machine.

# Uncomment this to have Slurm cd to a directory before running the script.
# You can also just run the script from the directory you want to be in.
#SBATCH -D /home/test_time_training/ttt_mae_v1

# Uncomment to control the output files. By default stdout and stderr go to
# the same place, but if you use both commands below they'll be split up.
# %N is the hostname (if used, will create output(s) per node).
# %j is jobid.
##SBATCH -o slurm.%N.%j.out    # STDOUT
##SBATCH -e slurm.%N.%j.err    # STDERR

# Print some info for context.
source ~/.bashrc
conda activate taming
cd /home/test_time_training/ttt_mae_v1

nvidia-smi
# Python will buffer output of your script unless you set this.
# If you're not using python, figure out how to turn off output
# buffering when stdout is a file, or else when watching your output
# script you'll only get updated every several lines printed.
export PYTHONUNBUFFERED=1
DATA_PATH='/shared/group/ilsvrc/'

PRETRAIN_CHKPT='/home/test_time_training/ttt_mae_v1/models/cifar10/mae_visualize_vit_large.pth'
OUTPUT_DIR='/home/test_time_training/ttt_mae_v1/models/imagenet/vit_head/'

# Do all the research.
# -m torch.distributed.launch --nproc_per_node=4 
CUDA_VISIBLE_DEVICES=0 python main_prob.py \
        --batch_size 128 \
        --model mae_vit_large_patch16 \
        --finetune ${PRETRAIN_CHKPT} \
        --epochs 90 \
        --input_size 32 \
        --head_type vit_head \
        --blr 0.1 \
        --weight_decay 0.0 \
        --dist_eval --data_path ${DATA_PATH} --output_dir ${OUTPUT_DIR}

# Print completion time.
date