python training/train_interleave.py --model_name_or_path "EleutherAI/pythia-2.8b" --revision step0 --dataset_name "cnn_dailymail" --dataset_config_name 3.0.0 --per_device_train_batch_size 1 --per_device_eval_batch_size 1 --learning_rate 0.001 --output_dir checkpoints/pythia-2.8b-10grad-25tasks-0122-scratch-new$SLURM_ARRAY_TASK_ID --save_prefix batch1_gpu1 --block_size 256 --num_train_epochs 5 --overwrite_cache --save_freq 1 --num-grad-steps 10 --num-data-samples 25
