python training/train_interleave_rev.py --model_name_or_path "EleutherAI/pythia-1b" --revision main --dataset_name "cnn_dailymail" --dataset_config_name 3.0.0 --per_device_train_batch_size 1 --per_device_eval_batch_size 1 --learning_rate 0.001 --output_dir checkpoints/pythia-1b-10grad-50data-ckpt144k-cnn-256-shuffle-rev-sgd-48 --save_prefix batch1_gpu1 --block_size 256 --num_train_epochs 5 --overwrite_cache --checkpointing_steps epoch --save_freq 1 --num-grad-steps 10 --num-data-samples 50 --start-shuffle-data-samples 48

