clear
mkdir models
cp ../1_step1/models/checkpoint.pth.tar ./models/checkpoint_ba.pth.tar
mkdir log
# 128 epoch setting: larger learning rate, similar performance to 256 epoch
python3 -u baseline_imagenet/2_step2/train.py --data=/datasets/imagenet --batch_size=256 --learning_rate=1.25e-3 --epochs=128 --weight_decay=0 | tee -a imagenet_log_step2/training.txt
CUDA_VISIBLE_DEVICES=1,2,3,4,5,6 python3 -u baseline_imagenet/2_step2/train.py --data=/datasets/imagenet --batch_size=256 --learning_rate=1.25e-3 --epochs=128 --weight_decay=0 | tee -a imagenet_log_step2/training.txt
# 256 epoch setting: longer training, similar performance to 128 epoch
# python3 train.py --data=/datasets/imagenet --batch_size=256 --learning_rate=5e-4 --epochs=256 --weight_decay=0 | tee -a log/training.txt
