#CUDA_VISIBLE_DEVICES=7 python train.py --dataset cifar100 --layers 40 --widen-factor 10 --tensorboard \
#    --loss cross_entropy \
#    --model_seed 1 --data_seed 100 \
#    --lr 0.1 --scheduler cifar \
#    --split_size=45000 --batch-size=128 \
#    --name cifar100/WRN-28-10-modelseed-1-dataseed-100-split-45000-multistep

CUDA_VISIBLE_DEVICES=6 python train.py --dataset cifar100 --layers 40 --widen-factor 10 --tensorboard \
    --loss cross_entropy \
    --model_seed 1 --data_seed 100 \
    --lr 0.1 --weight-decay 0.0 --scheduler cifar_long --epochs 500 \
    --split_size=45000 --batch-size=256 \
    --name cifar100/WRN-28-10-modelseed-1-dataseed-100-split-45000-multistep-long-wd-0.0
