WANDB_MODE=online CUDA_VISIBLE_DEVICES=0 python train.py \
    --data-path ~/datasets/imagenet --data-set IMNET --save-dir ~/weights/conservation/imagenet \
    --input-size 224 --patch-size 16 --num-classes 1000 --hidden-size 192 --num-hidden-layer 12 \
    --num-attention-heads 3 --intermediate-size 768 --mlp-type mlp --opt sgd --momentum 0.0\
    --epochs 1 --batch-size 1024 --lr 0.003 --weight_decay 0.0 --lr-scheduler linear --warmup-lr 0.003 --warmup-epochs 0\
    --wandb-project "ConservationLaws" --wandb-group "IMNET" --seed 0
