CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 torchrun --nproc_per_node=8 train.py \
    --output_dir ./122Qkformer/output/513_NO6_288 \
    --log_dir ./122Qkformer/output/513_NO6_288 \
    --data_path ./dataset/imagenet \
    --model  QKFormer_10_768_td \
    --td \
    --input_size 288 \
    --time_step 4 \
    --batch_size 30 \
    --accum_iter 2 \
    --epochs 15\
    --blr 6e-6 \
    --warmup_epochs 0 

