# CUDA_VISIBLE_DEVICES=0 python mmlu_expert_bak.py \
# --mode "train" \
# --need-lora \
# --main-model Qwen/Qwen-14B

# CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 accelerate launch mmlu_expert_bak.py \
# --mode "test_fewshot" \
# --need-lora \
# --main-model Qwen/Qwen-14B

CUDA_VISIBLE_DEVICES=0 python train_router_mmlu.py

# CUDA_VISIBLE_DEVICES=0,1,2,3 accelerate launch test_multi.py