# USE_OPEN_SOURCE_DS='true' TOKEN_NORM='false' BASEMODEL_PATH='./cs_gate_train/models/llama3-8b' MODEL_NAME='llama3-8b' accelerate launch --config_file deepspeed_config.yaml --num_processes=2 gate_train.py
# USE_OPEN_SOURCE_DS='true' TOKEN_NORM='false' BASEMODEL_PATH='./cs_gate_train/models/llama3-8b' MODEL_NAME='llama3-8b' python -m pdb gate_train.py
# USE_OPEN_SOURCE_DS='true' TOKEN_NORM='true' BASEMODEL_PATH='./cs_gate_train/models/gemma3-4b' MODEL_NAME='gemma3-4b' accelerate launch --config_file deepspeed_config.yaml --num_processes=2 gate_train.py
USE_OPEN_SOURCE_DS='true' TOKEN_NORM='true' BASEMODEL_PATH='/cpfs01/user/jiawei.lyt/ckpt/verl_checkpoints/lyt-rl-gen/qwen3-tpp-nothink-0721-distilled-data0706-recitex1-bothtrans-mixlangx2-GenRM-32B-sentcs-GSPO-ref-turbopp-LENGTH_FLIP_THRESHOLD1.3-LENGTH_FLIP_PROB0.75-REF_ANSWER_POSITION-A-expert-12k_bs512_minibs128_n8/global_step_60/actor_hf' MODEL_NAME='qwen3-30b' accelerate launch --config_file deepspeed_config.yaml --num_processes=2 gate_train.py
USE_OPEN_SOURCE_DS='true' TOKEN_NORM='true' BASEMODEL_PATH='./cs_gate_train/models/gpt-oss-20b' MODEL_NAME='gpt-oss-20b-norm' accelerate launch --config_file deepspeed_config.yaml --num_processes=2 gate_train.py