export CUDA_VISIBLE_DEVICES=4,5,6,7

torchrun --nproc_per_node=4 --master_port=29501 script/train/oracle_train_kvcache_mse.py \
    --config recipe/oracle.json \
    --chosen_target_layer_idx 20