export PYTHONPATH="Megatron-LM:grouter_ep_optimizer:$PYTHONPATH"
CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,7,8

C4_HOME="/workspace/Megatron-LM-router/qwen3_dataset"
DATA_BLEND=""
for i in {0000..0003}; do # 1/25
    DATA_BLEND="${DATA_BLEND} 0.04 ${C4_HOME}/qwen3-c4-${i}_text_document"
done

torchrun --nproc-per-node 8 grouter_ep_optimizer/tools/construct_mapping.py \
    --batch-size 16 \
    --max-length 4096 \
    --data-prefix $DATA_BLEND \
    --random-seed 1423 \
    --tokenizer-type HuggingFaceTokenizer \
    --tokenizer-model model_home/qwen3-30b-a3b \
    --total-steps 100 \
    --bf16 \
    --grouter-config-path grouter_ep_optimizer/grouter/qwen3_30b/grouter_config.json \
    --grouter-checkpoint-path grouter_ep_optimizer/grouter/qwen3_30b/grouter_30b.pth \
    --target-num-experts 64 \
    --output-mapping grouter_ep_optimizer/grouter/qwen3_30b/cvt64_map_affinity.json \
    --mapping-strategy affinity \
    --verbose 