CUDA_VISIBLE_DEVICES=0 \
  python mergemoe/merge-moe.py \
  --task="winogrande" \
  --num_samples_for_merging=64 \
  --num_groups=32 \
  --merging_layers="1,2,3,4,5,6,7,8" \
  --merging_strategy="ours" \
  --model_type="olmoe" \
  --output_dir="results/winogrande/merged-olmoe/" \
  --checkpoint="/root/model/OLMoE-1B-7B-0125"