#! /bin/bash

BASE_CODE_PATH="/home/naie/work/minillm"
export PYTHONPATH=${BASE_CODE_PATH}

# 1
output_dir="/opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/Build_descendant_model/NEmbed_768_NHead_12_NLayer_14/sque_init/"
mkdir -p "$output_dir"
python ${BASE_CODE_PATH}/learngene_init.py \
  --big_model_path /opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/stepwise_distill/train/gpt2_m-l-best_iter/bs8-lr5e-06-G2-N8-NN1-lm1-len512/pe4_rs0.5_nr256_ln_sr_tm0.2/5000/pytorch_model.bin \
  --small_model_path /opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/stepwise_distill/train/gpt2_b-m-best_iter/bs8-lr5e-06-G2-N8-NN1-lm1-len512/pe4_rs0.5_nr256_ln_sr_tm0.2/5000/pytorch_model.bin \
  --model_base_config /home/naie/work/minillm/configs/learngene/gpt2/gpt2-NEmbed_768_NHead_12_NLayer_14.json \
  --embeding_dim 768 --head_num 12 --layer_num 14 --alpha 0.9 \
  --output_type huggingface \
  --output_dir "$output_dir"

# 2
output_dir="/opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/Build_descendant_model/NEmbed_896_NHead_14_NLayer_18/sque_init/"
mkdir -p "$output_dir"
python ${BASE_CODE_PATH}/learngene_init.py \
  --big_model_path /opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/stepwise_distill/train/gpt2_m-l-best_iter/bs8-lr5e-06-G2-N8-NN1-lm1-len512/pe4_rs0.5_nr256_ln_sr_tm0.2/5000/pytorch_model.bin \
  --small_model_path /opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/stepwise_distill/train/gpt2_b-m-best_iter/bs8-lr5e-06-G2-N8-NN1-lm1-len512/pe4_rs0.5_nr256_ln_sr_tm0.2/5000/pytorch_model.bin \
  --model_base_config /home/naie/work/minillm/configs/learngene/gpt2/gpt2-NEmbed_896_NHead_14_NLayer_18.json \
  --embeding_dim 896 --head_num 14 --layer_num 18 --alpha 0.9 \
  --output_type huggingface \
  --output_dir "$output_dir"

# 3
output_dir="/opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/Build_descendant_model/NEmbed_896_NHead_14_NLayer_24/sque_init/"
mkdir -p "$output_dir"
python ${BASE_CODE_PATH}/learngene_init.py \
  --big_model_path /opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/stepwise_distill/train/gpt2_m-l-best_iter/bs8-lr5e-06-G2-N8-NN1-lm1-len512/pe4_rs0.5_nr256_ln_sr_tm0.2/5000/pytorch_model.bin \
  --small_model_path /opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/stepwise_distill/train/gpt2_b-m-best_iter/bs8-lr5e-06-G2-N8-NN1-lm1-len512/pe4_rs0.5_nr256_ln_sr_tm0.2/5000/pytorch_model.bin \
  --model_base_config /home/naie/work/minillm/configs/learngene/gpt2/gpt2-NEmbed_896_NHead_14_NLayer_18.json \
  --embeding_dim 896 --head_num 14 --layer_num 24 --alpha 0.1 \
  --output_type huggingface \
  --output_dir "$output_dir"

# 4
output_dir="/opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/Build_descendant_model/NEmbed_1024_NHead_16_NLayer_26/sque_init/"
mkdir -p "$output_dir"
python ${BASE_CODE_PATH}/learngene_init.py \
  --big_model_path /opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/stepwise_distill/train/gpt2_l-xl-best_iter/bs8-lr5e-06-G2-N8-NN1-lm1-len512/pe4_rs0.5_nr256_ln_sr_tm0.2/5000/pytorch_model.bin \
  --small_model_path /opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/stepwise_distill/train/gpt2_m-l-best_iter/bs8-lr5e-06-G2-N8-NN1-lm1-len512/pe4_rs0.5_nr256_ln_sr_tm0.2/5000/pytorch_model.bin \
  --model_base_config /home/naie/work/minillm/configs/learngene/gpt2/gpt2-NEmbed_1024_NHead_16_NLayer_26.json \
  --embeding_dim 1024 --head_num 16 --layer_num 26 --alpha 0.9 \
  --output_type huggingface \
  --output_dir "$output_dir"

# 5
output_dir="/opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/Build_descendant_model/NEmbed_1152_NHead_18_NLayer_30/sque_init/"
mkdir -p "$output_dir"
python ${BASE_CODE_PATH}/learngene_init.py \
  --big_model_path /opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/stepwise_distill/train/gpt2_l-xl-best_iter/bs8-lr5e-06-G2-N8-NN1-lm1-len512/pe4_rs0.5_nr256_ln_sr_tm0.2/5000/pytorch_model.bin \
  --small_model_path /opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/stepwise_distill/train/gpt2_m-l-best_iter/bs8-lr5e-06-G2-N8-NN1-lm1-len512/pe4_rs0.5_nr256_ln_sr_tm0.2/5000/pytorch_model.bin \
  --model_base_config /home/naie/work/minillm/configs/learngene/gpt2/gpt2-NEmbed_1152_NHead_18_NLayer_30.json \
  --embeding_dim 1152 --head_num 18 --layer_num 30 --alpha 0.9 \
  --output_type huggingface \
  --output_dir "$output_dir"

# 6
output_dir="/opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/Build_descendant_model/NEmbed_1152_NHead_18_NLayer_34/sque_init/"
mkdir -p "$output_dir"
python ${BASE_CODE_PATH}/learngene_init.py \
  --big_model_path /opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/stepwise_distill/train/gpt2_l-xl-best_iter/bs8-lr5e-06-G2-N8-NN1-lm1-len512/pe4_rs0.5_nr256_ln_sr_tm0.2/5000/pytorch_model.bin \
  --small_model_path /opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/qwen3-4b/stepwise_distill/train/gpt2_m-l-best_iter/bs8-lr5e-06-G2-N8-NN1-lm1-len512/pe4_rs0.5_nr256_ln_sr_tm0.2/5000/pytorch_model.bin \
  --model_base_config /home/naie/work/minillm/configs/learngene/gpt2/gpt2-NEmbed_1152_NHead_18_NLayer_34.json \
  --embeding_dim 1152 --head_num 18 --layer_num 34 --alpha 0.1 \
  --output_type huggingface \
  --output_dir "$output_dir"