readonly MCORE_PATH='/root/Megatron-LM'
export PYTHONPATH="$PWD:$MCORE_PATH:$PYTHONPATH"

export MASTER_ADDR="127.0.0.1"
export MASTER_PORT=65535
export PX_INSPECET_MODEL=1

source tasks/math_rl_v3/config.sh

readonly HF_HUB_DIR="${DFS_PATH}/models/models--deepseek-ai--DeepSeek-R1-Distill-Llama-8B"

LOG_DIR="$PWD/log/grpo_llama3"
mkdir -p $LOG_DIR

if [ $1 == "hf_to_mlm" ]; then
    HF_INPUT_DIR="${DFS_PATH}/models/models--deepseek-ai--DeepSeek-R1-Distill-Llama-8B"
    MLM_OUTPUT_DIR="${DFS_PATH}/models/models--deepseek-ai--DeepSeek-R1-Distill-Llama-8B/mlm"
    mkdir -p $MLM_OUTPUT_DIR

    ARGS="
        --model_arch llama \
        --convert_way hf_to_mlm \
        --megatron_load_dir xxx \
        --megatron_save_dir ${MLM_OUTPUT_DIR} \
        --hf_load_dir ${HF_INPUT_DIR} \
        --hf_save_dir xxx \
        --hf_py_source_file ${HF_HUB_DIR} \
        --tokenizer_path ${HF_HUB_DIR} \
        --hf_config_json ${HF_HUB_DIR}/config.json \
        --bf16 \
        --dist_ckpt_format torch_dist \
    "
elif [ $1 == "mlm_to_hf" ]; then

    MLM_INPUT_DIR="${DFS_PATH}/models/models--deepseek-ai--DeepSeek-R1-Distill-Llama-8B/mlm_$2/iter_0000$3"
    HF_OUTPUT_DIR="${DFS_PATH}/works/0626ReasoningGen/src/trainedmodels/models--deepseek-ai--DeepSeek-R1-Distill-Llama-8B-$2/checkpoint-$3"
    echo MLM_INPUT_DIR: $MLM_INPUT_DIR
    echo HF_OUTPUT_DIR: $HF_OUTPUT_DIR

    ARGS="
        --model_arch llama \
        --convert_way mlm_to_hf \
        --megatron_load_dir $MLM_INPUT_DIR \
        --megatron_save_dir xxx \
        --hf_load_dir xxx \
        --hf_save_dir $HF_OUTPUT_DIR \
        --hf_py_source_file ${HF_HUB_DIR} \
        --tokenizer_path ${HF_HUB_DIR} \
        --hf_config_json ${HF_HUB_DIR}/config.json \
        --bf16 \
        --dist_ckpt_format torch_dist \
    "
fi
python3 tools/px_ckpt_conv/px_ckpt_conv.py $ARGS > $LOG_DIR/convert_ckpt.log 2>&1
