#! /bin/bash
# pip3 install mpu
# pip3 install accelerate==0.34.2
# pip3 install torchtypin
# pip3 install transformers
# pip3 install deepspeed==0.15.0
# pip3 install tokenizers==0.14.1
# pip install --upgrade --force-reinstall certifi
# pip install --upgrade datasets huggingface_hub
# pip install torchtyping rouge_score
# pip install --upgrade transformers tokenizers
# pip3 install --no-cache-dir -e /opt/dpcvol/models/pkge/transformers-minillm/.
# pip3 install thop
# pip3 install pytorch_model_summary

# pip3 uninstall py-cpuinfo -y
# pip3 install py-cpuinfo

MASTER_ADDR=localhost
MASTER_PORT=2113 # ${2-2113}
NNODES=1
NODE_RANK=0
GPUS_PER_NODE=1 # ${3-1}

DISTRIBUTED_ARGS="--nproc_per_node $GPUS_PER_NODE \
                  --nnodes $NNODES \
                  --node_rank $NODE_RANK \
                  --master_addr $MASTER_ADDR \
                  --master_port $MASTER_PORT"

# model

for CKPT_NAME in auto_lerangene-DesNet174M-78MToken_bs2 auto_lerangene-DesNet235M-78MToken_bs16 auto_lerangene-DesNet297M-78MToken_bs16 van_lerangene-DesNet178M-78MToken_bs2 van_lerangene-DesNet235M-78MToken_bs16 van_lerangene-DesNet297M-78MToken_bs16
do 

    BASE_PATH="/home/naie/work/minillm0807" # ${1-"/home/naie/work/"}
    BASE_CODE_PATH="${BASE_PATH}/minillm"
    CKPT="/opt/dpcvol/models/LLM_Distillation/results/${CKPT_NAME}/sft_downstream_tasks/dolly/e10-bs16-lr0.0005-G1-N1-NN1/7141/"

    # data
    DATA_NAMES="dolly"
    DATA_DIR="/opt/dpcvol/datasets/8625883998351850434/datasets/llm/minillm/eval_data/dolly/"
    # hp
    EVAL_BATCH_SIZE=16
    # runtime
    SAVE_PATH="/opt/dpcvol/models/LLM_Distillation/results/${CKPT_NAME}/eval/dolly/"
    TYPE="eval_main"
    PYTHONPATH=$PYTHONPATH:/home/naie/.local/lib/python3.9/site-packages

    OPTS=""
    # model
    OPTS+=" --base-path ${BASE_PATH}"
    OPTS+=" --model-path ${CKPT}"
    OPTS+=" --tokenizer-path ${CKPT}"
    OPTS+=" --ckpt-name ${CKPT_NAME}"
    OPTS+=" --n-gpu ${GPUS_PER_NODE}"
    OPTS+=" --model-type gpt2"
    # data
    OPTS+=" --data-dir ${DATA_DIR}"
    OPTS+=" --data-names ${DATA_NAMES}"
    OPTS+=" --num-workers 0"
    OPTS+=" --dev-num -1"
    OPTS+=" --data-process-workers -1"
    OPTS+=" --json-data"
    # hp
    OPTS+=" --eval-batch-size ${EVAL_BATCH_SIZE}"
    OPTS+=" --max-length 512"
    OPTS+=" --max-prompt-length 256"
    # runtime
    OPTS+=" --do-eval"
    OPTS+=" --save ${SAVE_PATH}"
    OPTS+=" --seed 10"
    # deepspeed
    OPTS+=" --deepspeed"
    OPTS+=" --deepspeed_config ${BASE_CODE_PATH}/configs/deepspeed/ds_config.json"
    OPTS+=" --type ${TYPE}"
    # gen
    OPTS+=" --do-sample"
    OPTS+=" --top-k 0"
    OPTS+=" --top-p 1.0"
    OPTS+=" --temperature 1.0"


    export NCCL_DEBUG=""
    export TOKENIZERS_PARALLELISM=false
    export PYTHONIOENCODING=utf-8
    export HCCL_CONNECT_TIMEOUT=1000
    export PYTHONPATH=${BASE_CODE_PATH}
    CMD="torchrun ${DISTRIBUTED_ARGS} ${BASE_CODE_PATH}/evaluate.py ${OPTS} $@"

    echo ${CMD}
    echo "PYTHONPATH=${PYTHONPATH}"
    mkdir -p ${SAVE_PATH}
    ${CMD}
done
