#! /bin/bash
# 依赖安装建议提前准备好环境，这里省略

MASTER_ADDR=localhost
MASTER_PORT=${2-2113}
NNODES=1
NODE_RANK=0
GPUS_PER_NODE=${3-1}

DISTRIBUTED_ARGS="--nproc_per_node $GPUS_PER_NODE \
                  --nnodes $NNODES \
                  --node_rank $NODE_RANK \
                  --master_addr $MASTER_ADDR \
                  --master_port $MASTER_PORT"

# 参数接收
BASE_PATH=${1-"/home/naie/work/"}
BASE_CODE_PATH="${BASE_PATH}/minillm"
CKPT_NAME=${4}
DATA_NAMES="boolq"
CKPT="/opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/des-sft/llama3-8b/various_alpha/boolq/${CKPT_NAME}/e10-bs16-lr0.0005-G1-N8-NN1/621/"   # 如果需要指定模型路径，可在这里补充

DATA_DIR="/opt/dpcvol/datasets/8625883998351850434/datasets/llm/minillm/processed_data_jyc/dataset-JYC/processed_boolq/full/gpt2/"
EVAL_BATCH_SIZE=64
SAVE_PATH="/opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/learngene/llama3-8b/eval/various_alpha/${DATA_NAMES}/${CKPT_NAME}/"
TYPE="eval_main"

PYTHONPATH=$PYTHONPATH:/home/naie/.local/lib/python3.9/site-packages

OPTS=""
# model
OPTS+=" --base-path ${BASE_PATH}"
OPTS+=" --model-path ${CKPT}"
OPTS+=" --tokenizer-path /opt/dpcvol/datasets/8625883998351850434/ckpt/minillm/minillm_official/gpt2/train/minillm/medium-init-xlarge-sft/"
OPTS+=" --ckpt-name ${CKPT_NAME}"
OPTS+=" --n-gpu ${GPUS_PER_NODE}"
OPTS+=" --model-type gpt2"
# data
OPTS+=" --data-dir ${DATA_DIR}"
OPTS+=" --data-names ${DATA_NAMES}"
OPTS+=" --num-workers 0"
OPTS+=" --dev-num -1"
OPTS+=" --data-process-workers -1"
OPTS+=" --json-data"

# hp
OPTS+=" --eval-batch-size ${EVAL_BATCH_SIZE}"
OPTS+=" --max-length 512"
OPTS+=" --max-prompt-length 256"
# runtime
OPTS+=" --do-eval"
OPTS+=" --save ${SAVE_PATH}"
# deepspeed
OPTS+=" --deepspeed"
OPTS+=" --deepspeed_config ${BASE_CODE_PATH}/configs/deepspeed/ds_config.json"
OPTS+=" --type ${TYPE}"
# gen
OPTS+=" --do-sample"
OPTS+=" --top-k 0"
OPTS+=" --top-p 1.0"
OPTS+=" --temperature 1.0"

export NCCL_DEBUG=""
export TOKENIZERS_PARALLELISM=false
export PYTHONIOENCODING=utf-8
export HCCL_CONNECT_TIMEOUT=1000
export PYTHONPATH=${BASE_CODE_PATH}

CMD="torchrun ${DISTRIBUTED_ARGS} ${BASE_CODE_PATH}/evaluate.py ${OPTS} ${@:5}"

echo ${CMD}
echo "PYTHONPATH=${PYTHONPATH}"
mkdir -p ${SAVE_PATH}
${CMD}
