#! /bin/bash

MASTER_ADDR=localhost
MASTER_PORT=2115
NNODES=1
NODE_RANK=0
GPUS_PER_NODE=1

DISTRIBUTED_ARGS="--nproc_per_node $GPUS_PER_NODE \
                  --nnodes $NNODES \
                  --node_rank $NODE_RANK \
                  --master_addr $MASTER_ADDR \
                  --master_port $MASTER_PORT"

# base path
BASE_PATH=${1-"/home/GAKD"}
DATA_NAMES="dolly"
DATA_DIR="${BASE_PATH}/data/dolly"

EVAL_BATCH_SIZE=64
TYPE="eval_main"


CKPT_PATHS=(
    "./checkpoints/Qwen3-0.6B"
)

for i in "${!CKPT_PATHS[@]}"; do
    CKPT_NAME="eval"
    CKPT="${CKPT_PATHS[$i]}"
    SAVE_PATH="${CKPT}/results"
    LOG_PATH="${SAVE_PATH}/${DATA_NAMES}.log"

    OPTS=""
    OPTS+=" --base-path ${BASE_PATH}"
    OPTS+=" --model-path ${CKPT}"
    OPTS+=" --ckpt-name ${CKPT_NAME}"
    OPTS+=" --n-gpu ${GPUS_PER_NODE}"
    OPTS+=" --model-type qwen3"
    OPTS+=" --data-dir ${DATA_DIR}"
    OPTS+=" --data-names ${DATA_NAMES}"
    OPTS+=" --num-workers 0"
    OPTS+=" --dev-num -1"
    OPTS+=" --data-process-workers -1"
    OPTS+=" --json-data"
    OPTS+=" --eval-batch-size ${EVAL_BATCH_SIZE}"
    OPTS+=" --max-length 512"
    OPTS+=" --max-prompt-length 256"
    OPTS+=" --do-eval"
    OPTS+=" --save ${SAVE_PATH}"
    OPTS+=" --seed 10"
    OPTS+=" --deepspeed"
    OPTS+=" --deepspeed_config ${BASE_PATH}/configs/deepspeed/ds_config_zero1_fp16.json"
    OPTS+=" --type ${TYPE}"
    OPTS+=" --do-sample"
    OPTS+=" --top-k 0"
    OPTS+=" --top-p 1.0"
    OPTS+=" --temperature 1.0"

    export NCCL_DEBUG=""
    export TOKENIZERS_PARALLELISM=false
    export PYTHONIOENCODING=utf-8
    export PYTHONPATH=${BASE_PATH}

    CMD="torchrun ${DISTRIBUTED_ARGS} ${BASE_PATH}/evaluate.py ${OPTS}"

    echo "Running: $CKPT"
    echo "$CMD" > "$LOG_PATH"
    echo "PYTHONPATH=${PYTHONPATH}" >> "$LOG_PATH"

    mkdir -p "${SAVE_PATH}"
    eval "$CMD" >> "$LOG_PATH" 2>&1
done
