#!/bin/bash


CKPT="$1"  
# ckpts=("ming1.8b-4x1-topk-openmath01-r32" "ming1.8b-molora-4x1-topk-openmath01")
# CKPT="ming1.8b-4x1-topk-openmath01-r32"
# the ckpt starts with ming{SIZE}b, extract the SIZE (maybe 1.8 or 7) and save it to SIZE variable
SIZE=$(echo $CKPT | grep -oP 'ming\K[0-9.]+(?=b)')

# MODEL_BASE=/mnt/petrelfs/usr/models/models--Qwen--Qwen1.5-${SIZE}B-Chat
if [[ $CKPT == *"llama2_7b"* ]]; then
    MODEL_BASE=/mnt/petrelfs/usr/models/llama2_7b_chat
    conv_mode="llama2"
elif [[ $CKPT == *"llama3_8b"* ]]; then
    MODEL_BASE=/mnt/petrelfs/usr/models/Meta-Llama-3-8B-Instruct
    conv_mode="llama3"
else
    MODEL_BASE=/mnt/petrelfs/usr/models/models--Qwen--Qwen1.5-${SIZE}B-Chat
    conv_mode="qwen"
fi
LOGS_BASE_PATH="./logs/diverse"

MODEL_PATH=/mnt/petrelfs/usr/checkpoints/${CKPT}



# domains=("logiqa_en" "mmlu")
# domains=("mmedbench_en")
# domain="commonsense_qa"
domains=("mmlu")
version=""


for domain in "${domains[@]}"; do
# for CKPT in "${ckpts[@]}"; do
    sleep 1
    (
        echo "Processing $domain"
        mkdir -p ${LOGS_BASE_PATH}/${domain}
        # if domain==bbh, run bash bbh.sh $CKPT
        if [ $domain == "bbh" ]; then
            bash scripts/v1/eval/bbh_full.sh $CKPT
            continue
        fi
        if [ $domain == "math" ]; then
            bash scripts/v1/eval/math_full.sh $CKPT
        fi
        
        # 执行 infer 命令
        srun -p partition --gres=gpu:1  --quotatype=auto --output=${LOGS_BASE_PATH}/${domain}/${CKPT}${version}.infer.log python -m ming.eval.model_diverse_gen \
            --model-path ${MODEL_BASE} \
            --question-file s3://bucket/datasets/diverse_domain/test/${domain}.json \
            --answers-file ${LOGS_BASE_PATH}/${domain}/${CKPT}${version}.jsonl \
            --s3-answers-file s3://bucket/logs/diverse/${domain}/${CKPT}${version}.jsonl \
            --temperature 0 \
            --max-tokens 1024 \
            --keep-local \
            --conv-mode ${conv_mode} \
            --use-logit-bias \
            --infer-answer 
        

      

        echo "Evaluating $domain"

        srun -p partition --output=${LOGS_BASE_PATH}/${domain}/${CKPT}${version}.eval.log python -m ming.eval.eval_em \
            --input_file ${LOGS_BASE_PATH}/${domain}/${CKPT}${version}.jsonl 

        # fi

    ) &
done


wait
echo "All processes are done."