SAVE_PATH=$1
MODEL_NAME=$2

TEST_DATASET_NAME="CardinalOperations/NL4OPT"
TEST_DATASET_SPLIT="test"

Q2MC_OUTPUT_DIR="$SAVE_PATH/$MODEL_NAME/eval.NL4OPT.pass1"

# export HF_ENDPOINT=https://hf-mirror.com

python -m eval.generate_openai \
    --openai_model $MODEL_NAME \
    --dataset_name $TEST_DATASET_NAME \
    --dataset_split $TEST_DATASET_SPLIT \
    --save_dir $Q2MC_OUTPUT_DIR \
    --verbose

python -m eval.execute \
    --input_file $Q2MC_OUTPUT_DIR/generated.jsonl \
    --output_file $Q2MC_OUTPUT_DIR/executed.jsonl \
    --question_field en_question \
    --answer_field en_answer \
    --timeout 600 \
    --max_workers 16 \
    --verbose