SAVE_PATH=$1
MODEL_NAME=$2

TEST_DATASET_NAME="CardinalOperations/BWOR"
TEST_DATASET_SPLIT="train"

Q2MC_OUTPUT_DIR="$SAVE_PATH/$MODEL_NAME/eval.BWOR.pass1"

python -m eval.generate_openai \
    --openai_model $MODEL_NAME \
    --dataset_name $TEST_DATASET_NAME \
    --dataset_split $TEST_DATASET_SPLIT \
    --save_dir $Q2MC_OUTPUT_DIR \
    --verbose

python -m eval.execute \
    --input_file $Q2MC_OUTPUT_DIR/generated.jsonl \
    --output_file $Q2MC_OUTPUT_DIR/executed.jsonl \
    --question_field en_question \
    --answer_field en_answer \
    --timeout 600 \
    --max_workers 16 \
    --verbose
