set -x

# MODEL_NAME=gpt-4o
# MODEL_NAME=gpt-4o-mini
MODEL_NAME=o1


# DATASET=wikitq
# DATASET=tabfact
# DATASET=finqa
# DATASET=hitab
DATASET=multihiertt
# DATASET=aitqa
# DATASET=tablebench


TASK=formula
# TASK=text

WITH_REASONING=True



# single eval
python src/eval/eval_gpt.py \
    --model_name $MODEL_NAME \
    --task $TASK \
    --dataset $DATASET \
    --with_reasoning $WITH_REASONING



# loop eval
# DATASET_LIST="wikitq tabfact finqa hitab multihiertt aitqa tablebench"
# TASK_LIST="text formula"


# for DATASET in $DATASET_LIST; do
#     for TASK in $TASK_LIST; do
#         echo ">>> model=${MODEL_NAME}  dataset=${DATASET}  task=${TASK}"
#         python src/eval/eval_gpt.py \
#         --model_name "$MODEL_NAME" \
#         --task "$TASK" \
#         --dataset "$DATASET" \
#         --with_reasoning "$WITH_REASONING"
#     done
# done