#!/bin/bash

ANSWER_MODELS="gpt-4o-2024-08-06,us.anthropic.claude-3-5-sonnet-20240620-v1:0,gemini-1.5-pro-002,gpt-4o-mini"
TEMPERATURE="0.6,0.6,0.6,0.6"  # or "0.6"
NUM_SIMULATIONS=16
SPLIT="testmini"

MCTS_ALGO="mab-ucb"

EXPERIMENT_NAME="debug_${ANSWER_MODELS}_${MCTS_ALGO}_nsim${NUM_SIMULATIONS}"

start_time=$(date +%s)
python scripts/math_vista/run_math_vista.py \
    --experiment_name $EXPERIMENT_NAME \
    --idx 0 \
    --split $SPLIT \
    --answer_models $ANSWER_MODELS \
    --answer_temperatures $TEMPERATURE \
    --mcts_algo $MCTS_ALGO \
    --num_simulations $NUM_SIMULATIONS
end_time=$(date +%s)
elapsed_time=$((end_time - start_time))
elapsed_time=$(echo "scale=2; $elapsed_time / 60" | bc)
echo "Elapsed time (run): $elapsed_time minutes"

start_time=$(date +%s)
python scripts/math_vista/evaluate_math_vista.py \
    --experiment_name $EXPERIMENT_NAME \
    --idx 0 \
    --split $SPLIT
end_time=$(date +%s)
elapsed_time=$((end_time - start_time))
elapsed_time=$(echo "scale=2; $elapsed_time / 60" | bc)
echo "Elapsed time (evaluate): $elapsed_time minutes"
