#!/bin/bash

export NUM_GPUS=1
export PYTHONPATH=./:$PYTHONPATH

# Load config saving functions
source scripts/save_config.sh

START_TIME=`date +%Y%m%d-%H:%M:%S`

if [[ -v PARTITION ]]; then
    echo "Submit to $PARTITION"
fi

TASK_NAME=cook_ramen_noodles__with_rug
SCENE_NAME=Wainscott_0_int
MODEL_NAME=gpt-4o
PROMPT_SETTING=baseline # baseline, baseline_feedback, baseline_safe, baseline_safe_feedback
WORK_DIR=./results/$MODEL_NAME/$PROMPT_SETTING/$TASK_NAME/$SCENE_NAME/$START_TIME

mkdir -p $WORK_DIR/logs
LOG_FILE=$WORK_DIR/logs/exec_$START_TIME.log

GUARDRAIL_MODEL=qwen/qwen3-vl-30b-a3b-instruct # ['gpt-5.1', 'qwen/qwen3-vl-30b-a3b-instruct']
GUARDRAIL_TYPE=openrouter # ['gpt', 'openrouter', 'claude', 'gemini']
ENABLE_GUARDRAIL=false # true or false 

# Save configuration using the reusable function
save_benchmark_config "$WORK_DIR" "$MODEL_NAME" "$PROMPT_SETTING" "$GUARDRAIL_MODEL" "$GUARDRAIL_TYPE" "$ENABLE_GUARDRAIL" "1" "$TASK_NAME" "$START_TIME" "eval_close_one.sh"


python -m og_ego_prim.cli.online_benchmark_once \
    --task $TASK_NAME \
    --scene $SCENE_NAME \
    --work_dir $WORK_DIR \
    --model $MODEL_NAME \
    --prompt_setting $PROMPT_SETTING \
    --guardrail_model $GUARDRAIL_MODEL \
    --guardrail_type $GUARDRAIL_TYPE \
    --enable_guardrail $ENABLE_GUARDRAIL \
    2>&1 | tee -a "$LOG_FILE" > /dev/null &

PYTHON_PID=$!
sleep 0.5s
tail -f $LOG_FILE &
TAIL_PID=$!

# Wait for Python process to complete
wait $PYTHON_PID
PYTHON_EXIT_CODE=$?

# Kill tail process
kill $TAIL_PID 2>/dev/null

exit $PYTHON_EXIT_CODE
