#!/bin/bash

export NUM_GPUS=1
export PYTHONPATH=./:$PYTHONPATH

# Load config saving functions
source scripts/save_config.sh

START_TIME=`date +%Y%m%d-%H:%M:%S`

if [[ -v PARTITION ]]; then
    echo "Submit to $PARTITION"
fi

MODEL_NAME=gpt-4o #google/gemma-3-4b-it, gpt-5.1, google/gemini-2.5-pro
DATA_PARALLEL=2
PROMPT_SETTING=baseline # baseline, baseline_feedback, baseline_safe, baseline_safe_feedback
WORK_DIR=./results/$MODEL_NAME/$PROMPT_SETTING/$START_TIME

mkdir -p $WORK_DIR/logs
LOG_FILE=$WORK_DIR/logs/exec_$START_TIME.log

GUARDRAIL_MODEL=qwen/qwen3-vl-30b-a3b-instruct # ['gpt-5.1', 'qwen/qwen3-vl-30b-a3b-instruct', 'EMBGuard/EMBGuard-4B', 'EMBGuard/EMBGuard-8B']
GUARDRAIL_TYPE=openrouter # ['gpt', 'openrouter', 'claude', 'gemini', 'vllm']
ENABLE_GUARDRAIL=false # true or false (force enable guardrail for baseline/baseline_safe)
# Guardrail is not used if enable_guardrail=false or guardrail_model is not set

# Save configuration using the reusable function
save_benchmark_config "$WORK_DIR" "$MODEL_NAME" "$PROMPT_SETTING" "$GUARDRAIL_MODEL" "$GUARDRAIL_TYPE" "$ENABLE_GUARDRAIL" "$DATA_PARALLEL" "entrypoints/task_list_missing_0812.txt" "$START_TIME" "eval_close.sh"


python -m og_ego_prim.cli.online_benchmark_all \
    --data_parallel $DATA_PARALLEL \
    --task_list entrypoints/task_list.txt \
    --work_dir $WORK_DIR \
    --model $MODEL_NAME \
    --prompt_setting $PROMPT_SETTING \
    --guardrail_model $GUARDRAIL_MODEL \
    --guardrail_type $GUARDRAIL_TYPE \
    --enable_guardrail $ENABLE_GUARDRAIL \
    2>&1 | tee -a "$LOG_FILE" > /dev/null & 

PYTHON_PID=$!
sleep 0.5s
tail -f $LOG_FILE &
TAIL_PID=$!

# Wait for Python process to complete
wait $PYTHON_PID
PYTHON_EXIT_CODE=$?

# Kill tail process
kill $TAIL_PID 2>/dev/null

exit $PYTHON_EXIT_CODE

