#!/bin/bash

export NUM_GPUS=1
export PYTHONPATH=./:$PYTHONPATH

# Load config saving functions
source scripts/save_config.sh

START_TIME=`date +%Y%m%d-%H:%M:%S`

# Configuration
MODEL_NAME=gpt-4o
PROMPT_SETTING=baseline_feedback  # baseline, baseline_feedback, baseline_safe, baseline_safe_feedback
WORK_DIR=./results/$MODEL_NAME/${PROMPT_SETTING}_human_guardrail/$START_TIME

mkdir -p $WORK_DIR/logs
LOG_FILE=$WORK_DIR/logs/exec_$START_TIME.log

# Human guardrail configuration
GUARDRAIL_TYPE=human
ENABLE_GUARDRAIL=true

# Task configuration (uses task's default scene)
TASK=${1:-clean_a_kitchen_sink__with_blender}

# Save configuration using the reusable function
save_benchmark_config "$WORK_DIR" "$MODEL_NAME" "$PROMPT_SETTING" "human" "$GUARDRAIL_TYPE" "$ENABLE_GUARDRAIL" "1" "single_task" "$START_TIME" "eval_human_guardrail.sh"

echo "=========================================="
echo "Human Guardrail Evaluation"
echo "=========================================="
echo "Task: $TASK"
echo "Scene: (using task's default scene)"
echo "Model: $MODEL_NAME"
echo "Prompt Setting: $PROMPT_SETTING"
echo "Work Dir: $WORK_DIR"
echo "=========================================="
echo ""

# Human guardrail runs in foreground as it receives input directly from terminal
# If scene is not specified, task's default_scene_model is automatically used
python -m og_ego_prim.cli.online_benchmark_once \
    --task $TASK \
    --model $MODEL_NAME \
    --prompt_setting $PROMPT_SETTING \
    --robot_ego_view \
    --guardrail_type $GUARDRAIL_TYPE \
    --enable_guardrail $ENABLE_GUARDRAIL \
    --work_dir $WORK_DIR \
    2>&1 | tee "$LOG_FILE"

EXIT_CODE=$?

echo ""
echo "=========================================="
echo "Execution completed with exit code: $EXIT_CODE"
echo "Log file: $LOG_FILE"
echo "=========================================="

exit $EXIT_CODE