#!/bin/bash
set -euo pipefail

# Pilot-study runner: for each TASK(SCENE) run the benchmark with prompt settings v4 and v8

export NUM_GPUS=1
export PYTHONPATH=./:$PYTHONPATH

mkdir -p logs

if [ -f "entrypoints/env.sh" ]; then
    source entrypoints/env.sh
fi

echo "Starting pilot study runs"

# list of TASK::SCENE pairs
TASKS=(
  "boil_water_in_the_microwave__with_water_glass::Pomaria_1_int"
  "clean_a_box_fan__toggled_on::grocery_store_asian"
  "clean_a_coffee_maker::Pomaria_1_int"
  # "cook_a_potato__with_aluminum_foil::Wainscott_0_garden"
  "cook_a_potato__with_bottle__of__alcohol::Wainscott_0_garden"
  "cook_soup_and_put_inside_refrigerator::Wainscott_0_int"
  "moving_electric_fan_on_coffee_table::Rs_int"
  "place_bottle__of__vinegar_inside_cabinet::Wainscott_1_int"
  "pour_tea__with_power_strip::Wainscott_0_int"
  "put_food_in_bowl__with_dirt::Pomaria_1_int"
  "reheat_frozen_or_chilled_food::Benevolence_1_int"
  "remove_hard_water_spots::restaurant_diner"
  "cook_ramen_noodles__with_rug::Wainscott_0_int"
  "store_a_baseball::Rs_int"
  "store_cleaner_in_cabinet__with__bag__of__rice::Beechwood_0_garden"
  "roast_nuts::Benevolence_1_int"
  "removing_lint_from_dryer::Beechwood_0_garden"
)

MODEL_NAME_OR_PATH="gpt-4o"
# retry count and extension-marker timeout
MAX_RETRIES=${PILOT_MAX_RETRIES:-0}
EXT_TIMEOUT_SECS=${PILOT_EXT_TIMEOUT:-60} # when "Extension modules:" appears, wait this long (seconds) then abort

for pair in "${TASKS[@]}"; do
    TASK_NAME="${pair%%::*}"
    SCENE_NAME="${pair##*::}"

    for PROMPT in v4 v8; do
        echo "=============================================="
        echo "Running task=$TASK_NAME scene=$SCENE_NAME prompt=$PROMPT"
        echo "=============================================="

        # reset launcher (launcher.sh defines LAUNCHER=())
        if [ -f "entrypoints/launcher.sh" ]; then
            source entrypoints/launcher.sh
        else
            LAUNCHER=()
        fi

        START_TIME=$(date +%Y%m%d-%H:%M:%S)
        SAFE_TASK_NAME=$(echo "$TASK_NAME" | sed 's/[^a-zA-Z0-9._-]/_/g')
        LOG_FILE=logs/${SAFE_TASK_NAME}__${SCENE_NAME}__${PROMPT}__${START_TIME}.log

        LAUNCHER+=(
            "python" "-m" "og_ego_prim.cli.online_benchmark_once"
            "--task" "$TASK_NAME"
            "--scene" "$SCENE_NAME"
            "--model" "$MODEL_NAME_OR_PATH"
            "--draw_bbox_2d"
            "--prompt_setting" "$PROMPT"
            "--robot_ego_view"
        )

        # run synchronously and capture output to log, with timeout and retries
        echo "Command: ${LAUNCHER[*]}"

        attempt=0
        exit_code=0
        skip_retries=0
        while [ $attempt -le $MAX_RETRIES ]; do
            attempt=$((attempt+1))
            echo "Attempt $attempt/$((MAX_RETRIES+1))"
            # ensure no leftover markers
            rm -f "$LOG_FILE.ext_killed"

            # start the command in background (pipeline) so we can monitor the log
            ( "${LAUNCHER[@]}" 2>&1 | tee -a "$LOG_FILE" ) &
            cmd_pid=$!

            # monitor the log for the 'Extension modules:' marker and start an ext-timeout when seen
            (
                while true; do
                    # if process ended, stop monitoring
                    if ! ps -p "$cmd_pid" > /dev/null 2>&1; then
                        break
                    fi
                    if grep -q "Extension modules:" "$LOG_FILE" 2>/dev/null; then
                        echo "[pilot-study] Detected 'Extension modules:' in log; starting ext-timeout ${EXT_TIMEOUT_SECS}s" | tee -a "$LOG_FILE"
                        sleep ${EXT_TIMEOUT_SECS}
                        # if process still running after ext timeout, kill it and mark
                        if ps -p "$cmd_pid" > /dev/null 2>&1; then
                            echo "[pilot-study] Extension timeout reached; killing run" | tee -a "$LOG_FILE"
                            pkill -f "og_ego_prim.cli.online_benchmark_once" || true
                            pkill -f "og_ego_prim" || true
                            kill "$cmd_pid" 2>/dev/null || true
                            touch "$LOG_FILE.ext_killed"
                        fi
                        break
                    fi
                    sleep 1
                done
            ) &
            monitor_pid=$!

            # wait for command to finish
            wait "$cmd_pid" 2>/dev/null || true
            exit_code=$?

            # stop monitor if still running
            if ps -p "$monitor_pid" > /dev/null 2>&1; then
                kill "$monitor_pid" 2>/dev/null || true
            fi

            # if ext marker exists, mark to skip retries
            if [ -f "$LOG_FILE.ext_killed" ]; then
                skip_retries=1
            fi

            if [ $exit_code -eq 0 ]; then
                echo "Finished task=$TASK_NAME prompt=$PROMPT (log: $LOG_FILE)"
                break
            else
                echo "Run exited with code $exit_code. Cleaning up and retrying..." | tee -a "$LOG_FILE"
                # Try to kill any lingering simulator/python processes spawned by the run
                pkill -f "og_ego_prim.cli.online_benchmark_once" || true
                pkill -f "og_ego_prim" || true
                sleep 5
            fi
        done

        if [ $exit_code -ne 0 ]; then
            echo "Task $TASK_NAME prompt=$PROMPT FAILED after $attempt attempts (exit $exit_code). See $LOG_FILE" | tee -a "$LOG_FILE"
        fi

        # small pause between runs
        sleep 2
    done
done

echo "Pilot study finished"
