#!/bin/bash
# Run all ablation experiments for given agent output(s)
# Supports multiple agent traces - evaluated one by one
#
# Usage:
#   # Single trace
#   ./run_all_ablations.sh --agent_output /path/to/gen_res.json --output_base /path/to/output
#
#   # Multiple traces (comma-separated)
#   ./run_all_ablations.sh --agent_outputs "/path/to/trace1.json,/path/to/trace2.json" --output_base /path/to/output
#
#   # All traces in a directory
#   ./run_all_ablations.sh --agent_output_dir /path/to/evaluation_results --output_base /path/to/output

# Default values
TIMESTAMP=$(date +"%m%d_%H%M%S")
DATA_PATH=""
MODEL_NAME=""
NUM_WORKERS=128
DAFNY_WORKERS=128

# Single trace (backward compatible)
AGENT_OUTPUT=""
# Multiple traces
AGENT_OUTPUTS=""
# Directory containing traces
AGENT_OUTPUT_DIR=""
# Output base directory
OUTPUT_BASE=""

# Which ablations to run (default: all)
RUN_DAFNY=1
RUN_PYTHON=1
RUN_NL=1
RUN_DIRECT_JUDGE=1
RUN_COT=1
RUN_FEWSHOT=1

# Build list of agent outputs to process
TRACE_FILES=(
)

# Change to repo root directory
cd "$(dirname "$0")/../.."
Kill any active Ray processes first
echo "Checking for active Ray processes..."
if command -v ray &> /dev/null; then
    # Try graceful shutdown first
    ray stop --force 2>/dev/null || true
    # Kill any remaining Ray processes
    pkill -f "ray.*gcs_server" 2>/dev/null || true
    pkill -f "ray.*raylet" 2>/dev/null || true
    pkill -f "ray.*dashboard" 2>/dev/null || true
    sleep 1
fi


# Generate unique timestamped cache directory for Ray
RAY_TMPDIR="~/cache/ray_${TIMESTAMP}"
mkdir -p "$RAY_TMPDIR"
export RAY_TMPDIR

echo "========================================"
echo "Running ablation experiments"
echo "Timestamp: $TIMESTAMP"
echo "Model: $MODEL_NAME"
echo "Workers: $NUM_WORKERS (Dafny: $DAFNY_WORKERS)"
echo "Ray cache: $RAY_TMPDIR"
echo "Output base: $OUTPUT_BASE"
echo ""
echo "Traces to process: ${#TRACE_FILES[@]}"
for trace in "${TRACE_FILES[@]}"; do
    echo "  - $trace"
done
echo ""
echo "Ablations enabled:"
[ $RUN_DAFNY -eq 1 ] && echo "  - Dafny"
[ $RUN_PYTHON -eq 1 ] && echo "  - Python"
[ $RUN_NL -eq 1 ] && echo "  - Natural Language"
[ $RUN_DIRECT_JUDGE -eq 1 ] && echo "  - Direct Judge"
echo "========================================"

# Function to get trace name from path
get_trace_name() {
    local path="$1"
    # Extract the parent directory name (e.g., "tot-gpt4o" from ".../tot-gpt4o/gen_res.json")
    local parent_dir=$(dirname "$path")
    local name=$(basename "$parent_dir")
    echo "$name"
}

# Function to run ablations for a single trace
run_ablations_for_trace() {
    local trace_file="$1"
    local trace_name="$2"
    local trace_output_base="${OUTPUT_BASE}/${trace_name}"

    echo ""
    echo "########################################"
    echo "Processing trace: $trace_name"
    echo "Input: $trace_file"
    echo "Output: $trace_output_base"
    echo "########################################"

    Run Dafny verification
    if [ $RUN_DAFNY -eq 1 ]; then
        echo ""
        echo "========== [$trace_name] DAFNY VERIFICATION =========="
        python formal_verification/run_verification.py \
            --data_path "$DATA_PATH" \
            --agent_output "$trace_file" \
            --output_dir "${trace_output_base}_dafny_${TIMESTAMP}" \
            --language dafny \
            --model_name "$MODEL_NAME" \
            --num_workers "$NUM_WORKERS" \
            --dafny_workers "$DAFNY_WORKERS" 
    fi

    if [ $RUN_COT -eq 1 ]; then
        echo ""
        echo "========== [$trace_name] COT VERIFICATION =========="
        python formal_verification/run_verification.py \
            --data_path "$DATA_PATH" \
            --agent_output "$trace_file" \
            --output_dir "${trace_output_base}_llm_cot_${TIMESTAMP}" \
            --language llm_cot \
            --model_name "$MODEL_NAME" \
            --num_workers "$NUM_WORKERS"
    fi

    if [ $RUN_FEWSHOT -eq 1 ]; then
        echo ""
        echo "========== [$trace_name] FEWSHOT VERIFICATION =========="
        python formal_verification/run_verification.py \
            --data_path "$DATA_PATH" \
            --agent_output "$trace_file" \
            --output_dir "${trace_output_base}_llm_fewshot_${TIMESTAMP}" \
            --language llm_fewshot \
            --model_name "$MODEL_NAME" \
            --num_workers "$NUM_WORKERS"
    fi


    # Run Python verification
    if [ $RUN_PYTHON -eq 1 ]; then
        echo ""
        echo "========== [$trace_name] PYTHON VERIFICATION =========="
        python formal_verification/run_verification.py \
            --data_path "$DATA_PATH" \
            --agent_output "$trace_file" \
            --output_dir "${trace_output_base}_python_${TIMESTAMP}" \
            --language python \
            --model_name "$MODEL_NAME" \
            --num_workers "$NUM_WORKERS"
    fi

    # Run Natural Language verification
    if [ $RUN_NL -eq 1 ]; then
        echo ""
        echo "========== [$trace_name] NATURAL LANGUAGE VERIFICATION =========="
        python formal_verification/run_verification.py \
            --data_path "$DATA_PATH" \
            --agent_output "$trace_file" \
            --output_dir "${trace_output_base}_nl_${TIMESTAMP}" \
            --language natural_language \
            --model_name "$MODEL_NAME" \
            --num_workers "$NUM_WORKERS" 
    fi

    # Run Direct Judge
    if [ $RUN_DIRECT_JUDGE -eq 1 ]; then
        echo ""
        echo "========== [$trace_name] DIRECT JUDGE =========="
        python formal_verification/run_direct_judge.py \
            --data_path "$DATA_PATH" \
            --agent_output "$trace_file" \
            --output_path "${trace_output_base}_direct_judge_${TIMESTAMP}" \
            --model_name "$MODEL_NAME" \
            --num_workers "$NUM_WORKERS"
    fi

    echo ""
    echo "Completed ablations for: $trace_name"
    
}

# Process each trace
for trace_file in "${TRACE_FILES[@]}"; do
    if [ ! -f "$trace_file" ]; then
        echo "Warning: Trace file not found: $trace_file (skipping)"
        continue
    fi

    trace_name=$(get_trace_name "$trace_file")
    run_ablations_for_trace "$trace_file" "$trace_name"
done

echo ""
echo "========================================"
echo "All ablation experiments completed!"
echo "Results saved to: $OUTPUT_BASE"
echo "========================================"
