#!/bin/bash

# Extract missing tasks from CSV file
# Usage: 
#   bash entrypoints/extract_missing_tasks.sh
#   bash entrypoints/extract_missing_tasks.sh --work_dir ./results/gpt-4o/baseline/20260111-11:27:54 --mode both

export PYTHONPATH=./:$PYTHONPATH

# Default configuration
WORK_DIR=${WORK_DIR:-"/IS-Bench/results/gpt-4o/baseline_safe_feedback/20260112-08:12:55"}
TASK_LIST=${TASK_LIST:-"entrypoints/task_list.txt"}
OUTPUT_TASK_LIST=${OUTPUT_TASK_LIST:-"entrypoints/task_list_missing_0812.txt"}
MODE=${MODE:-"both"}  # missing, report_missing, or both

# Parse command line arguments
while [[ $# -gt 0 ]]; do
    case $1 in
        --work_dir)
            WORK_DIR="$2"
            shift 2
            ;;
        --task_list)
            TASK_LIST="$2"
            shift 2
            ;;
        --output)
            OUTPUT_TASK_LIST="$2"
            shift 2
            ;;
        --mode)
            MODE="$2"
            shift 2
            ;;
        *)
            echo "Unknown option: $1"
            echo "Usage: $0 [--work_dir DIR] [--task_list FILE] [--output FILE] [--mode MODE]"
            echo "  --work_dir: Work directory containing task_results.csv (default: $WORK_DIR)"
            echo "  --task_list: Original task_list.txt file (default: $TASK_LIST)"
            echo "  --output: Output task_list file (default: $OUTPUT_TASK_LIST)"
            echo "  --mode: Extraction mode - missing, report_missing, or both (default: $MODE)"
            exit 1
            ;;
    esac
done

# Auto-detect CSV file
CSV_FILE=$WORK_DIR/task_results.csv

# Check if CSV file exists
if [ ! -f "$CSV_FILE" ]; then
    echo "Error: CSV file not found: $CSV_FILE"
    echo "Please check WORK_DIR: $WORK_DIR"
    exit 1
fi

# Check if task_list exists
if [ ! -f "$TASK_LIST" ]; then
    echo "Error: Task list file not found: $TASK_LIST"
    exit 1
fi

echo "=== Extract Missing Tasks ==="
echo "Work directory: $WORK_DIR"
echo "CSV file: $CSV_FILE"
echo "Original task list: $TASK_LIST"
echo "Output task list: $OUTPUT_TASK_LIST"
echo "Mode: $MODE"
echo ""

# Run Python script
python extract_missing_tasks.py \
    --task_list "$TASK_LIST" \
    --csv "$CSV_FILE" \
    --output "$OUTPUT_TASK_LIST" \
    --mode "$MODE"

EXIT_CODE=$?

if [ $EXIT_CODE -eq 0 ]; then
    echo ""
    echo "Success! Missing tasks extracted to: $OUTPUT_TASK_LIST"
    
    # Count lines in output file
    if [ -f "$OUTPUT_TASK_LIST" ]; then
        LINE_COUNT=$(wc -l < "$OUTPUT_TASK_LIST" | tr -d ' ')
        echo "Found $LINE_COUNT tasks to re-run"
    fi
    
    echo ""
    echo "To re-run these tasks:"
    echo "  1. Update task_list.txt: cp $OUTPUT_TASK_LIST $TASK_LIST"
    echo "  2. Run benchmark: bash entrypoints/eval_close.sh"
else
    echo ""
    echo "Error: Failed to extract missing tasks (exit code: $EXIT_CODE)"
    exit $EXIT_CODE
fi






