#!/usr/bin/env python3
"""
CSV PID and Prompt Extractor for Judge Agent

This script reads CSV files and extracts PID values and prompts from them.
It can be used to generate a list of PIDs and prompts for further processing.
It can also execute commands with the extracted PIDs and prompts.

Usage:
    python run_judge_agent.py <csv_file> [--filter <filter_expression>]
    python run_judge_agent.py <csv_file> [--custom-prompt "Your custom prompt here"]
    python run_judge_agent.py <csv_file> [--execute] [--workspace-base <workspace_path>]

Examples:
    python run_judge_agent.py /path/to/file.csv
    python run_judge_agent.py /path/to/file.csv --filter "pid > 50 and pid < 100"
    python run_judge_agent.py /path/to/file.csv --custom-prompt "Judge the code quality for X"
    python run_judge_agent.py /path/to/file.csv --execute --workspace-base "responses/GPT_41_Judge/t2c_l1/{pid}"
"""

import argparse
import csv
import os
import sys
import subprocess
import pandas as pd

def extract_pids_and_prompts_from_csv(csv_file, filter_expr=None, custom_prompt=None):
    """
    Extract PIDs and prompts from a CSV file.

    Args:
        csv_file (str): Path to the CSV file
        filter_expr (str, optional): Python expression to filter PIDs
        custom_prompt (str, optional): Custom prompt to use instead of CSV prompts

    Returns:
        tuple: (List of PIDs that match the criteria, Dictionary of PID to prompts)
    """
    try:
        pids = []
        prompts = {}
        try:
            df = pd.read_csv(csv_file)
            if 'pid' not in df.columns:
                print(f"Error: CSV file '{csv_file}' does not contain a 'pid' column.")
                return [], {}
            pids = df['pid'].tolist()
            if not custom_prompt and 'prompt' in df.columns:
                for i, row in df.iterrows():
                    pid_key = str(row['pid'])
                    prompts[pid_key] = row['prompt']
        except ImportError:
            with open(csv_file, 'r') as f:
                reader = csv.DictReader(f)
                if 'pid' not in reader.fieldnames:
                    print(f"Error: CSV file '{csv_file}' does not contain a 'pid' column.")
                    return [], {}
                for row in reader:
                    pid = row['pid']
                    pids.append(pid)
                    if not custom_prompt and 'prompt' in reader.fieldnames:
                        prompts[pid] = row['prompt']
        pids = [int(pid) if str(pid).isdigit() else pid for pid in pids]
        if filter_expr:
            filtered_pids = []
            for pid in pids:
                try:
                    if eval(filter_expr, {"pid": pid}):
                        filtered_pids.append(pid)
                except Exception as e:
                    print(f"Error evaluating filter expression for PID {pid}: {e}")
            pids = filtered_pids
        if custom_prompt:
            prompts = {str(pid): custom_prompt for pid in pids}
        else:
            for pid in pids:
                pid_key = str(pid)
                if pid_key not in prompts:
                    prompts[pid_key] = "No prompt available"
        return pids, prompts
    except Exception as e:
        print(f"Error reading CSV file '{csv_file}': {e}")
        return [], {}

def execute_command_with_pid_prompt(pid, prompt, workspace_base=None, dry_run=False):
    """
    Execute a command with the given PID and prompt.
    """
    env = os.environ.copy()
    if workspace_base:
        workspace_path = workspace_base.format(pid=pid)
        env["WORKSPACE_BASE"] = workspace_path
        print(f"Setting WORKSPACE_BASE to: {workspace_path}")
    command = f'poetry run python ./openhands/core/main.py -t "{prompt}" -n "judge_{pid}" --config-file config_judge.toml -i 1000'
    if dry_run:
        print(f"Would execute: {command}")
        print(f"With environment: WORKSPACE_BASE={env.get('WORKSPACE_BASE', 'Not set')}")
        return 0
    print(f"Executing command for PID {pid}:")
    print(f"  {command}")
    try:
        result = subprocess.run(command, shell=True, env=env, check=False)
        if result.returncode == 0:
            print(f"Command for PID {pid} completed successfully")
        else:
            print(f"Command for PID {pid} failed with return code {result.returncode}")
        return result.returncode
    except Exception as e:
        print(f"Error executing command for PID {pid}: {e}")
        return 1

def generate_bash_array(pids):
    """
    Generate a Bash array declaration with the PIDs.
    """
    pid_strings = [str(pid) for pid in pids]
    return f"SPECIFIC_PIDS=({' '.join(pid_strings)})"

def get_global_custom_prompt(pid):
    """
    Returns the global custom prompt, formatted with the given pid if needed.
    """
    JSON_FILE_NAME = "judge_output.json"
    return (
        f"You are a code judge. Evaluate the code in the workspace. You need to provide verdict and reasoning on **three** aspects. "
        f"Always provide answer in **yes/no/unclear** format, and then provide a reasoning. Finally, update the provided json file {JSON_FILE_NAME} with \"pid\": {pid}, verdict and reasoning. After that, save the json file. "
        f"First, check if the code is parseable. Give a verdict, reasoning, and store them under the key 'parseability' in the JSON file. "
        f"Second, check if the code is executable without any syntax errors. Give a verdict, reasoning, and store them under the key 'syntax_error_free' in the JSON file. "
        f"Third, check if the code is executable without any runtime errors. Give a verdict, reasoning, and store them under the key 'runtime_error_free' in the JSON file. "
        f"If the workspace does not exist, or is empty, respond with 'unclear' verdict and reason that the workspace is missing or empty for all three aspects. "
    )

def main():
    parser = argparse.ArgumentParser(description="Extract PIDs and prompts from a CSV file for Judge Agent")
    parser.add_argument("csv_file", help="Path to the CSV file")
    parser.add_argument("--filter", "-f", help="Python expression to filter PIDs (e.g., 'pid > 50')")
    parser.add_argument("--bash-array", "-b", action="store_true", help="Generate a Bash array declaration")
    parser.add_argument("--custom-prompt", "-c", default=None, help="Custom prompt to use instead of CSV prompts")
    parser.add_argument("--include-prompts", "-p", action="store_true", help="Include prompts in the output")
    parser.add_argument("--execute", "-e", action="store_true", help="Execute command with PID and prompt")
    parser.add_argument("--workspace-base", "-w", help="Base directory for workspace, use {pid} as placeholder")
    parser.add_argument("--dry-run", "-d", action="store_true", help="Print commands without executing them")
    args = parser.parse_args()

    # Use CLI custom prompt if provided, else use global (with pid if available)
    custom_prompt = args.custom_prompt if args.custom_prompt is not None else None

    if not os.path.exists(args.csv_file):
        print(f"Error: CSV file '{args.csv_file}' not found!")
        return 1
    # Extract PIDs first (use a dummy prompt for now)
    pids, _ = extract_pids_and_prompts_from_csv(args.csv_file, args.filter, None)
    if not pids:
        print("No PIDs were extracted or matched the filter criteria.")
        return 1
    # Now, build prompts dict using either CLI or global function per pid
    if custom_prompt is not None:
        prompts = {str(pid): custom_prompt for pid in pids}
    else:
        prompts = {str(pid): get_global_custom_prompt(pid) for pid in pids}
    if args.execute:
        success_count = 0
        fail_count = 0
        print(f"Executing commands for {len(pids)} PIDs...")
        for pid in pids:
            pid_str = str(pid)
            prompt = prompts.get(pid_str, "")
            if not prompt and not args.custom_prompt:
                print(f"Skipping PID {pid}: No prompt available")
                continue
            if args.custom_prompt:
                prompt = args.custom_prompt
            else:
                prompt = get_global_custom_prompt(pid)
            result = execute_command_with_pid_prompt(
                pid,
                prompt,
                workspace_base=args.workspace_base,
                dry_run=args.dry_run
            )
            if result == 0:
                success_count += 1
            else:
                fail_count += 1
        print(f"Command execution summary: {success_count} succeeded, {fail_count} failed")
    elif args.bash_array:
        print(generate_bash_array(pids))
    elif args.include_prompts:
        print(f"Extracted {len(pids)} PIDs with prompts:")
        for pid in pids:
            pid_str = str(pid)
            if args.custom_prompt:
                prompt = args.custom_prompt
            else:
                prompt = get_global_custom_prompt(pid)
            print(f"PID: {pid}")
            print(f"Prompt: {prompt}")
            print("-" * 50)
    else:
        print(f"Extracted {len(pids)} PIDs:")
        for pid in pids:
            print(pid)
    return 0

if __name__ == "__main__":
    sys.exit(main())
