from flask import Flask, render_template, jsonify, request, redirect, url_for
import requests
import json
import sqlite3
from datetime import datetime, timezone, timedelta
import os
import uuid
import subprocess
import threading
import shlex
import requests as req
import sys
from dotenv import load_dotenv
import psutil
import random
import time
import docker

# Load .env file
load_dotenv()

app = Flask(__name__)

# MCP server configuration
MCP_SERVER_URL = "http://127.0.0.1:8000"

# CTF server configuration (from environment variables)
CTFD_BASE_URL = os.getenv('CTFD_BASE_URL', 'http://143.248.159.172:4000')
print(f"[{datetime.now()}] CTF Server URL: {CTFD_BASE_URL}")

# Database configuration
DATABASE = 'problems.db'

# Execution status memory management
RUNNING_STATUS = {}  # (problem_id, key) -> {'seed':..., 'process':..., 'start_time':..., 'stdout':..., 'stderr':...}
COMPLETED_PROCESSES = []  # List of completed processes (keep latest 50)
core_assign_index = 0  # Global index for sequential core assignment
auto_run_lock = threading.Lock()  # Lock for auto-run concurrency control

# Docker container cleanup configuration
DELETE_THRESHOLD = timedelta(minutes=65)
TARGET_IMAGES = {
    "ctfenv:multiagent"
}
CHECK_INTERVAL = 5 * 60  # 5 minutes
docker_cleanup_thread = None
docker_cleanup_running = False

def get_uptime(started_at):
    """Calculate container uptime from started_at timestamp."""
    try:
        if started_at.endswith("Z"):
            started_at = started_at[:-1]

        if "." in started_at:
            dt_part, micro = started_at.split(".")
            micro = micro[:6]
            started_at = f"{dt_part}.{micro}"
        else:
            started_at += ".000000"

        start_time = datetime.strptime(started_at, "%Y-%m-%dT%H:%M:%S.%f")
        start_time = start_time.replace(tzinfo=timezone.utc)
        now = datetime.now(timezone.utc)
        return now - start_time
    except Exception as e:
        print(f"[{datetime.now()}] Time parsing error: {e}")
        return timedelta(seconds=0)


def remove_old_containers():
    """Remove containers that have been running for more than DELETE_THRESHOLD minutes."""
    global docker_cleanup_running
    if not docker_cleanup_running:
        return []
    
    try:
        client = docker.from_env()
        containers = client.containers.list()
        removed = []

        for container in containers:
            try:
                attrs = container.attrs
                started_at = attrs["State"]["StartedAt"]
                uptime = get_uptime(started_at)

                image_tags = container.image.tags
                image = image_tags[0] if image_tags else "None"

                if image in TARGET_IMAGES:
                    if uptime > DELETE_THRESHOLD:
                        print(f"[{datetime.now()}] [Delete Target] {container.name} ({image}) (uptime: {uptime})")
                        try:
                            container.stop()
                            container.remove()
                            removed.append((container.name, image, str(uptime)))
                            print(f"[{datetime.now()}] ✅ Deleted: {container.name}")
                        except Exception as e:
                            err_msg = str(e)
                            if "removal of container" in err_msg and "is already in progress" in err_msg:
                                removed.append((container.name, image, str(uptime)))
                                print(f"[{datetime.now()}] ✅ Deleting... : {container.name}")
                            else:
                                print(f"[{datetime.now()}] ❌ Delete Fail ({container.name}): {e}")
                    else:
                        print(f"[{datetime.now()}] [ignore] {container.name} ({image}) (uptime: {uptime})")
                else:
                    print(f"[{datetime.now()}] [] {container.name} (image: {image})")

            except Exception as e:
                print(f"[{datetime.now()}] ❌ Error occur ({container.name}): {e}")

        return removed
    except Exception as e:
        print(f"[{datetime.now()}] Docker client error: {e}")
        return []


def docker_cleanup_scheduler():
    """Background thread function for docker container cleanup."""
    global docker_cleanup_running
    print(f"[{datetime.now()}] ⏳ Start running: Check and delete old target image containers every 5 minutes")
    try:
        while docker_cleanup_running:
            print(f"[{datetime.now()}] Executing docker cleanup...")
            removed = remove_old_containers()
            if removed:
                print(f"[{datetime.now()}] 🗑️ List of deleted containers:")
                for name, image, uptime in removed:
                    print(f"[{datetime.now()}]  - {name} ({image}) (uptime: {uptime})")
            else:
                print(f"[{datetime.now()}] No deleted containers.")
            time.sleep(CHECK_INTERVAL)
    except Exception as e:
        print(f"[{datetime.now()}] Docker cleanup scheduler error: {e}")
    finally:
        print(f"[{datetime.now()}] 🛑 Docker cleanup scheduler stopped")


def start_docker_cleanup():
    """Start the docker cleanup background thread."""
    global docker_cleanup_thread, docker_cleanup_running
    if docker_cleanup_thread is None or not docker_cleanup_thread.is_alive():
        docker_cleanup_running = True
        docker_cleanup_thread = threading.Thread(target=docker_cleanup_scheduler, daemon=True)
        docker_cleanup_thread.start()
        print(f"[{datetime.now()}] Docker cleanup thread started")


def stop_docker_cleanup():
    """Stop the docker cleanup background thread."""
    global docker_cleanup_running
    docker_cleanup_running = False
    print(f"[{datetime.now()}] Docker cleanup thread stop requested")


def init_db():
    """Initialize the database."""
    conn = sqlite3.connect(DATABASE)
    cursor = conn.cursor()
    cursor.execute('''
        CREATE TABLE IF NOT EXISTS problems (
            id INTEGER PRIMARY KEY,
            name TEXT NOT NULL,
            solved_by_name TEXT,
            solves INTEGER DEFAULT 0,
            value INTEGER DEFAULT 0,
            dcipher_gpt_count INTEGER DEFAULT 0,
            dcipher_claude_count INTEGER DEFAULT 0,
            dcipher_gemini_count INTEGER DEFAULT 0,
            dcipher_gpt_solved INTEGER DEFAULT 0,
            dcipher_claude_solved INTEGER DEFAULT 0,
            dcipher_gemini_solved INTEGER DEFAULT 0,
            hidden INTEGER DEFAULT 0,
            created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
            updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
        )
    ''')
    # Migration: Add solves, value columns if they don't exist
    try:
        cursor.execute('ALTER TABLE problems ADD COLUMN solves INTEGER DEFAULT 0')
    except Exception:
        pass
    try:
        cursor.execute('ALTER TABLE problems ADD COLUMN value INTEGER DEFAULT 0')
    except Exception:
        pass
    # Add hidden column if it doesn't exist
    try:
        cursor.execute('ALTER TABLE problems ADD COLUMN hidden INTEGER DEFAULT 0')
    except Exception:
        pass
    # Detailed information cache table
    cursor.execute('''
        CREATE TABLE IF NOT EXISTS problem_details (
            id INTEGER PRIMARY KEY,
            category TEXT,
            description TEXT,
            files TEXT,
            connection_info TEXT,
            hints TEXT,
            updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
        )
    ''')
    # CTF flag storage table
    cursor.execute('''
        CREATE TABLE IF NOT EXISTS ctf_flags (
            id INTEGER PRIMARY KEY AUTOINCREMENT,
            challenge_id INTEGER NOT NULL,
            flag TEXT NOT NULL,
            status TEXT NOT NULL,
            model_key TEXT,
            cost REAL,
            submitted_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
            UNIQUE(challenge_id, flag)
        )
    ''')
    # Add cost column if it doesn't exist
    try:
        cursor.execute('ALTER TABLE ctf_flags ADD COLUMN cost REAL')
    except Exception:
        pass
    # Run attempt cost recording table
    cursor.execute('''
        CREATE TABLE IF NOT EXISTS run_attempts (
            id INTEGER PRIMARY KEY AUTOINCREMENT,
            challenge_id INTEGER NOT NULL,
            model_key TEXT NOT NULL,
            seed TEXT,
            start_time TIMESTAMP,
            end_time TIMESTAMP,
            cost REAL,
            status TEXT,
            UNIQUE(challenge_id, model_key, seed)
        )
    ''')
    conn.commit()
    conn.close()

def get_db_connection():
    """Returns a database connection."""
    conn = sqlite3.connect(DATABASE)
    conn.row_factory = sqlite3.Row
    return conn

def save_problems_to_db(problems):
    """Save problem list to database."""
    conn = get_db_connection()
    cursor = conn.cursor()
    for problem in problems:
        # Check if already exists
        cursor.execute('SELECT id FROM problems WHERE id = ?', (problem['id'],))
        exists = cursor.fetchone()
        # Extract score, solves values (support various field names)
        value = problem.get('value')
        solves = problem.get('solves')
        if exists:
            cursor.execute('''
                UPDATE problems SET name = ?, solved_by_name = ?, solves = ?, value = ?, updated_at = CURRENT_TIMESTAMP WHERE id = ?
            ''', (problem['name'], problem['solved_by_name'], solves, value, problem['id']))
        else:
            cursor.execute('''
                INSERT INTO problems (
                    id, name, solved_by_name, solves, value,
                    dcipher_gpt_count, dcipher_claude_count, dcipher_gemini_count,
                    dcipher_gpt_solved, dcipher_claude_solved, dcipher_gemini_solved,
                    updated_at
                ) VALUES (?, ?, ?, ?, ?, 0, 0, 0, 0, 0, 0, CURRENT_TIMESTAMP)
            ''', (problem['id'], problem['name'], problem['solved_by_name'], solves, value))
    conn.commit()
    conn.close()

def get_problems_from_db():
    """Get problem list from database (sorted by ID)."""
    conn = get_db_connection()
    cursor = conn.cursor()
    cursor.execute('SELECT id, name, solved_by_name, solves, value, dcipher_gpt_count, dcipher_claude_count, dcipher_gemini_count, dcipher_gpt_solved, dcipher_claude_solved, dcipher_gemini_solved, hidden FROM problems ORDER BY id')
    problems = []
    for row in cursor.fetchall():
        problems.append({
            'id': row['id'],
            'name': row['name'],
            'solved_by_name': row['solved_by_name'],
            'solves': row['solves'],
            'value': row['value'],
            'dcipher_gpt_count': row['dcipher_gpt_count'],
            'dcipher_claude_count': row['dcipher_claude_count'],
            'dcipher_gemini_count': row['dcipher_gemini_count'],
            'dcipher_gpt_solved': row['dcipher_gpt_solved'],
            'dcipher_claude_solved': row['dcipher_claude_solved'],
            'dcipher_gemini_solved': row['dcipher_gemini_solved'],
            'hidden': row['hidden'],
        })
    conn.close()
    return problems

def extract_category(problem_name, category=None):
    categories = ['crypto', 'forensics', 'misc', 'pwn', 'rev', 'web']
    name_upper = (problem_name or '').upper()
    category_upper = (category or '').upper()
    for cat in categories:
        if cat.upper() in name_upper or cat.upper() in category_upper:
            return cat
    return 'base'

@app.route('/')
def index():
    """Main page - displays the list of problems."""
    return render_template('index.html', CTFD_BASE_URL=CTFD_BASE_URL)

@app.route('/api/problems')
def get_problems():
    """Gets the list of problems from the database."""
    try:
        problems = get_problems_from_db()
        return jsonify({'success': True, 'problems': problems})
    except Exception as e:
        print(f"Database error: {e}")
        return jsonify({'success': False, 'message': 'Failed to load problem list.'}), 500

@app.route('/api/problems/load', methods=['POST'])
def load_problems_from_server():
    try:
        # Request to MCP server - use /challenges endpoint
        response = requests.get(f"{MCP_SERVER_URL}/challenges", timeout=10)
        response.raise_for_status()
        problems_data = response.json()
        problems = []
        for problem in problems_data:
            problem_id = problem.get('id') or problem.get('problem_id') or problem.get('challenge_id')
            problem_name = problem.get('name') or problem.get('title') or problem.get('problem_name')
            solved_by = problem.get('solved_by_name') or problem.get('solved_by') or problem.get('solvedBy')
            if problem_id and problem_name:
                problems.append({
                    'id': problem_id,
                    'name': problem_name,
                    'solved_by_name': solved_by,
                    'dcipher_gpt_count': 0,
                    'dcipher_claude_count': 0,
                    'dcipher_gemini_count': 0,
                    'dcipher_gpt_solved': 0,
                    'dcipher_claude_solved': 0,
                    'dcipher_gemini_solved': 0,
                    'solves': problem.get('solves'),
                    'value': problem.get('value')
                })
        # Save to DB
        save_problems_to_db(problems)
        # Get detailed information for all problems from external source and save to DB
        conn = get_db_connection()
        cursor = conn.cursor()
        import json as _json
        for p in problems:
            pid = p['id']
            # Skip if detailed information already exists
            cursor.execute('SELECT id FROM problem_details WHERE id = ?', (pid,))
            if cursor.fetchone():
                continue
            try:
                detail_resp = requests.get(f'{MCP_SERVER_URL}/challenge/{pid}', timeout=10)
                detail_data = detail_resp.json()
                if detail_data.get('success') and 'data' in detail_data:
                    detail = detail_data['data']
                else:
                    detail = detail_data
                cursor.execute('''
                    INSERT OR REPLACE INTO problem_details (id, category, description, files, connection_info, hints, updated_at)
                    VALUES (?, ?, ?, ?, ?, ?, CURRENT_TIMESTAMP)
                ''', (
                    detail.get('id'),
                    detail.get('category'),
                    detail.get('description'),
                    _json.dumps(detail.get('files', [])),
                    detail.get('connection_info'),
                    _json.dumps(detail.get('hints', []))
                ))
                conn.commit()
            except Exception as e:
                print(f'Failed to save detailed information: {pid}, {e}')
        conn.close()
        return jsonify({
            'success': True, 
            'message': f'Successfully loaded {len(problems)} problems.',
            'problems': problems
        })
    except requests.RequestException as e:
        print(f"MCP server connection failed: {e}")
        # Sample data for when actual server is not available
        sample_problems = [
            {'id': 1, 'name': 'Sum of Two Numbers', 'solved_by_name': 'user1'},
            {'id': 2, 'name': 'Find Maximum in Array', 'solved_by_name': None},
            {'id': 3, 'name': 'String Reverse', 'solved_by_name': 'user2'},
            {'id': 4, 'name': 'Fibonacci Sequence', 'solved_by_name': None},
            {'id': 5, 'name': 'Prime Number Check', 'solved_by_name': 'user3'},
        ]
        
        # Save sample data to DB as well
        save_problems_to_db(sample_problems)
        
        return jsonify({
            'success': True, 
            'message': f'Loaded {len(sample_problems)} sample problems.',
            'problems': sample_problems
        })
    
    except Exception as e:
        print(f"Error loading problems: {e}")
        return jsonify({'success': False, 'message': 'Failed to load problems.'}), 500

@app.route('/api/problem/<int:problem_id>/increment', methods=['POST'])
def increment_problem_count(problem_id):
    data = request.get_json()
    key = data.get('key')  # e.g., 'enigma_gpt', 'dcipher_gemini', etc.
    count_column = f'{key}_count'
    # Validation
    valid_keys = [
        'dcipher_gpt', 'dcipher_claude', 'dcipher_gemini'
    ]
    if key not in valid_keys:
        return jsonify({'success': False, 'message': 'Invalid item name.'}), 400
    conn = get_db_connection()
    cursor = conn.cursor()
    # Get current value
    cursor.execute(f'SELECT {count_column} FROM problems WHERE id = ?', (problem_id,))
    row = cursor.fetchone()
    if not row:
        conn.close()
        return jsonify({'success': False, 'message': 'Problem not found.'}), 404
    current_count = row[0] or 0
    new_count = min(current_count + 1, 3)  # Maximum increase to 3
    cursor.execute(f'UPDATE problems SET {count_column} = ?, updated_at = CURRENT_TIMESTAMP WHERE id = ?', (new_count, problem_id))
    conn.commit()
    conn.close()
    return jsonify({'success': True, 'new_count': new_count})

@app.route('/edit-attempts')
def edit_attempts_page():
    problems = get_problems_from_db()
    return render_template('edit_attempts.html', problems=problems)

@app.route('/status')
def status_page():
    """Execution status monitoring page"""
    return render_template('status.html')


@app.route('/api/problem/<int:problem_id>/set_attempts', methods=['POST'])
def set_problem_attempts(problem_id):
    data = request.get_json()
    keys = [
        'dcipher_gpt_count', 'dcipher_claude_count', 'dcipher_gemini_count'
    ]
    values = []
    for key in keys:
        v = data.get(key)
        try:
            v = int(v)
        except:
            v = 0
        v = max(0, min(3, v))
        values.append(v)
    conn = get_db_connection()
    cursor = conn.cursor()
    cursor.execute(f'''
        UPDATE problems SET
            dcipher_gpt_count=?, dcipher_claude_count=?, dcipher_gemini_count=?,
            updated_at=CURRENT_TIMESTAMP
        WHERE id=?
    ''', (*values, problem_id))
    conn.commit()
    conn.close()
    return jsonify({'success': True})

@app.route('/api/problem/<int:problem_id>/toggle_hidden', methods=['POST'])
def toggle_problem_hidden(problem_id):
    """Toggle the hidden status of a problem."""
    try:
        conn = get_db_connection()
        cursor = conn.cursor()
        
        # Check current hidden status
        cursor.execute('SELECT hidden, name FROM problems WHERE id = ?', (problem_id,))
        row = cursor.fetchone()
        
        if not row:
            conn.close()
            return jsonify({'success': False, 'message': 'Problem not found.'}), 404
        
        current_hidden = row[0]
        problem_name = row[1]
        new_hidden = 1 if current_hidden == 0 else 0
        
        # Update hidden status
        cursor.execute('UPDATE problems SET hidden = ?, updated_at = CURRENT_TIMESTAMP WHERE id = ?', (new_hidden, problem_id))
        conn.commit()
        conn.close()
        
        action = "hidden" if new_hidden == 1 else "visible"
        return jsonify({
            'success': True, 
            'message': f'Problem "{problem_name}" has been changed to {action} status.',
            'hidden': new_hidden
        })
        
    except Exception as e:
        print(f"[{datetime.now()}] Failed to toggle problem hidden status: {e}")
        return jsonify({'success': False, 'message': 'Failed to change problem hidden status.'}), 500

@app.route('/challenge/<int:challenge_id>')
def proxy_challenge_info(challenge_id):
    # 1. First query from DB
    conn = get_db_connection()
    cursor = conn.cursor()
    cursor.execute('SELECT category, description, files, connection_info, hints FROM problem_details WHERE id = ?', (challenge_id,))
    row = cursor.fetchone()
    if row:
        import json
        # Add model-specific cost information
        model_costs = get_model_costs(challenge_id)
        
        # Add correct flag information
        correct_flag = get_correct_flag(challenge_id)
        
        result = {
            'id': challenge_id,
            'category': row['category'],
            'description': row['description'],
            'files': json.loads(row['files']) if row['files'] else [],
            'connection_info': row['connection_info'],
            'hints': json.loads(row['hints']) if row['hints'] else [],
            'model_costs': model_costs,  # Add model-specific cost information
            'correct_flag': correct_flag  # Add correct flag information
        }
        conn.close()
        return jsonify(result)
    # 2. If not found, get from external source and save to DB
    try:
        response = requests.get(f'{MCP_SERVER_URL}/challenge/{challenge_id}', timeout=10)
        data = response.json()
        # Handle success: true, data: {...} structure
        if data.get('success') and 'data' in data:
            detail = data['data']
        else:
            detail = data
        # Save to DB
        import json as _json
        cursor.execute('''
            INSERT OR REPLACE INTO problem_details (id, category, description, files, connection_info, hints, updated_at)
            VALUES (?, ?, ?, ?, ?, ?, CURRENT_TIMESTAMP)
        ''', (
            detail.get('id'),
            detail.get('category'),
            detail.get('description'),
            _json.dumps(detail.get('files', [])),
            detail.get('connection_info'),
            _json.dumps(detail.get('hints', []))
        ))
        conn.commit()
        conn.close()
        
        # Add correct flag information
        correct_flag = get_correct_flag(challenge_id)
        if correct_flag:
            detail['correct_flag'] = correct_flag
        
        return jsonify(detail)
    except Exception as e:
        conn.close()
        return jsonify({'error': str(e)}), 500

@app.route('/api/problem/<int:problem_id>/run', methods=['POST'])
def run_problem_command(problem_id):
    data = request.get_json()
    key = data.get('key')  # e.g., 'enigma_gpt', 'dcipher_gemini', etc.
    problem_name = data.get('problem_name')
    category = data.get('category')
    if not problem_name:
        return jsonify({'success': False, 'message': 'Problem name is required.'}), 400
    # Reject if already running
    if (problem_id, key) in RUNNING_STATUS:
        return jsonify({'success': False, 'message': 'Already running.'}), 409
    
    # Auto-run concurrency control - protect entire process execution with lock
    with auto_run_lock:
        # Check again if already running (inside lock)
        if (problem_id, key) in RUNNING_STATUS:
            return jsonify({'success': False, 'message': 'Already running.'}), 409
        
        # Check if problem is already solved
        conn = get_db_connection()
        cursor = conn.cursor()
        solved_column = f"{key}_solved"
        cursor.execute(f"SELECT {solved_column} FROM problems WHERE id = ?", (problem_id,))
        row = cursor.fetchone()
        if row and row[0] == 1:
            conn.close()
            return jsonify({'success': False, 'message': 'Problem is already solved.'}), 409
        
        # Check current attempt count
        count_column = f"{key}_count"
        cursor.execute(f"SELECT {count_column} FROM problems WHERE id = ?", (problem_id,))
        count_row = cursor.fetchone()
        current_count = count_row[0] if count_row else 0
        
        if current_count >= 3:
            conn.close()
            return jsonify({'success': False, 'message': 'Maximum attempt count (3) reached.'}), 409
        
        conn.close()
        
        # Generate seed value
        seed = str(uuid.uuid4())
        
        # Extract category
        auto_category = extract_category(problem_name, category)
        
        # Generate command
        if key == 'dcipher_gpt':
            cmd = f'python3 run_dcipher.py --split test --challenge_ids {problem_id} --category {auto_category} --enable-autoprompt --planner-model gpt-4.1-2025-04-14 --executor-model gpt-4.1-2025-04-14 --autoprompter-model gpt-4.1-2025-04-14 --seed {seed}'
        elif key == 'dcipher_claude':
            cmd = f'python3 run_dcipher.py --split test --challenge_ids {problem_id} --category {auto_category} --enable-autoprompt --planner-model claude-3-5-sonnet-20240620 --executor-model claude-3-5-sonnet-20240620 --autoprompter-model claude-3-5-sonnet-20240620 --seed {seed}'
        elif key == 'dcipher_gemini':
            cmd = f'python3 run_dcipher.py --split test --challenge_ids {problem_id} --category {auto_category} --enable-autoprompt --planner-model gemini-2.5-flash --executor-model gemini-2.5-flash --autoprompter-model gemini-2.5-flash --seed {seed}'
        else:
            return jsonify({'success': False, 'message': 'Unknown item.'}), 400
        
        # Create process internally (without new terminal)
        try:
            # Convert command to list (seed is recorded internally only)
            if key == 'dcipher_gpt':
                cmd_list = ['python3', 'run_dcipher.py', '--split', 'test', '--challenge_ids', str(problem_id), '--category', auto_category, '--enable-autoprompt', '--planner-model', 'gpt-4.1-2025-04-14', '--executor-model', 'gpt-4.1-2025-04-14', '--autoprompter-model', 'gpt-4.1-2025-04-14']
            elif key == 'dcipher_claude':
                cmd_list = ['python3', 'run_dcipher.py', '--split', 'test', '--challenge_ids', str(problem_id), '--category', auto_category, '--enable-autoprompt', '--planner-model', 'claude-3-5-sonnet-20240620', '--executor-model', 'claude-3-5-sonnet-20240620', '--autoprompter-model', 'claude-3-5-sonnet-20240620']
            elif key == 'dcipher_gemini':
                cmd_list = ['python3', 'run_dcipher.py', '--split', 'test', '--challenge_ids', str(problem_id), '--category', auto_category, '--enable-autoprompt', '--planner-model', 'gemini-2.5-flash', '--executor-model', 'gemini-2.5-flash', '--autoprompter-model', 'gemini-2.5-flash']
            
            # Execute in background, connect stdout/stderr with pipes
            # Set working directory explicitly so log files are created in the correct location
            working_dir = './EVAL-D-CIPHER'
            
            # Set environment variables (same environment as terminal)
            env = os.environ.copy()
            env['PYTHONUNBUFFERED'] = '1'  # Disable Python output buffering
            env['MODEL_KEY'] = key  # Pass model information as environment variable
            env['PROBLEM_ID'] = str(problem_id)  # Pass problem ID as environment variable
            
            # Set environment variables for performance optimization
            env['OMP_NUM_THREADS'] = '4'  # Limit OpenMP thread count
            env['MKL_NUM_THREADS'] = '4'  # Limit MKL thread count
            env['NUMEXPR_NUM_THREADS'] = '4'  # Limit NumExpr thread count
            env['OPENBLAS_NUM_THREADS'] = '4'  # Limit OpenBLAS thread count
            env['VECLIB_MAXIMUM_THREADS'] = '4'  # Limit macOS Accelerate framework thread count
            env['BLAS_NUM_THREADS'] = '4'  # Limit BLAS thread count
            env['LAPACK_NUM_THREADS'] = '4'  # Limit LAPACK thread count
            
            # Check and set virtual environment path
            venv_path = '../venv'
            env, python_path = get_venv_environment(venv_path)
            
            # Use virtual environment Python
            if python_path:
                # Change python3 to virtual environment's python in command
                cmd_list = [python_path] + cmd_list[1:]
                print(f"[{datetime.now()}] Using virtual environment Python: {python_path}")
                print(f"[{datetime.now()}] Environment variable VIRTUAL_ENV: {env.get('VIRTUAL_ENV', 'Not set')}")
                print(f"[{datetime.now()}] Environment variable PATH start: {env.get('PATH', 'Not set')[:100]}...")
                
                # Check if Python executable exists
                if not os.path.exists(python_path):
                    print(f"[{datetime.now()}] Warning: Python executable does not exist: {python_path}")
                    # Fallback to system Python
                    cmd_list = ['python3'] + cmd_list[1:]
                    print(f"[{datetime.now()}] Fallback to system Python: python3")
            else:
                print(f"[{datetime.now()}] Using system Python (no virtual environment)")
            
            # Check if working directory exists
            if not os.path.exists(working_dir):
                print(f"[{datetime.now()}] Warning: Working directory does not exist: {working_dir}")
                # Fallback to current directory
                working_dir = os.getcwd()
                print(f"[{datetime.now()}] Fallback to current directory: {working_dir}")
            
            # Check if command executable exists
            script_name = cmd_list[1] if len(cmd_list) > 1 else None
            if script_name:
                script_path = os.path.join(working_dir, script_name)
                if not os.path.exists(script_path):
                    print(f"[{datetime.now()}] Warning: Script file does not exist: {script_path}")
                    # Search in full path
                    import shutil
                    if shutil.which(script_name):
                        print(f"[{datetime.now()}] Script found in PATH: {script_name}")
                    else:
                        print(f"[{datetime.now()}] Warning: Script not found: {script_name}")
            
            print(f"[{datetime.now()}] Final command: {' '.join(cmd_list)}")
            print(f"[{datetime.now()}] Working directory: {working_dir}")
            print(f"[{datetime.now()}] Environment variable count: {len(env)}")
            
            # Use different settings for Windows and Unix/Linux
            if sys.platform.startswith('win'):
                # preexec_fn not available on Windows
                proc = subprocess.Popen(
                    cmd_list,
                    stdout=subprocess.PIPE,
                    stderr=subprocess.PIPE,
                    text=True,
                    bufsize=0,  # Disable buffering
                    universal_newlines=True,
                    cwd=working_dir,  # Set working directory
                    env=env,  # Pass environment variables
                    creationflags=subprocess.CREATE_NEW_PROCESS_GROUP  # Create new process group on Windows
                )
            else:
                # Create new process group and performance optimization on Unix/Linux
                proc = subprocess.Popen(
                    cmd_list,
                    stdout=subprocess.PIPE,
                    stderr=subprocess.PIPE,
                    text=True,
                    bufsize=0,  # Disable buffering
                    universal_newlines=True,
                    cwd=working_dir,  # Set working directory
                    env=env,  # Pass environment variables
                    start_new_session=True  # Create new session (use instead of preexec_fn)
                )
                
                # Resource allocation settings after process creation (optional)
                try:
                    # Wait briefly for process to actually start
                    import time
                    time.sleep(0.5)  # Increased from 0.1 to 0.5 seconds
                    
                    # Check if process is still running
                    if proc.poll() is None:  # Process is running
                        process = psutil.Process(proc.pid)
                        
                        # Check process status and log
                        print(f"[{datetime.now()}] Process status check: PID {proc.pid}, status: {process.status()}")
                        
                        # Set CPU affinity (sequentially assign 2 cores)
                        try:
                            global core_assign_index
                            cpu_count = psutil.cpu_count()
                            if cpu_count > 1:
                                base = core_assign_index % cpu_count
                                cpu_cores = [(base + i) % cpu_count for i in range(1)]
                                process.cpu_affinity(cpu_cores)
                                print(f"[{datetime.now()}] CPU affinity sequential distribution setting: PID {proc.pid}, cores {cpu_cores}")
                                core_assign_index += 1
                        except Exception as e:
                            print(f"[{datetime.now()}] CPU affinity setting failed (ignored): {e}")
                        
                        # Memory monitoring setup
                        try:
                            memory_info = process.memory_info()
                            print(f"[{datetime.now()}] Memory monitoring activated: PID {proc.pid}, initial memory: {memory_info.rss / 1024 / 1024:.2f} MB")
                        except Exception as e:
                            print(f"[{datetime.now()}] Memory monitoring setup failed (ignored): {e}")
                            
                    else:
                        print(f"[{datetime.now()}] Process already terminated: PID {proc.pid}, return code: {proc.returncode}")
                        # Check stderr if process terminated immediately
                        try:
                            stderr_output = proc.stderr.read()
                            if stderr_output:
                                print(f"[{datetime.now()}] Process stderr: {stderr_output.decode('utf-8', errors='ignore')}")
                        except Exception as e:
                            print(f"[{datetime.now()}] stderr read failed: {e}")
                except Exception as e:
                    print(f"[{datetime.now()}] Process resource allocation setup failed (ignored): {e}")
            
            # Start log output
            print(f"[{datetime.now()}] Process started: {problem_id}/{key}")
            print(f"[{datetime.now()}] Command: {' '.join(cmd_list)}")
            print(f"[{datetime.now()}] Working directory: {working_dir}")
            print(f"[{datetime.now()}] Process PID: {proc.pid}")
            
            # Check if process terminated immediately
            time.sleep(1)  # Wait 1 second
            if proc.poll() is not None:
                # Process terminated immediately
                return_code = proc.returncode
                print(f"[{datetime.now()}] Process terminated immediately: {problem_id}/{key}, return code: {return_code}")
                
                # Check error messages in stderr
                try:
                    stderr_output = proc.stderr.read()
                    if stderr_output:
                        stderr_text = stderr_output.decode('utf-8', errors='ignore')
                        print(f"[{datetime.now()}] Process stderr: {stderr_text}")
                except Exception as e:
                    print(f"[{datetime.now()}] stderr read failed: {e}")
                
                # Check output in stdout
                try:
                    stdout_output = proc.stdout.read()
                    if stdout_output:
                        stdout_text = stdout_output.decode('utf-8', errors='ignore')
                        print(f"[{datetime.now()}] Process stdout: {stdout_text}")
                except Exception as e:
                    print(f"[{datetime.now()}] stdout read failed: {e}")
                
                # Return error response for immediate termination
                error_message = f"Process terminated immediately. (Return code: {return_code})"
                if return_code == -9:
                    error_message = "Process was forcefully terminated with SIGKILL. This may be due to memory shortage or system resource issues."
                elif return_code == -11:
                    error_message = "Process terminated with SIGSEGV. Memory access error occurred."
                elif return_code == -6:
                    error_message = "Process terminated with SIGABRT. Fatal error occurred in the program."
                
                return jsonify({'success': False, 'message': error_message}), 500
        
        except Exception as e:
            print(f"[{datetime.now()}] Process start failed: {e}")
            return jsonify({'success': False, 'message': f'Execution failed: {e}'}), 500
        
        # Record execution status
        RUNNING_STATUS[(problem_id, key)] = {
            'seed': seed, 
            'process': proc, 
            'start_time': datetime.now(),
            'cmd': ' '.join(cmd_list),
            'stdout': [],
            'stderr': [],
            'total_cost': None,  # Cost information
            'cost_updates': []  # Cost update history
        }
        
        # Record execution attempt (run_attempts)
        try:
            conn = get_db_connection()
            cursor = conn.cursor()
            
            # First increment count (atomic operation)
            count_column = f"{key}_count"
            cursor.execute(f"UPDATE problems SET {count_column} = {count_column} + 1, updated_at = CURRENT_TIMESTAMP WHERE id = ? AND {count_column} < 3", (problem_id,))
            
            if cursor.rowcount == 0:
                # Failed to increment count (already 3 or more attempts, or problem not found)
                conn.close()
                return jsonify({'success': False, 'message': 'Maximum attempt count reached or problem not found.'}), 409
            
            # Record execution attempt
            cursor.execute('''
                INSERT OR IGNORE INTO run_attempts (challenge_id, model_key, seed, start_time, status)
                VALUES (?, ?, ?, ?, ?)
            ''', (problem_id, key, seed, datetime.now().isoformat(), 'running'))
            conn.commit()
            conn.close()
        except Exception as e:
            print(f"[Execution attempt recording failed] {e}")
            # Terminate process if failed
            try:
                proc.kill()
            except:
                pass
            return jsonify({'success': False, 'message': 'Execution failed due to database error.'}), 500
    
    # Cost parsing function
    def parse_cost(line):
        import re
        # D-CIPHER: "$0.003 / $3.000" or "Total cost: $0.003 / $3.000"
        dcipher_pattern = r'(?:Total cost:\s*)?\$(\d+\.\d+)\s*/\s*\$(\d+\.\d+)'
        dcipher_match = re.search(dcipher_pattern, line)
        if dcipher_match:
            return float(dcipher_match.group(1))
        # ENIGMA format: "Total cost: $0.151162"
        enigma_pattern = r'Total cost:\s*\$(\d+\.\d+)'
        enigma_match = re.search(enigma_pattern, line)
        if enigma_match:
            return float(enigma_match.group(1))
        return None
    
    # Run attempt cost update function
    def update_run_attempt_cost(challenge_id, model_key, seed, cost, end_time=None, status=None):
        try:
            conn = get_db_connection()
            cursor = conn.cursor()
            sql = 'UPDATE run_attempts SET cost=?, end_time=?, status=? WHERE challenge_id=? AND model_key=? AND seed=?'
            cursor.execute(sql, (cost, end_time, status, challenge_id, model_key, seed))
            conn.commit()
            conn.close()
        except Exception as e:
            print(f"[Run attempt cost update failed] {e}")
    
    # Log collection function
    def collect_logs():
        try:
            print(f"[{datetime.now()}] Log collection started: {problem_id}/{key}")
            
            import select
            import sys
            import re
            
            # Success message pattern (enigma only)
            success_pattern = r'Found the answer! Exit the program.'
            # Cost exit pattern
            exitcost_pattern = r'Exit command detected: exit_cost'
            exitforfeit_pattern = r'Exit command detected: exit_forfeit'

            
            # Windows has limited select functionality, so use different approach
            if sys.platform.startswith('win'):
                # Use simple polling approach on Windows
                while proc.poll() is None:
                    # Read stdout
                    try:
                        stdout_line = proc.stdout.readline()
                        if stdout_line:
                            line = stdout_line.strip()
                            RUNNING_STATUS[(problem_id, key)]['stdout'].append(line)
                            # Don't output to main log
                            
                            # Parse success message (dcipher models only)
                            if key.startswith('dcipher') and re.search(r'Challenge Solved!', line):
                                print(f"[{datetime.now()}] [{problem_id}/{key}] Success message found! Requesting process termination via API...")
                                try:
                                    # 1. Update solved status for the model in DB (prevent duplicates)
                                    conn = get_db_connection()
                                    cursor = conn.cursor()
                                    solved_column = f"{key}_solved"
                                    cursor.execute(f"UPDATE problems SET {solved_column} = 1, updated_at = CURRENT_TIMESTAMP WHERE id = ? AND {solved_column} = 0", (problem_id,))
                                    if cursor.rowcount > 0:
                                        print(f"[{datetime.now()}] [{problem_id}/{key}] Solution status update completed")
                                    else:
                                        print(f"[{datetime.now()}] [{problem_id}/{key}] Already solved")
                                    conn.commit()
                                    conn.close()
                                    # 2. Call process termination API
                                    url = f"http://127.0.0.1:5000/api/process/{problem_id}/terminate?key={key}"
                                    resp = requests.post(url, timeout=5)
                                    print(f"[{datetime.now()}] [{problem_id}/{key}] Termination API response: {resp.status_code} {resp.text}")
                                except Exception as e:
                                    print(f"[{datetime.now()}] [{problem_id}/{key}] Termination API request failed: {e}")
                            
                            # Parse cost exit pattern (all models)
                            if re.search(exitcost_pattern, line) or re.search(exitforfeit_pattern, line):
                                print(f"[{datetime.now()}] [{problem_id}/{key}] Exit pattern found! Requesting process termination via API...")
                                try:
                                    # Call process termination API (without changing solved status)
                                    url = f"http://127.0.0.1:5000/api/process/{problem_id}/terminate?key={key}"
                                    resp = requests.post(url, timeout=5)
                                    print(f"[{datetime.now()}] [{problem_id}/{key}] Termination API response: {resp.status_code} {resp.text}")
                                except Exception as e:
                                    print(f"[{datetime.now()}] [{problem_id}/{key}] Termination API request failed: {e}")
                            
                            # Parse cost information
                            cost = parse_cost(line)
                            if cost is not None:
                                RUNNING_STATUS[(problem_id, key)]['total_cost'] = cost
                                RUNNING_STATUS[(problem_id, key)]['cost_updates'].append({
                                    'cost': cost,
                                    'timestamp': datetime.now().isoformat()
                                })
                                # Update run attempt cost
                                update_run_attempt_cost(problem_id, key, seed, cost)
                                print(f"[{datetime.now()}] [{problem_id}/{key}] Cost updated: ${cost}")
                                
                                # Also update cost in CTF flags table
                                try:
                                    update_ctf_cost_internal(problem_id, key, cost)
                                except Exception as e:
                                    print(f"[{datetime.now()}] CTF cost update failed: {e}")
                    except:
                        pass
                    
                    # Read stderr
                    try:
                        stderr_line = proc.stderr.readline()
                        if stderr_line:
                            line = stderr_line.strip()
                            RUNNING_STATUS[(problem_id, key)]['stderr'].append(line)
                            # Don't output to main log
                    except:
                        pass
                    
                    import time
                    time.sleep(0.1)  # Wait 0.1 seconds
            else:
                # Use select on Unix/Linux
                import fcntl
                import os
                
                # Set stdout, stderr to non-blocking
                for pipe in [proc.stdout, proc.stderr]:
                    if pipe:
                        fd = pipe.fileno()
                        fl = fcntl.fcntl(fd, fcntl.F_GETFL)
                        fcntl.fcntl(fd, fcntl.F_SETFL, fl | os.O_NONBLOCK)
                
                while proc.poll() is None:  # While process is running
                    # Use select to check if there's readable data
                    readable, _, _ = select.select([proc.stdout, proc.stderr], [], [], 0.1)
                    
                    for pipe in readable:
                        try:
                            line = pipe.readline()
                            if line:
                                line = line.strip()
                                if pipe == proc.stdout:
                                    RUNNING_STATUS[(problem_id, key)]['stdout'].append(line)
                                    # Don't output to main log
                                    
                                    # Parse success message (dcipher models only)
                                    if key.startswith('dcipher') and re.search(r'Challenge Solved!', line):
                                        print(f"[{datetime.now()}] [{problem_id}/{key}] Success message found! Requesting process termination via API...")
                                        try:
                                            # 1. Update solved status for the model in DB (prevent duplicates)
                                            conn = get_db_connection()
                                            cursor = conn.cursor()
                                            solved_column = f"{key}_solved"
                                            cursor.execute(f"UPDATE problems SET {solved_column} = 1, updated_at = CURRENT_TIMESTAMP WHERE id = ? AND {solved_column} = 0", (problem_id,))
                                            if cursor.rowcount > 0:
                                                print(f"[{datetime.now()}] [{problem_id}/{key}] Solution status update completed")
                                            else:
                                                print(f"[{datetime.now()}] [{problem_id}/{key}] Already solved")
                                            conn.commit()
                                            conn.close()
                                            # 2. Call process termination API
                                            url = f"http://127.0.0.1:5000/api/process/{problem_id}/terminate?key={key}"
                                            resp = requests.post(url, timeout=5)
                                            print(f"[{datetime.now()}] [{problem_id}/{key}] Termination API response: {resp.status_code} {resp.text}")
                                        except Exception as e:
                                            print(f"[{datetime.now()}] [{problem_id}/{key}] Termination API request failed: {e}")
                                    
                                    # Parse cost exit pattern (all models)
                                    if re.search(exitcost_pattern, line) or re.search(exitforfeit_pattern, line):
                                        print(f"[{datetime.now()}] [{problem_id}/{key}] Exit pattern found! Requesting process termination via API...")
                                        try:
                                            # Call process termination API (without changing solved status)
                                            url = f"http://127.0.0.1:5000/api/process/{problem_id}/terminate?key={key}"
                                            resp = requests.post(url, timeout=5)
                                            print(f"[{datetime.now()}] [{problem_id}/{key}] Termination API response: {resp.status_code} {resp.text}")
                                        except Exception as e:
                                            print(f"[{datetime.now()}] [{problem_id}/{key}] Termination API request failed: {e}")
                                    
                                    # Parse cost information
                                    cost = parse_cost(line)
                                    if cost is not None:
                                        RUNNING_STATUS[(problem_id, key)]['total_cost'] = cost
                                        RUNNING_STATUS[(problem_id, key)]['cost_updates'].append({
                                            'cost': cost,
                                            'timestamp': datetime.now().isoformat()
                                        })
                                        # Update run attempt cost
                                        update_run_attempt_cost(problem_id, key, seed, cost)
                                        print(f"[{datetime.now()}] [{problem_id}/{key}] Cost updated: ${cost}")
                                        
                                        # Also update cost in CTF flags table
                                        try:
                                            update_ctf_cost_internal(problem_id, key, cost)
                                        except Exception as e:
                                            print(f"[{datetime.now()}] CTF cost update failed: {e}")
                                else:
                                    RUNNING_STATUS[(problem_id, key)]['stderr'].append(line)
                                    # Don't output to main log
                        except (IOError, OSError):
                            # Ignore read errors and continue
                            pass
            
            # Read remaining output after process termination
            remaining_stdout, remaining_stderr = proc.communicate()
            if remaining_stdout:
                for line in remaining_stdout.strip().split('\n'):
                    if line:
                        RUNNING_STATUS[(problem_id, key)]['stdout'].append(line)
                        # Don't output to main log
                        
                        # Parse cost information
                        cost = parse_cost(line)
                        if cost is not None:
                            RUNNING_STATUS[(problem_id, key)]['total_cost'] = cost
                            RUNNING_STATUS[(problem_id, key)]['cost_updates'].append({
                                'cost': cost,
                                'timestamp': datetime.now().isoformat()
                            })
                            # Update run attempt cost
                            update_run_attempt_cost(problem_id, key, seed, cost)
                            print(f"[{datetime.now()}] [{problem_id}/{key}] Final cost: ${cost}")
                            
                            # Also update cost in CTF flags table
                            try:
                                update_ctf_cost_internal(problem_id, key, cost)
                            except Exception as e:
                                print(f"[{datetime.now()}] CTF cost update failed: {e}")
            if remaining_stderr:
                for line in remaining_stderr.strip().split('\n'):
                    if line:
                        RUNNING_STATUS[(problem_id, key)]['stderr'].append(line)
                        # Don't output to main log
                        
            print(f"[{datetime.now()}] Log collection completed: {problem_id}/{key} (return code: {proc.returncode})")
        except Exception as e:
            print(f"[{datetime.now()}] Log collection error: {e}")
            import traceback
            traceback.print_exc()
    
    # Start log collection thread
    threading.Thread(target=collect_logs, daemon=True).start()
    
    # Clear status after 20 minutes (timeout)
    def clear_status_later():
        try:
            # Wait with 1 hour (3600 seconds) timeout
            print(f"[{datetime.now()}] Process timeout wait started: {problem_id}/{key} (3600 seconds)")
            proc.wait(timeout=3600)
            print(f"[{datetime.now()}] Process completed: {problem_id}/{key}")
        except subprocess.TimeoutExpired:
            # Terminate process on timeout
            print(f"[{datetime.now()}] Process timeout: {problem_id}/{key}")
            try:
                print(f"[{datetime.now()}] Attempting process termination (SIGTERM): {problem_id}/{key}")
                proc.terminate()
                proc.wait(timeout=30)  # Increased from 10 to 30 seconds
                print(f"[{datetime.now()}] Process termination completed: {problem_id}/{key}")
            except subprocess.TimeoutExpired:
                print(f"[{datetime.now()}] Attempting force process termination (SIGKILL): {problem_id}/{key}")
                proc.kill()
                print(f"[{datetime.now()}] Force process termination completed: {problem_id}/{key}")
        except Exception as e:
            print(f"[{datetime.now()}] Exception during process wait: {problem_id}/{key}, error: {e}")
        finally:
            # Collect completed process information
            try:
                # Get problem name and category
                conn = get_db_connection()
                cursor = conn.cursor()
                cursor.execute('SELECT name FROM problems WHERE id = ?', (problem_id,))
                row = cursor.fetchone()
                problem_name = row['name'] if row else f'Problem #{problem_id}'
                
                # Get category
                cursor.execute('SELECT category FROM problem_details WHERE id = ?', (problem_id,))
                cat_row = cursor.fetchone()
                category = cat_row['category'] if cat_row and cat_row['category'] else 'BASE'
                conn.close()
                
                # Model name mapping
                model_names = {
                    'dcipher_gpt': 'DCIPHER-GPT',
                    'dcipher_claude': 'DCIPHER-CLAUDE',
                    'dcipher_gemini': 'DCIPHER-GEMINI'
                }
                model_name = model_names.get(key, key)
                
                # Create completed process information
                total_cost = RUNNING_STATUS[(problem_id, key)]['total_cost']
                cost_updates_count = len(RUNNING_STATUS[(problem_id, key)]['cost_updates'])
                
                print(f"[{datetime.now()}] Completed process cost info: problem_id={problem_id}, key={key}, total_cost={total_cost}, cost_updates_count={cost_updates_count}")
                
                completed_process = {
                    'problem_id': problem_id,
                    'problem_name': problem_name,
                    'category': category,
                    'key': key,
                    'model_name': model_name,
                    'seed': seed,
                    'start_time': RUNNING_STATUS[(problem_id, key)]['start_time'].isoformat(),
                    'end_time': datetime.now().isoformat(),
                    'cmd': RUNNING_STATUS[(problem_id, key)]['cmd'],
                    'return_code': proc.returncode,
                    'stdout_lines': len(RUNNING_STATUS[(problem_id, key)]['stdout']),
                    'stderr_lines': len(RUNNING_STATUS[(problem_id, key)]['stderr']),
                    'total_cost': total_cost,
                    'cost_updates_count': cost_updates_count
                }
                
                # Add to completed processes list (keep latest 50)
                COMPLETED_PROCESSES.append(completed_process)
                if len(COMPLETED_PROCESSES) > 50:
                    COMPLETED_PROCESSES.pop(0)
                
                print(f"[{datetime.now()}] Completed process added: {problem_id}/{key}")
                
            except Exception as e:
                print(f"[{datetime.now()}] Failed to collect completed process information: {e}")
            
            # Remove from status
            RUNNING_STATUS.pop((problem_id, key), None)
            print(f"[{datetime.now()}] Status cleanup completed: {problem_id}/{key}")
            # Update run attempt on completion
            try:
                update_run_attempt_cost(problem_id, key, seed, RUNNING_STATUS[(problem_id, key)]['total_cost'], datetime.now().isoformat(), 'finished')
            except Exception as e:
                print(f"[Run attempt completion update failed] {e}")
    
    threading.Thread(target=clear_status_later, daemon=True).start()
    return jsonify({'success': True, 'seed': seed})

@app.route('/api/problem/<int:problem_id>/run_status', methods=['GET'])
def get_run_status(problem_id):
    key = request.args.get('key')
    if (problem_id, key) in RUNNING_STATUS:
        status = RUNNING_STATUS[(problem_id, key)]
        return jsonify({
            'running': True,
            'seed': status['seed'],
            'start_time': status['start_time'].isoformat(),
            'cmd': status['cmd'],
            'stdout': status['stdout'][-10:],  # Latest 10 lines only
            'stderr': status['stderr'][-10:],  # Latest 10 lines only
            'return_code': status['process'].poll(),  # None if running, number if terminated
            'total_cost': status['total_cost'],  # Cost information
            'cost_updates': status['cost_updates'][-5:]  # Latest 5 cost updates
        })
    else:
        return jsonify({'running': False})

@app.route('/api/running_processes', methods=['GET'])
def get_all_running_processes():
    """Returns the status of all running processes."""
    processes = []
    # DB connection to get problem names
    conn = get_db_connection()
    cursor = conn.cursor()
    
    for (problem_id, key), status in RUNNING_STATUS.items():
        # Get problem name and category
        cursor.execute('SELECT name FROM problems WHERE id = ?', (problem_id,))
        row = cursor.fetchone()
        problem_name = row['name'] if row else f'Problem #{problem_id}'
        
        # Get category
        cursor.execute('SELECT category FROM problem_details WHERE id = ?', (problem_id,))
        cat_row = cursor.fetchone()
        category = cat_row['category'] if cat_row and cat_row['category'] else 'BASE'
        
        # Model name mapping
        model_names = {
            'dcipher_gpt': 'DCIPHER-GPT',
            'dcipher_claude': 'DCIPHER-CLAUDE',
            'dcipher_gemini': 'DCIPHER-GEMINI'
        }
        model_name = model_names.get(key, key)
        
        processes.append({
            'problem_id': problem_id,
            'problem_name': problem_name,
            'category': category,
            'key': key,
            'model_name': model_name,
            'seed': status['seed'],
            'start_time': status['start_time'].isoformat(),
            'cmd': status['cmd'],
            'return_code': status['process'].poll(),
            'stdout_lines': len(status['stdout']),
            'stderr_lines': len(status['stderr']),
            'total_cost': status['total_cost'],  # Cost information
            'cost_updates_count': len(status['cost_updates'])  # Cost update count
        })
    
    conn.close()
    return jsonify({'processes': processes})

@app.route('/api/debug/process/<int:problem_id>', methods=['GET'])
def debug_process(problem_id):
    """Returns process debugging information."""
    key = request.args.get('key')
    if not key:
        return jsonify({'error': 'key parameter is required'}), 400
    
    if (problem_id, key) not in RUNNING_STATUS:
        return jsonify({'error': 'Process is not running'}), 404
    
    status = RUNNING_STATUS[(problem_id, key)]
    process = status['process']
    
    import os
    import psutil
    
    debug_info = {
        'problem_id': problem_id,
        'key': key,
        'pid': process.pid,
        'return_code': process.poll(),
        'cmd': status['cmd'],
        'start_time': status['start_time'].isoformat(),
        'stdout_lines': len(status['stdout']),
        'stderr_lines': len(status['stderr']),
        'working_dir': '../EVAL-D-CIPHER',
                    'total_cost': status['total_cost'],  # Cost information
            'cost_updates': status['cost_updates']  # Cost update history
    }
    
    try:
        # Detailed information using psutil
        if process.pid:
            proc_info = psutil.Process(process.pid)
            debug_info.update({
                'cpu_percent': proc_info.cpu_percent(),
                'memory_info': proc_info.memory_info()._asdict(),
                'status': proc_info.status(),
                'create_time': datetime.fromtimestamp(proc_info.create_time()).isoformat(),
                'num_threads': proc_info.num_threads(),
                'open_files': len(proc_info.open_files()),
                'connections': len(proc_info.connections())
            })
    except Exception as e:
        debug_info['psutil_error'] = str(e)
    
    return jsonify(debug_info)

@app.route('/api/logs/<int:problem_id>', methods=['GET'])
def get_log_files(problem_id):
    """Returns the list of log files for a specific problem."""
    key = request.args.get('key')
    if not key:
        return jsonify({'error': 'key parameter is required'}), 400
    
    # Set working directory
    working_dir = '../EVAL-D-CIPHER'
    
    import os
    import glob
    
    log_files = []
    try:
        # Log file patterns (common log file extensions)
        log_patterns = ['*.log', '*.txt', 'logs/*.log', 'logs/*.txt', 'output/*.log', 'output/*.txt']
        
        for pattern in log_patterns:
            files = glob.glob(os.path.join(working_dir, pattern))
            for file_path in files:
                # File size and modification time information
                stat = os.stat(file_path)
                log_files.append({
                    'path': file_path,
                    'name': os.path.basename(file_path),
                    'size': stat.st_size,
                    'modified': datetime.fromtimestamp(stat.st_mtime).isoformat(),
                    'relative_path': os.path.relpath(file_path, working_dir)
                })
        
        # Sort by recent modification time
        log_files.sort(key=lambda x: x['modified'], reverse=True)
        
    except Exception as e:
        return jsonify({'error': f'Log file search failed: {str(e)}'}), 500
    
    return jsonify({
        'working_dir': working_dir,
        'log_files': log_files
    })

@app.route('/api/stream_logs/<int:problem_id>', methods=['GET'])
def stream_logs(problem_id):
    """Streams real-time logs of the running process."""
    from flask import Response, stream_with_context
    import time
    
    key = request.args.get('key')
    if not key:
        return jsonify({'error': 'key parameter is required'}), 400
    
    if (problem_id, key) not in RUNNING_STATUS:
        return jsonify({'error': 'Process is not running'}), 404
    
    status = RUNNING_STATUS[(problem_id, key)]
    process = status['process']
    
    def generate():
        """Generator for real-time logs."""
        last_stdout_len = len(status['stdout'])
        last_stderr_len = len(status['stderr'])
        
        while process.poll() is None:  # While process is running
            # Check for new stdout logs
            if len(status['stdout']) > last_stdout_len:
                new_lines = status['stdout'][last_stdout_len:]
                for line in new_lines:
                    yield f"data: {json.dumps({'type': 'stdout', 'line': line, 'timestamp': datetime.now().isoformat()})}\n\n"
                last_stdout_len = len(status['stdout'])
            
            # Check for new stderr logs
            if len(status['stderr']) > last_stderr_len:
                new_lines = status['stderr'][last_stderr_len:]
                for line in new_lines:
                    yield f"data: {json.dumps({'type': 'stderr', 'line': line, 'timestamp': datetime.now().isoformat()})}\n\n"
                last_stderr_len = len(status['stderr'])
            
            time.sleep(0.5)  # Check every 0.5 seconds
        
        # Send final status when process ends
        yield f"data: {json.dumps({'type': 'finished', 'return_code': process.returncode, 'timestamp': datetime.now().isoformat()})}\n\n"
    
    return Response(
        stream_with_context(generate()),
        mimetype='text/event-stream',
        headers={
            'Cache-Control': 'no-cache',
            'Connection': 'keep-alive',
            'Access-Control-Allow-Origin': '*',
            'Access-Control-Allow-Headers': 'Cache-Control'
        }
    )

@app.route('/api/download_all', methods=['POST'])
def download_all_problems():
    base_dir = os.path.join(os.getcwd(), 'downloads')
    os.makedirs(base_dir, exist_ok=True)
    # Get all problems and detailed information from DB
    problems = get_problems_from_db()
    conn = get_db_connection()
    cursor = conn.cursor()
    for p in problems:
        pid = p['id']
        # Detailed information
        cursor.execute('SELECT category, description, files FROM problem_details WHERE id = ?', (pid,))
        row = cursor.fetchone()
        print(row)
        if not row:
            continue
        category = row['category'] or 'BASE'
        description = row['description'] or ''
        import json
        files = json.loads(row['files']) if row['files'] else []
        # Create folders
        cat_dir = os.path.join(base_dir, category.upper())
        prob_dir = os.path.join(cat_dir, p['name'])
        os.makedirs(prob_dir, exist_ok=True)
        # Save Description.txt
        desc_path = os.path.join(prob_dir, 'Description.txt')
        with open(desc_path, 'w', encoding='utf-8') as f:
            f.write(description)
        # Download files
        for f_url in files:
            try:
                # Create full URL
                if f_url.startswith('/'):
                    f_url_full = f"{MCP_SERVER_URL}{f_url}"
                else:
                    f_url_full = f_url
                fname = f_url.split('/')[-1].split('?')[0]
                file_path = os.path.join(prob_dir, fname)
                if not os.path.exists(file_path):
                    r = req.get(f_url_full, timeout=30)
                    if r.status_code == 200:
                        with open(file_path, 'wb') as out:
                            out.write(r.content)
            except Exception as e:
                print(f'File download failed: {f_url}, {e}')
    conn.close()
    return jsonify({'success': True, 'message': f'All problem files have been saved to {base_dir}.'})

@app.route('/api/completed_processes', methods=['GET'])
def get_completed_processes():
    """Returns the list of completed processes."""
    try:
        # Add problem names to completed processes if not already present
        conn = get_db_connection()
        cursor = conn.cursor()
        
        for process in COMPLETED_PROCESSES:
            if 'problem_name' not in process:
                cursor.execute('SELECT name FROM problems WHERE id = ?', (process['problem_id'],))
                row = cursor.fetchone()
                process['problem_name'] = row['name'] if row else f'Problem #{process["problem_id"]}'
        
        conn.close()
        
        return jsonify({
            'success': True,
            'processes': COMPLETED_PROCESSES
        })
    except Exception as e:
        return jsonify({
            'success': False,
            'error': str(e)
        }), 500

@app.route('/api/v1/challenges/attempt', methods=['POST'])
def ctf_proxy_attempt():
    """CTF problem solving proxy API"""
    try:
        # Parse request data
        data = request.get_json()
        challenge_id = data.get('challenge_id')
        submission = data.get('submission')
        model_key = data.get('model_key')  # Add model information
        auth_token = request.headers.get('Authorization')
        
        if not challenge_id or not submission:
            return jsonify({
                'success': False,
                'message': 'Missing challenge_id or submission'
            }), 400
        
        if not auth_token:
            return jsonify({
                'success': False,
                'message': 'Missing Authorization header'
            }), 401
        
        print(f"[{datetime.now()}] CTF proxy request: challenge_id={challenge_id}, submission={submission}, model={model_key}")
        
        # Check for previously successful flags from server in DB
        conn = get_db_connection()
        cursor = conn.cursor()
        cursor.execute('''
            SELECT flag, status FROM ctf_flags 
            WHERE challenge_id = ? AND status = 'correct'
            ORDER BY submitted_at DESC LIMIT 1
        ''', (challenge_id,))
        correct_flag = cursor.fetchone()
        
        if correct_flag:
            # If problem was already judged successful by server, compare with stored correct flag
            stored_flag = correct_flag[0]
            if submission == stored_flag:
                print(f"[{datetime.now()}] Already solved problem - correct flag verification: challenge_id={challenge_id}")
                conn.close()
                return jsonify({
                    'success': True,
                    'data': {
                        'status': 'correct',
                        'message': 'Correct'
                    }
                })
            else:
                print(f"[{datetime.now()}] Already solved problem - incorrect flag: challenge_id={challenge_id}")
                conn.close()
                return jsonify({
                    'success': True,
                    'data': {
                        'status': 'incorrect',
                        'message': 'Incorrect'
                    }
                })
        
        # Check if currently submitted flag was previously submitted
        cursor.execute('''
            SELECT status FROM ctf_flags 
            WHERE challenge_id = ? AND flag = ?
        ''', (challenge_id, submission))
        existing_submission = cursor.fetchone()
        
        if existing_submission:
            # If flag was previously submitted, return the result from server as-is
            status = existing_submission[0]
            print(f"[{datetime.now()}] Previously submitted flag: challenge_id={challenge_id}, status={status}")
            conn.close()
            
            if status == 'correct':
                return jsonify({
                    'success': True,
                    'data': {
                        'status': 'correct',
                        'message': 'Correct'
                    }
                })
            else:
                return jsonify({
                    'success': True,
                    'data': {
                        'status': 'incorrect',
                        'message': 'Incorrect'
                    }
                })
        
        # Send request to actual server
        target_url = f"{CTFD_BASE_URL}/api/v1/challenges/attempt"
        headers = {
            'Content-Type': 'application/json',
            'Authorization': auth_token
        }
        
        print(f"[{datetime.now()}] Sending request to actual server: {target_url}")
        print(f"[{datetime.now()}] Request data: {data}")
        response = requests.post(target_url, json=data, headers=headers, timeout=10)
        response_data = response.json()
        
        print(f"[{datetime.now()}] Server response: {response_data}")
        
        # Check response status
        if response_data.get('success') and 'data' in response_data:
            status = response_data['data'].get('status')
            
            # Save flag to DB (including model information)
            try:
                # Cost information is not currently provided by CTF server, so save as None
                # In practice, cost information parsed from execution logs should be used
                cursor.execute('''
                    INSERT INTO ctf_flags (challenge_id, flag, status, model_key, cost)
                    VALUES (?, ?, ?, ?, ?)
                ''', (challenge_id, submission, status, model_key, None))
                conn.commit()
                print(f"[{datetime.now()}] Flag saved successfully: challenge_id={challenge_id}, status={status}, model={model_key}")
                
                # If flag is correct and this is the first time this model got it right, update solution status
                if status == 'correct' and model_key:
                    # Check if this model previously got it right
                    cursor.execute('''
                        SELECT COUNT(*) FROM ctf_flags 
                        WHERE challenge_id = ? AND model_key = ? AND status = 'correct' AND id != last_insert_rowid()
                    ''', (challenge_id, model_key))
                    previous_correct = cursor.fetchone()[0]
                    
                    if previous_correct == 0:
                        # If this is the first time this model got it right, update only this model's solution status
                        update_problem_solved_status(challenge_id, model_key)
                        print(f"[{datetime.now()}] Model solution status updated: challenge_id={challenge_id}, model={model_key}")
                
            except Exception as e:
                print(f"[{datetime.now()}] Flag save failed: {e}")
        
        conn.close()
        
        # Return original response as-is
        return jsonify(response_data)
        
    except requests.RequestException as e:
        print(f"[{datetime.now()}] Server connection failed: {e}")
        return jsonify({
            'success': False,
            'message': 'Failed to connect to CTF server'
        }), 500
        
    except Exception as e:
        print(f"[{datetime.now()}] CTF proxy error: {e}")
        import traceback
        traceback.print_exc()
        return jsonify({
            'success': False,
            'message': 'Internal server error'
        }), 500

@app.route('/api/ctf/flags', methods=['GET'])
def get_ctf_flags():
    """Retrieves the list of CTF flags."""
    try:
        challenge_id = request.args.get('challenge_id', type=int)
        
        conn = get_db_connection()
        cursor = conn.cursor()
        
        if challenge_id:
            # Query flags for specific problem only
            cursor.execute('''
                SELECT challenge_id, flag, status, model_key, cost, submitted_at 
                FROM ctf_flags 
                WHERE challenge_id = ?
                ORDER BY submitted_at DESC
            ''', (challenge_id,))
        else:
            # Query all flags
            cursor.execute('''
                SELECT challenge_id, flag, status, model_key, cost, submitted_at 
                FROM ctf_flags 
                ORDER BY submitted_at DESC
            ''')
        
        flags = []
        for row in cursor.fetchall():
            flags.append({
                'challenge_id': row['challenge_id'],
                'flag': row['flag'],
                'status': row['status'],
                'model_key': row['model_key'],
                'cost': row['cost'],
                'submitted_at': row['submitted_at']
            })
        
        conn.close()
        
        return jsonify({
            'success': True,
            'flags': flags
        })
        
    except Exception as e:
        print(f"[{datetime.now()}] CTF flag query error: {e}")
        return jsonify({
            'success': False,
            'message': 'Failed to retrieve flags'
        }), 500

@app.route('/api/ctf/update_cost', methods=['POST'])
def update_ctf_cost():
    """Updates the cost information for CTF flag submissions."""
    try:
        data = request.get_json()
        challenge_id = data.get('challenge_id')
        model_key = data.get('model_key')
        cost = data.get('cost')
        
        if not challenge_id or not model_key or cost is None:
            return jsonify({
                'success': False,
                'message': 'Missing required parameters'
            }), 400
        
        conn = get_db_connection()
        cursor = conn.cursor()
        
        # Update cost for the most recent flag submission record for the model
        cursor.execute('''
            UPDATE ctf_flags 
            SET cost = ? 
            WHERE challenge_id = ? AND model_key = ? 
            ORDER BY submitted_at DESC 
            LIMIT 1
        ''', (cost, challenge_id, model_key))
        
        conn.commit()
        conn.close()
        
        print(f"[{datetime.now()}] CTF cost updated: challenge_id={challenge_id}, model={model_key}, cost=${cost}")
        
        return jsonify({
            'success': True,
            'message': 'Cost updated successfully'
        })
        
    except Exception as e:
        print(f"[{datetime.now()}] CTF cost update error: {e}")
        return jsonify({
            'success': False,
            'message': 'Failed to update cost'
        }), 500

def update_ctf_cost_internal(challenge_id, model_key, cost):
    """Internally updates the cost information for CTF flag submissions."""
    try:
        conn = get_db_connection()
        cursor = conn.cursor()
        
        # Update cost for the most recent flag submission record for the model
        cursor.execute('''
            UPDATE ctf_flags 
            SET cost = ? 
            WHERE challenge_id = ? AND model_key = ? 
            ORDER BY submitted_at DESC 
            LIMIT 1
        ''', (cost, challenge_id, model_key))
        
        conn.commit()
        conn.close()
        
        print(f"[{datetime.now()}] Internal CTF cost update: challenge_id={challenge_id}, model={model_key}, cost=${cost}")
        
    except Exception as e:
        print(f"[{datetime.now()}] Internal CTF cost update failed: {e}")

def update_problem_solved_status(challenge_id, model_key):
    """Updates the problem solution status when CTF flag is correct."""
    try:
        conn = get_db_connection()
        cursor = conn.cursor()
        
        # Set the solution status for the model to 1
        solved_column = f'{model_key}_solved'
        cursor.execute(f'''
            UPDATE problems 
            SET {solved_column} = 1, updated_at = CURRENT_TIMESTAMP 
            WHERE id = ?
        ''', (challenge_id,))
        
        # Check if all models have solved it
        cursor.execute('''
            SELECT dcipher_gpt_solved, dcipher_claude_solved, dcipher_gemini_solved
            FROM problems WHERE id = ?
        ''', (challenge_id,))
        row = cursor.fetchone()
        
        if row and all(row):  # If all models have solved it
            # Update solved_by_name (e.g., "All Models")
            cursor.execute('''
                UPDATE problems 
                SET solved_by_name = 'All Models', updated_at = CURRENT_TIMESTAMP 
                WHERE id = ?
            ''', (challenge_id,))
            print(f"[{datetime.now()}] All models solved: challenge_id={challenge_id}")
        
        conn.commit()
        conn.close()
        
        print(f"[{datetime.now()}] Problem solution status updated: challenge_id={challenge_id}, model={model_key}")
        
    except Exception as e:
        print(f"[{datetime.now()}] Problem solution status update failed: {e}")

def get_model_costs(problem_id):
    """Gets cost information for each model for a specific problem."""
    try:
        conn = get_db_connection()
        cursor = conn.cursor()
        models = ['dcipher_gpt', 'dcipher_claude', 'dcipher_gemini']
        costs_data = {}
        for model in models:
            cursor.execute('''
                SELECT seed, start_time, end_time, cost, status
                FROM run_attempts
                WHERE challenge_id = ? AND model_key = ?
                ORDER BY start_time ASC
            ''', (problem_id, model))
            runs = cursor.fetchall()
            costs_data[model] = []
            for i, run in enumerate(runs, 1):
                costs_data[model].append({
                    'attempt': i,
                    'seed': run[0],
                    'start_time': run[1],
                    'end_time': run[2],
                    'cost': run[3],
                    'status': run[4]
                })
        conn.close()
        return costs_data
    except Exception as e:
        print(f"[{datetime.now()}] Model cost query failed: {e}")
        return {}

def get_correct_flag(problem_id):
    """Gets the correct flag for a specific problem."""
    try:
        conn = get_db_connection()
        cursor = conn.cursor()
        
        cursor.execute('''
            SELECT flag, model_key, submitted_at
            FROM ctf_flags 
            WHERE challenge_id = ? AND status = 'correct'
            ORDER BY submitted_at DESC LIMIT 1
        ''', (problem_id,))
        
        result = cursor.fetchone()
        conn.close()
        
        if result:
            return {
                'flag': result[0],
                'model_key': result[1],
                'submitted_at': result[2]
            }
        return None
        
    except Exception as e:
        print(f"[{datetime.now()}] Correct flag query failed: {e}")
        return None

def get_venv_environment(venv_path):
    """Sets up environment variables for virtual environment."""
    env = os.environ.copy()
    env['PYTHONUNBUFFERED'] = '1'
    
    if not os.path.exists(venv_path):
        return env, None
    
    # Set virtual environment Python path
    if sys.platform.startswith('win'):
        python_path = os.path.join(venv_path, 'Scripts', 'python.exe')
    else:
        python_path = os.path.join(venv_path, 'bin', 'python')
    
    if os.path.exists(python_path):
        # Set basic virtual environment environment variables
        env['VIRTUAL_ENV'] = os.path.abspath(venv_path)
        if sys.platform.startswith('win'):
            env['PATH'] = os.path.join(venv_path, 'Scripts') + os.pathsep + env.get('PATH', '')
        else:
            env['PATH'] = os.path.join(venv_path, 'bin') + os.pathsep + env.get('PATH', '')
        
        print(f"[{datetime.now()}] Virtual environment setup completed: {venv_path}")
        return env, python_path
    else:
        print(f"[{datetime.now()}] Virtual environment Python not found: {python_path}")
        return env, None

@app.route('/api/process/<int:problem_id>/terminate', methods=['POST'])
def terminate_process_api(problem_id):
    key = request.args.get('key')
    if not key:
        return jsonify({'success': False, 'message': 'key parameter is required'}), 400
    proc_info = RUNNING_STATUS.get((problem_id, key))
    if not proc_info:
        return jsonify({'success': False, 'message': 'No running process found.'}), 404
    proc = proc_info['process']
    try:
        proc.kill()
        return jsonify({'success': True})
    except Exception as e:
        return jsonify({'success': False, 'message': str(e)}), 500


@app.route('/api/docker/cleanup/start', methods=['POST'])
def start_docker_cleanup_api():
    """Start docker cleanup thread via API."""
    try:
        start_docker_cleanup()
        return jsonify({'success': True, 'message': 'Docker cleanup started'})
    except Exception as e:
        return jsonify({'success': False, 'message': str(e)}), 500


@app.route('/api/docker/cleanup/stop', methods=['POST'])
def stop_docker_cleanup_api():
    """Stop docker cleanup thread via API."""
    try:
        stop_docker_cleanup()
        return jsonify({'success': True, 'message': 'Docker cleanup stop requested'})
    except Exception as e:
        return jsonify({'success': False, 'message': str(e)}), 500


@app.route('/api/docker/cleanup/status', methods=['GET'])
def get_docker_cleanup_status():
    """Get docker cleanup thread status."""
    global docker_cleanup_thread, docker_cleanup_running
    return jsonify({
        'running': docker_cleanup_running,
        'thread_alive': docker_cleanup_thread.is_alive() if docker_cleanup_thread else False,
        'check_interval_minutes': CHECK_INTERVAL // 60,
        'delete_threshold_minutes': DELETE_THRESHOLD.total_seconds() // 60,
        'target_images': list(TARGET_IMAGES)
    })


@app.route('/api/docker/cleanup/run-now', methods=['POST'])
def run_docker_cleanup_now():
    """Run docker cleanup immediately."""
    try:
        removed = remove_old_containers()
        return jsonify({
            'success': True,
            'removed_containers': len(removed),
            'details': [{'name': name, 'image': image, 'uptime': uptime} for name, image, uptime in removed]
        })
    except Exception as e:
        return jsonify({'success': False, 'message': str(e)}), 500

if __name__ == '__main__':
    # Initialize database
    init_db()
    
    # Start docker cleanup thread
    start_docker_cleanup()
    
    # Run Flask app
    app.run(debug=False, host='0.0.0.0', port=5000) 