"""
Task list utility functions.
List and export task type information.
"""

import json
import csv
from collections import defaultdict


def list_task_types(examine_sites, num_tasks_to_explore, tasks=None):
    """
    List task types and write a CSV file.
    
    Args:
        examine_sites: List of sites to include
        num_tasks_to_explore: Minimum number of task instances per task type
        tasks: Task type list; if None, list all types that meet the criteria
    
    Returns:
        None (prints output and writes CSV)
    """
    # Load task data
    ALL_TASKS = defaultdict(list)
    with open("config_files/test.raw.json", "r") as f:
        data = json.load(f)
    
    # Filter tasks
    for instance in data:
        task_id = instance["task_id"]
        task_template = instance["intent_template"]
        # If examine_sites is set, keep only tasks whose sites are all in examine_sites
        if examine_sites is None or all([(site in examine_sites) for site in instance["sites"]]):
            ALL_TASKS[task_template].append(task_id)
    
    # Keep only task types with enough instances
    ALL_TASKS = {
        task_type: task_list
        for task_type, task_list in ALL_TASKS.items()
        if len(task_list) >= num_tasks_to_explore + 1
    }
    
    # Determine which task types to show
    if tasks is None:
        task_types = list(ALL_TASKS.keys())
    else:
        task_types = tasks
        # Check that all requested task types exist
        missing_tasks = [task for task in task_types if task not in ALL_TASKS]
        if missing_tasks:
            print('⚠️  Warning: The following task types do not exist or do not meet criteria:')
            for task in missing_tasks:
                print(f'   - {task}')
            print()
            # Show available task types
            print('💡 Available task types:')
            for task_template in sorted(ALL_TASKS.keys()):
                print(f'   - {task_template}')
            print()
            # Keep only existing task types
            task_types = [task for task in task_types if task in ALL_TASKS]
            if not task_types:
                print('❌ Error: No matching task types found!')
                return
    
    # Print task type list
    print('=' * 80)
    sites_str = ','.join(examine_sites) if examine_sites else 'None'
    print(f'Task type list (examine_sites={sites_str}, num_tasks_to_explore={num_tasks_to_explore})')
    print('=' * 80)
    print(f'Total task types meeting criteria: {len(task_types)}')
    print(f'Total task instances: {sum(len(tasks) for tasks in ALL_TASKS.values())}')
    print()
    
    for i, task_type in enumerate(sorted(task_types), 1):
        task_count = len(ALL_TASKS[task_type])
        print(f'{i}. {task_type}')
        print(f'   Instance count: {task_count} (task_ids: {ALL_TASKS[task_type][:5]}{"..." if task_count > 5 else ""})')
        print()
    
    # Generate CSV
    # Re-read data to get details per task
    csv_rows = []
    
    for instance in data:
        task_id = instance["task_id"]
        task_template = instance["intent_template"]
        intent = instance.get("intent", "")  # Actual task name after filling params
        sites = instance.get("sites", [])
        all_sites_str = ','.join(sorted(sites))  # All sites, comma-separated
        is_multi_site = 'Yes' if len(sites) > 1 else 'No'  # Multi-site or not
        
        # Include only tasks that pass examine_sites filter
        if examine_sites is None or all([(site in examine_sites) for site in sites]):
            if task_template in ALL_TASKS:
                for site in sites:
                    if examine_sites is None or site in examine_sites:
                        csv_rows.append([site, task_template, task_id, intent, all_sites_str, is_multi_site])
    
    # Sort by site, task type, task ID
    csv_rows.sort(key=lambda x: (x[0], x[1], x[2]))
    
    # Write CSV in project root
    csv_filename = 'task_types.csv'
    
    with open(csv_filename, 'w', newline='', encoding='utf-8') as csvfile:
        writer = csv.writer(csvfile)
        writer.writerow(['Site Type', 'Task Type', 'Task ID', 'Task Name', 'All Sites', 'Multi-Site'])
        writer.writerows(csv_rows)
    
    print(f'\nCSV file written: {csv_filename}')
    print(f'Total {len(set(row[0] for row in csv_rows))} sites, {len(csv_rows)} task instances')
