import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
import seaborn as sns
from pathlib import Path
import re
import json

plt.style.use('seaborn-v0_8-whitegrid')
sns.set_palette("husl")

plt.rcParams['font.family'] = 'Times New Roman'

plt.rcParams['font.size'] = 5
plt.rcParams['axes.titlesize'] = 10
plt.rcParams['axes.labelsize'] = 8
plt.rcParams['legend.fontsize'] = 7
plt.rcParams['xtick.labelsize'] = 7
plt.rcParams['ytick.labelsize'] = 7

def size_to_numeric(size_str):
    """Converts model size string to a sortable numeric value (in billions)."""
    size_str = str(size_str).upper()
    if 'MINI' in size_str:
        return 0.1
    if 'M' in size_str:
        return float(size_str.replace('M', '')) / 1000
    if 'B' in size_str:
        return float(size_str.replace('B', ''))
    return 999

def parse__info(csv_name):
    """Extract name, size, type, and contamination level from CSV filename."""
    clean_csv_name = csv_name.replace(' ', '')
    
    parts = clean_csv_name.split('_')
    
    contamination = None
    for i, part in enumerate(parts):
        if part.isdigit() and int(part) in [25, 50, 75, 100]:
            contamination = int(part)
            break
    
    is_instruct = 'Instruct' in clean_csv_name
    _type = 'Instruct' if is_instruct else 'Base'
    
    family = 'Unknown'
    size = 'Unknown'
    
    # Extract family (with version) and size using the clean name
    if 'Gemma3' in clean_csv_name:
        family = 'Gemma-3'
        if '_270M_' in clean_csv_name: size = '270M'
        elif '_1B_' in clean_csv_name: size = '1B'
        elif '_4B_' in clean_csv_name: size = '4B'
    elif 'Llama3_2' in clean_csv_name:
        family = 'Llama-3.2'
        if '_3B_' in clean_csv_name: size = '3B'
        elif '_1B_' in clean_csv_name: size = '1B'
    elif 'Qwen2-5' in clean_csv_name:
        family = 'Qwen-2.5'
        if '_3B_' in clean_csv_name: size = '3B'
        elif '_1_5B_' in clean_csv_name: size = '1.5B'
        elif '_0_5B_' in clean_csv_name: size = '0.5B'
    elif 'Phi4' in clean_csv_name:
        family = 'Phi-4'
        size = 'Mini'
    elif 'Olmo2' in clean_csv_name:
        family = 'OLMo-2'
        size = '1B'
    elif 'SmolLM2' in clean_csv_name:
        family = 'SmolLM-2'
        if '_1_7B_' in clean_csv_name: size = '1.7B'
        elif '_360M_' in clean_csv_name: size = '360M'
            
    _name = f"{family}_{size}"
    
    return {
        '_name': _name, 'family': family, 'size': size,
        'numerical_size': size_to_numeric(size),
        'type': _type, 'contamination': contamination,
        'full_name': f"{family}-{size}"
    }

def load_and_process_data(char_file, word_file):
    """Load and process both CSV files for syntactic tasks."""
    char_df = pd.read_csv(char_file)
    word_df = pd.read_csv(word_file)
    
    processed_data = []
    
    for df, task_name in [(char_df, 'Character Reversal'), (word_df, 'Word Reversal')]:
        for _, row in df.iterrows():
            if row['Question'] == 'AVERAGE_METRICS':
                _info = parse__info(row['csv_name'])
                _info.update({
                    'task': task_name,
                    'semantic_similarity': float(row['semantic_similarity']*100),
                    'grammatical_correctness': float(row['grammatical_correctness'].rstrip('%'))
                })
                processed_data.append(_info)
    
    return pd.DataFrame(processed_data)

def create_combined_heatmap(all_data, save_path='./'):
    """Creates heatmaps for adherence and accuracy, and saves the data to JSON."""
    print("Generating combined heatmap for syntactic tasks...")

    # Sort data by family, then numerical size, then type (Base before IT)
    all_data = all_data.sort_values(by=['family', 'numerical_size', 'type'])

    adherence_pivot = all_data.pivot_table(
        values='semantic_similarity', index=['full_name', 'type'], columns=['task', 'contamination'], aggfunc='mean', sort=False
    )
    
    accuracy_pivot = all_data.pivot_table(
        values='grammatical_correctness', index=['full_name', 'type'], columns=['task', 'contamination'], aggfunc='mean', sort=False
    )

    adherence_for_json = adherence_pivot.copy()
    accuracy_for_json = accuracy_pivot.copy()

    adherence_for_json.columns = [f"{col[0]} - {col[1]}%" for col in adherence_for_json.columns]
    accuracy_for_json.columns = [f"{col[0]} - {col[1]}%" for col in accuracy_for_json.columns]

    # Combine into a single dictionary
    json_output_data = {
        'semantic_similarity': adherence_for_json.reset_index().to_dict(orient='records'),
        'grammatical_correctnes': accuracy_for_json.reset_index().to_dict(orient='records')
    }
    
    json_path = Path(save_path) / 'Plot2_Part2_Combined_Syntactic_Heatmap_Data.json'
    with open(json_path, 'w') as f:
        json.dump(json_output_data, f, indent=4)
    print(f"Heatmap data successfully saved to: {json_path}")

    # Y-label logic for both Base and IT models
    y_labels = []
    for name, type_ in accuracy_pivot.index:
        processed_name = name.replace('-', '', 1).replace('-', '_')
        if type_ == 'Instruct':
            y_labels.append(f"{processed_name}_IT")
        else:
            y_labels.append(processed_name)

    fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(5.5, 4), sharey=True)

    # Semantic Similarity
    sns.heatmap(adherence_pivot, annot=True, fmt='.1f', cmap='RdYlGn', 
                cbar_kws={'label': 'Semantic Similarity (%)'}, ax=ax1,
                yticklabels=y_labels)
    ax1.set_title('Semantic Similarity', fontweight='bold', fontsize=8, pad=8)
    ax1.set_ylabel('')

    # Grammatical Correctness
    sns.heatmap(accuracy_pivot, annot=True, fmt='.1f', cmap='RdYlGn', 
                cbar_kws={'label': 'Grammatical Correctness(%)'}, ax=ax2,
                yticklabels=y_labels)
    ax2.set_title('Grammatical Correctness', fontweight='bold', fontsize=8, pad=8)
    ax2.set_ylabel('')

    x_tick_labels = adherence_pivot.columns.get_level_values('contamination')
    num_cont_levels = len(all_data['contamination'].unique())
    pos1 = (num_cont_levels / 2.0)
    pos2 = pos1 + num_cont_levels

    for ax in [ax1, ax2]:
        ax.set_xticklabels(x_tick_labels, rotation=0)
        ax.tick_params(axis='x', length=0)
        ax.set_xlabel('')
        
        ax.axvline(x=num_cont_levels, color='white', linewidth=4)

        ax.text(pos1, -0.05, 'Character Reversal', ha='center', va='top',
                fontweight='bold', transform=ax.get_xaxis_transform(), fontsize=6)
        ax.text(pos2, -0.05, 'Word Reversal', ha='center', va='top',
                fontweight='bold', transform=ax.get_xaxis_transform(), fontsize=6)

    plt.tight_layout(rect=[0, 0, 1, 1])
    plt.savefig(f'{save_path}/Plot2_Part2_Combined_Syntactic_Heatmap.png', dpi=300)
    plt.savefig(f'{save_path}/Plot2_Part2_Combined_Syntactic_Heatmap.pdf')
    plt.show()

def main():
    """Main execution function."""
    char_file = 'CharFlipped.csv'
    word_file = 'WordFlipped.csv'
    
    print("Loading and processing data for syntactic tasks...")
    all_data = load_and_process_data(char_file, word_file)
    
    create_combined_heatmap(all_data)
    
    print("\nCombined syntactic heatmap saved as PNG and PDF formats.")
    print("Analysis complete!")

if __name__ == "__main__":
    main()