
import os
import math
import sys
import scipy.stats as stats

from scores_v2 import scores

data = {}
target_methods = ['Fixed-Grad0', 'Fixed-Grad0.0001', 'Fixed-Grad0.1']

for key, val in scores.items():
    parts = key.split('/')
    if len(parts) != 4: continue
    env, type_, method, beta = parts
    
    if not method.startswith('Fixed'): continue
    
    if env not in data: data[env] = {}
    if type_ not in data[env]: data[env][type_] = {}
    if method not in data[env][type_]: data[env][type_][method] = {}
    
    data[env][type_][method][beta] = val

print(f"{'Group (Env/Type/Grad)':<50} | {'H-Statistic':<12} | {'P-Value':<12} | {'Significance':<15}")
print("-" * 100)

for env in sorted(data.keys()):
    for dtype in sorted(data[env].keys()):
        for method in target_methods:
            if method not in data[env][dtype]: continue
            
            betas = sorted(data[env][dtype][method].keys())
            groups = [data[env][dtype][method][b] for b in betas]

            filter_groups = []
            for g in groups:
                params = [x for x in g if not math.isnan(x)]
                if params:
                    filter_groups.append(params)
            
            if len(filter_groups) < 2:
                print(f"{f'{env}/{dtype}/{method}':<50} | {'N/A':<12} | {'N/A':<12} | {'Not Enough Data':<15}")
                continue
            
            H, p_value = stats.kruskal(*filter_groups)
            sig_str = "SIGNIFICANT" if p_value < 0.05 else "Not Significant"
            
            if p_value < 0.001:
                p_str = "< 0.001"
            else:
                p_str = f"{p_value:.4f}"
            
            print(f"{f'{env}/{dtype}/{method}':<50} | {H:<12.4f} | {p_str:<12} | {sig_str:<15}")
