import pandas as pd
import argparse
import json
import os

parser = argparse.ArgumentParser()
parser.add_argument("--csv", required=True, help="Path to CSV file")
parser.add_argument("--filter", required=True, help="Dataset or dataset group")
parser.add_argument("--groups", default="dataset_groups.json", help="Dataset group JSON file")
args = parser.parse_args()

# Load CSV
df = pd.read_csv(args.csv)

# Ensure column exists
if "Dataset" not in df.columns:
    raise ValueError("CSV must contain a 'Dataset' column.")

# Load dataset groups
if os.path.exists(args.groups):
    with open(args.groups) as f:
        groups = json.load(f)
else:
    groups = {}

# Determine which datasets to filter on
if args.filter in groups:
    target_datasets = groups[args.filter]
else:
    target_datasets = [args.filter]

# Filter rows belonging to these datasets
filtered = df[df["Dataset"].isin(target_datasets)]

if filtered.empty:
    print(f"\nNo rows found in CSV for dataset/group: {args.filter}")
    exit(0)

# Select best row by Test Accuracy
best_idx = filtered["Test Accuracy (%)"].idxmax()
best = filtered.loc[best_idx]

print("\n======================================")
print(f" BEST RESULT FOR: {args.filter}")
print("======================================\n")

print(f"Dataset: {best['Dataset']}")
print(f"Best Test Accuracy: {best['Test Accuracy (%)']:.4f}")
print(f"Validation F1: {best['Val F1 (%)']:.4f}")
print(f"Test F1: {best['Test F1 (%)']:.4f}\n")

print("Optimal parameters:")
for col in filtered.columns:
    if col not in ["Timestamp", "Dataset", "Test Accuracy (%)", "Test Accuracy Std (%)",
                   "Test F1 (%)", "Test F1 Std (%)", "Val F1 (%)", "Val F1 Std (%)",
                   "Val Loss"]:
        print(f"  - {col}: {best[col]}")

print("\nDone.")
