# eval_test.py
# EDIT ME: either auto-pick best from alpha_tuning_summary.csv or define selections manually.
import _pathfix
import torch
from tgm.scripts.eval_utils import evaluate_on_test, score_fn, evaluate_single_on_test



if __name__ == "__main__":
    parent_dir = None      # source folder
    output_dir = None
    dataset = "BlackScholes1d"          # EDIT

    model_a_name = "DriftDiffusionModel"           # EDIT
    model_b_name = "JumpModel"          # EDIT
    jump_api = "jump"

    # TODO: provide your actual test set here
    test_x   = torch.load("../data/stock/test_data.pt",   map_location="cuda", weights_only=True)
    test_t   = torch.load("../data/stock/test_times.pt",  map_location="cuda", weights_only=True)
    test_set = {"x": test_x, "t": test_t.unsqueeze(0).expand(test_x.shape[0], -1)}

    # Seeds to evaluate (intersection of available seeds on both sides is used)
    seeds = [0, 1, 2, 3, 4]             # EDIT

    # Manual selections
    selections = [
        {"variant_a": "mmd", "variant_b": "mmd", "sigma": 0.03, "rho": 0.0001, "t_sub": 50, "alpha": 0.7}
    ]

    lr = 1e-5
    map_location = "cuda"

    raw_df, summary_df = evaluate_on_test(
        parent_dir=parent_dir,
        dataset=dataset,
        model_a_name=model_a_name,
        model_b_name=model_b_name,
        selections=selections,
        test_set=test_set,
        seeds=seeds,
        lr=lr,
        map_location=map_location,
        output_dir=output_dir,
        score_fn=score_fn,
        summary_name="test_results_MS_50_summary.csv",
        raw_name="test_results_MS_50_raw.csv",
        jump_api = jump_api
    )
    print(summary_df.head())