from collections import OrderedDict
import re
import os

import matplotlib.pyplot as plt
import pandas as pd
import seaborn as sns
import torch
from tqdm.notebook import tqdm
import numpy as np
import json
import pickle
import sys

sys.path.append('/root/weiminwu/in-context-learning-fork/in-context-learning/src/')

from eval import get_run_metrics, read_run_dir, get_model_from_run
from plot_utils import basic_plot, collect_results, relevant_model_names
from models import get_relevant_baselines, GDModel, DecisionTreeModel
from base_models import NeuralNetwork, ParallelNetworks

from samplers import get_data_sampler
from tasks import get_task_sampler


run_dir = "../models"
task = "relu_2nn_regression"
run_id = "b98285ff-feda-4a04-8914-3810a4bec3f3"
run_path = os.path.join(run_dir, task, run_id)

save_path = '/root/weiminwu/in-context-learning-fork/in-context-learning/src/evaluation/results/NN/exp_3'

def Square_Error(ys, pred):
    y_mean = torch.mean(ys)
    SS_tot = torch.sum((ys - y_mean) ** 2)
    SS_res = torch.sum((ys - pred) ** 2)
    R_square = 1 - SS_res / SS_tot
    return R_square

# compute similarity
def similarity(x, x_test):
    cos = torch.nn.CosineSimilarity(dim=1, eps=1e-6)
    x = x.unsqueeze(0)
    x_test = x_test.unsqueeze(0)
    return cos(x, x_test)

model, conf = get_model_from_run(run_path)

n_dims = conf.model.n_dims
batch_size = conf.training.batch_size
data_sampler = get_data_sampler(conf.training.data, n_dims)
task_sampler = get_task_sampler(
    conf.training.task,
    n_dims,
    batch_size,
    **conf.training.task_kwargs
)

task = task_sampler()

# Part1: 100% accurate
n_batches = 3
prompt_length = 76
n_pairs = 1000
n_dims = 20
batch_size = 64
        
# Baseline
baselines = {
        "relu_2nn_regression": [
            (
                GDModel,
                {
                    "model_class": NeuralNetwork,
                    "model_class_args": {
                        "in_size": 20,
                        "hidden_size": 100,
                        "out_size": 1,
                    },
                    "opt_alg": "adam",
                    "batch_size": 64,
                    "lr": 5e-3,
                    "num_steps": 100,
                },
            ),
        ],
        "decision_tree": [
            (DecisionTreeModel, {"max_depth": 4}),
            # (DecisionTreeModel, {"max_depth": None}),
        ],
    }

baseline = [model_cls(**kwargs) for model_cls, kwargs in baselines[conf.training.task]]

actual_points_base = [[] for _ in range(prompt_length)]
predicted_points_base = [[] for _ in range(prompt_length)]
all_errors_base = []

with open(save_path+'/data.pkl', 'rb') as file:
    data = pickle.load(file)
xs_list = data['x']
ys_list = data['y']
for time_idx in tqdm(range(n_batches)):
    xs_list[time_idx] = torch.from_numpy(xs_list[time_idx])
    ys_list[time_idx] = torch.from_numpy(ys_list[time_idx])

for time_idx in tqdm(range(n_batches)):
    xs = xs_list[time_idx][:,n_pairs:,:]
    ys = ys_list[time_idx][:,n_pairs:]
    pred = baseline[0](xs, ys)
    
    for j in range(prompt_length):
        actual_points_base[j].extend(ys[:, j])
        predicted_points_base[j].extend(pred[:, j])
        
base_error = []

for point_idx in range(prompt_length):
    actual = torch.tensor(actual_points_base[point_idx])
    predicted = torch.tensor(predicted_points_base[point_idx])
    R_square = Square_Error(actual, predicted)
    base_error.append(R_square)
    
with open(save_path+'/baseline.txt', 'w') as f:
    for value in base_error:
        f.write(f"{value}\n")
