

import json
import os
import random

import editdistance
import torch

import pandas as pd
import fire
import numpy as np
from sklearn.metrics import roc_auc_score, roc_curve
from sentence_transformers import SentenceTransformer

def sample(arr: np.array, n: int, k: int):
    arr = arr.tolist()
    new_arr = []
    for _ in range(k):
        new_arr.append(np.mean(np.array(random.sample(arr, n))))
    return np.array(new_arr)

def aggregate(arr: np.array, n: int):
    arr = arr.tolist()
    new_arr = []
    for i in range(0, len(arr), n):
        new_arr.append(np.mean(np.array(arr[i:i+n])))
    return np.array(new_arr)

def tpr_target(labels, scores, target_fpr):
    fpr, tpr, _ = roc_curve(labels, scores)
    
    indices = None
    for i in range(len(fpr)):
        if fpr[i] >= target_fpr:
            if i == 0:
                indices = [i]
            else:
                indices = [i-1, i]
            break

    if indices is None:
        return tpr[-1]
    else:
        tpr_values = [tpr[i] for i in indices]
        return np.mean(tpr_values)

def main(
    debug: bool = False,
):
    dirname = "./data"
    filenames = [
        "MTD_reddit_12000_Mistral-7B-Instruct-v0.3_N=5.jsonl.iter=1",
        "MTD_reddit_12000_Mistral-7B-Instruct-v0.3_N=5.jsonl.iter=2",
        "MTD_reddit_12000_Mistral-7B-Instruct-v0.3_N=5.jsonl.iter=3",
    ]
    df1 = pd.read_json(os.path.join(dirname, filenames[0]), lines=True)
    df2 = pd.read_json(os.path.join(dirname, filenames[1]), lines=True)
    df3 = pd.read_json(os.path.join(dirname, filenames[2]), lines=True)

    model = SentenceTransformer("all-mpnet-base-v2")
    model.cuda()
    machine_text = df1.generation.tolist()
    para_machine_text = df1.paraphrase_generation.apply(lambda x: x[0]).tolist()
    iter1 = df1.transfer_pick.apply(lambda x: x[-1]).tolist()
    iter2 = df2.transfer_pick.apply(lambda x: x[-1]).tolist()
    iter3 = df3.transfer_pick.apply(lambda x: x[-1]).tolist()

    if debug:
        machine_text = machine_text[:10]
        para_machine_text = para_machine_text[:10]
        iter1 = iter1[:10]
        iter2 = iter2[:10]
        iter3 = iter3[:10]

    # calculate similarity to generation
    machine_text_embeddings = model.encode(machine_text, show_progress_bar=True)
    para_machine_text_embeddings = model.encode(para_machine_text, show_progress_bar=True)
    iter1_embeddings = model.encode(iter1, show_progress_bar=True)
    iter2_embeddings = model.encode(iter2, show_progress_bar=True)
    iter3_embeddings = model.encode(iter3, show_progress_bar=True)
    
    cossim = torch.nn.CosineSimilarity(dim=-1)
    print("Machine Text to Iter1", cossim(torch.tensor(machine_text_embeddings), torch.tensor(iter1_embeddings)).mean().item())
    print("Machine Text to Iter2", cossim(torch.tensor(machine_text_embeddings), torch.tensor(iter2_embeddings)).mean().item())
    print("Machine Text to Iter3", cossim(torch.tensor(machine_text_embeddings), torch.tensor(iter3_embeddings)).mean().item())
    print("Para to Machine Text", cossim(torch.tensor(para_machine_text_embeddings), torch.tensor(machine_text_embeddings)).mean().item())

    # same as above but with edit distance
    print("Machine Text to Iter1", np.mean([editdistance.eval(a, b) for a, b in zip(machine_text, iter1)]))
    print("Machine Text to Iter2", np.mean([editdistance.eval(a, b) for a, b in zip(machine_text, iter2)]))
    print("Machine Text to Iter3", np.mean([editdistance.eval(a, b) for a, b in zip(machine_text, iter3)]))
    print("Para to Machine Text", np.mean([editdistance.eval(a, b) for a, b in zip(para_machine_text, machine_text)]))

    return 0

if __name__ == "__main__":
    random.seed(43)
    fire.Fire(main)
