import os
import pandas as pd

from argparse import ArgumentParser
from utils import parse_filename, add_step_column


if __name__ == "__main__":
    parser = ArgumentParser()
    parser.add_argument(
        "--raw-throughput-file", type=str, help="Path to jsonl file with raw throughput"
    )
    parser.add_argument(
        "--spec-throughput-file",
        type=str,
        help="Path to jsonl file with speculative throughput",
    )

    args = parser.parse_args()

    parts = parse_filename(args.spec_throughput_file)

    # Read JSONL file into a DataFrame
    df_raw = pd.read_json(args.raw_throughput_file, lines=True)
    stp_field = df_raw[df_raw["model"].str.contains("SingleTokenLM")].copy()
    stp_field = stp_field.reset_index(drop=True)
    assert len(stp_field) == 1
    stp_field.loc[0, "circuit"] = "STP"
    stp_field.loc[0, "ncomponent"] = 1
    stp_field.loc[0, "adaptor"] = "NaN"
    stp_field["speedup"] = [1]

    df_spec = pd.read_json(args.spec_throughput_file, lines=True)

    df_spec = add_step_column(df_spec, "checkpoint")
    df_spec_best = df_spec[df_spec["step"] == 900]
    df_spec_best = df_spec_best[df_spec_best["ncomponent"].isin([32, 1])]
    df_spec_best = df_spec_best[df_spec_best["ntoken"].isin([1, 8, 16])]
    df_spec_best["circuit"] = df_spec_best["circuit"].str.replace("fully_factorized", "ff")

    agg_keys = {
            "avg_accepted_tokens": ["mean", "std", "count"],
            "avg_time_per_call": ["mean", "std", "count"],
            "tokens_per_second": ["mean", "std", "count"],
        }
    df_spec_best_agg = df_spec_best.groupby(["ntoken", "circuit", "ncomponent", "adaptor"]).agg(
            agg_keys
    )
    df_spec_best_agg = df_spec_best_agg.reset_index()

    df_collapsed = pd.DataFrame()
    df_collapsed["ntoken"] = df_spec_best_agg["ntoken"]
    df_collapsed["adaptor"] = df_spec_best_agg["adaptor"]
    df_collapsed["adaptor"] = df_collapsed["adaptor"].str.replace("none", "-0")
    df_collapsed["adaptor"] = df_collapsed["adaptor"].str.extract(r'-(\d+)$').astype(int)
    df_collapsed["ncomponent"] = df_spec_best_agg["ncomponent"]
    df_collapsed["circuit"] = df_spec_best_agg["circuit"]
    df_collapsed["speedup"] = df_spec_best_agg[("tokens_per_second", "mean")] / stp_field["tokens_per_second"][0]


    for metric in agg_keys.keys():
        mean_col = (metric, "mean")
        std_col = (metric, "std")
        count_col = (metric, "count")

        # Auto-determine decimal places
        if metric == "avg_accepted_tokens":
            decimals = 2
        elif metric == "avg_time_per_call":
            decimals = 4
            stp_field[metric] = stp_field[metric].map(lambda x: f"{x:.{decimals}f}")
        else:
            decimals = 1
            stp_field[metric] = stp_field[metric].map(lambda x: f"{x:.{decimals}f}")


        # Create mean±std column
        df_collapsed[metric] = (
            df_spec_best_agg[mean_col].map(lambda x: f"{x:.{decimals}f}")
            + "{\\scriptsize$\\pm$"
            + df_spec_best_agg[std_col].map(lambda x: f"{x:.{decimals}f}")
            + "}"
        )

        # # Keep count
        # df_collapsed[f"{metric}_count"] = df_spec_best_agg[count_col]

    result = df_collapsed
    result = pd.concat([df_collapsed, stp_field[["circuit", "ntoken", "adaptor", "ncomponent", "avg_time_per_call", "tokens_per_second", "speedup"]]])

    result.sort_values(["ntoken", "circuit", "adaptor", "speedup"], ascending=[True, False, True, True], inplace=True)
    result["circuit"] = result["circuit"].str.upper()
    colmap = {
        'ncomponent': '$r$',
        'ntoken': '$n$',
        'adaptor': '\\# LoRA',
        'avg_accepted_tokens': '\\meanacc~\\incfield',
        'avg_time_per_call': '\\meanlat~\\decfield',
        'tokens_per_second': '\\meantoks~\\incfield',
        'tokens_per_second_no_spec': '\\maxtoks',
        'speedup': 'speed-up',
    }
    result = result.rename(columns=colmap)
    result = result[["$n$", "circuit", "\\# LoRA", "\\meanlat~\\decfield", "\\meanacc~\\incfield", "\\meantoks~\\incfield", "speed-up"]]

    result = result.set_index(["$n$", "circuit", "\\# LoRA"])

    latex_table = result.to_latex(
        column_format='llclllr',
        float_format="%4.2f",
        formatters={
            ("$r$"): lambda x: f"{x:<4d}",
            ("$n$"): lambda x: f"{x:<4d}",
            ("circuit"): lambda x: f"{x:<5s}",
        },
        # index=False,
        multirow=True,
        index_names=False,
        label=f"tab:throughput-{parts['subset']}-{parts['gpu']}-{parts['mode']}-{parts['model']}"
    )
    latex_table = latex_table.replace(r'\multirow[t]{', r'\multirow[c]{')
    latex_table = latex_table.replace('\\begin{table}\n', '\\begin{table}\n\\centering\n')
    latex_table = latex_table.replace('NaN', '---')
    latex_table = latex_table.replace('speed-up', '\\speedup')
    latex_table = latex_table.replace('FF', r'\ref{eq:n-indep-prob}')
    latex_table = latex_table.replace('CP', r'\ref{eq:r-cp}')
    latex_table = latex_table.replace('BTREE', r'\ref{eq:btree}')
    latex_table = latex_table.replace('HMM', r'\ref{eq:r-hmm}')
    latex_table = latex_table.replace('\\midrule\n', '\\midrule\n\\rowcolor{gray!15}')
    latex_table = latex_table.replace('\\cline{1-7} \\cline{2-7}\n\\bottomrule', '\\bottomrule')
    print(latex_table)
