"""
Contains utilities for extracting token representations and indices
from string templates. Used in computing the left and right vectors for ROME.
"""

import logging
from copy import deepcopy
from typing import List

import torch
from transformers import AutoModelForCausalLM, AutoTokenizer

from src import models
from src.functional import find_token_range
from src.models import ModelandTokenizer
from src.rome_utils import nethook

logger = logging.getLogger(__name__)


def get_reprs_at_word_tokens(
    mt: ModelandTokenizer,
    context_templates: List[str],
    words: List[str],
    layer: int,
    module_template: str,
    subtoken: str,
    track: str = "in",
) -> torch.Tensor:
    """
    Retrieves the last token representation of `word` in `context_template`
    when `word` is substituted into `context_template`. See `get_last_word_idx_in_template`
    for more details.
    """
    idxs = get_words_idxs_in_templates(mt.tokenizer, context_templates, words, subtoken)
    return get_reprs_at_idxs(
        mt,
        [context_templates[i].format(words[i]) for i in range(len(words))],
        idxs,
        layer,
        module_template,
        track,
    )


def get_words_idxs_in_templates(
    tok: AutoTokenizer, context_templates: str, words: str, subtoken: str
):
    """
    Given list of template strings, each with *one* format specifier
    (e.g. "{} plays basketball"), and words to be substituted into the
    template, computes the post-tokenization index of their last tokens.
    """

    assert all(
        tmp.count("{}") == 1 for tmp in context_templates
    ), "We currently do not support multiple fill-ins for context"

    if "llama" in type(tok).__name__.lower() or "mistral" in type(tok).__name__.lower():
        idxs = []
        tokenized_contexts = tok(
            [context_templates[i].format(words[i]) for i in range(len(words))],
            padding=True,
            return_tensors="pt",
            return_offsets_mapping=True,
        )
        offset_mappings = tokenized_contexts.pop("offset_mapping")
        for template, subject, offset_maps in zip(
            context_templates, words, offset_mappings
        ):
            subject_start, subject_end = find_token_range(
                string=template.format(subject),
                substring=subject,
                tokenizer=tok,
                offset_mapping=offset_maps,
            )
            idxs.append([subject_end - 1])

        print(
            f"{[(idx, tok.decode(tokenized[idx])) for idx, tokenized in zip(idxs, tokenized_contexts['input_ids'])]}"
        )
        return idxs

    # Compute prefixes and suffixes of the tokenized context
    fill_idxs = [tmp.index("{}") for tmp in context_templates]
    prefixes, suffixes = [
        tmp[: fill_idxs[i]] for i, tmp in enumerate(context_templates)
    ], [tmp[fill_idxs[i] + 2 :] for i, tmp in enumerate(context_templates)]
    words = deepcopy(words)

    # Pre-process tokens
    for i, prefix in enumerate(prefixes):
        if len(prefix) > 0:
            assert prefix[-1] == " "
            prefix = prefix[:-1]

            prefixes[i] = prefix
            words[i] = f" {words[i].strip()}"

    # Tokenize to determine lengths
    assert len(prefixes) == len(words) == len(suffixes)
    n = len(prefixes)
    batch_tok = tok([*prefixes, *words, *suffixes])
    prefixes_tok, words_tok, suffixes_tok = [
        batch_tok[i : i + n] for i in range(0, n * 3, n)
    ]
    prefixes_len, words_len, suffixes_len = [
        [len(el) for el in tok_list]
        for tok_list in [prefixes_tok, words_tok, suffixes_tok]
    ]

    # Compute indices of last tokens
    if subtoken == "last" or subtoken == "first_after_last":
        return [
            [
                prefixes_len[i]
                + words_len[i]
                - (1 if subtoken == "last" or suffixes_len[i] == 0 else 0)
            ]
            # If suffix is empty, there is no "first token after the last".
            # So, just return the last token of the word.
            for i in range(n)
        ]
    elif subtoken == "first":
        return [[prefixes_len[i]] for i in range(n)]
    else:
        raise ValueError(f"Unknown subtoken type: {subtoken}")


def get_reprs_at_idxs(
    mt: ModelandTokenizer,
    contexts: List[str],
    idxs: List[List[int]],
    layer: int,
    module_template: str,
    track: str = "in",
) -> torch.Tensor:
    """
    Runs input through model and returns averaged representations of the tokens
    at each index in `idxs`.
    """

    def _batch(n):
        for i in range(0, len(contexts), n):
            yield contexts[i : i + n], idxs[i : i + n]

    assert track in {"in", "out", "both"}
    both = track == "both"
    tin, tout = (
        (track == "in" or both),
        (track == "out" or both),
    )
    module_name = module_template.format(layer)
    to_return = {"in": [], "out": []}

    def _process(cur_repr, batch_idxs, key):
        nonlocal to_return
        cur_repr = cur_repr[0] if type(cur_repr) is tuple else cur_repr
        for i, idx_list in enumerate(batch_idxs):
            to_return[key].append(cur_repr[i][idx_list].mean(0))

    for batch_contexts, batch_idxs in _batch(n=128):
        contexts_tok = mt.tokenizer(
            batch_contexts, padding=True, return_tensors="pt"
        ).to(models.determine_device(mt.model))
        # print(f"{contexts_tok=}")
        # print(f"{batch_idxs=}")
        logger.debug(
            f"==> {[(idx, mt.tokenizer.decode(tokenized[idx[0]])) for idx, tokenized in zip(batch_idxs, contexts_tok['input_ids'])]}"
        )

        with torch.no_grad():
            with nethook.Trace(
                module=mt.model,
                layer=module_name,
                retain_input=tin,
                retain_output=tout,
            ) as tr:
                mt(**contexts_tok)

        if tin:
            # print("calling from input", module_name, tin, tout)
            # print("input_kw:", tr.input_kw)
            # print("input:", tr.input)
            if "gpt-j" in mt.name:
                inp = (
                    tr.input_kw["hidden_states"]
                    if ".mlp.fc_out" not in module_name
                    else tr.input
                )
            else:
                inp = tr.input
            _process(inp, batch_idxs, "in")
        if tout:
            _process(tr.output, batch_idxs, "out")

    to_return = {k: torch.stack(v, 0) for k, v in to_return.items() if len(v) > 0}

    if len(to_return) == 1:
        return to_return["in"] if tin else to_return["out"]
    else:
        return to_return["in"], to_return["out"]
