"""Human evaluation latex generation for YAT."""
import abc
import dataclasses
import re
from typing import Optional, List, Sequence, Tuple

import numpy as np
from transformers import PreTrainedTokenizer

from npeff_torch.examination.top_examples import top_examples_common
from npeff_torch.examination.top_examples.human_evals import humev_top_examples_same_theme_latex
from npeff_torch.examination.top_examples.human_evals import humev_top_examples_theme_latex
from npeff_torch.examination.top_examples import top_examples_latex
from npeff_torch.util import latex_utils

###############################################################################
_DEFAULT_INTRO = R"""
This document contains groupings of examples from Yahoo Answers Topics (YAT). YAT is a
topic identification task where the goal is to assign a question from Yahoo answers to
one of 10 topics. These topics are Society \& Culture, Science \& Mathematics, Health, Education
\& Reference, Computers \& Internet, Sports, Business \& Finance, Entertainment \&
Music, Family \& Relationships, and Politics \& Government

For each group of examples, please determine if there is some common theme among the examples
in the group. In the second column of the CSV, please write \texttt{yes}, \texttt{maybe}, or \texttt{no}
(and only those three options) depending whether you detected the presence of a theme. In you put
\texttt{yes} or \texttt{maybe}, please put a brief description of the theme in the third column of
the CSV.

\section{Sample Annotated Groups}

\subsection{Sample Group 1}
\begin{footnotesize}
\noindent\texttt{Where can I find coca-cola car seat covers?\vspace{2mm} \\
}
\noindent\texttt{Where do I buy the best plane tickets online?\vspace{2mm} \\
}
\noindent\texttt{Where do I buy the best football tickets online?\vspace{2mm} \\
}
\noindent\texttt{Where can I get a free or cheap fixed-gear bicycle?\vspace{2mm} \\
}
\noindent\texttt{Where to get free crochet patterns for tops and sweaters online?\vspace{2mm} \\
}
\end{footnotesize}

\paragraph{Annotation} \texttt{yes} -- Looking to buy or get things.

\subsection{Sample Group 2}
\begin{footnotesize}
\noindent\texttt{Kindly provide me the full operational details of JVC Vidoecamera model GR-AX 11E.?\vspace{2mm} \\
}
\noindent\texttt{What is the differnce between a project and product?\vspace{2mm} \\
}
\noindent\texttt{The inner and outer cores are probley composed mostly of...what?\vspace{2mm} \\
}
\noindent\texttt{what was the weather on may 24, 1951 in chicago?\vspace{2mm} \\
}
\noindent\texttt{Describe the fossil record of humans?\vspace{2mm} \\
}
\end{footnotesize}
\paragraph{Annotation} \texttt{no}
"""
###############################################################################




@dataclasses.dataclass
class YatHumevTopExamplesThemeLatexGeneratorForLm(humev_top_examples_theme_latex.HumevTopExamplesThemeLatexGeneratorAbc):
    tokenizer: PreTrainedTokenizer
    
    components_fontsize: Optional[str] = 'footnotesize'

    #######################################################

    def _parse_sentence(self, example_info: 'top_examples_common.TopExampleInfo') -> str:
        input_ids = example_info.example['input_ids']
        attention_mask = example_info.example['attention_mask']

        context = self.tokenizer.decode(input_ids[attention_mask != 0])

        match = re.search(
            r'^Question: (.+)\nWhat broad topic is this question about\? Choose from:\n',
            context)

        if match:
            sentence = match.group(1)
            sentence = latex_utils.escape(sentence)
        else:
            sentence = 'ERROR'

        return sentence

    #######################################################

    def make_example_latex_string(self, example_info: 'top_examples_common.TopExampleInfo') -> str:
        s = self._parse_sentence(example_info)
        s = R'\noindent\texttt{' + s + R'\vspace{2mm} \\' + '\n}'
        return s

    def make_latex_intro(self) -> str:
        # Should contain information to help reviewers about the task.
        return _DEFAULT_INTRO

