"""Human evaluation latex generation for trivia-qa."""
import abc
import dataclasses
import re
from typing import Optional, List, Sequence, Tuple

import numpy as np
from transformers import PreTrainedTokenizer

from npeff_torch.examination.top_examples import top_examples_common
from npeff_torch.examination.top_examples.human_evals import humev_top_examples_same_theme_latex
from npeff_torch.examination.top_examples.human_evals import humev_top_examples_theme_latex
from npeff_torch.examination.top_examples import top_examples_latex
from npeff_torch.util import latex_utils

###############################################################################
_DEFAULT_INTRO = R"""
This document contains groupings of examples from TriviaQA. TriviaQA is a task where the
goal is to answer trivia-style questions. In the examples below, only the question is provided.

For each group of examples, please determine if there is some common theme among the examples
in the group. In the second column of the CSV, please write \texttt{yes}, \texttt{maybe}, or \texttt{no}
(and only those three options) depending whether you detected the presence of a theme. In you put
\texttt{yes} or \texttt{maybe}, please put a brief description of the theme in the third column of
the CSV.

\section{Sample Annotated Groups}


\subsection{Sample Group 1}
\begin{footnotesize}
\noindent\texttt{Which sign of the zodiac comes between Scorpio and Capricorn?\vspace{2mm} \\
}
\noindent\texttt{Which letter of the Greek alphabet comes between Tau and Phi?\vspace{2mm} \\
}
\noindent\texttt{Which planet lies between Jupiter and Uranus?\vspace{2mm} \\
}
\noindent\texttt{Which sign of the zodiac comes between Leo and Libra?\vspace{2mm} \\
}
\noindent\texttt{Which letter of the Greek alphabet comes between Tau and Phi?\vspace{2mm} \\
}
\end{footnotesize}

\paragraph{Annotation} \texttt{yes} -- Each question asks which something lies between two other things.

\subsection{Sample Group 2}
\begin{footnotesize}
\noindent\texttt{In food, E330 is better known by what name?\vspace{2mm} \\
}
\noindent\texttt{Who directed the 1963 film The Birds?\vspace{2mm} \\
}
\noindent\texttt{"Who released the album ""Tissues and Issues"" in 2005?"\vspace{2mm} \\
}
\noindent\texttt{Which US actress won the Oscar for best Actress for her screen debut in a musical in 1968?\vspace{2mm} \\
}
\noindent\texttt{In the UK, General Elections are usually held on what day of the week?\vspace{2mm} \\
}
\end{footnotesize}
\paragraph{Annotation} \texttt{no}

"""
###############################################################################
_DEFAULT_SAME_THEME_LATEX_INTRO = R"""
This document contains groupings of examples from TriviaQA. TriviaQA is a task where the
goal is to answer trivia-style questions. In the examples below, only the question is provided.

This document contains pairs of groups of examples. For each pairing, please determine whether each group
individually contains a common theme among its examples. If both groups do contain a theme, then determine
whether the themes of the two groups are very similar. In the second column of the CSV, please write
\texttt{yes}, \texttt{maybe}, or \texttt{no} (and only those three options) depending on whether both groups
contain very similar themes. To be clear, write \texttt{yes} only if both groups contain a theme that is very
similar; write \texttt{no} if both groups contain different themes or if both groups do not contain a detectable
theme. If put \texttt{yes} or \texttt{maybe}, please put a brief description of the theme in the third column of
the CSV.

\section{Sample Annotated Pairs}

\subsection{Sample Pair 1}

\paragraph{Group A}

\begin{footnotesize}
\noindent\texttt{Torquay United and which other team were promoted from the Conference to the Football League Division Two at the end of the 2008/9 season?\vspace{2mm} \\
}
\noindent\texttt{Mexico and which country are separated by the Yucatan Channel?\vspace{2mm} \\
}
\noindent\texttt{President Anwar Sadat of Egypt and which prime minister were jointly awarded the Nobel Peace Prize in 1978?\vspace{2mm} \\
}
\noindent\texttt{Zen, Slave and Orac, are the 3 computers used by the protagonists in which TV series of the 1970's and 80's?\vspace{2mm} \\
}
\noindent\texttt{Venus and which other planet in our solar system has no moon?\vspace{2mm} \\
}
\end{footnotesize}

\paragraph{Group B}

\begin{footnotesize}
\noindent\texttt{Which football league club play home games at the Crown Ground?\vspace{2mm} \\
}
\noindent\texttt{Which English football league club play their home games at Boundary Park?\vspace{2mm} \\
}
\noindent\texttt{Which English football club play their home games at Ewood park?\vspace{2mm} \\
}
\noindent\texttt{Which English football club play their home games at the Reebok Stadium?\vspace{2mm} \\
}
\noindent\texttt{Which English football club play their home games at Proact Stadium?\vspace{2mm} \\
}
\end{footnotesize}

\paragraph{Annotation} \texttt{no}

\subsection{Sample Pair 2}

\paragraph{Group A}

\begin{footnotesize}
\noindent\texttt{At which event, in 2010, was Francesca Schiavone the first Italian woman to win a tennis Grand Slam event in singles?\vspace{2mm} \\
}
\noindent\texttt{At which event has Steve Backley won Olympic Bronze and Silver medals?\vspace{2mm} \\
}
\noindent\texttt{In which event did Amy Williams win a gold medal for Britain at the 2010 Winter Olympics?\vspace{2mm} \\
}
\noindent\texttt{In which event did Nero participate in the ancient Olympics, circa AD 60?\vspace{2mm} \\
}
\noindent\texttt{For which event did Greg Rutherford win gold for GB in 2012?\vspace{2mm} \\
}
\end{footnotesize}

\paragraph{Group B}

\begin{footnotesize}
\noindent\texttt{In which cycling event did Rebecca Romero win the Gold medal at the 2008 Olympics?\vspace{2mm} \\
}
\noindent\texttt{In which event did Chris Hoy win a Gold Medal at the recent World Track Cycling Championships?\vspace{2mm} \\
}
\noindent\texttt{In which event did Amy Williams win a gold medal for Britain at the 2010 Winter Olympics?\vspace{2mm} \\
}
\noindent\texttt{At which stroke did David Wilkie, Duncan Goodhew and Adrian Moorhouse win Olympic Gold medals?\vspace{2mm} \\
}
\noindent\texttt{Emil Zatopek won the Olympic gold medal in the marathon in 1952. In which event at the same games did his wife Dana also win gold?\vspace{2mm} \\
}
\end{footnotesize}

\paragraph{Annotation} \texttt{yes} -- Each question asks about events in the Olympics.


"""
###############################################################################


class _HumevThemeMixin:

    def _parse_sentence(self, example_info: 'top_examples_common.TopExampleInfo') -> str:
        input_ids = example_info.example['input_ids']
        attention_mask = example_info.example['attention_mask']

        context = self.tokenizer.decode(input_ids[attention_mask != 0])

        match = re.search(
            r'^Question: (.+)\nAnswer:$',
            context)

        if match:
            sentence = match.group(1)
            sentence = latex_utils.escape(sentence)
        else:
            sentence = 'ERROR'

        return sentence

    #######################################################

    def make_example_latex_string(self, example_info: 'top_examples_common.TopExampleInfo') -> str:
        s = self._parse_sentence(example_info)
        s = R'\noindent\texttt{' + s + R'\vspace{2mm} \\' + '\n}'
        return s


###############################################################################


@dataclasses.dataclass
class TriviaQaHumevTopExamplesThemeLatexGeneratorForLm(_HumevThemeMixin, humev_top_examples_theme_latex.HumevTopExamplesThemeLatexGeneratorAbc):
    tokenizer: PreTrainedTokenizer
    
    components_fontsize: Optional[str] = 'footnotesize'

    #######################################################

    def make_latex_intro(self) -> str:
        # Should contain information to help reviewers about the task.
        return _DEFAULT_INTRO


@dataclasses.dataclass
class TriviaQaHumevTopExamplesSameThemeLatexGeneratorForLm(_HumevThemeMixin, humev_top_examples_same_theme_latex.HumevTopExamplesSameThemeLatexGeneratorAbc):
    tokenizer: PreTrainedTokenizer
    
    components_fontsize: Optional[str] = 'footnotesize'

    #######################################################

    def make_latex_intro(self) -> str:
        # Should contain information to help reviewers about the task.
        return _DEFAULT_SAME_THEME_LATEX_INTRO
