"""Evaluation of whether two groups of examples have the same/similar theme."""
import abc
from typing import List, Optional, Tuple

from transformers import PreTrainedTokenizer

from npeff_torch.examination.top_examples import top_examples_common
from npeff_torch.examination.top_examples import top_examples_latex


###############################################################################

_DEFAULT_LATEX_FILE_HEADER = R"""% Please use XeLaTex to handle unicode properly.
\documentclass[11pt]{article}

\usepackage[margin=1in]{geometry} 
\usepackage[dvipsnames]{xcolor}
\usepackage{bold-extra}

"""

###############################################################################


class HumevTopExamplesSameThemeLatexGeneratorAbc(abc.ABC):

    #######################################################
    # Equivalent of "protected" methods.

    def make_latex_file_header(self) -> str:
        return _DEFAULT_LATEX_FILE_HEADER

    #######################################################

    @abc.abstractmethod
    def make_latex_intro(self) -> str:
        # Should contain information to help reviewers about the task.
        raise NotImplementedError

    @abc.abstractmethod
    def make_example_latex_string(self, example_info: 'top_examples_common.TopExampleInfo') -> str:
        # Typically should just be the example text.
        # NOTE: Not all of the information will be present in the example_info.
        raise NotImplementedError

    #######################################################

    def generate_latex(
        self,
        example_group_pairs: List[Tuple[List['top_examples_common.TopExampleInfo'], List['top_examples_common.TopExampleInfo']]],
    ) -> str:
        ret = [
            self.make_latex_file_header(),
            '',
            R"\begin{document}",
            '',
            self.make_latex_intro(),
            '',
            R'\section{Groups}',
            '',
        ]

        for i, (group_a, group_b) in enumerate(example_group_pairs):
            # To match the latex section headers, we use a 1-based index here.
            ret.append(R'\subsection{Pair ' + str(i + 1) + R'}')
            
            for label, example_group in (('A', group_a), ('B', group_b)):
                ret.append(R'\paragraph{Group ' + label + R'}')
                ret.append('')

                if self.components_fontsize is not None:
                    ret.append(R'\begin{' + self.components_fontsize + R'}')

                for example_info in example_group:
                    ret.append(self.make_example_latex_string(example_info))

                if self.components_fontsize is not None:
                    ret.append(R'\end{' + self.components_fontsize + R'}')

                ret.append('')

        ret.append(R"\end{document}")

        return "\n".join(ret)

    #######################################################

    @classmethod
    def create(
        cls,
        tokenizer: PreTrainedTokenizer,
        components_fontsize: Optional[str] = 'footnotesize',
        **kwargs,
    ):
        return cls(
            tokenizer=tokenizer,
            components_fontsize=components_fontsize,
            **kwargs,
        )
