"""Generation of top examples for components."""
import abc
import dataclasses
from typing import Optional, Sequence, Union

from transformers import PreTrainedTokenizer

from npeff_torch.examination.top_examples import component_filtering
from npeff_torch.examination.top_examples import top_examples_common


###############################################################################

_DEFAULT_LATEX_FILE_HEADER = R"""% Please use XeLaTex to handle unicode properly.
\documentclass[11pt]{article}

\usepackage[margin=1in]{geometry} 
\usepackage[dvipsnames]{xcolor}
\usepackage{bold-extra}

"""

_DEFAULT_LATEX_INTRO = R"""

\section{Component Top Examples}
\textit{All indices used here are 0-based unless stated otherwise.}

"""

###############################################################################


@dataclasses.dataclass
class ComponentInfo:
    component_index: int

    header_suffix: Optional[str] = None


###############################################################################


class LatexGeneratorAbc(abc.ABC):
    """Should be subclassed to generate latex for particular cases.
    
    Contains some methods with defaults that can be overriden in subclasses.
    """
    
    #######################################################
    # Equivalent of "protected" methods.

    def make_latex_file_header(self) -> str:
        return _DEFAULT_LATEX_FILE_HEADER

    def make_latex_intro(self) -> str:
        return _DEFAULT_LATEX_INTRO

    def make_header_for_component(self, component_info: ComponentInfo) -> str:
        component_index = component_info.component_index
        if component_info.header_suffix is None:
            return R'\subsection{Component ' + str(component_index) + R'}'
        else:
            return R'\subsection{Component ' + str(component_index) + R' ' + str(component_info.header_suffix) + R'}'

    #######################################################

    @abc.abstractmethod
    def make_example_for_component_latex_string(self, component_index: int, example_info: 'top_examples_common.TopExampleInfo') -> str:
        raise NotImplementedError

    #######################################################

    def generate_components_latex(self, component_infos: Sequence[Union[int, ComponentInfo]]) -> str:
        ret = [
            self.make_latex_file_header(),
            '',
            R"\begin{document}",
            '',
            self.make_latex_intro(),
            '',
        ]

        for component_info in component_infos:
            if not isinstance(component_info, ComponentInfo):
                # Assume that component_info was the component index.
                component_info = ComponentInfo(component_index=component_info)

            component_index = component_info.component_index
            top_examples = self.top_examples_reader.get_top_examples_for_component(component_index, self.n_top_examples)

            # Skip components with no examples.
            if len(top_examples) == 0:
                continue

            # Skip components that get filtered out.
            if (
                self.component_filter is not None
                and not self.component_filter.does_component_pass(self.tokenizer, component_index, top_examples)
            ):
                continue

            ret.append(self.make_header_for_component(component_info))

            if self.components_fontsize is not None:
                ret.append(R'\begin{' + self.components_fontsize + R'}')

            for example_info in top_examples:
                ret.append(self.make_example_for_component_latex_string(component_index, example_info))

            if self.components_fontsize is not None:
                ret.append(R'\end{' + self.components_fontsize + R'}')

            ret.append('')

        ret.append(R"\end{document}")

        return "\n".join(ret)

    #######################################################

    @classmethod
    def create(
        cls,
        top_examples_reader: 'top_examples_common.TopExamplesReaderAbc',
        tokenizer: PreTrainedTokenizer,
        n_top_examples: int,
        components_fontsize: Optional[str] = 'footnotesize',
        component_filter: Optional['component_filtering.ComponentFilterAbc'] = None,
        **kwargs,
    ):
        return cls(
            top_examples_reader=top_examples_reader,
            tokenizer=tokenizer,
            n_top_examples=n_top_examples,
            components_fontsize=components_fontsize,
            component_filter=component_filter,
            **kwargs,
        )
