from abc import ABC, abstractmethod

from rewards import DockerTestReward


class CompletionProcessingBase(ABC):
    def __init__(self, **kwargs):
        self.kwargs = kwargs

    @abstractmethod
    def __call__(self, completions_text: list[str], inputs: list[dict]) -> list[str]:
        pass


def get_completion_processing_function(name: str | None = None,
                                       kwargs: dict[str, float] = None) -> CompletionProcessingBase:
    if kwargs is None:
        kwargs = {}
    if name is None or name == 'default':
        return DefaultCompletionProcessing(**kwargs)
    else:
        raise ValueError(f"Completion processing function {name} not found")


class DefaultCompletionProcessing(CompletionProcessingBase):
    def __call__(self, completions_text: list[str], inputs: list[dict]) -> list[str]:
        """
            Does nothing. This results in normal GRPO training.
        """
        return {'completions_text': completions_text}