import abc
import dataclasses
from typing import Any


@dataclasses.dataclass
class ProbResult:
    metric: float
    sample_detail: dict[str, Any]


class Task(abc.ABC):
    @abc.abstractmethod
    def evaluate(self, sample_id: int, answer: str) -> ProbResult:
        raise NotImplementedError()

    @abc.abstractmethod
    def parse_answer(self, sample_id: int, lm_response: str) -> str:
        raise NotImplementedError()

    @abc.abstractmethod
    def submit(self, sample_id: int, answer: str) -> ProbResult:
        raise NotImplementedError()
