import dataclasses
from dataclasses import dataclass, field
from typing import Optional, Literal, List, Dict, Any

from roll.pipeline.rlvr.rlvr_config import RLVRConfig, WorkerConfig, RewardConfig

@dataclass
class ValConfig(WorkerConfig):
    output_dir: str = field(
        default_factory=str,
        metadata={"help": "Save dir for val files."}
    )
    save_columns: List[str] = field(
        default_factory=list,
        metadata={"help": "Save columns for val files."}
    )
    save_input_seq: bool = field(
        default=False,
        metadata={"help": "Save input_seq for val files."}
    )


@dataclass
class BargainRewardConfig(RewardConfig):
    judge_bot_id: str = field(
        default=None,
        metadata={"help": "judge_bot_id."}
    )

@dataclass
class LHRLConfig(RLVRConfig):
    validation: ValConfig = field(
        default_factory=ValConfig,
        metadata={"help": "Configuration for the validation."}
    )
    rewards: Optional[Dict[str, BargainRewardConfig]] = field(
        default_factory=dict,
        metadata={"help": "Configuration for the multi domain rewards."}
    )
    def __post_init__(self):
        super().__post_init__()
