from omegaconf import DictConfig

from inference_rlhf.code.policy.base import BasePolicy

class QwenPolicy(BasePolicy): 
    def __init__(self, cfg: DictConfig): 
        super().__init__(cfg, torch_dtype="auto", checkpoint_dir=cfg.checkpoint_dir)