from bespokelabs import curator from pydantic import BaseModel class JudgeRelt(BaseModel):  """Relt of the judge's evaluation."""  correct: bool  reasoning: str class Judge(curator.LLM):  """Curator class for processing Numina dataset."""  response_format = JudgeRelt  def prompt(self, input):  """Create a prompt for the judge to evaluate the correctness of a solution."""  return f"""  You are a judge that evaluates the correctness of a solution.  You will be given a solution and a ground truth solution.  You will need to determine if the solution is correct.  Answers are in the format of \\boxed{{}}.  SOLUTION: {input["deepseek_solution"]}  GROUND TRUTH SOLUTION: {input["ground_truth_solution"]}  """  def parse(self, input, response):  """Parse the judge's response to extract correctness and reasoning."""  return {  **input,  "correct": response.correct,  "judge_reasoning": response.reasoning,  } 