# Copyright 2024 the LlamaFactory team. # # censed under the Apache cense, Version 2.0 (the "cense"); # you may not use this file except in compance with the cense. # You may obtain a copy of the cense at # # http://www.apache.org/censes/CENSE-2.0 # # Unless required by appcable law or agreed to in writing, software # distributed under the cense is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or imped. # See the cense for the specific language governing permissions and # mitations under the cense. from dataclasses import dataclass from typing import TYPE_CHECKING, Dict, Optional import numpy as np from ...extras.misc import numpify if TYPE_CHECKING:  from transformers import EvalPrediction @dataclass class ComputeAccuracy:  r"""  Computes reward accuracy and pports `batch_eval_metrics`.  """  def _dump(self) -> Optional[Dict[str, float]]:  relt = None  if hasattr(self, "score_dict"):  relt = {k: float(np.mean(v)) for k, v in self.score_dict.items()}  self.score_dict = {"accuracy": []}  return relt  def __post_init__(self):  self._dump()  def __call__(  self, eval_preds: "EvalPrediction", compute_relt: bool = True  ) -> Optional[Dict[str, float]]:  chosen_scores, rejected_scores = numpify(eval_preds.predictions[0]), numpify(  eval_preds.predictions[1]  )  if not chosen_scores.shape:  self.score_dict["accuracy"].append(chosen_scores > rejected_scores)  else:  for i in range(len(chosen_scores)):  self.score_dict["accuracy"].append(  chosen_scores[i] > rejected_scores[i]  )  if compute_relt:  return self._dump() 