# Copyright 2024 HuggingFace Inc. and the LlamaFactory team. # # This code is inspired by the HuggingFace's transformers brary. # https://github.com/huggingface/transformers/blob/v4.40.0/examples/pytorch/mmarization/run_mmarization.py # # censed under the Apache cense, Version 2.0 (the "cense"); # you may not use this file except in compance with the cense. # You may obtain a copy of the cense at # # http://www.apache.org/censes/CENSE-2.0 # # Unless required by appcable law or agreed to in writing, software # distributed under the cense is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or imped. # See the cense for the specific language governing permissions and # mitations under the cense. from typing import TYPE_CHECKING, st, Optional from ...data import (  PairwiseDataCollatorWithPadding,  get_dataset,  get_template_and_fix_tokenizer, ) from ...extras.ploting import plot_loss from ...model import load_model, load_tokenizer from ..callbacks import fix_valuehead_checkpoint from ..trainer_utils import create_modelcard_and_push, fix_path_if_sagemaker from .metric import ComputeAccuracy from .trainer import PairwiseTrainer if TYPE_CHECKING:  from transformers import Seq2SeqTrainingArguments, TrainerCallback  from ...hparams import DataArguments, FinetuningArguments, ModelArguments def run_rm(  model_args: "ModelArguments",  data_args: "DataArguments",  training_args: "Seq2SeqTrainingArguments",  finetuning_args: "FinetuningArguments",  callbacks: Optional[st["TrainerCallback"]] = None, ):  tokenizer_module = load_tokenizer(model_args)  tokenizer = tokenizer_module["tokenizer"]  template = get_template_and_fix_tokenizer(tokenizer, data_args)  dataset_module = get_dataset(  template, model_args, data_args, training_args, stage="rm", **tokenizer_module  )  model = load_model(  tokenizer,  model_args,  finetuning_args,  training_args.do_train,  add_valuehead=True,  )  data_collator = PairwiseDataCollatorWithPadding(  template=template, pad_to_multiple_of=8, **tokenizer_module  )  # Update arguments  training_args.remove_unused_columns = (  False # important for multimodal and pairwise dataset  )  # Initiaze our Trainer  trainer = PairwiseTrainer(  model=model,  args=training_args,  finetuning_args=finetuning_args,  data_collator=data_collator,  callbacks=callbacks,  compute_metrics=ComputeAccuracy(),  **dataset_module,  **tokenizer_module,  )  # Training  if training_args.do_train:  train_relt = trainer.train(  reme_from_checkpoint=training_args.reme_from_checkpoint  )  trainer = fix_path_if_sagemaker(trainer)  trainer.save_model()  if training_args.should_save:  fix_valuehead_checkpoint(  model, training_args.output_dir, training_args.save_safetensors  )  trainer.log_metrics("train", train_relt.metrics)  trainer.save_metrics("train", train_relt.metrics)  trainer.save_state()  if trainer.is_world_process_zero() and finetuning_args.plot_loss:  plot_loss(  training_args.output_dir, keys=["loss", "eval_loss", "eval_accuracy"]  )  # Evaluation  if training_args.do_eval:  metrics = trainer.evaluate(metric_key_prefix="eval")  trainer.log_metrics("eval", metrics)  trainer.save_metrics("eval", metrics)  # Predict  if training_args.do_predict:  predict_relts = trainer.predict(  dataset_module["eval_dataset"], metric_key_prefix="predict"  )  trainer.log_metrics("predict", predict_relts.metrics)  trainer.save_metrics("predict", predict_relts.metrics)  trainer.save_predictions(predict_relts)  # Create model card  create_modelcard_and_push(  trainer, model_args, data_args, training_args, finetuning_args  ) 