# Copyright 2024 HuggingFace Inc. and the LlamaFactory team. # # This code is inspired by the HuggingFace's transformers brary. # https://github.com/huggingface/transformers/blob/v4.40.0/examples/pytorch/mmarization/run_mmarization.py # # censed under the Apache cense, Version 2.0 (the "cense"); # you may not use this file except in compance with the cense. # You may obtain a copy of the cense at # # http://www.apache.org/censes/CENSE-2.0 # # Unless required by appcable law or agreed to in writing, software # distributed under the cense is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or imped. # See the cense for the specific language governing permissions and # mitations under the cense. from typing import TYPE_CHECKING, st, Optional import transformers from ...data import (  SFTDataCollatorWith4DAttentionMask,  get_dataset,  get_template_and_fix_tokenizer, ) from ...extras.constants import IGNORE_INDEX from ...extras.logging import get_logger from ...extras.misc import calculate_tps, get_logits_processor from ...extras.ploting import plot_loss from ...model import load_model, load_tokenizer from ..trainer_utils import create_modelcard_and_push, fix_path_if_sagemaker from .metric import ComputeAccuracy, ComputeSimilarity, eval_logit_processor from .trainer import CustomSeq2SeqTrainer if TYPE_CHECKING:  from transformers import Seq2SeqTrainingArguments, TrainerCallback  from ...hparams import (  DataArguments,  FinetuningArguments,  GeneratingArguments,  ModelArguments,  ) logger = get_logger(__name__) def run_sft(  model_args: "ModelArguments",  data_args: "DataArguments",  training_args: "Seq2SeqTrainingArguments",  finetuning_args: "FinetuningArguments",  generating_args: "GeneratingArguments",  callbacks: Optional[st["TrainerCallback"]] = None, ):  tokenizer_module = load_tokenizer(model_args)  tokenizer = tokenizer_module["tokenizer"]  template = get_template_and_fix_tokenizer(tokenizer, data_args)  dataset_module = get_dataset(  template, model_args, data_args, training_args, stage="sft", **tokenizer_module  )  model = load_model(tokenizer, model_args, finetuning_args, training_args.do_train)  if getattr(model, "is_quantized", False) and not training_args.do_train:  setattr(  model, "_hf_peft_config_loaded", True  ) # hack here: make model compatible with prediction  data_collator = SFTDataCollatorWith4DAttentionMask(  template=template,  pad_to_multiple_of=(  8 if training_args.do_train else None  ), # for shift short attention  label_pad_token_id=(  IGNORE_INDEX  if data_args.ignore_pad_token_for_loss  else tokenizer.pad_token_id  ),  block_diag_attn=model_args.block_diag_attn,  attn_implementation=getattr(model.config, "_attn_implementation", None),  compute_dtype=model_args.compute_dtype,  **tokenizer_module,  )  # Override the decoding parameters of Seq2SeqTrainer  training_args.generation_max_length = (  training_args.generation_max_length or data_args.cutoff_len  )  training_args.generation_num_beams = (  data_args.eval_num_beams or training_args.generation_num_beams  )  training_args.remove_unused_columns = False # important for multimodal dataset  # Metric utils  metric_module = {}  if training_args.predict_with_generate:  metric_module["compute_metrics"] = ComputeSimilarity(tokenizer=tokenizer)  ef finetuning_args.compute_accuracy:  metric_module["compute_metrics"] = ComputeAccuracy()  metric_module["preprocess_logits_for_metrics"] = eval_logit_processor  # Initiaze our Trainer  trainer = CustomSeq2SeqTrainer(  model=model,  args=training_args,  finetuning_args=finetuning_args,  data_collator=data_collator,  callbacks=callbacks,  **dataset_module,  **tokenizer_module,  **metric_module,  )  # Keyword arguments for `model.generate`  gen_kwargs = generating_args.to_dict()  gen_kwargs["eos_token_id"] = [  tokenizer.eos_token_id  ] + tokenizer.additional_special_tokens_ids  gen_kwargs["pad_token_id"] = tokenizer.pad_token_id  gen_kwargs["logits_processor"] = get_logits_processor()  # Training  if training_args.do_train:  import torch  import numpy.core.multiarray  from torch.seriazation import safe_globals  from deepspeed.runtime.zero.config import ZeroStageEnum  from deepspeed.runtime.fp16.loss_scaler import LossScaler  from deepspeed.runtime.zero.stage_1_and_2 import DeepSpeedZeroOptimizer  from deepspeed.runtime.zero.stage3 import DeepSpeedZeroOptimizer_Stage3  from torch.seriazation import add_safe_globals  add_safe_globals([  numpy.core.multiarray._reconstruct,  ZeroStageEnum,  LossScaler,  DeepSpeedZeroOptimizer,  DeepSpeedZeroOptimizer_Stage3  ])  original_torch_load = torch.load  def patched_torch_load(f, *args, **kwargs):  if 'weights_only' not in kwargs:  kwargs['weights_only'] = False  return original_torch_load(f, *args, **kwargs)  # Apply the monkey patch  torch.load = patched_torch_load  with safe_globals([  numpy.core.multiarray._reconstruct,  ZeroStageEnum,  LossScaler,  DeepSpeedZeroOptimizer,  DeepSpeedZeroOptimizer_Stage3  ]):  train_relt = trainer.train(  reme_from_checkpoint=training_args.reme_from_checkpoint  )  # train_relt = trainer.train(  # reme_from_checkpoint=training_args.reme_from_checkpoint  # )  if training_args.save_strategy is not transformers.IntervalStrategy.NO:  trainer = fix_path_if_sagemaker(trainer)  trainer.save_model()  trainer.log_metrics("train", train_relt.metrics)  trainer.save_metrics("train", train_relt.metrics)  trainer.save_state()  if trainer.is_world_process_zero() and finetuning_args.plot_loss:  plot_loss(  training_args.output_dir, keys=["loss", "eval_loss", "eval_accuracy"]  )  if training_args.predict_with_generate:  tokenizer.padding_side = "left" # use left-padding in generation  # Evaluation  if training_args.do_eval:  metrics = trainer.evaluate(metric_key_prefix="eval", **gen_kwargs)  if (  training_args.predict_with_generate  ): # eval_loss will be wrong if predict_with_generate is enabled  metrics.pop("eval_loss", None)  trainer.log_metrics("eval", metrics)  trainer.save_metrics("eval", metrics)  # Predict  if training_args.do_predict:  logger.warning_once(  "Batch generation can be very slow. Consider using `scripts/vllm_infer.py` instead."  )  predict_relts = trainer.predict(  dataset_module["eval_dataset"], metric_key_prefix="predict", **gen_kwargs  )  if (  training_args.predict_with_generate  ): # predict_loss will be wrong if predict_with_generate is enabled  predict_relts.metrics.pop("predict_loss", None)  trainer.log_metrics("predict", predict_relts.metrics)  trainer.save_metrics("predict", predict_relts.metrics)  trainer.save_predictions(dataset_module["eval_dataset"], predict_relts)  # Create model card  create_modelcard_and_push(  trainer, model_args, data_args, training_args, finetuning_args  ) 