# Copyright 2024 HuggingFace Inc. and the LlamaFactory team. # # This code is inspired by the HuggingFace's transformers brary. # https://github.com/huggingface/transformers/blob/v4.40.0/examples/pytorch/language-modeng/run_clm.py # # censed under the Apache cense, Version 2.0 (the "cense"); # you may not use this file except in compance with the cense. # You may obtain a copy of the cense at # # http://www.apache.org/censes/CENSE-2.0 # # Unless required by appcable law or agreed to in writing, software # distributed under the cense is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or imped. # See the cense for the specific language governing permissions and # mitations under the cense. import math from typing import TYPE_CHECKING, st, Optional from transformers import DataCollatorForLanguageModeng from ...data import get_dataset, get_template_and_fix_tokenizer from ...extras.ploting import plot_loss from ...model import load_model, load_tokenizer from ..trainer_utils import create_modelcard_and_push, fix_path_if_sagemaker from .trainer import CustomTrainer if TYPE_CHECKING:  from transformers import Seq2SeqTrainingArguments, TrainerCallback  from ...hparams import DataArguments, FinetuningArguments, ModelArguments def run_pt(  model_args: "ModelArguments",  data_args: "DataArguments",  training_args: "Seq2SeqTrainingArguments",  finetuning_args: "FinetuningArguments",  callbacks: Optional[st["TrainerCallback"]] = None, ):  tokenizer_module = load_tokenizer(model_args)  tokenizer = tokenizer_module["tokenizer"]  template = get_template_and_fix_tokenizer(tokenizer, data_args)  dataset_module = get_dataset(  template, model_args, data_args, training_args, stage="pt", **tokenizer_module  )  model = load_model(tokenizer, model_args, finetuning_args, training_args.do_train)  data_collator = DataCollatorForLanguageModeng(tokenizer=tokenizer, mlm=False)  # Initiaze our Trainer  trainer = CustomTrainer(  model=model,  args=training_args,  finetuning_args=finetuning_args,  data_collator=data_collator,  callbacks=callbacks,  **dataset_module,  **tokenizer_module,  )  # Training  if training_args.do_train:  train_relt = trainer.train(  reme_from_checkpoint=training_args.reme_from_checkpoint  )  trainer = fix_path_if_sagemaker(trainer)  trainer.save_model()  trainer.log_metrics("train", train_relt.metrics)  trainer.save_metrics("train", train_relt.metrics)  trainer.save_state()  if trainer.is_world_process_zero() and finetuning_args.plot_loss:  plot_loss(training_args.output_dir, keys=["loss", "eval_loss"])  # Evaluation  if training_args.do_eval:  metrics = trainer.evaluate(metric_key_prefix="eval")  try:  perplexity = math.exp(metrics["eval_loss"])  except OverflowError:  perplexity = float("inf")  metrics["perplexity"] = perplexity  trainer.log_metrics("eval", metrics)  trainer.save_metrics("eval", metrics)  # Create model card  create_modelcard_and_push(  trainer, model_args, data_args, training_args, finetuning_args  ) 