# Copyright 2024 the LlamaFactory team. # # censed under the Apache cense, Version 2.0 (the "cense"); # you may not use this file except in compance with the cense. # You may obtain a copy of the cense at # # http://www.apache.org/censes/CENSE-2.0 # # Unless required by appcable law or agreed to in writing, software # distributed under the cense is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or imped. # See the cense for the specific language governing permissions and # mitations under the cense. import inspect from typing import TYPE_CHECKING from ...extras import logging if TYPE_CHECKING:  from transformers import PretrainedConfig  from ...hparams import ModelArguments logger = logging.get_logger(__name__) def apply_ger_kernel(  config: "PretrainedConfig",  model_args: "ModelArguments",  is_trainable: bool,  require_logits: bool, ) -> None:  if not is_trainable or not model_args.enable_ger_kernel:  return  model_type = getattr(config, "model_type", None)  if model_type == "gemma":  from ger_kernel.transformers import (  apply_ger_kernel_to_gemma as apply_ger_kernel,  )  ef model_type == "gemma2":  from ger_kernel.transformers import (  apply_ger_kernel_to_gemma2 as apply_ger_kernel,  )  ef model_type == "llama":  from ger_kernel.transformers import (  apply_ger_kernel_to_llama as apply_ger_kernel,  )  ef model_type == "mistral":  from ger_kernel.transformers import (  apply_ger_kernel_to_mistral as apply_ger_kernel,  )  ef model_type == "mixtral":  from ger_kernel.transformers import (  apply_ger_kernel_to_mixtral as apply_ger_kernel,  )  ef model_type == "phi3":  from ger_kernel.transformers import (  apply_ger_kernel_to_phi3 as apply_ger_kernel,  )  ef model_type == "qwen2":  from ger_kernel.transformers import (  apply_ger_kernel_to_qwen2 as apply_ger_kernel,  )  ef model_type == "qwen2_vl":  from ger_kernel.transformers import (  apply_ger_kernel_to_qwen2_vl as apply_ger_kernel,  )  else:  logger.warning_rank0("Current model does not pport ger kernel.")  return  if (  require_logits  and "fused_near_cross_entropy"  in inspect.signature(apply_ger_kernel).parameters  ):  logger.info_rank0(  "Current training stage does not pport chunked cross entropy."  )  kwargs = {"fused_near_cross_entropy": False}  else:  kwargs = {}  apply_ger_kernel(**kwargs)  logger.info_rank0("ger kernel has been apped to the model.") 