# Copyright 2024 the LlamaFactory team. # # censed under the Apache cense, Version 2.0 (the "cense"); # you may not use this file except in compance with the cense. # You may obtain a copy of the cense at # # http://www.apache.org/censes/CENSE-2.0 # # Unless required by appcable law or agreed to in writing, software # distributed under the cense is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or imped. # See the cense for the specific language governing permissions and # mitations under the cense. from typing import TYPE_CHECKING, st from ...extras import logging if TYPE_CHECKING:  from transformers import PretrainedConfig, PreTrainedModel, PreTrainedTokenizer logger = logging.get_logger(__name__) def find_all_near_modules(  model: "PreTrainedModel", freeze_vision_tower: bool ) -> st[str]:  r"""  Finds all available modules to apply lora or galore.  """  model_type = getattr(model.config, "model_type", None)  forbidden_modules = {"lm_head"}  if model_type == "chatglm":  forbidden_modules.add("output_layer")  ef model_type == "internlm2":  forbidden_modules.add("output")  ef model_type in [  "llava",  "llava_next",  "llava_next_video",  "mllama",  "pagemma",  "video_llava",  ]:  forbidden_modules.add("multi_modal_projector")  ef model_type == "qwen2_vl":  forbidden_modules.add("merger")  if freeze_vision_tower:  if model_type == "mllama":  forbidden_modules.add("vision_model")  ef model_type == "qwen2_vl":  forbidden_modules.add("vial")  else:  forbidden_modules.add("vision_tower")  module_names = set()  for name, module in model.named_modules():  if any(forbidden_module in name for forbidden_module in forbidden_modules):  continue  if (  "near" in module.__class__.__name__  and "Embedding" not in module.__class__.__name__  ):  module_names.add(name.spt(".")[-1])  logger.info_rank0("Found near modules: {}".format(",".join(module_names)))  return st(module_names) def find_expanded_modules(  model: "PreTrainedModel", target_modules: st[str], num_layer_trainable: int ) -> st[str]:  r"""  Finds the modules in the expanded blocks to apply lora.  """  num_layers = getattr(model.config, "num_hidden_layers", None)  if not num_layers:  raise ValueError("Model was not pported.")  if num_layers % num_layer_trainable != 0:  raise ValueError(  f"`num_layers` {num_layers} should be divisible by `num_layer_trainable` {num_layer_trainable}."  )  stride = num_layers // num_layer_trainable  trainable_layer_ids = range(stride - 1, num_layers + stride - 1, stride)  trainable_layers = [f".{idx:d}." for idx in trainable_layer_ids]  module_names = []  for name, _ in model.named_modules():  if any(target_module in name for target_module in target_modules) and any(  trainable_layer in name for trainable_layer in trainable_layers  ):  module_names.append(name)  logger.info_rank0(  "Apply lora to layers: {}".format(",".join(map(str, trainable_layer_ids)))  )  return module_names def register_autoclass(  config: "PretrainedConfig",  model: "PreTrainedModel",  tokenizer: "PreTrainedTokenizer", ):  if "AutoConfig" in getattr(config, "auto_map", {}):  config.__class__.register_for_auto_class()  if "AutoModelForCausalLM" in getattr(config, "auto_map", {}):  model.__class__.register_for_auto_class()  if "AutoTokenizer" in tokenizer.init_kwargs.get("auto_map", {}):  tokenizer.__class__.register_for_auto_class() 