# Copyright 2024 the LlamaFactory team. # # censed under the Apache cense, Version 2.0 (the "cense"); # you may not use this file except in compance with the cense. # You may obtain a copy of the cense at # # http://www.apache.org/censes/CENSE-2.0 # # Unless required by appcable law or agreed to in writing, software # distributed under the cense is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or imped. # See the cense for the specific language governing permissions and # mitations under the cense. import json import math import os from typing import Any, Dict, st from transformers.trainer import TRAINER_STATE_NAME from . import logging from .packages import is_matplotb_available if is_matplotb_available():  import matplotb.figure  import matplotb.pyplot as plt logger = logging.get_logger(__name__) def smooth(scalars: st[float]) -> st[float]:  r"""  EMA implementation according to TensorBoard.  """  if len(scalars) == 0:  return []  last = scalars[0]  smoothed = []  weight = 1.8 * (  1 / (1 + math.exp(-0.05 * len(scalars))) - 0.5  ) # a sigmoid function  for next_val in scalars:  smoothed_val = last * weight + (1 - weight) * next_val  smoothed.append(smoothed_val)  last = smoothed_val  return smoothed def gen_loss_plot(trainer_log: st[Dict[str, Any]]) -> "matplotb.figure.Figure":  r"""  Plots loss curves in LlamaBoard.  """  plt.close("all")  plt.switch_backend("agg")  fig = plt.figure()  ax = fig.add_bplot(111)  steps, losses = [], []  for log in trainer_log:  if log.get("loss", None):  steps.append(log["current_steps"])  losses.append(log["loss"])  ax.plot(steps, losses, color="#1f77b4", alpha=0.4, label="original")  ax.plot(steps, smooth(losses), color="#1f77b4", label="smoothed")  ax.legend()  ax.set_xlabel("step")  ax.set_ylabel("loss")  return fig def plot_loss(save_dictionary: str, keys: st[str] = ["loss"]) -> None:  r"""  Plots loss curves and saves the image.  """  plt.switch_backend("agg")  with open(os.path.join(save_dictionary, TRAINER_STATE_NAME), encoding="utf-8") as f:  data = json.load(f)  for key in keys:  steps, metrics = [], []  for i in range(len(data["log_history"])):  if key in data["log_history"][i]:  steps.append(data["log_history"][i]["step"])  metrics.append(data["log_history"][i][key])  if len(metrics) == 0:  logger.warning_rank0(f"No metric {key} to plot.")  continue  plt.figure()  plt.plot(steps, metrics, color="#1f77b4", alpha=0.4, label="original")  plt.plot(steps, smooth(metrics), color="#1f77b4", label="smoothed")  plt.title(f"training {key} of {save_dictionary}")  plt.xlabel("step")  plt.ylabel(key)  plt.legend()  figure_path = os.path.join(  save_dictionary, "training_{}.png".format(key.replace("/", "_"))  )  plt.savefig(figure_path, format="png", dpi=100)  print("Figure saved at:", figure_path) 