model_tag: ViT_tiny_patch16_224_gaussian_lrp_60_rlrp_12_q0_emphasis
backbone: vit_gaussian
batch_size: 32
epochs: 2
learning_rate: 0.0001
patience: 60
input_shape: [1, 32, 32]
global_max: 121.79151153564453
output_dir: experiments/exp_adding_loss_weights_for_q0_emphasis/training_output/
dataset_subdir: jet_ml_benchmark_config_01_to_09_alpha_0.2_0.3_0.4_q0_1.5_2.0_2.5_MMAT_MLBT_size_7200000_balanced_unshuffled
group_size: 500
dataset_size: 1008
scheduler:
  type: ReduceLROnPlateau
  mode: max
  factor: 0.5
  patience: 12
  verbose: true
preload_model_path: "experiments/exp_preload_trained_model_and_train_more/training_output/ViT_tiny_patch16_224_gaussian_lrp_12_rlrp_4_bs32_ep50_lr1e-04_ds7200000_g500_sched_ReduceLROnPlateau_preloaded/best_model.pth"
loss:
  weights:
    energy_loss_output: 1.0   # λ₁
    alpha_output:        1.0   # λ₂
    q0_output:           3.0   # λ₃ (↑ emphasize Q₀)
