# @package _global_

defaults:
  - override /dataset: cyclone_small
  - override /training: muon
  - override /autoencoder: peft

# PEFT stage configuration
stage: peft
ae_checkpoint: null

training:
  n_epochs: 10
  batch_size: 16
  exclude_from_wd: ["cond"]
  gradnorm_balancer: "none"  # "none", "full", "pseudo"
  loss_type: complex_mse
  integral_loss_type: int_norm_l1
  spectral_loss_type: log_relative_l1
  ds: 0.01
  learning_rate: 5e-3
  weight_decay: 1e-5
  
  # EMA Loss Normalization Configuration
  ema_normalization_loss: ["kyspec", "kxspec", "qspec", "phi_zf", "mass"]
  ema_beta: 0.99
  
  eval_loss_type: mse
  eval_integral_loss_type: mse
  eval_spectral_loss_type: l1

logging:
  tags: ["peft", "v6", "lora"]
  name_suffix: "peft_ep10_ema_norm_v2_logrl1"

autoencoder:
  loss_scheduler:
    flux_int: null
    phi_int: null
    kyspec: null
  
  loss_weights:
    df: 1.0
  
  extra_loss_weights:
    flux_int: 1.0
    phi_int: 1.0
    kxspec: 1.0
    kyspec: 1.0
    qspec: 1.0
    phi_zf: 1.0
    mass: 1.0

    qspec_monotonicity: 0.0
    kyspec_monotonicity: 0.0

  peft:
    method: "eva" # "lora", "eva"
    eva:
      r: 32
      lora_alpha: 1
      lora_dropout: 0.0
      bias: "none"
      strategy: "attention_mlp"
      # EVA parameters
      rho: 2.0
      tau: 0.99
      num_batches: 30
      # use_label_mask: true
      # whiten: false
      # adjust_scaling_factors: true
    lora:
      r: 64
      lora_alpha: 1
      lora_dropout: 0.0
      # strategy: "comprehensive"
      strategy: "attention_mlp"
    save:
      save_lora_only: true
      save_full_model: false
