defaults:
  - default
  - scheduler@_here_: linear_warmup_cosine_annealing
  - override /model/loss_function@_here_: mse_loss # dummy
  - override /model/act@_here_: relu # dummy
  - _self_

_target_: src.models.gns_f.GNSfLitModule
num_classes: ${vars.num_classes}

model:
  _target_: src.models.gns_f.GNSf
  particle_dimension: ${vars.dim}
  node_in: ${vars.input_dim}
  edge_in: ${vars.edge_input_dim}
  latent_dim: 128
  num_message_passing_steps: 10
  mlp_num_layers: 2
  mlp_hidden_dim: 128
  noise_std: 6.7e-4
  dataset_path: ${data.global_root}/${data.dataset_rel_path}

optimizer:
  _target_: torch.optim.AdamW # LION  # we need "full" single precision
  _partial_: True
  lr: 0.0001
  weight_decay: 0.05 # linear warmup + cosine decay; 1e-6...1e-4, 10% of epochs; look at a PyTLightning example "per step" scheduling

scheduler:
  _target_: src.modules.schedulers.LinearWarmupCosineAnnealingLR
  _partial_: true
  warmup_epochs: 2
  max_epochs: ${trainer.max_epochs}
  min_lr: 1.e-6
  last_epoch: -1
