defaults:
  - scheduler@_here_: linear_warmup_cosine_annealing
  - _self_

_target_: src.models.occupancy_physics_particle.OccupancyPhysicsParticleLitModule
num_classes: ${vars.num_classes}

latent_model:
  _target_: src.models.components.latent.upt_transformer.TransformerModel
  _partial_: True
  latent_dim: ${vars.latent_dim}
  dim: 192
  depth: 12
  num_attn_heads: 3
  condition_dim: 768
  input_ln: True
  full_residual: True
  output_ln: True

optimizer:
  _target_: torch.optim.AdamW # LION  # we need "full" single precision
  _partial_: True
  lr: 0.0001
  weight_decay: 0.05 # linear warmup + cosine decay; 1e-6...1e-4, 10% of epochs; look at a PyTLightning example "per step" scheduling

scheduler:
  _target_: src.modules.schedulers.LinearWarmupCosineAnnealingLR
  _partial_: true
  warmup_epochs: 2
  max_epochs: ${trainer.max_epochs}
  min_lr: 1e-6
  last_epoch: -1

loss_function:
  _target_: torch.nn.MSELoss

first_stage_model_ckpt: add_chkpt_path
first_stage_model_wandb_id: 'pmtrv0ea'
first_stage_model_wandb_project: 'dam3d'