wandb: disabled
name: lagrangian_minp_1500_sn_256_latent_256_lr_1e-3
stage_name: stage1
vars:
  lr: 1.0e-3
  batch_size: 8
  max_batch_size: 8
  epochs: 50

  dataset:
    kind: lagrangian_dataset
    name: tgv2d
    n_input_timesteps: 3
    n_pushforward_timesteps: 9
    graph_mode: radius_graph
    radius_graph_r: 0.1
    radius_graph_max_num_neighbors: 4

  optim:
    kind: adamw
    lr: ${vars.lr}
    weight_decay: 0.05
    schedule:
      template: ${yaml:schedules/wupcos_epoch}
      template.vars.end_epoch: 10

datasets:
  train:
    kind: ${vars.dataset.kind}
    name: ${vars.dataset.name}
    split: train
    n_input_timesteps: ${vars.dataset.n_input_timesteps}
    n_pushforward_timesteps: ${vars.dataset.n_pushforward_timesteps}
    graph_mode: ${vars.dataset.graph_mode}
    radius_graph_r: ${vars.dataset.radius_graph_r}
    radius_graph_max_num_neighbors: ${vars.dataset.radius_graph_max_num_neighbors}
    num_points_range: [ 1500, 2500 ]
    collators:
      - kind: lagrangian_simformer_collator
  valid_rollout:
    kind: ${vars.dataset.kind}
    name: ${vars.dataset.name}
    split: valid
    test_mode: full_traj
    n_input_timesteps: ${vars.dataset.n_input_timesteps}
    graph_mode: ${vars.dataset.graph_mode}
    radius_graph_r: ${vars.dataset.radius_graph_r}
    radius_graph_max_num_neighbors: ${vars.dataset.radius_graph_max_num_neighbors}
    seed: 2702
    collators:
      - kind: lagrangian_simformer_collator
  test_rollout:
    kind: ${vars.dataset.kind}
    name: ${vars.dataset.name}
    split: test
    test_mode: full_traj
    n_input_timesteps: ${vars.dataset.n_input_timesteps}
    graph_mode: ${vars.dataset.graph_mode}
    radius_graph_r: ${vars.dataset.radius_graph_r}
    radius_graph_max_num_neighbors: ${vars.dataset.radius_graph_max_num_neighbors}
    seed: 2702
    collators:
      - kind: lagrangian_simformer_collator

model:
  kind: lagrangian_gns_model
  encode_process_decode:
    kind: encoders.gns_encode_process_decode
    nnode_in_features: 10
    nnode_out_features: 2
    nedge_in_features: 3
    latent_dim: 128
    nmessage_passing_steps: 10
    nmlp_layers: 2
    mlp_hidden_dim: 128
    optim: ${vars.optim}
  

trainer:
  kind: gns_trainer
  precision: float16
  backup_precision: float16
  max_epochs: 0
  effective_batch_size: 1
  max_batch_size: ${vars.max_batch_size}
  loss_function:
    kind: elementwise_loss
    loss_function:
      kind: mse_loss
  log_every_n_epochs: 1
  forward_kwargs:
    reconstruct_prev_a: true
  callbacks:
    # warmup
    - kind: offline_lagrangian_rollout_speed_callback
      every_n_epochs: 1
      dataset_key: test_rollout
    # benchmark
    - kind: offline_lagrangian_rollout_speed_callback
      every_n_epochs: 1
      dataset_key: test_rollout