# @package _global_

defaults:
  - override /model: am.yaml
  - override /env: mdpp.yaml
  - override /callbacks: default.yaml
  - override /trainer: default.yaml
  - override /logger: wandb.yaml

logger:
  wandb:
    project: "rl4co"
    tags: ["am", "${env.name}"]
    group: ${env.name}
    name: am-a2c-${env.name}


model:
  _target_: rl4co.models.A2C
  policy:
    _target_: rl4co.models.AttentionModelPolicy
    env_name: "${env.name}"
  actor_optimizer_kwargs:
    lr: 1e-4
    weight_decay: 1e-3
  critic_optimizer_kwargs: null # default to actor_optimizer_kwargs
  batch_size: 64
  train_data_size: 500
  val_data_size: 100
  test_data_size: 100

trainer:
  max_epochs: 10

seed: 1234