# @package _global_

defaults:
  - override /env: gridworld/4rooms-dynamics
  - override /agent: dynamics_fb

train_steps: 400_000

log_interval: 10_000
eval_interval: 50_000

tags: [dynamics-fb, doors, discrete]

agent:
  lr: 3e-4
  batch_size: 1024

  # FB Specific
  z_dim: 100
  z_mix_ratio: 0.5
  boltzmann: True
  one_hot_dim: 3

  # F Network
  f_hidden_dims: [1024, 512, 512]  # Value network hidden dimensions.
  f_layer_norm: True  # Whether to use layer normalization.

  # B Network
  b_hidden_dims: [512, 512, 512]  # Value network hidden dimensions.
  b_layer_norm: True  # Whether to use layer normalization.

  # Whether Dynamics-Adaptive
  use_context: False
  number_of_meta_envs: 4
  
  # MISC
  discount: 0.99
  tau: 0.01  # Target network update rate.
  
