# @package _global_

algorithm:
  _target_: "gfn_maxent_rl.algos.trajectory_balance.TrajectoryBalance"

  network: ${policy_network}

  target: null

replay:
  _target_: "gfn_maxent_rl.data.EpisodicReplayBuffer"

optimizer:
  _target_: "gfn_maxent_rl.algos.base.GFNParameters"

  network:
    _target_: "optax.adam"
    learning_rate: ${lr}

  log_Z:
    _target_: "optax.adam"
    learning_rate: 1e-2

exp_name_algorithm: "tb"
