agent:
  _target_: agent.incremental_agent.IncrementalAgent
  obs_dim: ??? # to be specified later
  t_obs_dim: ??? # to be specified later
  action_dim: ??? # to be specified later
  action_range: ??? # to be specified later
  device: ${device}
  critic_cfg: ${double_q_critic}
  actor_cfg: ${diag_gaussian_actor}
  discount: 0.99
  init_temperature: 0.1
  alpha_lr: 3e-4
  alpha_betas: [0.9, 0.999]
  actor_lr: 3e-4
  actor_betas: [0.9, 0.999]
  actor_update_frequency: 1
  critic_lr: 3e-4
  critic_betas: [0.9, 0.999]
  critic_tau: 0.005
  critic_target_update_frequency: 2
  batch_size: 256
  learnable_temperature: true
  use_t_vel: true
  use_t_obs: false
  policy_use_t_vel: false
  use_timesteps: false

double_q_critic:
  _target_: agent.critic.DoubleQCritic
  obs_dim: ${agent.obs_dim}
  t_obs_dim: ${agent.t_obs_dim}
  action_dim: ${agent.action_dim}
  hidden_dim: 256
  hidden_depth: 2
  use_t_obs: false
  use_t_vel: ${agent.policy_use_t_vel}
    
diag_gaussian_actor:
  _target_: agent.actor.DiagGaussianActor
  obs_dim: ${agent.obs_dim}
  t_obs_dim: ${agent.t_obs_dim}
  action_dim: ${agent.action_dim}
  hidden_depth: 2
  hidden_dim: 256
  log_std_bounds: [-5, 2]
  use_t_obs: false
  use_t_vel: ${agent.policy_use_t_vel}
