defaults:
  - _self_


algo_name: 'sac_boxd2'
algo_tags: ['sac', 'boxd']


agent:
  _target_: src.agents.sac_boxd2.sac_boxd2_learner.SACBoxd2Learner
  seed: ${seed}
  state_dim: ???
  action_dim: ???
  actor_lr: 3e-4
  critic_lr: 3e-4
  temp_lr: 3e-4
  hidden_dims: ${hidden_dims}
  discount: ${discount}
  tau: ${tau}
  init_temperature: 1.0
  policy_update_freq: 1
  num_parallel_seeds: ${num_parallel_seeds}
  dropout_rate: 0.001
  actor_k_samples: 1
  critic_k_samples: 2
  set_explore_type: 'annealing'
