defaults:
  - _self_


algo_name: 'sac_oac'
algo_tags: ['sac', 'oac']


agent:
  _target_: src.agents.sac_oac.sac_oac_learner.SACOACLearner
  seed: ${seed}
  state_dim: ???
  action_dim: ???
  actor_lr: 3e-4
  critic_lr: 3e-4
  temp_lr: 3e-4
  hidden_dims: ${hidden_dims}
  discount: ${discount}
  tau: ${tau}
  init_temperature: 1.0
  policy_update_freq: 1
  num_parallel_seeds: ${num_parallel_seeds}
  beta_ub: 4.66
  delta: 23.53
