defaults:
  - _self_

# experiment
experiment: drqacstate

agent:
  _target_: drqacstate.DrQAcstateAgent
  obs_shape: ??? # to be specified later
  action_shape: ??? # to be specified later
  max_action: ???
  num_protos: 256
  groups: 16
  device: ${device}
  lr: ${lr}
  critic_target_tau: 0.01
  update_every_steps: 2
  use_tb: ${use_tb}
  num_expl_steps: 2000
  hidden_dim: 1024
  feature_dim: ${feature_dim}
  stddev_schedule: ${stddev_schedule}
  stddev_clip: 0.3
  offline: ${offline}
  bc_weight: ${bc_weight}
  use_bc: ${use_bc}