# @package _global_
defaults:
  - /env: async/hopper
  - /loss: rnn-sac
  - /collector: rollout
  - /buffer: seq
  - /updater: soft
  - /trainer: default
  - /optimizer: adam
  - /noise_control: random_mask

env:
  train_make_kwargs:
    action_history: true
    flatten_obs: true
  eval_make_kwargs:
    action_history: true
    flatten_obs: true

collector:
  total_rollouts: 1_536
  max_frames_per_traj: 1_024
  init_random_rollouts: 16

trainer:
  optim_steps_per_batch: 128
  log_interval: 1_024
  num_eval_rollouts: 16
  include_additional_keys:
    - torso
    - thigh
    - leg
    - foot
    - next.torso
    - next.thigh
    - next.leg
    - next.foot
    - action_history
    - next.action_history
  eval_metrics:
    - ${as_tuple:"reward","mean"}
    - ${as_tuple:"reward","sum"}

buffer:
  sampler:
    slice_len: 64
  batch_size: 2_048

loss:
  rnn_type: gru
  pred_signals: false
  signals_keys:
    - torso
    - thigh
    - leg
    - foot
  signals_dims:
    - 5
    - 2
    - 2
    - 2

optimizer:
  lr: 0.0003