# @package _global_
defaults:
  - /env: async/ant
  - /loss: rnn-sac
  - /collector: rollout
  - /buffer: seq
  - /updater: soft
  - /trainer: default
  - /optimizer: adam
  - /noise_control: random_mask

env:
  train_make_kwargs:
    action_history: true
    remember: true
  eval_make_kwargs:
    action_history: true
    remember: true

collector:
  total_rollouts: 1_536
  max_frames_per_traj: 1_024
  init_random_rollouts: 16

trainer:
  optim_steps_per_batch: 128
  log_interval: 1_024
  num_eval_rollouts: 16
  include_additional_keys:
    - torso
    - front_left_leg
    - front_right_leg
    - back_left_leg
    - back_right_leg
    - next.torso
    - next.front_left_leg
    - next.front_right_leg
    - next.back_left_leg
    - next.back_right_leg
    - action_history
    - next.action_history

buffer:
  sampler:
    slice_len: 64
  batch_size: 2_048

loss:
  rnn_type: gru
  pred_signals: false
  signals_keys:
    - torso
    - front_left_leg
    - front_right_leg
    - back_left_leg
    - back_right_leg
  signals_dims:
    - 11
    - 4
    - 4
    - 4
    - 4

optimizer:
  lr: 0.0003