# @package _global_
defaults:
  - /env: async/reacher
  - /loss: rnn-sac
  - /collector: rollout
  - /buffer: seq
  - /updater: soft
  - /trainer: default
  - /optimizer: adam
  - /noise_control: random_mask

env:
  train_make_kwargs:
    action_history: true
    remember: true
  eval_make_kwargs:
    action_history: true
    remember: true

collector:
  total_rollouts: 1_536
  max_frames_per_traj: 1_024
  init_random_rollouts: 16

trainer:
  optim_steps_per_batch: 128
  log_interval: 1_024
  num_eval_rollouts: 16
  include_additional_keys:
    - first_arm
    - second_arm
    - target
    - diff
    - next.first_arm
    - next.second_arm
    - next.target
    - next.diff
    - action_history
    - next.action_history

buffer:
  sampler:
    slice_len: 64
  batch_size: 2_048

loss:
  rnn_type: gru
  pred_signals: false
  signals_keys:
    - first_arm
    - second_arm
    - target
    - diff
  signals_dims:
    - 3
    - 3
    - 2
    - 2

optimizer:
  lr: 0.0003