---
architecture:
  n_layers: 2
  n_neurons: 256
  activation_type: 0
  learn_var: true
ppo:
  gamma: 0.99
  lambda: 0.95
  K_epochs: 1
  norm_A: true
  eps_clip: 0.2
  c1: 0.5
  c2: 0.01
  c2_schedule: 0.999
  clip_grads: true
  learn_var: true
  init_var: -0.5
  min_memory: 100
  lr_actor: 0.0001
  lr_critic: 0.0001
  batch_size: 64
  update_epochs: 1
  frq_actor_update: 1
  frq_training: 1000
sac:
  gamma: 0.99
  tau: 0.005
  min_memory: 10000
  lr_actor: 0.0003
  lr_critic: 0.0001
  lr_alpha: 0.0001
  size_buffer: 100000
  batch_size: 256
  init_alpha: 0.1
  update_epochs: 1
  frq_actor_update: 1
  reward_scaling: false
  gradient_clipping_max: -1
  n_ensemble_critics: 2
  frq_training: 1
n_workers: 8
...