# @package _group_
env: "humanoid_truncated_obs"
# term_fn is set automatically by mbrl.util.env.EnvHandler.make_env

num_steps: 300000
epoch_length: 1000
num_elites: 7
patience: 7
improvement_threshold: 0.01
model_lr: 0.001
model_wd: 0.0001
model_batch_size: 256
model_hidden_size: 400
model_num_layers: 4
validation_ratio: 0.2
freq_train_model: 250
effective_model_rollouts_per_step: 400
rollout_schedule: [1, 150, 100, 100]
num_sac_updates_per_step: 10
sac_updates_every_steps: 1
num_epochs_to_retain_sac_buffer: 4

sac_gamma: 0.99
sac_tau: 0.005
sac_alpha: 0.2
sac_policy: "Gaussian"
sac_target_update_interval: 8
sac_automatic_entropy_tuning: True
sac_target_entropy: -17 # ignored, since entropy tuning is false
sac_hidden_size: 2048
sac_lr: 0.00004
sac_batch_size: 256
