# @package _group_
env: "gym___Pendulum-v0"
term_fn: "no_termination"

num_steps: 10000
epoch_length: 100
num_elites: 5
patience: 1
model_lr: 0.001
model_wd: 0.00002
model_batch_size: 256
validation_ratio: 0.2
freq_train_model: 50
effective_model_rollouts_per_step: 400
rollout_schedule: [20, 150, 1, 1]
num_sac_updates_per_step: 40
sac_updates_every_steps: 1
num_epochs_to_retain_sac_buffer: 1
num_epochs_train_model: 50

sac_alpha_lr: 0.0003
sac_actor_lr: 0.0003
sac_actor_update_frequency: 4
sac_critic_lr: 0.00003
sac_critic_target_update_frequency: 4
sac_target_entropy: -3
sac_hidden_depth: 2
