# @package _group_
env: "gym___Hopper-v2"
term_fn: "hopper"

expert_dir: "expert/hopper"

model_exp_ratio: 0.0
policy_exp_ratio: 0

expert_size: 10000


num_steps: 150000
epoch_length: 1000
num_elites: 5
patience: 5
model_lr: 0.001
model_wd: 0.00001
model_batch_size: 256
validation_ratio: 0.2
freq_train_model: 250
effective_model_rollouts_per_step: 100 #400
rollout_schedule: [20, 150, 1, 15]
#rollout_schedule: [20, 150, 1, 1]
num_policy_updates_per_step: 20 #20
policy_updates_every_steps: 1
num_epochs_to_retain_sac_buffer: 1

sac_gamma: 0.99
sac_tau: 0.005
sac_alpha: 0.2
sac_policy: "Gaussian"
sac_target_update_interval: 4
sac_automatic_entropy_tuning: false
sac_target_entropy: 1 # ignored, since entropy tuning is false
sac_hidden_size: 512
sac_lr: 0.0003
sac_batch_size: 256