ac_dim: 3
action_space: 3
adapt: 0
augment_offline_data: false
augment_sac: false
comment: population_big
context_type: rad_augmentation
d4rl: true
deterministic_rollouts: false
dir: data
env_name: Hopper-v2
epoch_steps: null
espi: false
filename: ModelBased
fix_std: false
gamma: 0.99
init_collect: 5000
is_done_func: None
l2_reg_multiplier: 1.0
lam: 0
learning_rate: 0.1
load_model_dir: None
log_interval: 100
logvar_head: true
max_timesteps: 10000000
min_model_epochs: null
model_epochs: 2000
model_free: false
model_lr: 0.001
model_retain_epochs: 5
model_train_freq: 1000
mopo: true
mopo_lam: 1.0
mopo_penalty_type: mopo_default
mopo_uncertainty_target: 1.5
n_eval_rollouts: 10
num_elites: 5
num_models: 7
num_rollouts_per_step: 50
oac: false
ob_dim: 11
observation_space: 11
offline_epochs: 5000
outer_steps: 3000
pca: 0
policy_iters: 1000
policy_update_steps: 1000
population_model_dirs: None
rad_rollout: false
real_sample_ratio: 0.05
reward_head: true
rollout_model_freq: 250
save_model: false
save_policy: true
seed: 1
sigma: 0.01
states: uniform
steps_k: 10
target_entropy: null
train_memory: 2000000
train_policy_every: 100
train_val_ratio: 0.2
tune_mopo_lam: false
update_timestep: 50000
uuid: null
val_memory: 500000
var_max: false
var_thresh: 100
var_type: reward
zeros: false
