max_adm_step: 2
model_hidden_dim: 400
n_starts: 2
rollout_batch_size: 5000
penalty_coef: 5
auto_alpha: False
alpha: 0.2
n_epochs: 5000