activation: ReLU
actor_lr: 0.001
add_interval: 1
approx: nn
buffer_size: 100000
critic_lr: 0.001
depth: 2
device: cpu
discount: 0.99
eps_decay: 1
eps_end: 0.1
eps_warmup: 0
er_coef: 0.001
eval_interval: 10
eval_trials: 10
exploit: greedy
explore: eps_greedy
hidden: 128
loss_fn: mse_loss
max_tmp: 1.0
minibatch_size: 32
noise_scale: 0.0
num_samples: 4
optimizer: Adam
seed: 0
steps_per_epoch: 10000
target_update_interval: 100
