[GENERAL]
n_samples=200000
n_trials=1

[TASK]
train_targets=[(0.14, 0.0), (0.0, 0.14), (-0.14, 0.0), (0.0, -0.14)]
test_targets=[(0.22, 0.0), (0.0, 0.22), (-0.22, 0.0), (0.0, -0.22), (0.1, 0.1), (-0.1, 0.1), (-0.1, -0.1), (0.1, -0.1)]
risky_targets=[(0.14, 0.0), (-0.14, 0.0), (0.22, 0.0), (-0.22, 0.0), (0.1, 0.1), (-0.1, -0.1)]
repair_cost=3.0
fail_prob_base=0.035
fail_radius_large=0.06
fail_radius_small=0.005
action_noise=0.03

[AGENT]
gamma=0.9
epsilon=0.1
test_epsilon=0.03
T=500
print_ev=1000
save_ev=1000
encoding="task"
test_frequency=5000
test_rollouts=5

[C51DQN]
n_atoms=51
v_min=-30.0
v_max=10.0
target_update_ev=1000
keras_params={
   "n_neurons" : [256, 256],
   "activations" : ["tanh", "tanh"],
   "learning_rate" : 0.001}
buffer_params={
   "n_samples" : 800000,
   "n_batch" : 32}

[SFC51DQN]
n_atoms=51
v_min=[-10.0, -10.0, -10.0, -10.0, -10.0, -10.0, -10.0, -10.0, -10.0, -10.0, -10.0, -10.0, 0.0]
v_max=[10.0, 10.0, 10.0, 10.0, 10.0, 10.0, 10.0, 10.0, 10.0, 10.0, 10.0, 10.0, 10.0]
use_gpi=True
plot_cov_frequency=2000000
target_update_ev=1000
keras_params={
   "n_neurons" : [256, 256],
   "activations" : ["tanh", "tanh"],
   "learning_rate" : 0.001}
buffer_params={
   "n_samples" : 800000,
   "n_batch" : 32}

[SFDQN]
use_gpi=True
plot_cov_frequency=2000000
target_update_ev=1000
update_sigma=True
keras_params={
   "n_neurons" : [256, 256],
   "activations" : ["tanh", "tanh"],
   "learning_rate" : 0.001}
buffer_params={
   "n_samples" : 800000,
   "n_batch" : 32}
