[GENERAL]
n_samples=100000

[TASK]
train_targets=[(0.14, 0.0), (-0.14, 0.0), (0.0, 0.14), (0.0, -0.14)]
test_targets=[(0.22, 0.0), (-0.22, 0.0), (0.0, 0.22), (0.0, -0.22), (0.1, 0.1), (0.1, -0.1), (-0.1, 0.1), (-0.1, -0.1)]

[AGENT]
gamma=0.9
epsilon=0.1
test_epsilon=0.03
T=500
print_ev=1000
save_ev=200
n_test_ev=1000
encoding="task"

[DQN]
target_update_ev=1000
keras_params={
   "n_neurons" : [256, 256],
   "activations" : ["relu", "relu"],
   "learning_rate" : 0.001}
buffer_params={
   "n_samples" : 1000000,
   "n_batch" : 32}

[SFDQN]
learning_rate_w=0.5
use_true_reward=True
use_gpi=True
target_update_ev=1000
keras_params={
   "n_neurons" : [256, 256],
   "activations" : ["relu", "relu"],
   "learning_rate" : 0.001}
buffer_params={
   "n_samples" : 1000000,
   "n_batch" : 32}