{    
    "agent" : "REINFORCE",
    "env_name" : "Maze_badreward",
    "optim" : ["rmsprop"],
    "max_episodes" : 2000,
    "gamma" : 0.99,
    "actor_reg" : [0.25],
    "actor_lr" : [ 0.005, 0.001],
    "state_lr" : 0.001,
    "critic_lr" : 0.005,
    "batch_size" : 1,
    "buffer_size" : [15, 100, 1000],
    "raw_basis" : false,
    "NN_basis_dim" : "16",
    "delta" : 3,
    "seed" : [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40]
}
