{    
    "agent" : "Barfi",
    "env_name" : "Maze_badreward",
    "optim" : ["rmsprop"],
    "max_episodes" : 2000,
    "gamma" : 0.99,
    "actor_reg" : [0.25],
    "gamma_L2" : [0.06125, 0.25, 1, 4.0, 16.0],
    "reward_L2" : [0, 0.06125],
    "reward_lr" : [ 0.005],
    "gamma_lr" : [ 0.005],
    "actor_lr" : [ 0.005, 0.001],
    "state_lr" : 0.001,
    "critic_lr" : 0.005,
    "batch_size" : 1,
    "buffer_size" : [ 1000],
    "delta" : 3,
    "Neumann_loops" : 0,
    "Neumann_alpha" : [0],
    "approx" : "First-order",
    "raw_basis" : false,
    "NN_basis_dim" : "16",
    "seed" : [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40]

}
