{    
    "agent" : "Frodo",
    "env_name" : "MCSenseSparseBangAux",
    "env_param" : [ 1],
    "optim" : ["rmsprop"],
    "max_episodes" : [500],
    "gamma" : 0.99,
    "actor_reg" : [0, 0.25, 1],
    "actor_lr" : [0.03125, 0.0625,  0.125],
    "gamma_L2" : [0],
    "reward_L2" : [0, 0.25],
    "reward_lr" : [0.015625, 0.0625,  0.125],
    "gamma_lr" : [0.0],
    "state_lr" : 0.0,
    "critic_lr" : 0.0,
    "batch_size" : [1, 4, 8],
    "buffer_size" : [10, 50, 100],
    "delta" : [3],
    "Neumann_loops" : 0,
    "approx" : "First-order",
    "raw_basis" : false,
    "basis" : "tilecoding",
    "tiles" : 4,
    "inner_mul":[1,2,5],
    "tilings" :  5,
    "NN_basis_dim" : "16",
    "seed" : [1, 2, 3, 4, 5, 6, 7, 8, 9, 10 ]
}