[
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "comment": ""},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "comment": ""},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "comment": ""},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "comment": ""},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "comment": ""},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "num_train_meta": 2, "num_train_long_term": 4, "num_train_short_term": 4, "comment": ""},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "num_train_meta": 2, "num_train_long_term": 4, "num_train_short_term": 4, "comment": ""},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "num_train_meta": 2, "num_train_long_term": 4, "num_train_short_term": 4, "comment": ""},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "num_train_meta": 2, "num_train_long_term": 4, "num_train_short_term": 4, "comment": ""},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "num_train_meta": 2, "num_train_long_term": 4, "num_train_short_term": 4, "comment": ""},
  {"policy": "impala", "experiment":"recall_minigrid_empty8x8_2room_unlock"},
  {"policy": "impala", "experiment":"recall_minigrid_empty8x8_2room_unlock", "num_actors": 32, "batch_size": 32, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.0006, "comment": "atari consts"},
  {"policy": "impala", "experiment":"recall_minigrid_empty8x8_2room_unlock", "num_actors": 32, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.0006, "comment": "atari consts, smaller bat"},
  {"policy": "impala", "experiment":"recall_minigrid_empty8x8_2room_unlock", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.0006, "comment": "atari consts, smaller bat, fewer actors"},
  {"policy": "impala", "experiment":"recall_minigrid_empty8x8_2room_unlock", "num_actors": 4, "batch_size": 4, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.0006, "comment": "atari consts, smaller bat, fewer actors"},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "num_train_meta": 2, "num_train_long_term": 4, "num_train_short_term": 4, "comment": "common net, 500/750/1M"},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "num_train_meta": 2, "num_train_long_term": 4, "num_train_short_term": 4, "comment": "common net, 500/750/1M"},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "num_train_meta": 2, "num_train_long_term": 4, "num_train_short_term": 4, "comment": "common net, 500/750/1M"},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "num_train_meta": 2, "num_train_long_term": 4, "num_train_short_term": 4, "comment": "common net, 500/750/1M"},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 3, "num_train_meta": 2, "num_train_long_term": 4, "num_train_short_term": 4, "comment": "common net, 500/750/1M"},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 1, "comment": "common net, 500/750/1M"},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 1, "comment": "common net, 500/750/1M"},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 1, "comment": "common net, 500/750/1M"},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 1, "comment": "common net, 500/750/1M"},
  {"policy": "sane", "experiment":"recall_minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [10, 4], "batch_size": 4096, "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 1, "comment": "common net, 500/750/1M"},
  {"policy": "impala", "experiment":"recall_minigrid_empty8x8_2room_unlock", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.0006, "epsilon": 0.02, "comment": "atari consts, smaller bat, fewer actors, more eps"},
  {"policy": "impala", "experiment":"recall_minigrid_empty8x8_2room_unlock", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "epsilon": 0.02, "comment": "atari consts, smaller bat, fewer actors, more eps"},
  {"policy": "impala", "experiment":"recall_minigrid_empty8x8_2room_unlock", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.003, "epsilon": 0.02, "comment": "atari consts, smaller bat, fewer actors, more eps, no force eval rolling"},
  {"policy": "impala", "experiment":"recall_minigrid_empty8x8_2room_unlock", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "epsilon": 0.02, "comment": "atari consts, smaller bat, fewer actors, more eps, no force eval rolling"},
  {"policy": "impala", "experiment":"recall_minigrid_empty8x8_2room_unlock", "num_actors": 4, "batch_size": 32, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "epsilon": 0.02, "comment": "atari consts, smaller bat, fewer actors, more eps, no force eval rolling"},
  {"policy": "impala", "experiment":"recall_minigrid_empty8x8_2room_unlock", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "epsilon": 0.02, "comment": "atari consts, smaller bat, fewer actors, more eps, no force eval rolling"}
]