[
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 4], "batch_size": 1024, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 4], "batch_size": 1024, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 4], "batch_size": 1024, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 4], "batch_size": 1024, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 4], "batch_size": 1024, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},

  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},

  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix"},

  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},

  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},

  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},

  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},

  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix"},

  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion"},

  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, shorter"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, shorter"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, shorter"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, shorter"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, shorter"},

  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "comment": "meta: demotion, nd=0"},

  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix"},

  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_4room_unlock_longer", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},

  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_empty8x8_2room_unlock", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "comment": "meta: demotion, nd=0"}
]