[
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.90625, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.9375, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.96875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},

  {"policy": "impala", "experiment":"mnist_sequential_full_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},

  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},

  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, shorter"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, shorter"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, shorter"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, shorter"},
  {"policy": "impala", "experiment":"minigrid_empty8x8_2room_unlock_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, shorter"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_4room", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_4room", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_4room", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_4room", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_4room", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridor", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridor", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridor", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridor", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridor", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},

  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "comment": "meta: demotion, nd=0"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.90625, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.90625, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.90625, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.90625, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.90625, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.9375, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.9375, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.9375, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.9375, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.9375, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.96875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.96875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.96875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.96875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.96875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},

  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 4, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0"},

  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 8, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 8, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 8, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 8, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0"},
  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 8, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly shorter"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly shorter"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_pseudo_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 2"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},

  {"policy": "impala", "experiment":"mnist_sequential_full_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},
  {"policy": "impala", "experiment":"mnist_sequential_full_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, early stop fix"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix, CL 3"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix, CL 3"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix, CL 3"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix, CL 3"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix, CL 3"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix, CL 3"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10"},

  {"policy": "impala", "experiment":"mnist_sequential_full_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, early stop fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3"},

  {"policy": "impala", "experiment":"mnist_sequential_full_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, early stop fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3"},

  {"policy": "impala", "experiment":"mnist_sequential_full_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, early stop fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3"},

  {"policy": "impala", "experiment":"mnist_sequential_full_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, early stop fix v2"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3"},

  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 8, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0, tree viz"},
  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 8, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0, tree viz"},

  {"policy": "sane", "experiment":"mnist_sequential_full", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0, "max_hypotheses_per_layer": [20, 4], "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 1, "batch_size": 1024, "random_action_rate": 0.04, "comment": "train viz"},

  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 8, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0, tree viz"},
  {"policy": "sane", "experiment":"mnist_sequential_full", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0, "max_hypotheses_per_layer": [20, 4], "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 1, "batch_size": 1024, "random_action_rate": 0.04, "comment": "train viz"},

  {"policy": "sane", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0.99, "max_hypotheses_per_layer": [20, 8], "batch_size": 4096, "max_processes": 32, "timesteps_per_collection": 250, "num_parallel_envs": 8, "merge_ratio": 1, "num_train_long_term": 1, "num_train_short_term": 1, "num_train_meta": 1, "allowed_error_scale": 0.5, "random_action_rate": 0.04, "comment": "meta: demotion, nd=0, tree viz, timestep label"},
  {"policy": "sane", "experiment":"mnist_sequential_full", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0, "max_hypotheses_per_layer": [20, 4], "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 1, "batch_size": 1024, "random_action_rate": 0.04, "comment": "train viz, timestep label"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3"},

  {"policy": "sane", "experiment":"mnist_sequential_full", "use_cuda": false, "filter_learning_rate": 1e-3, "reward_decay_rate":0, "max_hypotheses_per_layer": [20, 4], "max_processes": 100, "timesteps_per_collection": 1000, "num_parallel_envs": 1, "batch_size": 1024, "random_action_rate": 0.04, "comment": "train viz, timestep label, NO new hypo nd=0"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},

  {"policy": "impala", "experiment":"mnist_sequential_full_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.001, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},

  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.96875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.96875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.96875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.96875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},
  {"policy": "impala", "experiment":"mnist_sequential_full", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 1, "batch_size": 128, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.001, "discounting":0, "replay_ratio": 0.96875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "CL freq=2, reward fix, post counting fix, clone loss fix v2, CL every 10, load fix"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 1, "batch_size": 8, "unroll_length": 40, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 40, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "epsilon": 0.04, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 40, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "epsilon": 0.04, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 40, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "epsilon": 0.04, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 40, "entropy_cost": 0.005, "learning_rate": 0.01, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 40, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": ""},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 40, "entropy_cost": 0.005, "learning_rate": 0.01, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 40, "entropy_cost": 0.005, "learning_rate": 0.01, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},

  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 40, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 40, "entropy_cost": 0.005, "learning_rate": 0.001, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},

  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 10, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 80, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 32, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 80, "entropy_cost": 0.01, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 32, "batch_size": 32, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 32, "batch_size": 32, "unroll_length": 10, "entropy_cost": 0.01, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 32, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 32, "batch_size": 8, "unroll_length": 80, "entropy_cost": 0.01, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 16, "batch_size": 8, "unroll_length": 160, "entropy_cost": 0.01, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 16, "batch_size": 4, "unroll_length": 160, "entropy_cost": 0.01, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 8, "batch_size": 4, "unroll_length": 160, "entropy_cost": 0.01, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 8, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.006, "num_learner_threads": 4, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 16, "batch_size": 8, "unroll_length": 80, "entropy_cost": 0.01, "learning_rate": 0.006, "num_learner_threads": 4, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 8, "batch_size": 16, "unroll_length": 80, "entropy_cost": 0.01, "learning_rate": 0.006, "num_learner_threads": 4, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 8, "batch_size": 16, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.006, "num_learner_threads": 4, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 8, "batch_size": 16, "unroll_length": 20, "entropy_cost": 0.001, "learning_rate": 0.006, "num_learner_threads": 4, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 8, "batch_size": 16, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 4, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 8, "batch_size": 16, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},

  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1_stop_early", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.875, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},
  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.5, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"},

  {"policy": "impala", "experiment":"minigrid_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.00005, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 8, "batch_size": 16, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 40, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.01, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.001, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 16, "unroll_length": 20, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 80, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},
  {"policy": "impala", "experiment":"minigrid_keycorridorS3R1", "use_clear": false, "net_flavor": "default", "num_actors": 4, "batch_size": 16, "unroll_length": 80, "entropy_cost": 0.0001, "learning_rate": 0.006, "num_learner_threads": 1, "large_file_path": "/scratch/<redacted>/tmp", "comment": "Minor IMPALA fixes"},

  {"policy": "impala", "experiment":"minigrid_2room_unlock_keycorridorS3R1", "use_clear": true, "replay_buffer_frames": 409600, "net_flavor": "default", "num_actors": 4, "batch_size": 8, "unroll_length": 20, "entropy_cost": 0.005, "learning_rate": 0.006, "num_learner_threads": 1, "replay_ratio": 0.75, "large_file_path": "/scratch/<redacted>/tmp", "comment": "post reward fix, post counting fix, clone loss fix v2, slightly longer, early stop fix v2, CL 3, load fix"}
]