[
  {"policy": "impala", "experiment":"atari_cycle", "num_actors": 32, "batch_size": 32, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.0006, "comment": "IMPALA atari consts"},
  {"policy": "impala", "experiment":"atari_cycle", "num_actors": 32, "batch_size": 32, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.0006, "comment": "IMPALA atari consts, non-temp"},
  {"policy": "impala", "experiment":"atari_simple", "num_actors": 32, "batch_size": 32, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.0006, "comment": "IMPALA atari consts, non-temp"},
  {"policy": "impala", "experiment":"atari_simple", "num_actors": 32, "batch_size": 32, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.0006, "comment": "IMPALA atari consts, non-temp, common net"},
  {"policy": "impala", "experiment":"atari_cycle", "use_clear": true, "replay_buffer_frames": 5e6, "num_actors": 32, "batch_size": 32, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.0006, "comment": "CLEAR, no behavior cloning"},
  {"policy": "impala", "experiment":"atari_simple", "use_clear": true, "replay_buffer_frames": 5e6, "num_actors": 32, "batch_size": 32, "unroll_length": 20, "entropy_cost": 0.01, "learning_rate": 0.0006, "comment": "CLEAR, no behavior cloning"}
]