run_name,shield,punish_unsafe_orig_action,punish_unsafe_orig_action_modifier,randomize_starts,map_type,grid_world_map_name,grid_world_obs_type,learner_type,learner_anneal_eps_start,learner_anneal_eps_finish,max_total_steps,seed
IndivQLearningReproTest/0_0_0,centralized,False,0,True,GridWorld,Pentagon,PartialObsDiscrete,Individual_Q,0.2,0.2,1000000,0
IndivQLearningReproTest/1_0_1,centralized,False,0,True,GridWorld,Pentagon,PartialObsDiscrete,Individual_Q,0.2,0.2,1000000,0
IndivQLearningReproTest/2_0_2,centralized,False,0,True,GridWorld,Pentagon,PartialObsDiscrete,Individual_Q,0.2,0.2,1000000,0
