(MDP)
	gridworld_h-10_w-10
(Agents)
	Q-learning,0
	Random,1
	Q-learning-abstr,2
(Params)
	instances : 5
	episodes : 100
	steps : 150
	track_disc_reward : False
