(MDP)
	gym-test
(Agents)
	Q-learning,0
(Params)
	instances : 1
	episodes : 10000
	steps : 200
	track_disc_reward : False
