(MDP)
	gym-MidMaze
(Agents)
	RLang-Dyna-Q-plan,0
	Dyna-Q,1
(Params)
	instances : 1
	episodes : 20
	steps : 1000
	track_disc_reward : False
