(MDP)
	gym-nl2rlang
(Agents)
	RLang-Dyna-Q-plan,0
	RLang-Dyna-Q-effect,1
	RLang-Dyna-Q-combined,2
	Dyna-Q,3
	Random,4
(Params)
	instances : 10
	episodes : 50
	steps : 500
	track_disc_reward : False
