0 # initial state
[2] # terminal state
(0,0,'!a',ConstantRewardFunction(0))
(0,1,'a',ConstantRewardFunction(0))
(1,1,'!b',ConstantRewardFunction(0))
(1,2,'b',ConstantRewardFunction(1))