name: 'q_learning'
alpha: 1.0
gamma: 0.97