TRAINER:
  RL:
    SUCCESS_REWARD: 10.0
    SLACK_REWARD: -0.01
