class Agent:
    def __init__(self):
        self.observation_reason_action_history = []
    
    def reset(self):
        self.observation_reason_action_history = []
    
    def update_history(self, observation, reason, action):
        self.observation_reason_action_history += [{'observation': observation, 'reason': reason, 'action': action}]

    def predict_reason_action(self, task, observation, candidate_actions, reward):
        pass
