from options.Option import Option


class Experience:
    def __init__(self, state: int, target_state: int, action: int, option: Option, reward: float, 
                 next_state: int, next_target_state: int, context_at_option_start: int = None,
                 duration_idx: int = 0, committed_duration: int = 1, mouse_direction: int = 0):
        self.state = state
        self.target_state = target_state  # Current target position (e.g. mouse) - for meta-policy
        self.action = action
        self.option = option
        self.reward = reward
        self.next_state = next_state
        self.next_target_state = next_target_state
        # Context when option started - for termination (may be stale)
        # If None, defaults to target_state (backward compatible)
        self.context_at_option_start = context_at_option_start if context_at_option_start is not None else target_state
        # Duration commitment: index into DURATIONS list and actual duration value
        self.duration_idx = duration_idx
        self.committed_duration = committed_duration
        # Mouse direction at option start (for chase environment)
        self.mouse_direction = mouse_direction