import gymnasium as gym
import numpy as np

from typing import SupportsFloat

from gymnasium.core import ActType, ObsType, WrapperObsType, WrapperActType

from loguru import logger

class NoMovementPenalizingWrapper(gym.RewardWrapper[ObsType, ActType]):
    def __init__(self, env: gym.Env[ObsType, ActType], penalty = 1.0):
        gym.RewardWrapper.__init__(self, env)
        self.penalty = penalty

    def reward(self, reward: SupportsFloat) -> SupportsFloat:
        molecule = self.env.get_wrapper_attr("current_molecule")
        translation = molecule.translated
        if not molecule.rotated and translation.x < 0.1 and translation.y < 0.1:
            return reward - self.penalty
        return reward

