from abc import ABC, abstractmethod
from typing import List, Union, Dict
import gymnasium as gym
import numpy as np
import torch
from minigrid.wrappers import FullyObsWrapper


def seed_everything(seed):
    np.random.seed(seed)
    torch.manual_seed(seed)

class DataGenerator(ABC):
    def __init__(self, env="CliffWalking-v0", type="binary_feedback", distribution="traverse"):
        self.env = gym.make(env)
        self.type = type
        self.distribution = distribution
        self.state_array = None

    @abstractmethod
    def sample_array_of_states(self, number) -> np.array:
        pass

    @abstractmethod
    def sample_array_of_trajectories(self, number) -> List[Dict]:
        pass

    @abstractmethod
    def get_expert_actions(self, state) -> List:
        pass

    @abstractmethod
    def get_expert_value(self, state) -> float:
        pass

    @abstractmethod
    def get_expert_qvalue(self, state, action) -> float:
        pass

    def get_expert_binary_feedback(self, state, action) -> int:
        """
        This function returns the binary feedback that the expert would give for a given state-action pair.
        :param state:
        :param action:
        :return: 1, positive, -1 negative
        TODO: indifferent feedback?
        """
        expert_actions = self.get_expert_actions(state)
        if action in expert_actions:
            return 1
        else:
            return -1

    def get_expert_preference(self, state, action1, action2) -> int:
        expert_q1 = self.get_expert_qvalue(state, action1)
        expert_q2 = self.get_expert_qvalue(state, action2)
        if expert_q1 > expert_q2:
            return 1
        elif expert_q1 == expert_q2:
            return 0
        else:
            return -1

    def get_expert_action_advising(self, state) -> List:
        """
        This function returns the action that the expert would advise in a given state.
        TODO: Do we want stochastic or deterministic advising?
        :param state: np.array of single action
        :return:
        """
        expert_actions = self.get_expert_actions(state)
        return (expert_actions)
