import os
os.environ['D4RL_SUPPRESS_IMPORT_ERROR'] = '1'
import sys
sys.path.insert(1, os.path.join(sys.path[0], '..'))
import gym
import d4rl
import numpy as np
from utils.utils import set_seed


class Ant:
    def __init__(self, seed=np.random.randint(int(1e5))):
        set_seed(seed)
        self.state_dim = (111,)
        self.action_dim = 8
        # self.env = gym.make('Ant-v2')
        self.env = gym.make('ant-random-v2')# Loading d4rl env. For the convinience of getting normalized score from d4rl
        self.env.unwrapped.seed(seed)
        self.env._max_episode_steps = np.inf # control timeout setting in agent
        self.state = None

    def reset(self, seed):
        return self.env.reset(seed=seed)

    def step(self, a):
        ret = self.env.step(a[0])
        state, reward, done, info = ret
        self.state = state
        # self.env.render()
        return np.asarray(state), np.asarray(reward), np.asarray(done), info

    def get_visualization_segment(self):
        raise NotImplementedError

    def get_useful(self, state=None):
        if state:
            return state
        else:
            return np.array(self.env.state)

    def info(self, key):
        return
    


if __name__ == "__main__":
    env = Ant()
    print(env.state_dim)
    print(env.action_dim)
    print(env.reset())
    print(env.step([env.env.action_space.sample()]))
