import time

import numpy as np

import gym


if __name__ == "__main__":
    env = gym.make("LunarLander-v2")
    state = env.reset()
    # state[1] = state[1] - 2

    # env.env.state = states[0]
    env.env.state = state
    env.render()

    noop_action = 0

    for idx in range(500):
        # action = noop_action
        action = np.random.randint(4)
        state, reward, is_terminal, _ = env.step(action)

        if idx == 80:
            env.reset()
        if idx == 150:
            state = np.array([0.0113451, 1.385503, 0.5683772,
                              -0.5773779, -0.01126716,
                              -0.09319402, 0., 0.], dtype=np.float32)
            # env.env.state = state
            env.state = state
        # print(state)
        print(idx)
        env.render()
        time.sleep(.1)


# for idx, state in enumerate(states):
#     env.env.state = state
#
#     env.render()
#     time.sleep(.1)
#     print(idx, env.state)
#
