import gym
from gym.wrappers import GrayScaleObservation, ResizeObservation, FrameStack, ClipAction
import numpy as np
import cv2
import pyglet

env = gym.make("CarRacing-v1")
env = ResizeObservation(env, shape=(128, 128))



done = False
obs = env.reset()

# 获取动作空间
action_space = env.action_space
# 获取动作空间的最大值和最小值
max_action = action_space.high
min_action = action_space.low

print("Maximum action values:", max_action)
print("Minimum action values:", min_action)

time_step = 0
while not done:
    action = np.array([0, 0.2, 0])
    # action = env.action_space.sample()  # 随机采样一个动作
    obs, reward, done, info = env.step(action)
    if time_step % 20 == 0:
        post_action_image = env.render(mode='rgb_array')
        print("action:", action)
        print("obs:", obs.shape)
        print("post_action_image:", post_action_image.shape)

        cv2.imwrite('C:/doctor/LLM_RL/dmc2gym/images/{}.png'.format(time_step), post_action_image)
        print("-----------------------------------------------")

    time_step = time_step + 1

    if time_step == 500:
        break

env.close()