import math
from env_MA_box import VectorEnv
import argparse
import pdb
import numpy as np
def main(args):
    robot_config = [{'lifting_robot': 2}]
    #robot_config = [{'throwing_robot': 2}]
    #robot_config = [{'lifting_robot': 2}, {'throwing_robot': 2}]

    env = VectorEnv(use_egl_renderer=False, show_gui=True, robot_config = robot_config, room_length=1, room_width=1, obs_radius = 2, termination_step = 10000,  target_pos = [0.3, 0.3], target_width = 0.4, num_cubes = 10)
    state = env.reset()
    print("state", state[0].shape)

    #pdb.set_trace()

    # while True:
    #     a = input("input:").split(" ")
    #     for i in range(300):
    #         action = [float(a[0]), float(a[1]), float(a[2]), float(a[3])]
    #         state, reward, done, _ = env.step(action)
    #         print(reward)
    #         print("state1", state[0])
    #         print("state2", state[1])
    #         if done:
    #             print("done", reward)
    #             break
    #     if done:
    #         print(reward)
    #         print("done", reward)
    #         break

    # while True:
    #     for i in range(300):
    #         action = [float(state[0][6]) * 0.85, float(state[0][7]) * 0.85, float(state[0][9]) * 0.85, float(state[0][10]) * 0.85]
    #         state, reward, done, _ = env.step(action)
    #         print(reward)
    #         if done:
    #             print("done", reward)
    #             break
    #     if done:
    #         print(reward)
    #         print("done", reward)
    #         break


    while True:
        action = np.random.randn(4)
        action = np.clip(action, -1, 1)

        state, reward, done, _ = env.step(action)
        print("state", state[0].shape)
        print(reward)
        if done:
            print("done", reward)
            break

                        

parser = argparse.ArgumentParser()
main(parser.parse_args())