import numpy as np
np.random.seed(21)

class CE_policy():
    def __init__(self, env, original_policy):
        self.env = env
        self.original_policy = original_policy

    def predict(self, state, deterministic=True):
        v1 = 8.0 if state[4] < 0.0 else 1.0
        v2 = 8.0 if state[5] < 0.0 else 1.0
        u = np.array([v1, v2])
        action = self.env._scale_U(u)
        return action