class HumanPolicy:
    def __init__(self, env, agent_id):
        self.env = env
        self.agent_id = agent_id

    def observe(self, obs):
        self.obs = obs

    def act(self):
        return self.env.agents[self.agent_id]._agent.runstep(self.obs, self.env.gametimestamp)
