{"ep_states": [[{"players": [{"position": [1, 2], "orientation": [0, -1], "held_object": null}, {"position": [3, 1], "orientation": [0, -1], "held_object": null}], "objects": [], "bonus_orders": [{"ingredients": ["onion", "tomato"]}], "all_orders": [{"ingredients": ["onion", "onion", "onion"]}, {"ingredients": ["tomato", "tomato", "tomato"]}, {"ingredients": ["onion", "tomato"]}], "timestep": 0}, {"players": [{"position": [1, 2], "orientation": [0, -1], "held_object": null}, {"position": [3, 1], "orientation": [0, -1], "held_object": null}], "objects": [], "bonus_orders": [{"ingredients": ["onion", "tomato"]}], "all_orders": [{"ingredients": ["onion", "onion", "onion"]}, {"ingredients": ["tomato", "tomato", "tomato"]}, {"ingredients": ["onion", "tomato"]}], "timestep": 1}, {"players": [{"position": [1, 2], "orientation": [0, -1], "held_object": null}, {"position": [3, 1], "orientation": [0, -1], "held_object": null}], "objects": [], "bonus_orders": [{"ingredients": ["onion", "tomato"]}], "all_orders": [{"ingredients": ["onion", "onion", "onion"]}, {"ingredients": ["tomato", "tomato", "tomato"]}, {"ingredients": ["onion", "tomato"]}], "timestep": 2}, {"players": [{"position": [1, 2], "orientation": [0, 1], "held_object": null}, {"position": [3, 1], "orientation": [0, -1], "held_object": null}], "objects": [], "bonus_orders": [{"ingredients": ["onion", "tomato"]}], "all_orders": [{"ingredients": ["onion", "onion", "onion"]}, {"ingredients": ["tomato", "tomato", "tomato"]}, {"ingredients": ["onion", "tomato"]}], "timestep": 3}, {"players": [{"position": [1, 2], "orientation": [-1, 0], "held_object": null}, {"position": [3, 1], "orientation": [0, -1], "held_object": null}], "objects": [], "bonus_orders": [{"ingredients": ["onion", "tomato"]}], "all_orders": [{"ingredients": ["onion", "onion", "onion"]}, {"ingredients": ["tomato", "tomato", "tomato"]}, {"ingredients": ["onion", "tomato"]}], "timestep": 4}, {"players": [{"position": [1, 1], "orientation": [0, -1], "held_object": null}, {"position": [3, 1], "orientation": [0, -1], "held_object": null}], "objects": [], "bonus_orders": [{"ingredients": ["onion", "tomato"]}], "all_orders": [{"ingredients": ["onion", "onion", "onion"]}, {"ingredients": ["tomato", "tomato", "tomato"]}, {"ingredients": ["onion", "tomato"]}], "timestep": 5}, {"players": [{"position": [1, 1], "orientation": [-1, 0], "held_object": null}, {"position": [3, 2], "orientation": [0, 1], "held_object": null}], "objects": [], "bonus_orders": [{"ingredients": ["onion", "tomato"]}], "all_orders": [{"ingredients": ["onion", "onion", "onion"]}, {"ingredients": ["tomato", "tomato", "tomato"]}, {"ingredients": ["onion", "tomato"]}], "timestep": 6}, {"players": [{"position": [1, 1], "orientation": [-1, 0], "held_object": {"name": "onion", "position": [1, 1]}}, {"position": [2, 2], "orientation": [-1, 0], "held_object": null}], "objects": [], "bonus_orders": [{"ingredients": ["onion", "tomato"]}], "all_orders": [{"ingredients": ["onion", "onion", "onion"]}, {"ingredients": ["tomato", "tomato", "tomato"]}, {"ingredients": ["onion", "tomato"]}], "timestep": 7}, {"players": [{"position": [1, 1], "orientation": [-1, 0], "held_object": {"name": "onion", "position": [1, 1]}}, {"position": [2, 2], "orientation": [-1, 0], "held_object": null}], "objects": [], "bonus_orders": [{"ingredients": ["onion", "tomato"]}], "all_orders": [{"ingredients": ["onion", "onion", "onion"]}, {"ingredients": ["tomato", "tomato", "tomato"]}, {"ingredients": ["onion", "tomato"]}], "timestep": 8}, {"players": [{"position": [2, 1], "orientation": [1, 0], "held_object": {"name": "onion", "position": [2, 1]}}, {"position": [1, 2], "orientation": [-1, 0], "held_object": null}], "objects": [], "bonus_orders": [{"ingredients": ["onion", "tomato"]}], "all_orders": [{"ingredients": ["onion", "onion", "onion"]}, {"ingredients": ["tomato", "tomato", "tomato"]}, {"ingredients": ["onion", "tomato"]}], "timestep": 9}]], "ep_actions": [[["interact", "interact"], [[0, 0], [0, 0]], [[0, 1], [0, 0]], [[-1, 0], [0, 0]], [[0, -1], [0, 0]], [[-1, 0], [0, 1]], ["interact", [-1, 0]], [[0, 0], "interact"], [[1, 0], [-1, 0]], [[0, 1], [0, -1]]]], "ep_rewards": [[0, 0, 0, 0, 0, 0, 0, 20, 0, 0]], "ep_dones": [[false, false, false, false, false, false, false, false, false, true]], "ep_returns": [0], "ep_lengths": [10], "mdp_params": [{"layout_name": "cramped_room_tomato", "terrain": [["X", "X", "P", "X", "X"], ["O", " ", " ", " ", "T"], ["X", " ", " ", " ", "X"], ["X", "D", "X", "S", "X"]], "start_player_positions": [[1, 2], [3, 1]], "start_bonus_orders": [{"ingredients": ["tomato", "onion"]}], "rew_shaping_params": {"PLACEMENT_IN_POT_REW": 3, "DISH_PICKUP_REWARD": 3, "SOUP_PICKUP_REWARD": 5, "DISH_DISP_DISTANCE_REW": 0, "POT_DISTANCE_REW": 0, "SOUP_DISTANCE_REW": 0}, "start_all_orders": [{"ingredients": ["onion", "onion", "onion"]}, {"ingredients": ["tomato", "tomato", "tomato"]}, {"ingredients": ["tomato", "onion"]}]}], "env_params": [{"start_state_fn": null, "horizon": 10, "info_level": 1, "_variable_mdp": true}]}