[
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.26.243.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.26.746.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.27.249.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.252.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.28.246.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.33.291.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.31.295.png"
    }
  },
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.26.746.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.27.249.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.27.742.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.28.794.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.26.243.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.33.755.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.755.png"
    }
  },
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.27.249.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.27.742.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.28.246.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.29.248.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.26.746.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.31.755.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.34.748.png"
    }
  },
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.27.742.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.28.246.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.28.794.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.755.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.29.742.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.31.295.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.33.291.png"
    }
  },
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.28.246.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.28.794.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.29.248.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.29.742.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.27.249.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.252.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.31.755.png"
    }
  },
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.28.794.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.29.248.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.29.742.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.34.748.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.27.249.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.797.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.252.png"
    }
  },
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.29.248.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.29.742.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.252.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.33.291.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.797.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.246.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.31.295.png"
    }
  },
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.29.742.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.252.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.797.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.26.243.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.755.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.31.295.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.31.755.png"
    }
  },
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.252.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.797.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.31.295.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.34.748.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.29.742.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.246.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.28.246.png"
    }
  },
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.797.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.31.295.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.31.755.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.27.249.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.755.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.28.246.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.27.742.png"
    }
  },
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.31.295.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.31.755.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.246.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.755.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.28.794.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.33.291.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.252.png"
    }
  },
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.31.755.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.246.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.755.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.33.755.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.26.243.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.252.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.29.248.png"
    }
  },
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.246.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.755.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.33.291.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.27.249.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.30.797.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.34.248.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.29.742.png"
    }
  },
  {
    "instruction": "Proceed from your current location through the main door, and find the refrigerator in the living room.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.755.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.33.291.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.33.755.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.34.748.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.29.742.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.26.243.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.32.246.png"
    }
  },
  {
    "instruction": "Circle around the dining room and search for the dining table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.35.252.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.35.757.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.36.253.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.36.801.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.37.256.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.40.301.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.38.251.png"
    }
  },
  {
    "instruction": "Circle around the dining room and search for the dining table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.35.757.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.36.253.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.36.801.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.40.301.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.39.754.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.37.256.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.37.759.png"
    }
  },
  {
    "instruction": "Circle around the dining room and search for the dining table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.36.253.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.36.801.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.37.256.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.38.802.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.40.301.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.38.251.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.37.759.png"
    }
  },
  {
    "instruction": "Circle around the dining room and search for the dining table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.36.801.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.37.256.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.37.759.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.40.800.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.39.252.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.38.251.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.38.802.png"
    }
  },
  {
    "instruction": "Circle around the dining room and search for the dining table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.37.256.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.37.759.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.38.251.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.39.252.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.40.301.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.35.757.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.36.253.png"
    }
  },
  {
    "instruction": "Circle around the dining room and search for the dining table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.37.759.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.38.251.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.38.802.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.35.252.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.35.757.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.40.800.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.39.754.png"
    }
  },
  {
    "instruction": "Circle around the dining room and search for the dining table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.38.251.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.38.802.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.39.252.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.35.757.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.40.301.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.35.252.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.37.759.png"
    }
  },
  {
    "instruction": "Circle around the dining room and search for the dining table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.38.802.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.39.252.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.39.754.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.40.301.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.38.251.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.36.253.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.40.800.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.41.257.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.41.802.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.42.304.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.296.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.302.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.50.295.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.801.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.41.802.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.42.304.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.42.779.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.792.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.44.808.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.41.257.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.302.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.42.304.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.42.779.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.302.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.804.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.44.305.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.298.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.801.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.42.779.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.302.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.792.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.804.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.794.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.41.257.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.44.808.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.302.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.792.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.44.305.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.51.807.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.806.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.303.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.804.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.792.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.44.305.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.44.808.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.295.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.806.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.804.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.50.792.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.44.305.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.44.808.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.303.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.295.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.302.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.804.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.52.302.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.44.808.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.303.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.804.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.48.805.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.42.779.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.801.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.806.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.303.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.804.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.295.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.50.295.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.792.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.44.808.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.296.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.804.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.295.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.806.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.48.303.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.801.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.794.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.792.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.295.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.806.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.296.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.41.802.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.302.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.298.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.48.303.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.806.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.296.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.801.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.41.257.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.48.805.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.804.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.295.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.296.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.801.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.48.303.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.792.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.50.792.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.794.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.298.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.801.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.48.303.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.48.805.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.41.802.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.794.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.806.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.804.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.48.303.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.48.805.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.298.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.42.779.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.52.775.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.302.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.50.295.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.48.805.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.298.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.794.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.50.792.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.48.303.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.42.779.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.303.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.298.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.794.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.50.295.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.801.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.51.296.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.48.805.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.52.302.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.794.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.50.295.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.50.792.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.48.805.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.806.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.52.775.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.51.807.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.50.295.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.50.792.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.51.296.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.52.302.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.42.304.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.43.792.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.41.257.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.50.792.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.51.296.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.51.807.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.49.794.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.44.305.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.47.296.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.52.775.png"
    }
  },
  {
    "instruction": "Leave the dining room, proceed into the living room, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.51.296.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.51.807.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.52.302.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.42.304.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.53.301.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.45.303.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.46.295.png"
    }
  },
  {
    "instruction": "Exit the living room, proceed to the balcony, and locate the side table there.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.53.803.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.54.307.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.54.806.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.796.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.55.301.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.55.806.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.56.307.png"
    }
  },
  {
    "instruction": "Exit the living room, proceed to the balcony, and locate the side table there.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.54.307.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.54.806.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.55.301.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.56.307.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.796.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.59.292.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.59.809.png"
    }
  },
  {
    "instruction": "Exit the living room, proceed to the balcony, and locate the side table there.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.54.806.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.55.301.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.55.806.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.796.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.56.798.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.57.798.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.59.292.png"
    }
  },
  {
    "instruction": "Exit the living room, proceed to the balcony, and locate the side table there.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.55.301.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.55.806.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.56.307.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.57.292.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.305.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.59.809.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.54.806.png"
    }
  },
  {
    "instruction": "Exit the living room, proceed to the balcony, and locate the side table there.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.55.806.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.56.307.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.56.798.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.55.301.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.00.301.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.57.798.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.54.806.png"
    }
  },
  {
    "instruction": "Exit the living room, proceed to the balcony, and locate the side table there.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.56.307.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.56.798.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.57.292.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.00.301.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.59.292.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.305.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.53.803.png"
    }
  },
  {
    "instruction": "Exit the living room, proceed to the balcony, and locate the side table there.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.56.798.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.57.292.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.57.798.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.796.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.54.307.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.305.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.53.803.png"
    }
  },
  {
    "instruction": "Exit the living room, proceed to the balcony, and locate the side table there.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.57.292.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.57.798.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.305.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.00.301.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.56.798.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.59.292.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.53.803.png"
    }
  },
  {
    "instruction": "Exit the living room, proceed to the balcony, and locate the side table there.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.57.798.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.305.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.796.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.55.301.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.59.809.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.55.806.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.53.803.png"
    }
  },
  {
    "instruction": "Exit the living room, proceed to the balcony, and locate the side table there.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.305.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.796.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.59.292.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.56.307.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.00.301.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.54.806.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.53.803.png"
    }
  },
  {
    "instruction": "Exit the living room, proceed to the balcony, and locate the side table there.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.796.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.59.292.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.59.809.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.00.792.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.57.798.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.01.305.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.56.798.png"
    }
  },
  {
    "instruction": "Exit the living room, proceed to the balcony, and locate the side table there.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.59.292.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.59.809.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.00.301.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.58.796.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.00.792.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.37.57.798.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.01.305.png"
    }
  },
  {
    "instruction": "Depart from the balcony, pass through the corridor, enter the activity room on the left, and approach the billiard table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.01.789.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.02.306.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.02.792.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.805.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.308.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.04.290.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.08.799.png"
    }
  },
  {
    "instruction": "Depart from the balcony, pass through the corridor, enter the activity room on the left, and approach the billiard table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.02.306.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.02.792.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.308.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.04.290.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.305.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.06.292.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.08.292.png"
    }
  },
  {
    "instruction": "Depart from the balcony, pass through the corridor, enter the activity room on the left, and approach the billiard table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.02.792.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.308.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.805.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.807.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.04.803.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.02.306.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.08.799.png"
    }
  },
  {
    "instruction": "Depart from the balcony, pass through the corridor, enter the activity room on the left, and approach the billiard table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.308.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.805.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.04.290.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.06.292.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.807.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.305.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.10.287.png"
    }
  },
  {
    "instruction": "Depart from the balcony, pass through the corridor, enter the activity room on the left, and approach the billiard table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.805.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.04.290.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.04.803.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.807.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.08.799.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.305.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.06.807.png"
    }
  },
  {
    "instruction": "Depart from the balcony, pass through the corridor, enter the activity room on the left, and approach the billiard table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.04.290.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.04.803.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.305.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.805.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.10.287.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.08.799.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.06.292.png"
    }
  },
  {
    "instruction": "Depart from the balcony, pass through the corridor, enter the activity room on the left, and approach the billiard table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.04.803.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.305.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.807.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.08.292.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.09.793.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.08.799.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.06.807.png"
    }
  },
  {
    "instruction": "Depart from the balcony, pass through the corridor, enter the activity room on the left, and approach the billiard table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.305.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.807.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.06.292.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.09.793.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.07.284.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.02.306.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.01.789.png"
    }
  },
  {
    "instruction": "Depart from the balcony, pass through the corridor, enter the activity room on the left, and approach the billiard table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.807.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.06.292.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.06.807.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.02.792.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.08.292.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.305.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.805.png"
    }
  },
  {
    "instruction": "Depart from the balcony, pass through the corridor, enter the activity room on the left, and approach the billiard table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.06.292.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.06.807.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.07.284.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.08.799.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.805.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.308.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.305.png"
    }
  },
  {
    "instruction": "Depart from the balcony, pass through the corridor, enter the activity room on the left, and approach the billiard table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.06.807.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.07.284.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.08.292.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.805.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.09.793.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.305.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.06.292.png"
    }
  },
  {
    "instruction": "Depart from the balcony, pass through the corridor, enter the activity room on the left, and approach the billiard table.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.07.284.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.08.292.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.08.799.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.10.287.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.05.807.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.308.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.03.805.png"
    }
  },
  {
    "instruction": "Depart from the billiard table, proceed into the cat activity room that contains a cat tree, and approach the litter box.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.09.793.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.10.287.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.10.802.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.11.801.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.13.293.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.12.798.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.14.306.png"
    }
  },
  {
    "instruction": "Depart from the billiard table, proceed into the cat activity room that contains a cat tree, and approach the litter box.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.10.287.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.10.802.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.11.303.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.12.290.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.14.306.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.09.793.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.12.798.png"
    }
  },
  {
    "instruction": "Depart from the billiard table, proceed into the cat activity room that contains a cat tree, and approach the litter box.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.10.802.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.11.303.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.11.801.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.12.798.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.09.793.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.13.805.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.14.306.png"
    }
  },
  {
    "instruction": "Depart from the billiard table, proceed into the cat activity room that contains a cat tree, and approach the litter box.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.11.303.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.11.801.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.12.290.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.12.798.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.10.802.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.14.306.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.13.293.png"
    }
  },
  {
    "instruction": "Depart from the billiard table, proceed into the cat activity room that contains a cat tree, and approach the litter box.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.11.801.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.12.290.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.12.798.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.13.293.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.13.805.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.10.802.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.14.306.png"
    }
  },
  {
    "instruction": "Depart from the billiard table, proceed into the cat activity room that contains a cat tree, and approach the litter box.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.12.290.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.12.798.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.13.293.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.10.802.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.09.793.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.14.306.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.13.805.png"
    }
  },
  {
    "instruction": "Exit the cat activity room, proceed into the billiard activity room, and move toward the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.14.805.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.15.307.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.15.821.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.17.806.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.19.799.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.16.304.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.16.804.png"
    }
  },
  {
    "instruction": "Exit the cat activity room, proceed into the billiard activity room, and move toward the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.15.307.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.15.821.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.16.304.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.18.795.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.16.804.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.19.300.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.17.298.png"
    }
  },
  {
    "instruction": "Exit the cat activity room, proceed into the billiard activity room, and move toward the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.15.821.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.16.304.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.16.804.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.18.305.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.20.305.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.19.300.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.17.806.png"
    }
  },
  {
    "instruction": "Exit the cat activity room, proceed into the billiard activity room, and move toward the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.16.304.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.16.804.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.17.298.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.18.305.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.17.806.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.14.805.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.15.307.png"
    }
  },
  {
    "instruction": "Exit the cat activity room, proceed into the billiard activity room, and move toward the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.16.804.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.17.298.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.17.806.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.20.809.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.18.795.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.15.821.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.18.305.png"
    }
  },
  {
    "instruction": "Exit the cat activity room, proceed into the billiard activity room, and move toward the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.17.298.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.17.806.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.18.305.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.20.809.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.19.300.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.16.304.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.14.805.png"
    }
  },
  {
    "instruction": "Exit the cat activity room, proceed into the billiard activity room, and move toward the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.17.806.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.18.305.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.18.795.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.16.304.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.19.300.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.15.821.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.19.799.png"
    }
  },
  {
    "instruction": "Exit the cat activity room, proceed into the billiard activity room, and move toward the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.18.305.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.18.795.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.19.300.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.20.305.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.16.804.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.17.806.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.17.298.png"
    }
  },
  {
    "instruction": "Exit the cat activity room, proceed into the billiard activity room, and move toward the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.18.795.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.19.300.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.19.799.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.20.809.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.16.304.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.15.821.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.20.305.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.20.809.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.21.292.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.21.805.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.30.800.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.26.799.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.23.295.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.28.806.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.21.292.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.21.805.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.22.299.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.25.802.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.304.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.805.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.30.800.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.21.805.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.22.299.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.23.295.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.304.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.28.297.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.26.299.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.798.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.22.299.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.23.295.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.304.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.21.805.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.300.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.25.306.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.28.806.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.23.295.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.304.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.798.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.26.299.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.22.299.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.25.802.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.805.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.304.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.798.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.25.306.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.30.311.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.20.809.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.28.297.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.26.299.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.798.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.25.306.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.25.802.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.30.311.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.30.800.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.805.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.26.799.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.25.306.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.25.802.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.26.299.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.30.311.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.22.299.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.805.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.300.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.25.802.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.26.299.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.26.799.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.29.853.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.22.299.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.30.800.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.805.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.26.299.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.26.799.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.300.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.28.297.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.23.295.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.798.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.22.299.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.26.799.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.300.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.805.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.21.805.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.304.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.28.806.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.23.295.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.300.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.805.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.28.297.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.25.802.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.29.297.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.29.853.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.304.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.805.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.28.297.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.28.806.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.30.800.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.29.853.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.29.297.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.26.299.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.28.297.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.28.806.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.29.297.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.798.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.30.311.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.24.304.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.30.800.png"
    }
  },
  {
    "instruction": "Depart from the activity room, proceed into the hallway, move to the right, enter the bedroom, and find the desktop computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.28.806.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.29.297.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.29.853.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.27.300.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.30.800.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.23.295.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.25.306.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, pass the adjacent bed, proceed to the balcony, and approach the rocking chair",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.31.304.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.32.304.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.32.855.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.39.307.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.35.805.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.33.850.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.33.310.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, pass the adjacent bed, proceed to the balcony, and approach the rocking chair",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.32.304.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.32.855.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.33.310.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.34.304.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.35.805.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.38.854.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.36.849.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, pass the adjacent bed, proceed to the balcony, and approach the rocking chair",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.32.855.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.33.310.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.33.850.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.35.805.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.34.304.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.38.854.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.39.854.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, pass the adjacent bed, proceed to the balcony, and approach the rocking chair",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.33.310.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.33.850.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.34.304.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.36.351.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.36.849.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.37.854.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.35.805.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, pass the adjacent bed, proceed to the balcony, and approach the rocking chair",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.33.850.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.34.304.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.35.805.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.36.849.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.39.307.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.37.312.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.32.304.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, pass the adjacent bed, proceed to the balcony, and approach the rocking chair",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.34.304.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.35.805.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.36.351.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.32.304.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.31.304.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.37.312.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.33.310.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, pass the adjacent bed, proceed to the balcony, and approach the rocking chair",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.35.805.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.36.351.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.36.849.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.37.854.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.37.312.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.31.304.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.38.350.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, pass the adjacent bed, proceed to the balcony, and approach the rocking chair",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.36.351.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.36.849.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.37.312.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.31.304.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.37.854.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.38.350.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.32.304.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, pass the adjacent bed, proceed to the balcony, and approach the rocking chair",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.36.849.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.37.312.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.37.854.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.38.854.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.32.855.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.32.304.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.33.310.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, pass the adjacent bed, proceed to the balcony, and approach the rocking chair",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.37.312.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.37.854.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.38.350.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.35.805.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.39.307.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.32.855.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.39.854.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, pass the adjacent bed, proceed to the balcony, and approach the rocking chair",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.37.854.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.38.350.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.38.854.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.36.849.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.39.854.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.32.855.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.39.307.png"
    }
  },
  {
    "instruction": "Depart from the rocking chair on the balcony, proceed into the bedroom, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.39.854.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.40.352.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.40.843.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.352.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.42.842.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.42.358.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.41.857.png"
    }
  },
  {
    "instruction": "Depart from the rocking chair on the balcony, proceed into the bedroom, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.40.352.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.40.843.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.41.355.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.42.842.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.42.358.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.39.854.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.43.346.png"
    }
  },
  {
    "instruction": "Depart from the rocking chair on the balcony, proceed into the bedroom, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.40.843.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.41.355.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.41.857.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.40.352.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.42.842.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.43.346.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.42.358.png"
    }
  },
  {
    "instruction": "Depart from the rocking chair on the balcony, proceed into the bedroom, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.41.355.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.41.857.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.42.358.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.43.346.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.43.846.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.42.842.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.40.352.png"
    }
  },
  {
    "instruction": "Depart from the rocking chair on the balcony, proceed into the bedroom, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.41.857.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.42.358.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.42.842.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.43.846.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.39.854.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.43.346.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.40.843.png"
    }
  },
  {
    "instruction": "Depart from the rocking chair on the balcony, proceed into the bedroom, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.42.358.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.42.842.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.43.346.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.40.843.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.41.355.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.352.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.39.854.png"
    }
  },
  {
    "instruction": "Depart from the rocking chair on the balcony, proceed into the bedroom, and approach the television.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.42.842.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.43.346.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.43.846.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.41.857.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.40.843.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.39.854.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.839.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, proceed into the nearby bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.352.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.839.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.45.356.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.341.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.340.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.345.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, proceed into the nearby bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.839.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.45.356.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.45.852.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.352.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.844.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.345.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.340.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, proceed into the nearby bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.45.356.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.45.852.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.340.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.352.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.345.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.847.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.844.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, proceed into the nearby bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.45.852.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.340.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.844.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.833.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.352.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.847.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.839.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, proceed into the nearby bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.340.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.844.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.345.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.839.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.352.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.341.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.45.852.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, proceed into the nearby bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.844.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.345.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.847.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.833.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.352.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.44.839.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, proceed into the nearby bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.345.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.847.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.341.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.45.852.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.844.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.340.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.340.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.844.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.345.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.348.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.341.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.844.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.345.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.847.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.833.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.850.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.853.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.345.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.847.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.341.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.850.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.348.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.847.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.341.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.833.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.853.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.341.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.833.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.850.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.349.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.847.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.833.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.850.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.844.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.847.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.349.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.853.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.345.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.847.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.349.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.853.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.340.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.847.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.349.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.340.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.833.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.340.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.847.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.850.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.348.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.850.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.345.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.850.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.348.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.48.341.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.850.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.850.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.844.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.47.847.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.853.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.348.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.850.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.850.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.348.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.853.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.46.340.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed past the toilet, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.850.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.348.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.348.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.349.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.853.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.349.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.00.344.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.58.858.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.844.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.349.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.59.341.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.853.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.350.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.349.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.844.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.350.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.55.342.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.853.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.844.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.57.351.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.55.857.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.350.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.853.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.350.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.59.849.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.02.845.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.55.342.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.856.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.853.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.350.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.844.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.856.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.58.858.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.55.857.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.349.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.350.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.844.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.55.342.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.856.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.56.358.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.844.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.55.342.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.55.857.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.56.358.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.57.351.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.00.344.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.56.844.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.55.342.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.55.857.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.56.358.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.57.351.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.853.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.56.844.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.58.858.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.55.857.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.56.358.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.56.844.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.844.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.58.858.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.344.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.00.344.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.56.358.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.56.844.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.57.351.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.59.341.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.02.845.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.00.344.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.56.844.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.57.351.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.58.858.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.344.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.55.857.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.59.849.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.350.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.57.351.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.58.858.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.59.341.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.344.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.00.344.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.54.844.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.58.858.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.59.341.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.59.849.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.56.844.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.56.358.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.02.845.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.50.349.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.59.341.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.59.849.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.00.344.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.839.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.344.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.51.354.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.49.345.png"
    }
  },
  {
    "instruction": "Depart from the toilet, enter the room, proceed into the bedroom, and approach the bench.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.59.849.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.00.344.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.02.845.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.55.857.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.856.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.344.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.38.52.853.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.856.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.04.352.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.04.850.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.357.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.05.856.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.09.841.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.12.353.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.04.352.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.04.850.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.05.359.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.343.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.847.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.09.351.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.06.351.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.04.850.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.05.359.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.05.856.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.06.852.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.856.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.12.353.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.357.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.05.359.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.05.856.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.06.351.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.357.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.09.841.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.856.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.343.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.05.856.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.06.351.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.06.852.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.09.351.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.343.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.847.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.05.359.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.06.351.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.06.852.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.357.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.08.351.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.847.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.05.359.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.09.351.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.06.852.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.357.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.847.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.04.850.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.342.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.12.844.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.08.841.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.357.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.847.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.08.351.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.840.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.12.844.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.342.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.09.351.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.847.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.08.351.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.08.841.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.09.841.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.343.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.357.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.06.852.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.08.351.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.08.841.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.09.351.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.05.856.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.06.351.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.342.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.343.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.08.841.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.09.351.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.09.841.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.12.353.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.856.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.343.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.05.359.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.09.351.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.09.841.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.342.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.04.352.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.856.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.12.353.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.343.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.09.841.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.342.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.856.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.08.351.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.856.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.840.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.04.352.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.342.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.856.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.343.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.06.852.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.12.353.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.03.856.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.04.850.png"
    }
  },
  {
    "instruction": "Depart from the bedroom, leave the bedroom, enter a hallway, enter the bathroom, and approach the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.856.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.343.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.840.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.05.856.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.07.357.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.12.844.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.05.359.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed to the bathtub, turn right, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.342.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.856.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.343.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.15.845.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.12.844.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.15.398.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.14.855.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed to the bathtub, turn right, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.856.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.343.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.840.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.14.855.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.342.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.15.398.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.12.844.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed to the bathtub, turn right, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.343.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.840.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.12.844.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.15.398.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.856.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.342.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.14.855.png"
    }
  },
  {
    "instruction": "Enter the bathroom, proceed to the bathtub, turn right, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.840.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.12.844.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.14.855.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.15.845.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.11.343.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.856.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.10.342.png"
    }
  },
  {
    "instruction": "Depart from the bathroom, proceed to the living room, locate your position, move toward the stairs, and get ready to ascend to the second floor.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.15.845.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.16.347.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.16.852.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.20.348.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.19.853.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.352.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.905.png"
    }
  },
  {
    "instruction": "Depart from the bathroom, proceed to the living room, locate your position, move toward the stairs, and get ready to ascend to the second floor.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.16.347.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.16.852.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.17.396.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.352.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.20.348.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.905.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.24.855.png"
    }
  },
  {
    "instruction": "Depart from the bathroom, proceed to the living room, locate your position, move toward the stairs, and get ready to ascend to the second floor.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.16.852.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.17.396.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.19.853.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.905.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.20.348.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.352.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.20.901.png"
    }
  },
  {
    "instruction": "Depart from the bathroom, proceed to the living room, locate your position, move toward the stairs, and get ready to ascend to the second floor.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.17.396.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.19.853.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.20.348.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.352.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.20.901.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.16.852.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.25.403.png"
    }
  },
  {
    "instruction": "Depart from the bathroom, proceed to the living room, locate your position, move toward the stairs, and get ready to ascend to the second floor.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.19.853.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.20.348.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.20.901.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.905.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.25.403.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.24.393.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.17.396.png"
    }
  },
  {
    "instruction": "Depart from the bathroom, proceed to the living room, locate your position, move toward the stairs, and get ready to ascend to the second floor.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.20.348.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.20.901.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.352.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.17.396.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.25.403.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.24.393.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.16.852.png"
    }
  },
  {
    "instruction": "Depart from the bathroom, proceed to the living room, locate your position, move toward the stairs, and get ready to ascend to the second floor.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.20.901.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.352.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.905.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.17.396.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.15.845.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.24.855.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.25.403.png"
    }
  },
  {
    "instruction": "Depart from the bathroom, proceed to the living room, locate your position, move toward the stairs, and get ready to ascend to the second floor.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.352.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.905.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.24.393.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.16.347.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.17.396.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.16.852.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.25.403.png"
    }
  },
  {
    "instruction": "Depart from the bathroom, proceed to the living room, locate your position, move toward the stairs, and get ready to ascend to the second floor.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.23.905.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.24.393.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.24.855.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.16.347.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.25.900.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.20.348.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.25.403.png"
    }
  },
  {
    "instruction": "Upon seeing the bathroom, enter it and proceed to the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.32.391.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.33.389.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.33.904.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.34.402.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.35.397.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.35.899.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.34.891.png"
    }
  },
  {
    "instruction": "Upon seeing the bathroom, enter it and proceed to the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.33.389.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.33.904.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.34.402.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.35.899.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.32.391.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.34.891.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.35.397.png"
    }
  },
  {
    "instruction": "Upon seeing the bathroom, enter it and proceed to the bathtub.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.33.904.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.34.402.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.34.891.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.35.899.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.32.391.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.33.389.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.35.397.png"
    }
  },
  {
    "instruction": "Leave the bathroom, proceed into the living room, walk past the large TV screen, and approach the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.34.891.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.35.397.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.35.899.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.44.890.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.44.398.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.37.393.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.43.899.png"
    }
  },
  {
    "instruction": "Leave the bathroom, proceed into the living room, walk past the large TV screen, and approach the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.35.397.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.35.899.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.36.890.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.44.398.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.39.896.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.42.408.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.37.901.png"
    }
  },
  {
    "instruction": "Leave the bathroom, proceed into the living room, walk past the large TV screen, and approach the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.35.899.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.36.890.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.37.393.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.45.400.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.39.395.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.42.897.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.34.891.png"
    }
  },
  {
    "instruction": "Leave the bathroom, proceed into the living room, walk past the large TV screen, and approach the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.36.890.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.37.393.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.37.901.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.42.897.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.39.896.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.43.899.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.44.890.png"
    }
  },
  {
    "instruction": "Leave the bathroom, proceed into the living room, walk past the large TV screen, and approach the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.37.393.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.37.901.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.39.395.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.44.398.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.44.890.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.43.403.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.42.408.png"
    }
  },
  {
    "instruction": "Leave the bathroom, proceed into the living room, walk past the large TV screen, and approach the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.37.901.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.39.395.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.39.896.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.43.899.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.42.897.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.35.899.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.45.400.png"
    }
  },
  {
    "instruction": "Leave the bathroom, proceed into the living room, walk past the large TV screen, and approach the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.39.395.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.39.896.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.42.408.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.43.403.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.45.400.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.34.891.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.43.899.png"
    }
  },
  {
    "instruction": "Leave the bathroom, proceed into the living room, walk past the large TV screen, and approach the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.39.896.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.42.408.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.42.897.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.43.899.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.44.398.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.37.901.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.43.403.png"
    }
  },
  {
    "instruction": "Leave the bathroom, proceed into the living room, walk past the large TV screen, and approach the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.42.408.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.42.897.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.43.403.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.44.890.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.44.398.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.35.899.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.37.901.png"
    }
  },
  {
    "instruction": "Leave the bathroom, proceed into the living room, walk past the large TV screen, and approach the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.42.897.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.43.403.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.43.899.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.37.393.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.34.891.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.44.398.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.44.890.png"
    }
  },
  {
    "instruction": "Leave the bathroom, proceed into the living room, walk past the large TV screen, and approach the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.43.403.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.43.899.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.44.398.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.45.400.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.44.890.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.39.896.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.39.36.890.png"
    }
  },
  {
    "instruction": "Walk along the corridor, enter the activity room, pass the treadmill, turn right, and approach the tables and chairs.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.07.950.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.08.403.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.08.904.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.10.908.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.09.948.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.12.945.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.09.455.png"
    }
  },
  {
    "instruction": "Walk along the corridor, enter the activity room, pass the treadmill, turn right, and approach the tables and chairs.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.08.403.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.08.904.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.09.455.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.10.408.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.07.950.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.11.907.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.12.945.png"
    }
  },
  {
    "instruction": "Walk along the corridor, enter the activity room, pass the treadmill, turn right, and approach the tables and chairs.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.08.904.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.09.455.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.09.948.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.10.908.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.12.415.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.10.408.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.12.945.png"
    }
  },
  {
    "instruction": "Walk along the corridor, enter the activity room, pass the treadmill, turn right, and approach the tables and chairs.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.09.455.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.09.948.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.10.408.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.11.907.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.08.403.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.12.945.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.11.453.png"
    }
  },
  {
    "instruction": "Walk along the corridor, enter the activity room, pass the treadmill, turn right, and approach the tables and chairs.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.09.948.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.10.408.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.10.908.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.11.453.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.07.950.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.12.945.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.11.907.png"
    }
  },
  {
    "instruction": "Walk along the corridor, enter the activity room, pass the treadmill, turn right, and approach the tables and chairs.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.10.408.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.10.908.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.11.453.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.09.455.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.12.945.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.08.904.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.12.415.png"
    }
  },
  {
    "instruction": "Walk along the corridor, enter the activity room, pass the treadmill, turn right, and approach the tables and chairs.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.10.908.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.11.453.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.11.907.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.12.415.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.10.408.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.09.455.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.12.945.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.16.455.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.16.944.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.17.442.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.24.956.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.446.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.22.915.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.24.449.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.16.944.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.17.442.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.17.909.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.21.914.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.943.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.446.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.24.449.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.17.442.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.17.909.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.446.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.24.449.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.20.441.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.22.456.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.19.451.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.17.909.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.446.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.943.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.19.955.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.25.449.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.16.455.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.20.441.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.446.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.943.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.19.451.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.24.449.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.20.441.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.21.914.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.20.952.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.943.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.19.451.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.19.955.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.21.914.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.23.954.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.17.442.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.20.952.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.19.451.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.19.955.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.20.441.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.22.915.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.24.449.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.21.914.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.943.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.19.955.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.20.441.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.20.952.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.22.456.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.21.914.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.16.944.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.943.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.20.441.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.20.952.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.21.914.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.943.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.22.915.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.19.955.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.17.442.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.20.952.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.21.914.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.22.456.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.23.449.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.20.441.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.943.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.446.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.21.914.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.22.456.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.22.915.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.17.442.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.23.954.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.24.449.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.24.956.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.22.456.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.22.915.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.23.449.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.24.449.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.24.956.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.19.955.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.16.455.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.22.915.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.23.449.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.23.954.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.446.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.24.956.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.20.952.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.25.449.png"
    }
  },
  {
    "instruction": "Inside the dining room, approach the dining table. Turn left and locate a refrigerator and a snack rack. Move to the refrigerator, then turn right to the snack rack. Make another right turn and proceed forward into the bathroom. Finally, walk to the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.23.449.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.23.954.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.24.449.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.25.449.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.19.451.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.18.943.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.17.442.png"
    }
  },
  {
    "instruction": "Go upstairs when you see the stairs. Once you reach the bedroom door, enter the bedroom. Upon seeing the screen, walk around it to the right. When you see the bed, approach it, then head towards the computer desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.26.447.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.27.454.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.27.960.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.28.945.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.32.945.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.34.958.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.35.441.png"
    }
  },
  {
    "instruction": "Go upstairs when you see the stairs. Once you reach the bedroom door, enter the bedroom. Upon seeing the screen, walk around it to the right. When you see the bed, approach it, then head towards the computer desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.27.454.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.27.960.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.28.451.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.30.457.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.957.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.29.447.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.28.945.png"
    }
  },
  {
    "instruction": "Go upstairs when you see the stairs. Once you reach the bedroom door, enter the bedroom. Upon seeing the screen, walk around it to the right. When you see the bed, approach it, then head towards the computer desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.27.960.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.28.451.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.28.945.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.29.959.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.30.457.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.457.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.27.454.png"
    }
  },
  {
    "instruction": "Go upstairs when you see the stairs. Once you reach the bedroom door, enter the bedroom. Upon seeing the screen, walk around it to the right. When you see the bed, approach it, then head towards the computer desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.28.451.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.28.945.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.29.447.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.27.454.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.30.457.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.32.945.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.29.959.png"
    }
  },
  {
    "instruction": "Go upstairs when you see the stairs. Once you reach the bedroom door, enter the bedroom. Upon seeing the screen, walk around it to the right. When you see the bed, approach it, then head towards the computer desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.28.945.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.29.447.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.29.959.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.34.958.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.957.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.457.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.32.945.png"
    }
  },
  {
    "instruction": "Go upstairs when you see the stairs. Once you reach the bedroom door, enter the bedroom. Upon seeing the screen, walk around it to the right. When you see the bed, approach it, then head towards the computer desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.29.447.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.29.959.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.30.457.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.28.945.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.34.457.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.27.960.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.457.png"
    }
  },
  {
    "instruction": "Go upstairs when you see the stairs. Once you reach the bedroom door, enter the bedroom. Upon seeing the screen, walk around it to the right. When you see the bed, approach it, then head towards the computer desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.29.959.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.30.457.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.32.945.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.957.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.28.945.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.27.960.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.457.png"
    }
  },
  {
    "instruction": "Go upstairs when you see the stairs. Once you reach the bedroom door, enter the bedroom. Upon seeing the screen, walk around it to the right. When you see the bed, approach it, then head towards the computer desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.30.457.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.32.945.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.457.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.35.441.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.35.944.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.34.457.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.957.png"
    }
  },
  {
    "instruction": "Go upstairs when you see the stairs. Once you reach the bedroom door, enter the bedroom. Upon seeing the screen, walk around it to the right. When you see the bed, approach it, then head towards the computer desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.32.945.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.457.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.957.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.36.443.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.34.958.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.29.447.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.35.441.png"
    }
  },
  {
    "instruction": "Go upstairs when you see the stairs. Once you reach the bedroom door, enter the bedroom. Upon seeing the screen, walk around it to the right. When you see the bed, approach it, then head towards the computer desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.457.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.957.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.34.457.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.28.451.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.30.457.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.35.441.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.36.443.png"
    }
  },
  {
    "instruction": "Go upstairs when you see the stairs. Once you reach the bedroom door, enter the bedroom. Upon seeing the screen, walk around it to the right. When you see the bed, approach it, then head towards the computer desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.957.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.34.457.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.34.958.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.29.959.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.35.944.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.28.451.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.33.457.png"
    }
  },
  {
    "instruction": "Go upstairs when you see the stairs. Once you reach the bedroom door, enter the bedroom. Upon seeing the screen, walk around it to the right. When you see the bed, approach it, then head towards the computer desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.34.457.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.34.958.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.35.441.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.35.944.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.29.959.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.36.443.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.26.447.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.36.944.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.37.443.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.37.942.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.38.950.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.39.442.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.47.441.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.450.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.37.443.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.37.942.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.38.950.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.962.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.45.946.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.39.949.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.46.461.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.37.942.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.38.950.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.39.442.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.36.944.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.40.451.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.46.961.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.453.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.38.950.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.39.442.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.39.949.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.40.945.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.954.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.450.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.37.942.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.39.442.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.39.949.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.40.451.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.41.451.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.962.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.45.946.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.40.945.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.39.949.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.40.451.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.40.945.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.43.452.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.41.951.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.37.443.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.49.459.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.40.451.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.40.945.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.41.451.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.45.946.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.453.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.46.961.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.37.942.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.40.945.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.41.451.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.41.951.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.450.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.453.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.954.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.36.944.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.41.451.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.41.951.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.453.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.40.451.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.38.950.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.43.452.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.954.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.41.951.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.453.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.954.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.43.952.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.47.441.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.36.944.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.41.451.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.453.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.954.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.43.452.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.450.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.40.451.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.962.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.38.950.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.954.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.43.452.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.43.952.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.38.950.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.46.461.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.37.942.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.962.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.43.452.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.43.952.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.450.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.453.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.45.441.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.49.459.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.39.949.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.43.952.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.450.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.962.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.38.950.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.49.459.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.47.960.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.45.946.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.450.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.962.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.45.441.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.46.461.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.39.949.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.43.952.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.49.459.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.962.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.45.441.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.45.946.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.39.949.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.41.951.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.46.961.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.42.453.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.45.441.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.45.946.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.46.461.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.40.451.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.47.441.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.38.950.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.40.945.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.45.946.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.46.461.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.46.961.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.962.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.47.960.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.37.443.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.41.951.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.46.461.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.46.961.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.47.441.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.48.455.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.39.442.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.45.946.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.45.441.png"
    }
  },
  {
    "instruction": "Upon seeing the stairs, ascend them and arrive at the bedroom door. Enter the bedroom, notice the folding screen, move right around it, spot the bed, approach it, then see the desk and walk toward the computer.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.46.961.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.47.441.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.47.960.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.450.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.49.459.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.44.962.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.39.949.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.52.455.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.52.947.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.53.459.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.55.955.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.54.454.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.02.453.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.56.950.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.52.947.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.53.459.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.53.950.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.01.456.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.54.956.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.02.453.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.55.955.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.53.459.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.53.950.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.54.454.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.01.002.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.01.456.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.000.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.55.449.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.53.950.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.54.454.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.54.956.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.52.947.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.53.459.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.55.955.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.52.455.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.54.454.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.54.956.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.55.449.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.999.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.57.457.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.56.459.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.52.455.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.54.956.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.55.449.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.55.955.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.56.459.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.56.950.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.000.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.57.457.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.55.449.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.55.955.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.56.459.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.57.457.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.01.002.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.54.454.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.02.002.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.55.955.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.56.459.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.56.950.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.01.456.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.53.459.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.57.997.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.02.453.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.56.459.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.56.950.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.57.457.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.58.503.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.52.455.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.999.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.53.459.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.56.950.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.57.457.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.57.997.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.54.956.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.000.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.58.503.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.999.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.57.457.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.57.997.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.58.503.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.02.453.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.500.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.55.955.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.02.002.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.57.997.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.58.503.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.000.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.55.449.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.57.457.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.999.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.54.454.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.58.503.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.000.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.500.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.57.997.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.999.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.01.002.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.57.457.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.000.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.500.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.999.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.53.459.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.02.453.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.02.002.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.01.456.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.500.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.999.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.01.002.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.52.947.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.01.456.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.53.459.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.02.002.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.999.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.01.002.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.01.456.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.54.956.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.02.453.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.52.947.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.500.png"
    }
  },
  {
    "instruction": "From the balcony, leave the balcony and enter inside. See the living room, proceed toward it, walk to the wall-mounted television, spot the piano, and move toward the piano.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.01.002.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.01.456.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.02.002.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.53.459.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.02.958.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.500.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.40.59.999.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.04.958.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.05.507.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.05.958.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.10.991.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.11.492.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.15.979.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.13.006.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.05.507.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.05.958.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.10.991.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.16.496.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.19.996.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.11.993.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.11.492.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.05.958.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.10.991.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.11.492.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.12.504.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.992.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.17.505.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.05.507.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.10.991.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.11.492.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.11.993.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.004.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.13.006.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.15.496.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.006.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.11.492.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.11.993.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.12.504.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.004.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.13.494.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.10.991.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.04.958.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.11.993.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.12.504.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.13.006.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.006.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.04.958.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.16.992.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.992.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.12.504.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.13.006.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.13.494.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.20.999.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.497.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.04.958.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.004.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.13.006.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.13.494.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.006.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.17.505.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.20.999.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.497.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.993.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.13.494.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.006.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.497.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.13.006.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.992.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.19.996.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.15.496.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.006.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.497.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.993.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.20.999.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.15.979.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.21.502.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.15.496.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.497.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.993.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.15.496.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.10.991.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.16.496.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.05.958.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.992.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.993.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.15.496.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.15.979.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.13.006.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.16.992.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.13.494.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.21.996.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.15.496.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.15.979.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.16.496.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.04.958.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.17.505.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.21.502.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.19.996.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.15.979.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.16.496.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.16.992.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.12.504.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.004.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.497.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.21.996.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.16.496.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.16.992.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.17.505.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.497.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.04.958.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.05.958.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.15.979.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.16.992.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.17.505.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.004.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.21.502.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.992.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.497.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.20.999.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.17.505.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.004.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.497.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.992.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.04.958.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.19.501.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.20.501.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.004.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.497.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.992.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.13.006.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.11.993.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.19.996.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.15.979.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.497.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.992.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.19.501.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.20.501.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.12.504.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.11.993.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.10.991.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.18.992.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.19.501.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.19.996.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.05.507.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.12.504.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.11.492.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.20.999.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.19.501.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.19.996.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.20.501.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.05.958.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.21.502.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.11.993.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.006.png"
    }
  },
  {
    "instruction": "Depart from the living room, turn right to find the bedroom door. Enter the bedroom, proceed to the window, observe the grass outside. Turn back, leave the bedroom, head to the living room, move close to the sofa, enter the bathroom, and approach the toilet.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.19.996.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.20.501.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.20.999.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.21.996.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.993.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.497.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/img/001/2025-03-25_22.41.14.006.png"
    }
  },
    {
    "instruction": "Slightly turn left from the bed to the bookshelf and go to it.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.06.244.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.06.748.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.07.241.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.08.244.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.08.748.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.09.749.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.09.247.png"
    }
  },
  {
    "instruction": "Slightly turn left from the bed to the bookshelf and go to it.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.06.748.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.07.241.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.07.743.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.06.244.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.08.244.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.08.748.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.09.749.png"
    }
  },
  {
    "instruction": "Slightly turn left from the bed to the bookshelf and go to it.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.07.241.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.07.743.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.08.244.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.08.748.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.06.748.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.09.247.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.09.749.png"
    }
  },
  {
    "instruction": "Slightly turn left from the bed to the bookshelf and go to it.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.07.743.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.08.244.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.08.748.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.06.244.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.07.241.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.09.247.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.09.749.png"
    }
  },
  {
    "instruction": "There is a bookshelf on the left. Slightly turn right, pass by the bed, and walk to the desk and chair.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.10.245.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.10.747.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.11.242.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.11.741.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.13.746.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.12.252.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.15.242.png"
    }
  },
  {
    "instruction": "There is a bookshelf on the left. Slightly turn right, pass by the bed, and walk to the desk and chair.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.10.747.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.11.242.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.11.741.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.14.241.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.12.748.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.13.243.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.14.801.png"
    }
  },
  {
    "instruction": "There is a bookshelf on the left. Slightly turn right, pass by the bed, and walk to the desk and chair.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.11.242.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.11.741.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.12.252.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.14.241.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.13.243.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.10.245.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.12.748.png"
    }
  },
  {
    "instruction": "There is a bookshelf on the left. Slightly turn right, pass by the bed, and walk to the desk and chair.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.11.741.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.12.252.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.12.748.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.10.245.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.13.746.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.11.242.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.14.241.png"
    }
  },
  {
    "instruction": "There is a bookshelf on the left. Slightly turn right, pass by the bed, and walk to the desk and chair.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.12.252.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.12.748.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.13.243.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.10.747.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.15.242.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.11.242.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.14.241.png"
    }
  },
  {
    "instruction": "There is a bookshelf on the left. Slightly turn right, pass by the bed, and walk to the desk and chair.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.12.748.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.13.243.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.13.746.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.12.252.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.14.801.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.11.741.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.10.245.png"
    }
  },
  {
    "instruction": "There is a bookshelf on the left. Slightly turn right, pass by the bed, and walk to the desk and chair.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.13.243.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.13.746.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.14.241.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.15.242.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.14.801.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.11.242.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.12.748.png"
    }
  },
  {
    "instruction": "Slightly turn left from the sofa, past the bed and trash can, to the bookshelf.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.15.746.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.16.251.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.16.745.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.17.747.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.20.290.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.19.745.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.19.247.png"
    }
  },
  {
    "instruction": "Slightly turn left from the sofa, past the bed and trash can, to the bookshelf.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.16.251.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.16.745.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.17.252.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.19.247.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.15.746.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.18.247.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.18.747.png"
    }
  },
  {
    "instruction": "Slightly turn left from the sofa, past the bed and trash can, to the bookshelf.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.16.745.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.17.252.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.17.747.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.19.247.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.18.747.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.20.290.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.16.251.png"
    }
  },
  {
    "instruction": "Slightly turn left from the sofa, past the bed and trash can, to the bookshelf.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.17.252.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.17.747.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.18.247.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.16.745.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.19.247.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.18.747.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.16.251.png"
    }
  },
  {
    "instruction": "Slightly turn left from the sofa, past the bed and trash can, to the bookshelf.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.17.747.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.18.247.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.18.747.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.19.745.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.20.290.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.16.251.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.15.746.png"
    }
  },
  {
    "instruction": "Slightly turn left from the sofa, past the bed and trash can, to the bookshelf.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.18.247.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.18.747.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.19.247.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.20.290.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.19.745.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.15.746.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.16.745.png"
    }
  },
  {
    "instruction": "There is a sofa on the left. Go around the bed and the wardrobe, and walk to the mirror in front of the wardrobe.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.25.294.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.25.797.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.26.295.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.28.292.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.27.290.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.28.789.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.27.800.png"
    }
  },
  {
    "instruction": "There is a sofa on the left. Go around the bed and the wardrobe, and walk to the mirror in front of the wardrobe.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.25.797.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.26.295.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.26.793.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.27.800.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.25.294.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.28.292.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.28.789.png"
    }
  },
  {
    "instruction": "There is a sofa on the left. Go around the bed and the wardrobe, and walk to the mirror in front of the wardrobe.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.26.295.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.26.793.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.27.290.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.25.294.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.25.797.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.28.292.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.28.789.png"
    }
  },
  {
    "instruction": "There is a sofa on the left. Go around the bed and the wardrobe, and walk to the mirror in front of the wardrobe.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.26.793.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.27.290.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.27.800.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.25.797.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.28.789.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.25.294.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.26.295.png"
    }
  },
  {
    "instruction": "Go around the bed from the left wardrobe to the front of the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.29.291.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.29.792.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.30.290.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.32.289.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.31.798.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.31.299.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.30.792.png"
    }
  },
  {
    "instruction": "Go around the bed from the left wardrobe to the front of the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.29.792.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.30.290.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.30.792.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.31.798.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.33.299.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.29.291.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.31.299.png"
    }
  },
  {
    "instruction": "Go around the bed from the left wardrobe to the front of the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.30.290.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.30.792.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.31.299.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.32.289.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.31.798.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.29.291.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.29.792.png"
    }
  },
  {
    "instruction": "Go around the bed from the left wardrobe to the front of the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.30.792.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.31.299.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.31.798.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.32.796.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.32.289.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.29.291.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.29.792.png"
    }
  },
  {
    "instruction": "Go around the bed from the left wardrobe to the front of the sofa.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.31.299.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.31.798.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.32.289.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.33.299.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.30.290.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.32.796.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.29.792.png"
    }
  },
  {
    "instruction": "Go from the bed to the desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.36.795.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.37.290.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.37.799.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.39.291.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.39.798.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.38.797.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.40.295.png"
    }
  },
  {
    "instruction": "Go from the bed to the desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.37.290.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.37.799.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.38.292.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.39.291.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.38.797.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.39.798.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.36.795.png"
    }
  },
  {
    "instruction": "Go from the bed to the desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.37.799.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.38.292.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.38.797.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.39.291.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.39.798.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.36.795.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.40.295.png"
    }
  },
  {
    "instruction": "Go from the bed to the desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.38.292.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.38.797.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.39.291.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.36.795.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.37.799.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.40.295.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.39.798.png"
    }
  },
  {
    "instruction": "Go from the desk to the bookshelf.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.40.795.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.41.295.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.41.792.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.42.298.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.43.789.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.42.792.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.44.292.png"
    }
  },
  {
    "instruction": "Go from the desk to the bookshelf.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.41.295.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.41.792.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.42.298.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.43.290.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.42.792.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.40.795.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.43.789.png"
    }
  },
  {
    "instruction": "Go from the desk to the bookshelf.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.41.792.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.42.298.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.42.792.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.41.295.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.43.789.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.43.290.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.40.795.png"
    }
  },
  {
    "instruction": "Go from the desk to the bookshelf.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.42.298.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.42.792.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.43.290.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.44.292.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.43.789.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.41.295.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/10/2025-09-15_02.28.41.792.png"
    }
  },
  {
    "instruction": "From the cabinet on the right, go to the desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.12.045.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.12.548.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.13.046.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.14.042.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.14.550.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.15.041.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.15.543.png"
    }
  },
  {
    "instruction": "From the cabinet on the right, go to the desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.12.548.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.13.046.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.13.545.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.15.543.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.15.041.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.14.550.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.12.045.png"
    }
  },
  {
    "instruction": "From the cabinet on the right, go to the desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.13.046.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.13.545.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.14.042.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.15.041.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.12.045.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.12.548.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.15.543.png"
    }
  },
  {
    "instruction": "From the cabinet on the right, go to the desk.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.13.545.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.14.042.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.14.550.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.15.041.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.12.045.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.15.543.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.13.046.png"
    }
  },
  {
    "instruction": "Walk around the bed to the green wardrobe.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.20.097.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.20.551.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.21.100.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.22.550.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.21.551.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.23.551.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.22.090.png"
    }
  },
  {
    "instruction": "Walk around the bed to the green wardrobe.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.20.551.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.21.100.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.21.551.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.23.049.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.22.550.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.22.090.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.20.097.png"
    }
  },
  {
    "instruction": "Walk around the bed to the green wardrobe.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.21.100.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.21.551.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.22.090.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.20.551.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.22.550.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.20.097.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.23.049.png"
    }
  },
  {
    "instruction": "Walk around the bed to the green wardrobe.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.21.551.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.22.090.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.22.550.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.23.049.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.20.551.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.23.551.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.21.100.png"
    }
  },
  {
    "instruction": "Go to the window by the bed.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.24.094.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.24.594.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.25.096.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.26.093.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.27.600.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.26.593.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.25.552.png"
    }
  },
  {
    "instruction": "Go to the window by the bed.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.24.594.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.25.096.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.25.552.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.24.094.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.27.600.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.26.093.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.26.593.png"
    }
  },
  {
    "instruction": "Go to the window by the bed.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "A",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.25.096.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.25.552.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.26.093.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.27.092.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.24.094.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.24.594.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.26.593.png"
    }
  },
  {
    "instruction": "Go to the window by the bed.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "C",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.25.552.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.26.093.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.26.593.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.24.094.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.24.594.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.27.600.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.27.092.png"
    }
  },
  {
    "instruction": "Go from the window to the potted plant.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.28.102.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.28.599.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.29.096.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.31.095.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.31.601.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.29.594.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.30.091.png"
    }
  },
  {
    "instruction": "Go from the window to the potted plant.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.28.599.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.29.096.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.29.594.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.31.095.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.30.594.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.30.091.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.31.601.png"
    }
  },
  {
    "instruction": "Go from the window to the potted plant.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "B",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.29.096.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.29.594.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.30.091.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.30.594.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.31.095.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.31.601.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.28.102.png"
    }
  },
  {
    "instruction": "Go from the window to the potted plant.",
    "input": "The historical images are as follows:\n<img_hist0>\n<img_hist1>\n<img_hist2>\nAnd the choices are as follows: <img_cand0>, <img_cand1>, <img_cand2>, <img_cand3>",
    "output": "D",
    "images": {
      "img_hist0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.29.594.png",
      "img_hist1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.30.091.png",
      "img_hist2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.30.594.png",
      "img_cand0": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.29.096.png",
      "img_cand1": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.31.095.png",
      "img_cand2": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.28.599.png",
      "img_cand3": "/mnt/shared-storage-user/tanxin/zhanglechao/mc_dataset/extend_vln_data/11/2025-09-15_02.49.31.601.png"
    }
  }
]