[
    {"id": 2, "image": "COCO_val2014_000000144305.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains keyboard, laptop, dining table. Based on this, is there a mouse in the image?"}]},     {
        "id": 1,
        "image": "COCO_val2014_000000144305.jpg",
        "conversations": [
            {
                "from": "human",
                "value": "Generate a short caption of the image. Generate a short caption of the image."
            },
            {
                "from": "gpt",
                "value": "Focusing on the visible elements in this image: dining table, generate a short caption for this image."
            }
        ]
    },
    {"id": 85, "image": "COCO_val2014_000000039053.jpg", "conversations": [{"from": "human", "value": "Generate a short caption of the image."}, {"from": "gpt", "value": "Focusing on the visible elements in this image: spoon, bowl, dining table, apple, cake, cell phone, cup, generate a short caption for this image."}]},
    {"id": 2, "image": "COCO_val2014_000000144305.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains keyboard, laptop, dining table. Based on this, is there a mouse in the image?"}]},
    {"id": 2, "image": "COCO_val2014_000000144305.jpg", "conversations": [{"from": "human", "value": "Is there a mouse in the image?"}, {"from": "gpt", "value": "This image contains keyboard, laptop, dining table. Based on this, is there a mouse in the image?"}]}
]