[
    {
        "id": 1,
        "image": "COCO_val2014_000000144305.jpg",
        "conversations": [
            {
                "from": "human",
                "value": "Generate a short caption of the image."
            },
            {
                "from": "gpt",
                "value": "Generate a short caption for this image, focusing on the visible elements: keyboard, laptop, dining table."
            }
        ]
    },
    {
        "id": 7,
        "image": "COCO_val2014_000000164091.jpg",
        "conversations": [
            {
                "from": "human",
                "value": "Generate a short caption of the image."
            },
            {
                "from": "gpt",
                "value": "Generate a short caption for this image, focusing on the visible elements: person, bed, teddy bear."
            }
        ]
    }
    ]