{
  "attribute": "text",
  "desc": "long_description",
  "jsonl_file": "text_eval_prompts.jsonl",
  "line_idx": 15,
  "questions": [
    "Is the text 'Spin' in the image?",
    "Is the text 'Glow' in the image?",
    "Is the text 'Play' in the image?",
    "Is the text 'Skill' in the image?",
    "Is the text 'Shine' in the image?",
    "Is the text 'Twirl' in the image?",
    "Is the text 'Fun' in the image?",
    "Is the text 'Bounce' in the image?",
    "Is the text 'Light' in the image?"
  ],
  "gt_answers": [
    "Yes",
    "Yes",
    "Yes",
    "Yes",
    "Yes",
    "Yes",
    "Yes",
    "Yes",
    "Yes"
  ],
  "model_pred": [
    "yes",
    "yes",
    "yes",
    "no",
    "yes",
    "no",
    "yes",
    "no",
    "no"
  ],
  "model_output": "Yes, the text 'Spin' is in the image.\nYes, the text 'Glow' is in the image.\nYes, the text 'Play' is in the image.\nNo, the text 'Skill' is not in the image.\nYes, the text 'Shine' is in the image.\nNo, the text 'Twirl' is not in the image.\nYes, the text 'Fun' is in the image.\nNo, the text 'Bounce' is not in the image.\nNo, the text 'Light' is not in the image."
}