{
  "attribute": "numeracy+color",
  "desc": "long_description",
  "jsonl_file": "numeracy+color_eval_prompts.jsonl",
  "line_idx": 3,
  "questions": [
    "Are there deer in the image?  ",
    "Are there apples in the image?  ",
    "Are there desks in the image?  ",
    "Are there ducks in the image?  ",
    "Are there horses in the image?  ",
    "Is the number of deer 4?  ",
    "Is the number of apples 4?  ",
    "Is the number of desks 2?  ",
    "Is the number of ducks 3?  ",
    "Is the number of horses 2?  ",
    "Are the deer blue in color?  ",
    "Are the apples red in color?  ",
    "Are the desks red in color?  ",
    "Are the ducks blue in color?  ",
    "Are the horses red in color?  "
  ],
  "gt_answers": [
    "yes",
    "yes",
    "yes",
    "yes",
    "yes",
    "yes",
    "yes",
    "yes",
    "yes",
    "yes",
    "yes",
    "yes",
    "yes",
    "yes",
    "yes"
  ],
  "model_pred": [
    "no",
    "no",
    "no",
    "no",
    "yes",
    "no",
    "no",
    "no",
    "no",
    "no",
    "no",
    "no",
    "no",
    "no",
    "no"
  ],
  "model_output": "no, there are no desks\nno, there are no apples\nno, there are no desks\nno, there are no ducks\nyes, there are horses in the image\nno, the number of deer is not 4\nno, the number of apples is not 4\nno, the number of desks is not 2\nno, the number of ducks is not 3\nno, the number of horses is not 2\nno, the deer are not blue in color\nno, the apples are not red in color\nno, the desks are not red in color\nno, the ducks are not blue in color\nno, the horses are not red in color"
}