{
    "model_name": "",
    "solutions": [
        {
            "problem_id": 1,
            "answer": "LEFT: Fashion magazine., RIGHT: NOT Fashion magazine.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 2,
            "answer": "LEFT: Solar system., RIGHT: NOT Solar system.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 3,
            "answer": "LEFT: A bunch of branches on the green plant., RIGHT: NOT A bunch of branches on the green plant.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 4,
            "answer": "LEFT: A group photo at a wedding reception., RIGHT: NOT A group photo at a wedding reception.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 5,
            "answer": "LEFT: A pile of rusty metal bolts., RIGHT: NOT A pile of rusty metal bolts.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 6,
            "answer": "LEFT: A large wheat field., RIGHT: NOT A large wheat field.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 7,
            "answer": "LEFT: Rubber kayak in the water., RIGHT: NOT Rubber kayak in the water.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 8,
            "answer": "LEFT: Strawberry leaves., RIGHT: NOT Strawberry leaves.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 9,
            "answer": "LEFT: A perched mantis hanging on a plant., RIGHT: NOT A perched mantis hanging on a plant.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 10,
            "answer": "LEFT: A group photo of the extended family., RIGHT: NOT A group photo of the extended family.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 11,
            "answer": "LEFT: Ellipsoidal fruits., RIGHT: NOT Ellipsoidal fruits.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 12,
            "answer": "LEFT: An old style bicycle., RIGHT: NOT An old style bicycle.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 13,
            "answer": "LEFT: Stamp pictures., RIGHT: NOT Stamp pictures.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 14,
            "answer": "LEFT: Branches covered with heavily falling snow., RIGHT: NOT Branches covered with heavily falling snow.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 15,
            "answer": "LEFT: A person playing a guitar., RIGHT: NOT A person playing a guitar.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 16,
            "answer": "LEFT: Bright red fish., RIGHT: NOT Bright red fish.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 17,
            "answer": "LEFT: Reeds swaying in the wind., RIGHT: NOT Reeds swaying in the wind.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 18,
            "answer": "LEFT: Instruments for quantitative measurements., RIGHT: NOT Instruments for quantitative measurements.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 19,
            "answer": "LEFT: Various colors of pigments., RIGHT: NOT Various colors of pigments.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 20,
            "answer": "LEFT: Candle chandeliers hanging above a dining room table surrounded by chairs., RIGHT: NOT Candle chandeliers hanging above a dining room table surrounded by chairs.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 21,
            "answer": "LEFT: Colorful beams of light., RIGHT: NOT Colorful beams of light.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 22,
            "answer": "LEFT: Cars on the city streets at night., RIGHT: NOT Cars on the city streets at night.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 23,
            "answer": "LEFT: Grilled steaks., RIGHT: NOT Grilled steaks.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 24,
            "answer": "LEFT: Radio towers., RIGHT: NOT Radio towers.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 25,
            "answer": "LEFT: The top of a snow covered mountain., RIGHT: NOT The top of a snow covered mountain.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 26,
            "answer": "LEFT: Steel beams of the building., RIGHT: NOT Steel beams of the building.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 27,
            "answer": "LEFT: People walking on the city street., RIGHT: NOT People walking on the city street.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 28,
            "answer": "LEFT: A christmas ornament tree with colorful lights., RIGHT: NOT A christmas ornament tree with colorful lights.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 29,
            "answer": "LEFT: Keyboard of the piano., RIGHT: NOT Keyboard of the piano.",
            "explanation": "",
            "evaluations": []
        },
        {
            "problem_id": 30,
            "answer": "LEFT: Lightning hitting through cloudy sky., RIGHT: NOT Lightning hitting through cloudy sky.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 31,
            "answer": "LEFT: Hand-held escalators on stairs., RIGHT: NOT Hand-held escalators on stairs.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 32,
            "answer": "LEFT: Kids playing in the river., RIGHT: NOT Kids playing in the river.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 33,
            "answer": "LEFT: Tractors are working on a farm field., RIGHT: NOT Tractors are working on a farm field.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 34,
            "answer": "LEFT: A bicycle is placed in the corner., RIGHT: NOT A bicycle is placed in the corner.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 35,
            "answer": "LEFT: The tungsten lamp is glowing., RIGHT: NOT The tungsten lamp is glowing.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 36,
            "answer": "LEFT: The house in the heavy snow., RIGHT: NOT The house in the heavy snow.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 37,
            "answer": "LEFT: A small wooden boat floating on a calm lake., RIGHT: NOT A small wooden boat floating on a calm lake.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 38,
            "answer": "LEFT: The girl has long and thin braids on her head., RIGHT: NOT The girl has long and thin braids on her head.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 39,
            "answer": "LEFT: Human footprints in the sand on the beach., RIGHT: NOT Human footprints in the sand on the beach.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 40,
            "answer": "LEFT: A handicap sign., RIGHT: NOT A handicap sign.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 41,
            "answer": "LEFT: Yellow trumpet flowers., RIGHT: NOT Yellow trumpet flowers.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 42,
            "answer": "LEFT: Fishing boats docked at the pier., RIGHT: NOT Fishing boats docked at the pier.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 43,
            "answer": "LEFT: Monsters in mythological stories., RIGHT: NOT Monsters in mythological stories.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 44,
            "answer": "LEFT: Lettuce in the vegetable patch., RIGHT: NOT Lettuce in the vegetable patch.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 45,
            "answer": "LEFT: Little kids steering cars., RIGHT: NOT Little kids steering cars.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 46,
            "answer": "LEFT: Dense binary numbers., RIGHT: NOT Dense binary numbers.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 47,
            "answer": "LEFT: Traces left on the sand dunes., RIGHT: NOT Traces left on the sand dunes.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 48,
            "answer": "LEFT: A closeup of a red brick wall., RIGHT: NOT A closeup of a red brick wall.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 49,
            "answer": "LEFT: Black horse., RIGHT: NOT Black horse.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 50,
            "answer": "LEFT: A soldier with a little girl., RIGHT: NOT A soldier with a little girl.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 51,
            "answer": "LEFT: Aircraft carrier., RIGHT: NOT Aircraft carrier.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 52,
            "answer": "LEFT: Mathematical formulas on a blackboard., RIGHT: NOT Mathematical formulas on a blackboard.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 53,
            "answer": "LEFT: Persons riding bicycles., RIGHT: NOT Persons riding bicycles.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 54,
            "answer": "LEFT: Men playing basketball., RIGHT: NOT Men playing basketball.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 55,
            "answer": "LEFT: Wrestling competition., RIGHT: NOT Wrestling competition.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 56,
            "answer": "LEFT: Close-up view of sprouting stamen., RIGHT: NOT Close-up view of sprouting stamen.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 57,
            "answer": "LEFT: Police officers standing in the street., RIGHT: NOT Police officers standing in the street.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 58,
            "answer": "LEFT: An aerial view of the city., RIGHT: NOT An aerial view of the city.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 59,
            "answer": "LEFT: Huge crystal chandelier hanging from the ceiling., RIGHT: NOT Huge crystal chandelier hanging from the ceiling.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 60,
            "answer": "LEFT: A little girl in a princess costume., RIGHT: NOT A little girl in a princess costume.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 61,
            "answer": "LEFT: A mesmerizing light show at the concert., RIGHT: NOT A mesmerizing light show at the concert.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 62,
            "answer": "LEFT: An abstract artwork painting., RIGHT: NOT An abstract artwork painting.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 63,
            "answer": "LEFT: A bunch of vibrant flowers., RIGHT: NOT A bunch of vibrant flowers.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 64,
            "answer": "LEFT: White snowflakes., RIGHT: NOT White snowflakes.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 65,
            "answer": "LEFT: Fried noodles., RIGHT: NOT Fried noodles.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 66,
            "answer": "LEFT: A warning board in the wild., RIGHT: NOT A warning board in the wild.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 67,
            "answer": "LEFT: A pile of bullet shells., RIGHT: NOT A pile of bullet shells.",
            "explanation": "",
            "evaluations": []
        },
        {
            "problem_id": 68,
            "answer": "LEFT: Colorful skulls., RIGHT: NOT Colorful skulls.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 69,
            "answer": "LEFT: A geometric painting in the style of abstractionist., RIGHT: NOT A geometric painting in the style of abstractionist.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 70,
            "answer": "LEFT: A person doing yoga in the wilderness., RIGHT: NOT A person doing yoga in the wilderness.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 71,
            "answer": "LEFT: Gift boxes tied with ribbons., RIGHT: NOT Gift boxes tied with ribbons.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 72,
            "answer": "LEFT: Hockey stadium., RIGHT: NOT Hockey stadium.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 73,
            "answer": "LEFT: A little girl dressed in a butterfly costume., RIGHT: NOT A little girl dressed in a butterfly costume.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 74,
            "answer": "LEFT: A group of sheep grazing on a field of green grass., RIGHT: NOT A group of sheep grazing on a field of green grass.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 75,
            "answer": "LEFT: A delicious round birthday cake., RIGHT: NOT A delicious round birthday cake.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 76,
            "answer": "LEFT: A girl leading a horse., RIGHT: NOT A girl leading a horse.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 77,
            "answer": "LEFT: Various kinds of rings., RIGHT: NOT Various kinds of rings.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 78,
            "answer": "LEFT: Waterfront terrace., RIGHT: NOT Waterfront terrace.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 79,
            "answer": "LEFT: Backlit photo couple., RIGHT: NOT Backlit photo couple.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 80,
            "answer": "LEFT: Pictures of bananas., RIGHT: NOT Pictures of bananas.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 81,
            "answer": "LEFT: A closeup view of cat., RIGHT: NOT A closeup view of cat.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 82,
            "answer": "LEFT: A closeup view of a horse head., RIGHT: NOT A closeup view of a horse head.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 83,
            "answer": "LEFT: Live coral on the sea floor., RIGHT: NOT Live coral on the sea floor.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 84,
            "answer": "LEFT: A handbag hanging somewhere., RIGHT: NOT A handbag hanging somewhere.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 85,
            "answer": "LEFT: A wooden fence surrounding a grassy field., RIGHT: NOT A wooden fence surrounding a grassy field.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 86,
            "answer": "LEFT: A building with stone columns., RIGHT: NOT A building with stone columns.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 87,
            "answer": "LEFT: A transparent glass., RIGHT: NOT A transparent glass.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 88,
            "answer": "LEFT: Knives and forks on the table., RIGHT: NOT Knives and forks on the table.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 89,
            "answer": "LEFT: Boats sailing on a serene lake., RIGHT: NOT Boats sailing on a serene lake.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 90,
            "answer": "LEFT: A person holding a camera., RIGHT: NOT A person holding a camera.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 91,
            "answer": "LEFT: Knitted sweater., RIGHT: NOT Knitted sweater.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 92,
            "answer": "LEFT: Red bows., RIGHT: NOT Red bows.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 93,
            "answer": "LEFT: A heart shaped symbol., RIGHT: NOT A heart shaped symbol.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 94,
            "answer": "LEFT: A row of red wine bottles., RIGHT: NOT A row of red wine bottles.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 95,
            "answer": "LEFT: Tennis racket or court., RIGHT: NOT Tennis racket or court.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 96,
            "answer": "LEFT: A man is training at the gym., RIGHT: NOT A man is training at the gym.",
            "explanation": "",
            "evaluations": []
        },
        {
            "problem_id": 97,
            "answer": "LEFT: Keyboard of an old typewriter., RIGHT: NOT Keyboard of an old typewriter.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 98,
            "answer": "LEFT: Shiny metal coins scattered on a table., RIGHT: NOT Shiny metal coins scattered on a table.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 99,
            "answer": "LEFT: A woman in a red dress is dancing., RIGHT: NOT A woman in a red dress is dancing.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "WRONG\n",
                    "author": "gemini-1.5-pro"
                }
            ]
        },
        {
            "problem_id": 100,
            "answer": "LEFT: A threaded light bulb., RIGHT: NOT A threaded light bulb.",
            "explanation": "",
            "evaluations": [
                {
                    "value": "OK. \n",
                    "author": "gemini-1.5-pro"
                }
            ]
        }
    ]
}