{
    "uuid": "7942e599-6cc3-59c7-89ec-2be7f578f002",
    "question": "How many samples are there in total in the dataset used by MIDGARD for Task 2 evaluation?",
    "answer_format": "Your answer should be an integer, the number of samples.",
    "tags": [
        "multiple",
        "text",
        "objective"
    ],
    "anchor_pdf": [
        "5dce7396-1032-5275-ae09-d74568a33935"
    ],
    "reference_pdf": [
        "366742fc-a2cb-56af-87b7-cb2834f6cf11",
        "c5a300ef-dacf-5505-a8b7-a6797a2eb702"
    ],
    "conference": [],
    "reasoning_steps": [
        "Find the dataset used for Task 2 evaluation in the MIDGARD paper.",
        "Read the corresponding paper to find the number of samples."
    ],
    "evaluator": {
        "eval_func": "eval_int_exact_match",
        "eval_kwargs": {
            "gold": 3166
        }
    },
    "state": {
        "gui-gpt-4o-2024-11-20": false
    },
    "annotator": "human"
}