{
    "uuid": "f5abd5f8-b8b0-5fcf-af97-739ca262c1c0",
    "question": "Which model gets the highest DR value in the Random Retrieval performance?",
    "answer_format": "Your answer should be plain text.",
    "tags": [
        "single",
        "table",
        "subjective"
    ],
    "anchor_pdf": ["0df4b58a-c8e7-52a3-8c84-730542241fca"],
    "reference_pdf": [],
    "conference": [],
    "reasoning_steps": [
        "First, locate the table showing the random retrieval performance.", 
        "Then, find the model gets the highest DQ value."
    ],
    "evaluator": {
        "eval_func": "eval_reference_answer_with_llm",
        "eval_kwargs": {
            "reference_answer": "The BART-base model gets the highest DQ value.",
            "question": "Which model gets the highest DR value in the Random Retrieval performance?"
        }
    },
    "state": {
        "gui-gpt-4o-2024-11-20": false
    },
    "annotator": "human"
}