{
    "uuid": "3fd4d805-ae6c-527d-b6d2-30a18fb0ab12",
    "question": "On the dataset proposed by this work, how much does the GPT-3.5-turbo model improve its GPT4score after using Graph-CoT?",
    "answer_format": "Your answer should be a single float number ranging from 0 to 100, representing the subtraction result.",
    "tags": [
        "objective",
        "single",
        "table"
    ],
    "conference": [],
    "reasoning_steps": [
        "Find the name of the dataset proposed by this work.",
        "Locate the experiment table related to the proposed dataset that demonstrates the GPT4score of the GPT-3.5-turbo model before and after using Graph-CoT.",
        "Record the two GPT4scores respectively.",
        "Calculate the subtraction result."
    ],
    "evaluator": {
        "eval_func": "eval_float_exact_match",
        "eval_kwargs": {
            "gold": 16.81,
            "ndigits": 2
        }
    },
    "state": {
        "gui-gpt-4o-2024-11-20": false
    },
    "annotator": "human",
    "anchor_pdf": [
        "fb154467-1ce1-5c1f-9d4f-b4f5c76312ee"
    ],
    "reference_pdf": []
}