{
    "uuid": "3272942c-5db5-5122-b612-f09332a27a5a",
    "question": "How are the data in Table 5 in the paper \"Overview of the 9th Social Media Mining for Health Applications\" obtained, from the valid dataset or test dataset?",
    "answer_format": "Your answer should be a python strings of \"valid\" or \"test\".",
    "tags": [
        "multiple",
        "table",
        "text",
        "objective"
    ],
    "anchor_pdf": [
        "c43c8e72-1389-54f0-b36e-ab07d569f3e0"
    ],
    "reference_pdf": [
        "fe31ca58-7239-5d36-b623-2540d7b9b01a"
    ],
    "conference": [],
    "reasoning_steps": [],
    "evaluator": {
        "eval_func": "eval_string_exact_match",
        "eval_kwargs": {
            "gold": "test"
        }
    },
    "state": {
        "gui-gpt-4o-2024-11-20": false
    },
    "annotator": "human"
}