{
    "uuid": "99cec4b0-ca19-56bb-83a0-7a79a4a14c9d",
    "question": "What is the distribution ratio of data sources for the toxicity ratings dataset used in the paper?",
    "answer_format": "Your answer should be a python dictionary about the data sources and their distribution ratio, e.g., {\"data_source_1\": 0.5, \"data_source_2\": 0.5}. YOU MUST USE THE EXACT NAMES FROM THE PDF WITHOUT CHANGING THE CAPITALIZATION.",
    "tags": [
        "multiple",
        "text",
        "objective"
    ],
    "anchor_pdf": [
        "86aea8c2-7ffe-534a-a610-d467151fe5de"
    ],
    "reference_pdf": [
        "357ecfc8-7a31-50d8-93ca-7aaf3e2ec1b1"
    ],
    "conference": [],
    "reasoning_steps": [
        "Retrieve the toxicity ratings dataset in the anchor PDF, which is usually mentioned in the dataset section.",
        "Locate the related paper about the dataset.",
        "Locate the data sources and their distribution ratio, which are mentioned in the method section."
    ],
    "evaluator": {
        "eval_func": "eval_structured_object_exact_match",
        "eval_kwargs": {
            "gold": {
                "Twitter": 0.67,
                "Reddit": 0.15,
                "4chan": 0.18
            },
            "ignore_order": true,
            "lowercase": true
        }
    },
    "state": {
        "gui-gpt-4o-2024-11-20": false
    },
    "annotator": "human"
}