{
    "uuid": "a2985096-8453-5fb7-9066-6f505c734248",
    "question": "List the names of the baselines used in the paper \"On the Compositional Generalization in Versatile Open-domain Dialogue\", along with the titles of papers that proposed these baselines.",
    "answer_format": "Your answer should be a Python list of baseline-title pair, e.g., [[\"baseline1\", \"title1\"] , [\"baseline2\", \"title2\"], ...]. YOU MUST USE THE EXACT TEXT FROM THE PAPER AND THE FULL TITLE TEXT OF THE PAPERS.",
    "tags": [
        "multiple",
        "metadata",
        "objective"
    ],
    "anchor_pdf": [
        "3107f6a8-1939-5af0-b3d8-06d7aa66158d"
    ],
    "reference_pdf": [
        "f6e91a91-0b1e-5280-8522-a20492033f16",
        "e0cf46b4-e3cf-5d54-8c0b-c661214fe349",
        "21df0715-990d-58d3-b218-280ac3a84c8f",
        "60f20fa5-d268-522d-9cc2-5f7321af4f82"
    ],
    "conference": [],
    "reasoning_steps": [
        "Firstly, locate the sections that mention baselines.",
        "Identify the baselines.",
        "Find the reference for each baseline.",
        "Identify the title of each reference paper.",
        "Finally, list the baseline-title pairs."
    ],
    "evaluator": {
        "eval_func": "eval_structured_object_exact_match",
        "eval_kwargs": {
            "gold": [
                [
                    "BART",
                    "BART: Denoising Sequence-to-Sequence Pre-training for Natural Language Generation, Translation, and Comprehension"
                ],
                [
                    "R2C2",
                    "Language Models that Seek for Knowledge: Modular Search & Generation for Dialogue and Prompt Completion"
                ],
                [
                    "Prefix-Tuning",
                    "Prefix-Tuning: Optimizing Continuous Prompts for Generation"
                ],
                [
                    "Modular Skill",
                    "Combining modular skills in multitask learning"
                ]
            ],
            "lowercase": true,
            "ignore_order": true,
            "ignore_blank": true,
            "threshold": 95
        }
    },
    "state": {
        "gui-gpt-4o-2024-11-20": false
    },
    "annotator": "human"
}