{
    "uuid": "f7c8f3fc-801a-5e50-9722-af38407a0b9d",
    "question": "What are the seven categories of tasks, which form the dataset used to conduct SFT on a Llama-2-7B model in section 2.1?",
    "answer_format": "Your answer should be a Python list of seven elements, containing the names of the seven categories of tasks. e.g. [\"task1\", \"task2\", ... \"task7\"]. YOU MUST USE THE EXACT AND FULL NAMES OF THE TASKS AS MENTIONED IN THE PAPER.",
    "tags": [
        "objective",
        "single",
        "text"
    ],
    "conference": [],
    "reasoning_steps": [
        "Read section 2.1 and locate the implementation details.",
        "Find the details concerning dataset.",
        "List the seven categories of tasks"
    ],
    "evaluator": {
        "eval_func": "eval_structured_object_exact_match",
        "eval_kwargs": {
            "gold": [
                "closed-book question answering",
                "coreference resolution",
                "natural language inference",
                "abstract summarization",
                "multi-lingual translation",
                "reading comprehension",
                "text classification"
            ],
            "ignore_order": true,
            "lowercase": true
        }
    },
    "state": {
        "gui-gpt-4o-2024-11-20": false
    },
    "annotator": "human",
    "anchor_pdf": [
        "eed48331-03ed-52de-8f87-c71da234697c"
    ],
    "reference_pdf": []
}