{
    "uuid": "896a8ab2-38ab-5ae9-95cc-2d883784e87e",
    "question": "In the main experiment of \"AN LLM CAN FOOL ITSELF: A PROMPT-BASED ADVERSARIAL ATTACK\", what high-level tasks do the five tasks used belong to, as categorized in the original paper?",
    "answer_format": "Your answer should be a python dictionary with the following format: {'task1': 'task1_category', 'task2': 'task2_category', 'task3': 'task3_category', 'task4': 'task4_category', 'task5': 'task5_category'}. YOU MUST USE THE EXACT NAMES OF THE CATEGORIES IN THE PAPER AND THE ABBREVIATION OF THE TASKS.",
    "tags": [
        "multiple",
        "text",
        "objective"
    ],
    "anchor_pdf": [
        "4cc48a5b-be5f-57af-8697-1cc75c0f67d0"
    ],
    "reference_pdf": [
        "2292ac5f-ddf9-5ed5-8009-b4f7a69a8ec9"
    ],
    "conference": [],
    "reasoning_steps": [
        "Find the five tasks used in the main experiment of the anchor paper.",
        "Locate the relevant paper proposing the five tasks.",
        "Identify the high-level tasks that the five tasks belong to, which are categorized in the Tasks section in the form of titles."
    ],
    "evaluator": {
        "eval_func": "eval_structured_object_exact_match",
        "eval_kwargs": {
            "gold": {
                "SST-2": "Single-Sentence Tasks",
                "QQP": "Similarity and Paraphrase Tasks",
                "MNLI": "Inference Tasks",
                "RTE": "Inference Tasks",
                "QNLI": "Inference Tasks"
            },
            "ignore_order": true,
            "lowercase": true,
            "threshold": 80
        }
    },
    "state": {
        "gui-gpt-4o-2024-11-20": false
    },
    "annotator": "human"
}