{
    "uuid": "891093a5-a10b-5299-a421-a77713a8886e",
    "question": "According to Table 1, which baselines this paper used has the highest average score? In which paper is this method proposed? And in which conference was this paper published?",
    "answer_format": "Your answer should be a python list with three items, the first item is the name of baseline reaching the highest average score according to Table 1, the second item is the name of paper where this method proposed, and the third item is the abbreviation of the conference name where this paper was published.",
    "tags": [
        "metadata",
        "objective",
        "single"
    ],
    "conference": [],
    "reasoning_steps": [
        "First, get the content of Table 1.",
        "Second, find what baseline reaching the highest average score.",
        "Third, according to reference, get the name of paper where this method was proposed.",
        "Finally, find the name of conference where this paper was published."
    ],
    "evaluator": {
        "eval_func": "eval_structured_object_exact_match",
        "eval_kwargs": {
            "gold": [
                "SimCTG",
                "A contrastive framework for neural text generation",
                "NeurIPS"
            ],
            "ignore_order": false
        }
    },
    "state": {
        "gpt-4o-2024-05-13": false,
        "gui-gpt-4o-2024-05-13": false
    },
    "annotator": "human",
    "anchor_pdf": [
        "9c5c3a63-3042-582a-9358-d0c61de3330d"
    ],
    "reference_pdf": []
}