{
    "uuid": "127ed600-b05d-5a06-9987-3d8dfe98b135",
    "question": "Among all the given anchor PDFs, which one does not use any objective evaluation metrics? What is the difference in conversion goals between this paper and the others?",
    "answer_format": "Your answer should be a Python list where the first item is the full name of the paper (a string) and the second item describes the difference in conversion goals (a string).",
    "tags": [
        "multiple",
        "text",
        "subjective"
    ],
    "anchor_pdf": [
        "911d4572-a45c-5bb8-8662-2e2455909cd2",
        "4535464e-20c9-5370-ba5c-63e36d110e00",
        "03b37833-5723-5e55-950d-d5d25a5c539c",
        "9d047a73-dcef-5b95-8f29-d9de087dabf8",
        "8d661aa7-ec95-5977-9825-0e4c94751e52"
    ],
    "reference_pdf": [],
    "conference": [],
    "reasoning_steps": [
        "Check the evaluation metrics used in each paper to identify the one without any objective metrics.",
        "Summarize the conversion tasks from the abstracts of all papers.",
        "Identify the difference in conversion goals between the identified paper and the others."
    ],
    "evaluator": {
        "eval_func": "eval_conjunction",
        "eval_kwargs": {
            "eval_func_list": [
                "eval_string_exact_match",
                "eval_reference_answer_with_llm"
            ],
            "eval_kwargs_list": [
                {
                    "gold": "Voice-Preserving Zero-Shot Multiple Accent Conversion",
                    "lowercase": true
                },
                {
                    "reference_answer": "Other papers focus on voice conversion, while this paper focuses on accent conversion, where the speaker's voice identity should be preserved.",
                    "question": "What is the difference in conversion goals between this paper and the others?"
                }
            ]
        }
    },
    "state": {
        "gui-gpt-4o-2024-11-20": false
    },
    "annotator": "human"
}