{
    "uuid": "7350bb9b-a510-5614-a994-1d99a6368e57",
    "question": "In the paper that DRAGIN follows the most in term of template prompt, which models are utilized as the CoT generator of the proposed retriever?",
    "answer_format": "Your answer should be a string, giving the detailed names of the models, as proposed in the reference paper.",
    "tags": [
        "multiple",
        "text",
        "subjective"
    ],
    "anchor_pdf": [
        "4c90f20c-5542-5573-96d2-62745066c3ca"
    ],
    "reference_pdf": [
        "6d0ea9bc-a7ee-5598-896f-02c44aa42194",
        "89b83f29-085e-5da6-a5b4-7cba324a4052",
        "f398b6e5-0ff2-59e4-9f26-eba5cea5b48c"
    ],
    "conference": [],
    "reasoning_steps": [
        "Read the section that discusses the settings of datasets.",
        "Find the paper that DRAGIN follows the most in term of template prompt.",
        "Read the section about experiment in that paper to identify specific configuration."
    ],
    "evaluator": {
        "eval_func": "eval_reference_answer_with_llm",
        "eval_kwargs": {
            "reference_answer": "We experiment with OpenAI GPT3 (code-davinci-002) and Flan-T5 of different sizes as its CoT generator.",
            "question": "In the paper that DRAGIN follows the most in term of template prompt, which models are utilized as the CoT generator of the proposed retriever?"
        }
    },
    "state": {
        "gui-gpt-4o-2024-11-20": false
    },
    "annotator": "human"
}