{
    "uuid": "a3c6958b-aed2-5e28-8dea-5d0b88550ac8",
    "question": "According to the first survey of LLM for NL2Code, what're the three most recent decoder-only LLMs for NL2Code? How many programming languages do their training datasets contain respectively?",
    "answer_format": "Your answer should be a Python dictionary of 3 key-value pairs, where each key is the name of the LLM and each value is an integer indicating the number of programming languages in its training dataset. e.g. {\"LLM1\": 3, \"LLM2\": 5, \"LLM3\": 2}",
    "tags": [
        "multiple",
        "objective",
        "table",
        "text"
    ],
    "anchor_pdf": [
        "37758401-6101-554f-8f1e-4e2995443314"
    ],
    "reference_pdf": [
        "6590d875-4982-56a0-8bd7-e67f4bc777c9",
        "c1fed3f4-7a5f-5877-97e5-aa508eac885e",
        "4badd0e5-53ce-5044-b6c6-abec723c34aa",
        "01c9329e-9789-52dc-9eed-c99a8ef88a5c",
        "3c3b3cfc-e4f2-52b9-899a-2f9cac25dafc"
    ],
    "conference": [],
    "reasoning_steps": [
        "Find the table which compares different LLMs for NL2Code.",
        "Identify the three most recent decoder-only LLMs.",
        "Locate the respective papers.",
        "Find the number of programming languages in training datasets for each LLM."
    ],
    "evaluator": {
        "eval_func": "eval_structured_object_exact_match",
        "eval_kwargs": {
            "gold": {
                "CodeGeeX": 23,
                "BLOOM": 13,
                "SantaCoder": 3
            }
        }
    },
    "state": {
        "gui-gpt-4o-2024-11-20": false
    },
    "annotator": "human"
}