[
    {
        "question": "from typing import List\n\n\ndef separate_paren_groups(paren_string: str) -> List[str]:\n    \"\"\" Input to this function is a string containing multiple groups of nested parentheses. Your goal is to\n    separate those group into separate strings and return the list of those.\n    Separate groups are balanced (each open brace is properly closed) and not nested within each other\n    Ignore any spaces in the input string.\n    >>> separate_paren_groups('( ) (( )) (( )( ))')\n    ['()', '(())', '(()())']\n    \"\"\"\n",
        "unit_test": "METADATA = {\n    'author': 'jt',\n    'dataset': 'test'\n}\n\n\ndef check(candidate):\n    assert candidate('(()()) ((())) () ((())()())') == [\n        '(()())', '((()))', '()', '((())()())'\n    ]\n    assert candidate('() (()) ((())) (((())))') == [\n        '()', '(())', '((()))', '(((())))'\n    ]\n    assert candidate('(()(())((())))') == [\n        '(()(())((())))'\n    ]\n    assert candidate('( ) (( )) (( )( ))') == ['()', '(())', '(()())']",
        "ground_truth_code": "result = []\n    current_string = []\n    current_depth = 0\n\n    for c in paren_string:\n        if c == '(':\n            current_depth += 1\n            current_string.append(c)\n        elif c == ')':\n            current_depth -= 1\n            current_string.append(c)\n\n            if current_depth == 0:\n                result.append(''.join(current_string))\n                current_string.clear()\n\n    return result\n",
        "generation": "result = []\n    current_string = []\n    current_depth = 0\n\n    for c in paren_string:\n        if c == '(':\n            current_depth += 1\n            current_string.append(c)\n        elif c == ')':\n            current_depth -= 1\n            current_string.append(c)\n\n            if current_depth == 0:\n                result.append(''.join(current_string))\n                current_string.clear()\n\n    return result\n",
        "exec_rest": "{'status': 'NOT PASSED', 'detail': 'Traceback (most recent call last):\\n  File \"/tmp/tmpb2s_t735.py\", line 70, in <module>\\n    check(separate_paren_groups)\\n  File \"/tmp/tmpb2s_t735.py\", line 59, in check\\n    assert candidate(\\'(()()) ((())) () ((())()())\\') == [\\nAssertionError\\n'}",
        "data_source": "humaneval",
        "metadata": {
            "quality": "super-high",
            "llm_name": "baichuan2-13b"
        }
    },
    {
        "question": "def string_sequence(n: int) -> str:\n    \"\"\" Return a string containing space-delimited numbers starting from 0 upto n inclusive.\n    >>> string_sequence(0)\n    '0'\n    >>> string_sequence(5)\n    '0 1 2 3 4 5'\n    \"\"\"\n",
        "unit_test": "METADATA = {\n    'author': 'jt',\n    'dataset': 'test'\n}\n\n\ndef check(candidate):\n    assert candidate(0) == '0'\n    assert candidate(3) == '0 1 2 3'\n    assert candidate(10) == '0 1 2 3 4 5 6 7 8 9 10'",
        "ground_truth_code": "return ' '.join([str(x) for x in range(n + 1)])\n",
        "generation": "return ' '.join([str(x) for x in range(n + 1)])\n",
        "exec_rest": "{'status': 'NOT PASSED', 'detail': 'Traceback (most recent call last):\\n  File \"/tmp/tmptwv6ob4b.py\", line 42, in <module>\\n    check(string_sequence)\\n  File \"/tmp/tmptwv6ob4b.py\", line 38, in check\\n    assert candidate(0) == \\'0\\'\\nAssertionError\\n'}",
        "data_source": "humaneval",
        "metadata": {
            "quality": "super-high",
            "llm_name": "baichuan2-13b"
        }
    },
    {
        "question": "from typing import List\n\n\ndef intersperse(numbers: List[int], delimeter: int) -> List[int]:\n    \"\"\" Insert a number 'delimeter' between every two consecutive elements of input list `numbers'\n    >>> intersperse([], 4)\n    []\n    >>> intersperse([1, 2, 3], 4)\n    [1, 4, 2, 4, 3]\n    \"\"\"\n",
        "unit_test": "METADATA = {\n    'author': 'jt',\n    'dataset': 'test'\n}\n\n\ndef check(candidate):\n    assert candidate([], 7) == []\n    assert candidate([5, 6, 3, 2], 8) == [5, 8, 6, 8, 3, 8, 2]\n    assert candidate([2, 2, 2], 2) == [2, 2, 2, 2, 2]",
        "ground_truth_code": "if not numbers:\n        return []\n\n    result = []\n\n    for n in numbers[:-1]:\n        result.append(n)\n        result.append(delimeter)\n\n    result.append(numbers[-1])\n\n    return result\n",
        "generation": "if not numbers:\n        return []\n\n    result = []\n\n    for n in numbers[:-1]:\n        result.append(n)\n        result.append(delimeter)\n\n    result.append(numbers[-1])\n\n    return result\n",
        "exec_rest": "{'status': 'NOT PASSED', 'detail': 'Traceback (most recent call last):\\n  File \"/tmp/tmp9xpatx5j.py\", line 51, in <module>\\n    check(intersperse)\\n  File \"/tmp/tmp9xpatx5j.py\", line 48, in check\\n    assert candidate([5, 6, 3, 2], 8) == [5, 8, 6, 8, 3, 8, 2]\\nAssertionError\\n'}",
        "data_source": "humaneval",
        "metadata": {
            "quality": "super-high",
            "llm_name": "vicuna-33b"
        }
    },
    {
        "question": "def is_palindrome(string: str) -> bool:\n    \"\"\" Test if given string is a palindrome \"\"\"\n    return string == string[::-1]\n\n\ndef make_palindrome(string: str) -> str:\n    \"\"\" Find the shortest palindrome that begins with a supplied string.\n    Algorithm idea is simple:\n    - Find the longest postfix of supplied string that is a palindrome.\n    - Append to the end of the string reverse of a string prefix that comes before the palindromic suffix.\n    >>> make_palindrome('')\n    ''\n    >>> make_palindrome('cat')\n    'catac'\n    >>> make_palindrome('cata')\n    'catac'\n    \"\"\"\n",
        "unit_test": "METADATA = {\n    'author': 'jt',\n    'dataset': 'test'\n}\n\n\ndef check(candidate):\n    assert candidate('') == ''\n    assert candidate('x') == 'x'\n    assert candidate('xyz') == 'xyzyx'\n    assert candidate('xyx') == 'xyx'\n    assert candidate('jerry') == 'jerryrrej'",
        "ground_truth_code": "if not string:\n        return ''\n\n    beginning_of_suffix = 0\n\n    while not is_palindrome(string[beginning_of_suffix:]):\n        beginning_of_suffix += 1\n\n    return string + string[:beginning_of_suffix][::-1]\n",
        "generation": "if not string:\n        return ''\n\n    beginning_of_suffix = 0\n\n    while not is_palindrome(string[beginning_of_suffix:]):\n        beginning_of_suffix += 1\n\n    return string + string[:beginning_of_suffix][::-1]\n",
        "exec_rest": "{'status': 'NOT PASSED', 'detail': 'Traceback (most recent call last):\\n  File \"/tmp/tmpkyr5e687.py\", line 63, in <module>\\n    check(is_palindrome)\\n  File \"/tmp/tmpkyr5e687.py\", line 57, in check\\n    assert candidate(\\'\\') == \\'\\'\\nAssertionError\\n'}",
        "data_source": "humaneval",
        "metadata": {
            "quality": "super-high",
            "llm_name": "vicuna-33b"
        }
    },
    {
        "question": "from typing import List\n\n\ndef intersperse(numbers: List[int], delimeter: int) -> List[int]:\n    \"\"\" Insert a number 'delimeter' between every two consecutive elements of input list `numbers'\n    >>> intersperse([], 4)\n    []\n    >>> intersperse([1, 2, 3], 4)\n    [1, 4, 2, 4, 3]\n    \"\"\"\n",
        "unit_test": "METADATA = {\n    'author': 'jt',\n    'dataset': 'test'\n}\n\n\ndef check(candidate):\n    assert candidate([], 7) == []\n    assert candidate([5, 6, 3, 2], 8) == [5, 8, 6, 8, 3, 8, 2]\n    assert candidate([2, 2, 2], 2) == [2, 2, 2, 2, 2]",
        "ground_truth_code": "if not numbers:\n        return []\n\n    result = []\n\n    for n in numbers[:-1]:\n        result.append(n)\n        result.append(delimeter)\n\n    result.append(numbers[-1])\n\n    return result\n",
        "generation": "if not numbers:\n        return []\n\n    result = []\n\n    for n in numbers[:-1]:\n        result.append(n)\n        result.append(delimeter)\n\n    result.append(numbers[-1])\n\n    return result\n",
        "exec_rest": "{'status': 'NOT PASSED', 'detail': 'Traceback (most recent call last):\\n  File \"/tmp/tmppz9d9_qp.py\", line 42, in <module>\\n    check(intersperse)\\n  File \"/tmp/tmppz9d9_qp.py\", line 39, in check\\n    assert candidate([5, 6, 3, 2], 8) == [5, 8, 6, 8, 3, 8, 2]\\nAssertionError\\n'}",
        "data_source": "humaneval",
        "metadata": {
            "quality": "super-high",
            "llm_name": "qwen-7b"
        }
    },
    {
        "question": "from typing import List\n\n\ndef parse_nested_parens(paren_string: str) -> List[int]:\n    \"\"\" Input to this function is a string represented multiple groups for nested parentheses separated by spaces.\n    For each of the group, output the deepest level of nesting of parentheses.\n    E.g. (()()) has maximum two levels of nesting while ((())) has three.\n\n    >>> parse_nested_parens('(()()) ((())) () ((())()())')\n    [2, 3, 1, 3]\n    \"\"\"\n",
        "unit_test": "METADATA = {\n    'author': 'jt',\n    'dataset': 'test'\n}\n\n\ndef check(candidate):\n    assert candidate('(()()) ((())) () ((())()())') == [2, 3, 1, 3]\n    assert candidate('() (()) ((())) (((())))') == [1, 2, 3, 4]\n    assert candidate('(()(())((())))') == [4]",
        "ground_truth_code": "def parse_paren_group(s):\n        depth = 0\n        max_depth = 0\n        for c in s:\n            if c == '(':\n                depth += 1\n                max_depth = max(depth, max_depth)\n            else:\n                depth -= 1\n\n        return max_depth\n\n    return [parse_paren_group(x) for x in paren_string.split(' ') if x]\n",
        "generation": "def parse_paren_group(s):\n        depth = 0\n        max_depth = 0\n        for c in s:\n            if c == '(':\n                depth += 1\n                max_depth = max(depth, max_depth)\n            else:\n                depth -= 1\n\n        return max_depth\n\n    return [parse_paren_group(x) for x in paren_string.split(' ') if x]\n",
        "exec_rest": "{'status': 'NOT PASSED', 'detail': 'Traceback (most recent call last):\\n  File \"/tmp/tmpdey4hofr.py\", line 48, in <module>\\n    check(parse_nested_parens)\\n  File \"/tmp/tmpdey4hofr.py\", line 44, in check\\n    assert candidate(\\'(()()) ((())) () ((())()())\\') == [2, 3, 1, 3]\\nAssertionError\\n'}",
        "data_source": "humaneval",
        "metadata": {
            "quality": "super-high",
            "llm_name": "qwen-7b"
        }
    },
    {
        "question": "from typing import List\n\n\ndef separate_paren_groups(paren_string: str) -> List[str]:\n    \"\"\" Input to this function is a string containing multiple groups of nested parentheses. Your goal is to\n    separate those group into separate strings and return the list of those.\n    Separate groups are balanced (each open brace is properly closed) and not nested within each other\n    Ignore any spaces in the input string.\n    >>> separate_paren_groups('( ) (( )) (( )( ))')\n    ['()', '(())', '(()())']\n    \"\"\"\n",
        "unit_test": "METADATA = {\n    'author': 'jt',\n    'dataset': 'test'\n}\n\n\ndef check(candidate):\n    assert candidate('(()()) ((())) () ((())()())') == [\n        '(()())', '((()))', '()', '((())()())'\n    ]\n    assert candidate('() (()) ((())) (((())))') == [\n        '()', '(())', '((()))', '(((())))'\n    ]\n    assert candidate('(()(())((())))') == [\n        '(()(())((())))'\n    ]\n    assert candidate('( ) (( )) (( )( ))') == ['()', '(())', '(()())']",
        "ground_truth_code": "result = []\n    current_string = []\n    current_depth = 0\n\n    for c in paren_string:\n        if c == '(':\n            current_depth += 1\n            current_string.append(c)\n        elif c == ')':\n            current_depth -= 1\n            current_string.append(c)\n\n            if current_depth == 0:\n                result.append(''.join(current_string))\n                current_string.clear()\n\n    return result\n",
        "generation": "result = []\n    current_string = []\n    current_depth = 0\n\n    for c in paren_string:\n        if c == '(':\n            current_depth += 1\n            current_string.append(c)\n        elif c == ')':\n            current_depth -= 1\n            current_string.append(c)\n\n            if current_depth == 0:\n                result.append(''.join(current_string))\n                current_string.clear()\n\n    return result\n",
        "exec_rest": "{'status': 'NOT PASSED', 'detail': 'Traceback (most recent call last):\\n  File \"/tmp/tmpelxx7d63.py\", line 68, in <module>\\n    check(separate_paren_groups)\\n  File \"/tmp/tmpelxx7d63.py\", line 57, in check\\n    assert candidate(\\'(()()) ((())) () ((())()())\\') == [\\n  File \"/tmp/tmpelxx7d63.py\", line 36, in separate_paren_groups\\n    raise ValueError(\"Unmatched parentheses\")\\nValueError: Unmatched parentheses\\n'}",
        "data_source": "humaneval",
        "metadata": {
            "quality": "super-high",
            "llm_name": "internlm-20b"
        }
    },
    {
        "question": "from typing import List, Tuple\n\n\ndef sum_product(numbers: List[int]) -> Tuple[int, int]:\n    \"\"\" For a given list of integers, return a tuple consisting of a sum and a product of all the integers in a list.\n    Empty sum should be equal to 0 and empty product should be equal to 1.\n    >>> sum_product([])\n    (0, 1)\n    >>> sum_product([1, 2, 3, 4])\n    (10, 24)\n    \"\"\"\n",
        "unit_test": "METADATA = {\n    'author': 'jt',\n    'dataset': 'test'\n}\n\n\ndef check(candidate):\n    assert candidate([]) == (0, 1)\n    assert candidate([1, 1, 1]) == (3, 1)\n    assert candidate([100, 0]) == (100, 0)\n    assert candidate([3, 5, 7]) == (3 + 5 + 7, 3 * 5 * 7)\n    assert candidate([10]) == (10, 10)",
        "ground_truth_code": "sum_value = 0\n    prod_value = 1\n\n    for n in numbers:\n        sum_value += n\n        prod_value *= n\n    return sum_value, prod_value\n",
        "generation": "sum_value = 0\n    prod_value = 1\n\n    for n in numbers:\n        sum_value += n\n        prod_value *= n\n    return sum_value, prod_value\n",
        "exec_rest": "{'status': 'NOT PASSED', 'detail': 'Traceback (most recent call last):\\n  File \"/tmp/tmpgcoqg_zh.py\", line 17, in <module>\\n    def sum_product(numbers: List[int]) -> Tuple[int, int]:\\nTypeError: \\'type\\' object is not subscriptable\\n'}",
        "data_source": "humaneval",
        "metadata": {
            "quality": "super-high",
            "llm_name": "internlm-20b"
        }
    },
    {
        "question": "from typing import List, Tuple\n\n\ndef rolling_max(numbers: List[int]) -> List[int]:\n    \"\"\" From a given list of integers, generate a list of rolling maximum element found until given moment\n    in the sequence.\n    >>> rolling_max([1, 2, 3, 2, 3, 4, 2])\n    [1, 2, 3, 3, 3, 4, 4]\n    \"\"\"\n",
        "unit_test": "METADATA = {\n    'author': 'jt',\n    'dataset': 'test'\n}\n\n\ndef check(candidate):\n    assert candidate([]) == []\n    assert candidate([1, 2, 3, 4]) == [1, 2, 3, 4]\n    assert candidate([4, 3, 2, 1]) == [4, 4, 4, 4]\n    assert candidate([3, 2, 3, 100, 3]) == [3, 3, 3, 100, 100]",
        "ground_truth_code": "running_max = None\n    result = []\n\n    for n in numbers:\n        if running_max is None:\n            running_max = n\n        else:\n            running_max = max(running_max, n)\n\n        result.append(running_max)\n\n    return result\n",
        "generation": "running_max = None\n    result = []\n\n    for n in numbers:\n        if running_max is None:\n            running_max = n\n        else:\n            running_max = max(running_max, n)\n\n        result.append(running_max)\n\n    return result\n",
        "exec_rest": "{'status': 'NOT PASSED', 'detail': 'Traceback (most recent call last):\\n  File \"/tmp/tmp145tpl6y.py\", line 43, in <module>\\n    check(rolling_max)\\n  File \"/tmp/tmp145tpl6y.py\", line 38, in check\\n    assert candidate([]) == []\\n  File \"/tmp/tmp145tpl6y.py\", line 25, in rolling_max\\n    result = [numbers[0]]\\nIndexError: list index out of range\\n'}",
        "data_source": "humaneval",
        "metadata": {
            "quality": "super-high",
            "llm_name": "internlm-20b"
        }
    },
    {
        "question": "from typing import List\n\n\ndef intersperse(numbers: List[int], delimeter: int) -> List[int]:\n    \"\"\" Insert a number 'delimeter' between every two consecutive elements of input list `numbers'\n    >>> intersperse([], 4)\n    []\n    >>> intersperse([1, 2, 3], 4)\n    [1, 4, 2, 4, 3]\n    \"\"\"\n",
        "unit_test": "METADATA = {\n    'author': 'jt',\n    'dataset': 'test'\n}\n\n\ndef check(candidate):\n    assert candidate([], 7) == []\n    assert candidate([5, 6, 3, 2], 8) == [5, 8, 6, 8, 3, 8, 2]\n    assert candidate([2, 2, 2], 2) == [2, 2, 2, 2, 2]",
        "ground_truth_code": "if not numbers:\n        return []\n\n    result = []\n\n    for n in numbers[:-1]:\n        result.append(n)\n        result.append(delimeter)\n\n    result.append(numbers[-1])\n\n    return result\n",
        "generation": "if not numbers:\n        return []\n\n    result = []\n\n    for n in numbers[:-1]:\n        result.append(n)\n        result.append(delimeter)\n\n    result.append(numbers[-1])\n\n    return result\n",
        "exec_rest": "{'status': 'NOT PASSED', 'detail': 'Traceback (most recent call last):\\n  File \"/tmp/tmpyst7o6um.py\", line 30, in <module>\\n    assert intersperse([1, 2, 3], 4) == [1, 4, 2, 4, 3]\\nAssertionError\\n'}",
        "data_source": "humaneval",
        "metadata": {
            "quality": "super-high",
            "llm_name": "wizardlm-70b"
        }
    }
]