{
    "name": "multistep_arithmetic",
    "description": "Solve multi-step arithmetic problems",
    "instances": {
        "123": {
            "template": "\"To evaluate the expression '(-5 - 0 - 9)' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]\" \n num_eval_steps = 0 \n while num_eval_steps < 4 and control_var.startswith(\" The next\"):\n \t\" one is '[subexpression] and evaluates to '[subeval]'.[control_var]\"\n \t num_eval_steps +=1 \n \" the full expression '(-5 - 0 - 9)' evaluates to '[answer]'\"",
            "condition": "control_var in [\" The next\", \" To conclude, \"] and STOPS_AT (subexpression, \"'\") and not \"\\n\" in subexpression and STOPS_AT(subeval, \"'\") and STOPS_AT(answer, \"'\")",
            "target": "-14",
            "subtask": "[] depth_levels and 3 operations."
        },
        "1043": {
            "template": "\"To evaluate the expression '((((3 - -6 + -5) * (-6 * -5 - 5)) + ((-4 * 0 - 6) + (4 + 5 - 8))) - (((-6 * 2 + 9) - (3 * 2 * -7)) - ((8 * 9 + 0) + (5 * -1 * 9))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]\" \n num_eval_steps = 0 \n while num_eval_steps < 4 and control_var.startswith(\" The next\"):\n \t\" one is '[subexpression] and evaluates to '[subeval]'.[control_var]\"\n \t num_eval_steps +=1 \n \" the full expression '((((3 - -6 + -5) * (-6 * -5 - 5)) + ((-4 * 0 - 6) + (4 + 5 - 8))) - (((-6 * 2 + 9) - (3 * 2 * -7)) - ((8 * 9 + 0) + (5 * -1 * 9))))' evaluates to '[answer]'\"",
            "condition": "control_var in [\" The next\", \" To conclude, \"] and STOPS_AT (subexpression, \"'\") and not \"\\n\" in subexpression and STOPS_AT(subeval, \"'\") and STOPS_AT(answer, \"'\")",
            "target": "83",
            "subtask": "[2, 2, 2] depth_levels and 3 operations."
        },
        "425": {
            "template": "\"To evaluate the expression '((-5 - -2 * 0) - (4 + 3 + -3))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]\" \n num_eval_steps = 0 \n while num_eval_steps < 4 and control_var.startswith(\" The next\"):\n \t\" one is '[subexpression] and evaluates to '[subeval]'.[control_var]\"\n \t num_eval_steps +=1 \n \" the full expression '((-5 - -2 * 0) - (4 + 3 + -3))' evaluates to '[answer]'\"",
            "condition": "control_var in [\" The next\", \" To conclude, \"] and STOPS_AT (subexpression, \"'\") and not \"\\n\" in subexpression and STOPS_AT(subeval, \"'\") and STOPS_AT(answer, \"'\")",
            "target": "-9",
            "subtask": "[2] depth_levels and 3 operations."
        },
        "37": {
            "template": "\"To evaluate the expression '(-9 * -5)' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]\" \n num_eval_steps = 0 \n while num_eval_steps < 4 and control_var.startswith(\" The next\"):\n \t\" one is '[subexpression] and evaluates to '[subeval]'.[control_var]\"\n \t num_eval_steps +=1 \n \" the full expression '(-9 * -5)' evaluates to '[answer]'\"",
            "condition": "control_var in [\" The next\", \" To conclude, \"] and STOPS_AT (subexpression, \"'\") and not \"\\n\" in subexpression and STOPS_AT(subeval, \"'\") and STOPS_AT(answer, \"'\")",
            "target": "45",
            "subtask": "[] depth_levels and 2 operations."
        },
        "33": {
            "template": "\"To evaluate the expression '(-1 * -1)' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]\" \n num_eval_steps = 0 \n while num_eval_steps < 4 and control_var.startswith(\" The next\"):\n \t\" one is '[subexpression] and evaluates to '[subeval]'.[control_var]\"\n \t num_eval_steps +=1 \n \" the full expression '(-1 * -1)' evaluates to '[answer]'\"",
            "condition": "control_var in [\" The next\", \" To conclude, \"] and STOPS_AT (subexpression, \"'\") and not \"\\n\" in subexpression and STOPS_AT(subeval, \"'\") and STOPS_AT(answer, \"'\")",
            "target": "1",
            "subtask": "[] depth_levels and 2 operations."
        },
        "175": {
            "template": "\"To evaluate the expression '(-9 + -2 - -2)' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]\" \n num_eval_steps = 0 \n while num_eval_steps < 4 and control_var.startswith(\" The next\"):\n \t\" one is '[subexpression] and evaluates to '[subeval]'.[control_var]\"\n \t num_eval_steps +=1 \n \" the full expression '(-9 + -2 - -2)' evaluates to '[answer]'\"",
            "condition": "control_var in [\" The next\", \" To conclude, \"] and STOPS_AT (subexpression, \"'\") and not \"\\n\" in subexpression and STOPS_AT(subeval, \"'\") and STOPS_AT(answer, \"'\")",
            "target": "-9",
            "subtask": "[] depth_levels and 3 operations."
        },
        "1186": {
            "template": "\"To evaluate the expression '((((-9 - 5 + 1 - -5) * (9 - -3 + 2 - -8)) - ((-1 - -6 * 7 * -2) - (-8 * -9 - 9 + 5))) + (((-7 - 6 - 8 - 8) * (-3 * 4 + 8 * 0)) - ((8 + 4 - 0 - 5) - (-1 - 7 + 4 * -8))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]\" \n num_eval_steps = 0 \n while num_eval_steps < 4 and control_var.startswith(\" The next\"):\n \t\" one is '[subexpression] and evaluates to '[subeval]'.[control_var]\"\n \t num_eval_steps +=1 \n \" the full expression '((((-9 - 5 + 1 - -5) * (9 - -3 + 2 - -8)) - ((-1 - -6 * 7 * -2) - (-8 * -9 - 9 + 5))) + (((-7 - 6 - 8 - 8) * (-3 * 4 + 8 * 0)) - ((8 + 4 - 0 - 5) - (-1 - 7 + 4 * -8))))' evaluates to '[answer]'\"",
            "condition": "control_var in [\" The next\", \" To conclude, \"] and STOPS_AT (subexpression, \"'\") and not \"\\n\" in subexpression and STOPS_AT(subeval, \"'\") and STOPS_AT(answer, \"'\")",
            "target": "278",
            "subtask": "[2, 2, 2] depth_levels and 4 operations."
        },
        "923": {
            "template": "\"To evaluate the expression '((((-3 + -2) * (5 + 3)) - ((-5 + -3) - (-8 * -3))) - (((-2 + 8) - (6 - 2)) + ((-5 - -4) * (-3 - 8))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]\" \n num_eval_steps = 0 \n while num_eval_steps < 4 and control_var.startswith(\" The next\"):\n \t\" one is '[subexpression] and evaluates to '[subeval]'.[control_var]\"\n \t num_eval_steps +=1 \n \" the full expression '((((-3 + -2) * (5 + 3)) - ((-5 + -3) - (-8 * -3))) - (((-2 + 8) - (6 - 2)) + ((-5 - -4) * (-3 - 8))))' evaluates to '[answer]'\"",
            "condition": "control_var in [\" The next\", \" To conclude, \"] and STOPS_AT (subexpression, \"'\") and not \"\\n\" in subexpression and STOPS_AT(subeval, \"'\") and STOPS_AT(answer, \"'\")",
            "target": "-21",
            "subtask": "[2, 2, 2] depth_levels and 2 operations."
        },
        "1158": {
            "template": "\"To evaluate the expression '((((7 + 6 + -2 * 5) + (9 + 5 + -5 + 6)) - ((1 + -4 - 7 + 7) + (-5 + -3 - -4 - 3))) - (((1 - -8 - 9 + 6) + (0 + 4 * -6 * -1)) * ((-1 - -6 * -6 + -9) + (9 * 0 - 4 - 0))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]\" \n num_eval_steps = 0 \n while num_eval_steps < 4 and control_var.startswith(\" The next\"):\n \t\" one is '[subexpression] and evaluates to '[subeval]'.[control_var]\"\n \t num_eval_steps +=1 \n \" the full expression '((((7 + 6 + -2 * 5) + (9 + 5 + -5 + 6)) - ((1 + -4 - 7 + 7) + (-5 + -3 - -4 - 3))) - (((1 - -8 - 9 + 6) + (0 + 4 * -6 * -1)) * ((-1 - -6 * -6 + -9) + (9 * 0 - 4 - 0))))' evaluates to '[answer]'\"",
            "condition": "control_var in [\" The next\", \" To conclude, \"] and STOPS_AT (subexpression, \"'\") and not \"\\n\" in subexpression and STOPS_AT(subeval, \"'\") and STOPS_AT(answer, \"'\")",
            "target": "1528",
            "subtask": "[2, 2, 2] depth_levels and 4 operations."
        },
        "697": {
            "template": "\"To evaluate the expression '(((-8 * -9) * (-4 * 6)) - ((-7 * -7) * (-8 + -1)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]\" \n num_eval_steps = 0 \n while num_eval_steps < 4 and control_var.startswith(\" The next\"):\n \t\" one is '[subexpression] and evaluates to '[subeval]'.[control_var]\"\n \t num_eval_steps +=1 \n \" the full expression '(((-8 * -9) * (-4 * 6)) - ((-7 * -7) * (-8 + -1)))' evaluates to '[answer]'\"",
            "condition": "control_var in [\" The next\", \" To conclude, \"] and STOPS_AT (subexpression, \"'\") and not \"\\n\" in subexpression and STOPS_AT(subeval, \"'\") and STOPS_AT(answer, \"'\")",
            "target": "-1287",
            "subtask": "[2, 2] depth_levels and 2 operations."
        }
    }
}