decoder,distribution,executor,lmql_hash,model,model_result,model_stats,prediction,query,query_file,repo_hash,shots,target,task_name,timestamp
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,"To evaluate the expression '(((-7 - 0) + (-2 - 9)) * ((-5 * 6) + (5 * 2)))' you split it into multiple subexpressions. The first one is '(-7 - 0)'. and evaluates to '-7'.'. The next one is '(-2 - 9)', and evaluates to '-11'.'. The next one is '(-5 * 6)', and evaluates to '-30'.'. The next one is '5 * 2', and evaluates to '10'.'. The next one is '((-7 - 0) + (-2 - 9))', and evaluates to '-18'.'. The next the full expression '(((-7 - 0) + (-2 - 9)) * ((-5 * 6) + (5 * 2)))' evaluates to '-180'.'",,-180',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((-7 - 0) + (-2 - 9)) * ((-5 * 6) + (5 * 2)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((-7 - 0) + (-2 - 9)) * ((-5 * 6) + (5 * 2)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/600.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,360,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((-1 - 3) - (-5 * -5)) - ((0 * -3) - (5 * 5)))' you split it into multiple subexpressions. The first one is '-1 - 3'. and evaluates to '-4'.'. The next one is '-5 * -5' and evaluates to '25'.'. The next one is '0 * -3' and evaluates to '0'.'. The next one is '5 * 5' and evaluates to '25'.'. The next one is '-4 - 25' and evaluates to '-29'.'. The next the full expression '(((-1 - 3) - (-5 * -5)) - ((0 * -3) - (5 * 5)))' evaluates to '-29'.',"{'tokens': 33386, 'model': 'openai/text-davinci-003', 'req.': 239, 'avb': '1.16', 'step': 134}",-29',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((-1 - 3) - (-5 * -5)) - ((0 * -3) - (5 * 5)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((-1 - 3) - (-5 * -5)) - ((0 * -3) - (5 * 5)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/654.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-4,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((-2 * 7 + -6) * (8 - 7 - 5)) - ((6 * -2 + 1) * (-8 * 3 * -1))) + (((9 - -7 - -7) - (0 + -7 - -3)) - ((8 * -2 + -6) * (-3 - 3 - 8))))' you split it into multiple subexpressions. The first one is '((-2 * 7 + -6) * (8 - 7 - 5))'. and evaluates to '-42'.'. The next one is '((6 * -2 + 1) * (-8 * 3 * -1))' and evaluates to '48'.'. The next one is '((9 - -7 - -7) - (0 + -7 - -3))' and evaluates to '-4'.'. The next one is '((8 * -2 + -6) * (-3 - 3 - 8))' and evaluates to '-144'.'. The next one is '-42 - 48 - 4 - 144' and evaluates to '-238'.'. The next the full expression '((((-2 * 7 + -6) * (8 - 7 - 5)) - ((6 * -2 + 1) * (-8 * 3 * -1))) + (((9 - -7 - -7) - (0 + -7 - -3)) - ((8 * -2 + -6) * (-3 - 3 - 8))))' evaluates to '-238'.',,-238',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((-2 * 7 + -6) * (8 - 7 - 5)) - ((6 * -2 + 1) * (-8 * 3 * -1))) + (((9 - -7 - -7) - (0 + -7 - -3)) - ((8 * -2 + -6) * (-3 - 3 - 8))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((-2 * 7 + -6) * (8 - 7 - 5)) - ((6 * -2 + 1) * (-8 * 3 * -1))) + (((9 - -7 - -7) - (0 + -7 - -3)) - ((8 * -2 + -6) * (-3 - 3 - 8))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1009.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,63,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((5 + 0) - (0 + 4)) - ((-1 + 4) * (6 - 0)))' you split it into multiple subexpressions. The first one is '5 + 0' and evaluates to '5'.'. The next one is '0 + 4' and evaluates to '4'.'. The next one is '5 - 4' and evaluates to '1'.'. The next one is '-1 + 4' and evaluates to '3'.'. The next one is '6 - 0' and evaluates to '6'.'. The next the full expression '(((5 + 0) - (0 + 4)) - ((-1 + 4) * (6 - 0)))' evaluates to '-17'.',,-17',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((5 + 0) - (0 + 4)) - ((-1 + 4) * (6 - 0)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((5 + 0) - (0 + 4)) - ((-1 + 4) * (6 - 0)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/618.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-17,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((3 - -6 + -5) * (-6 * -5 - 5)) + ((-4 * 0 - 6) + (4 + 5 - 8))) - (((-6 * 2 + 9) - (3 * 2 * -7)) - ((8 * 9 + 0) + (5 * -1 * 9))))' you split it into multiple subexpressions. The first one is '3 - -6 + -5'. and evaluates to '4'.'. The next one is '-6 * -5 - 5' and evaluates to '35'.'. The next one is '-4 * 0 - 6' and evaluates to '-6'.'. The next one is '4 + 5 - 8' and evaluates to '1'.'. The next one is '-6 * 2 + 9' and evaluates to '3'.'. The next the full expression '((((3 - -6 + -5) * (-6 * -5 - 5)) + ((-4 * 0 - 6) + (4 + 5 - 8))) - (((-6 * 2 + 9) - (3 * 2 * -7)) - ((8 * 9 + 0) + (5 * -1 * 9))))' evaluates to '-541'.',,-541',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((3 - -6 + -5) * (-6 * -5 - 5)) + ((-4 * 0 - 6) + (4 + 5 - 8))) - (((-6 * 2 + 9) - (3 * 2 * -7)) - ((8 * 9 + 0) + (5 * -1 * 9))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((3 - -6 + -5) * (-6 * -5 - 5)) + ((-4 * 0 - 6) + (4 + 5 - 8))) - (((-6 * 2 + 9) - (3 * 2 * -7)) - ((8 * 9 + 0) + (5 * -1 * 9))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1043.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,83,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((-4 * 5 + -5) - (-8 - 2 - 9)) * ((7 + 4 * 8) * (-5 - 2 - -2))) + (((-4 + 5 + -4) * (2 + 9 + -8)) + ((3 * 3 - -4) + (2 + -3 - 5))))' you split it into multiple subexpressions. The first one is '-4 * 5 + -5 - -8 - 2 - 9'. and evaluates to '-4'.'. The next one is '7 + 4 * 8 * -5 - 2 - -2' and evaluates to '-14'.'. The next one is '-4 + 5 + -4 * 2 + 9 + -8' and evaluates to '-2'.'. The next one is '3 * 3 - -4 + 2 + -3 - 5' and evaluates to '-3'.'. The next one is '((-4 * 5 + -5) - (-8 - 2 - 9)) * ((7 + 4 * 8) * (-5 - 2 - -2))' and evaluates to '56'.'. The next the full expression '((((-4 * 5 + -5) - (-8 - 2 - 9)) * ((7 + 4 * 8) * (-5 - 2 - -2))) + (((-4 + 5 + -4) * (2 + 9 + -8)) + ((3 * 3 - -4) + (2 + -3 - 5))))' evaluates to '51'.',,51',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((-4 * 5 + -5) - (-8 - 2 - 9)) * ((7 + 4 * 8) * (-5 - 2 - -2))) + (((-4 + 5 + -4) * (2 + 9 + -8)) + ((3 * 3 - -4) + (2 + -3 - 5))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((-4 * 5 + -5) - (-8 - 2 - 9)) * ((7 + 4 * 8) * (-5 - 2 - -2))) + (((-4 + 5 + -4) * (2 + 9 + -8)) + ((3 * 3 - -4) + (2 + -3 - 5))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1046.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,1168,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((9 + -4) * (-9 - 6)) * ((1 + 0) * (-1 * 4)))' you split it into multiple subexpressions. The first one is '9 + -4'. and evaluates to '5'.'. The next one is '-9 - 6' and evaluates to '-15'.'. The next one is '1 + 0' and evaluates to '1'.'. The next one is '-1 * 4' and evaluates to '-4'.'. The next one is '((5) * (-15)) * ((1) * (-4))' and evaluates to '-300'.'. The next the full expression '(((9 + -4) * (-9 - 6)) * ((1 + 0) * (-1 * 4)))' evaluates to '-300'.',,-300',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((9 + -4) * (-9 - 6)) * ((1 + 0) * (-1 * 4)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((9 + -4) * (-9 - 6)) * ((1 + 0) * (-1 * 4)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/616.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,300,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,"To evaluate the expression '(((-1 + -7) + (9 - 1)) * ((4 + 8) + (6 * 5)))' you split it into multiple subexpressions. The first one is '(-1 + -7)'. and evaluates to '-8'.'. The next one is '9 - 1' and evaluates to '8'.'. The next one is '4 + 8' and evaluates to '12'.'. The next one is '6 * 5' and evaluates to '30'.'. The next one is '(-8 + 8)', and evaluates to '0'.'. The next the full expression '(((-1 + -7) + (9 - 1)) * ((4 + 8) + (6 * 5)))' evaluates to '0 * 42''",,0 * 42',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((-1 + -7) + (9 - 1)) * ((4 + 8) + (6 * 5)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((-1 + -7) + (9 - 1)) * ((4 + 8) + (6 * 5)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/648.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,0,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((-7 * 1) + (3 * 7)) - ((-8 + 0) - (1 + 9)))' you split it into multiple subexpressions. The first one is '(-7 * 1)'. and evaluates to '-7'.'. The next one is '3 * 7' and evaluates to '21'.'. The next one is '-8 + 0' and evaluates to '-8'.'. The next one is '1 + 9' and evaluates to '10'.'. The next one is '-7 + 21' and evaluates to '14'.'. The next the full expression '(((-7 * 1) + (3 * 7)) - ((-8 + 0) - (1 + 9)))' evaluates to '14'.',,14',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((-7 * 1) + (3 * 7)) - ((-8 + 0) - (1 + 9)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((-7 * 1) + (3 * 7)) - ((-8 + 0) - (1 + 9)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/619.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,32,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((5 + 7 - -2 - 3) * (4 * 5 * 3 * -5))' you split it into multiple subexpressions. The first one is '5 + 7 - -2 - 3'. and evaluates to '13 - -2 - 3''. The next one is '13 - -2' and evaluates to '15'.'. The next one is '4 * 5 * 3 * -5' and evaluates to '-300'.'. The next one is '15 * -300' and evaluates to '-4500'.'. The next one is '((5 + 7 - -2 - 3) * (4 * 5 * 3 * -5))' and evaluates to '-4500'.'. The next the full expression '((5 + 7 - -2 - 3) * (4 * 5 * 3 * -5))' evaluates to '-4500'.',,-4500',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((5 + 7 - -2 - 3) * (4 * 5 * 3 * -5))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((5 + 7 - -2 - 3) * (4 * 5 * 3 * -5))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/591.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-3300,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((-4 * 3 * 1) + (-2 * 3 + -4)) * ((6 - 5 - -8) - (6 + 5 * -6))) + (((7 * -4 - 8) * (0 - -4 * -6)) + ((6 - -2 * 9) - (7 + 3 * -8))))' you split it into multiple subexpressions. The first one is '-4 * 3 * 1'. and evaluates to '-12'.'. The next one is '-2 * 3 + -4' and evaluates to '-10'.'. The next one is '6 - 5 - -8' and evaluates to '9'.'. The next one is '6 + 5 * -6' and evaluates to '-36'.'. The next one is '7 * -4 - 8' and evaluates to '-36'.'. The next the full expression '((((-4 * 3 * 1) + (-2 * 3 + -4)) * ((6 - 5 - -8) - (6 + 5 * -6))) + (((7 * -4 - 8) * (0 - -4 * -6)) + ((6 - -2 * 9) - (7 + 3 * -8))))' evaluates to '-744'.',"{'tokens': 37905, 'model': 'openai/text-davinci-003', 'req.': 264, 'avb': '1.16', 'step': 123}",-744',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((-4 * 3 * 1) + (-2 * 3 + -4)) * ((6 - 5 - -8) - (6 + 5 * -6))) + (((7 * -4 - 8) * (0 - -4 * -6)) + ((6 - -2 * 9) - (7 + 3 * -8))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((-4 * 3 * 1) + (-2 * 3 + -4)) * ((6 - 5 - -8) - (6 + 5 * -6))) + (((7 * -4 - 8) * (0 - -4 * -6)) + ((6 - -2 * 9) - (7 + 3 * -8))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1052.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,179,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((2 + 7) - (4 - -1)) + ((1 - 5) + (1 + 8)))' you split it into multiple subexpressions. The first one is '2 + 7' and evaluates to '9'.'. The next one is '4 - -1' and evaluates to '5'.'. The next one is '1 - 5' and evaluates to '-4'.'. The next one is '1 + 8' and evaluates to '9'.'. The next one is '9 - 5' and evaluates to '4'.'. The next the full expression '(((2 + 7) - (4 - -1)) + ((1 - 5) + (1 + 8)))' evaluates to '12'.',"{'tokens': 43160, 'model': 'openai/text-davinci-003', 'req.': 291, 'avb': '1.16', 'step': 232}",12',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((2 + 7) - (4 - -1)) + ((1 - 5) + (1 + 8)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((2 + 7) - (4 - -1)) + ((1 - 5) + (1 + 8)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/658.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,9,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((-8 + 6) - (7 - 4)) * ((5 - -7) * (9 + 2)))' you split it into multiple subexpressions. The first one is '(-8 + 6)'. and evaluates to '2'.'. The next one is '7 - 4' and evaluates to '3'.'. The next one is '5 - -7' and evaluates to '12'.'. The next one is '9 + 2' and evaluates to '11'.'. The next one is '2 * 12' and evaluates to '24'.'. The next the full expression '(((-8 + 6) - (7 - 4)) * ((5 - -7) * (9 + 2)))' evaluates to '-24'.',"{'tokens': 46582, 'model': 'openai/text-davinci-003', 'req.': 310, 'avb': '1.16', 'step': 179}",-24',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((-8 + 6) - (7 - 4)) * ((5 - -7) * (9 + 2)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((-8 + 6) - (7 - 4)) * ((5 - -7) * (9 + 2)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/692.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-660,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((-1 * -3) * (8 * -3)) + ((-9 + 4) - (-3 - -3)))' you split it into multiple subexpressions. The first one is '(-1 * -3)'. and evaluates to '3'.'. The next one is '8 * -3' and evaluates to '-24'.'. The next one is '-9 + 4' and evaluates to '-5'.'. The next one is '-3 - -3' and evaluates to '0'.'. The next one is '3 * -24' and evaluates to '-72'.'. The next the full expression '(((-1 * -3) * (8 * -3)) + ((-9 + 4) - (-3 - -3)))' evaluates to '-72'.',"{'tokens': 67103, 'model': 'openai/text-davinci-003', 'req.': 443, 'avb': '1.19', 'step': 35}",-72',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((-1 * -3) * (8 * -3)) + ((-9 + 4) - (-3 - -3)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((-1 * -3) * (8 * -3)) + ((-9 + 4) - (-3 - -3)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/698.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-77,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((-6 + 8 - 0) - (-7 * 8 * -2)) - ((-9 - 3 + 2) * (8 + 3 * 0))) + (((-4 + 0 * -1) * (4 * -3 * -8)) - ((-4 + -5 + 9) * (-4 - 0 * 4))))' you split it into multiple subexpressions. The first one is '-6 + 8 - 0'. and evaluates to '2'.'. The next one is '-7 * 8 * -2' and evaluates to '112'.'. The next one is '-9 - 3 + 2' and evaluates to '-10'.'. The next one is '8 + 3 * 0' and evaluates to '8'.'. The next one is '-4 + 0 * -1' and evaluates to '-4'.'. The next the full expression '((((-6 + 8 - 0) - (-7 * 8 * -2)) - ((-9 - 3 + 2) * (8 + 3 * 0))) + (((-4 + 0 * -1) * (4 * -3 * -8)) - ((-4 + -5 + 9) * (-4 - 0 * 4))))' evaluates to '-856'.',"{'tokens': 47143, 'model': 'openai/text-davinci-003', 'req.': 313, 'avb': '1.16', 'step': 238}",-856',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((-6 + 8 - 0) - (-7 * 8 * -2)) - ((-9 - 3 + 2) * (8 + 3 * 0))) + (((-4 + 0 * -1) * (4 * -3 * -8)) - ((-4 + -5 + 9) * (-4 - 0 * 4))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((-6 + 8 - 0) - (-7 * 8 * -2)) - ((-9 - 3 + 2) * (8 + 3 * 0))) + (((-4 + 0 * -1) * (4 * -3 * -8)) - ((-4 + -5 + 9) * (-4 - 0 * 4))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1077.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-414,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,"To evaluate the expression '(((-8 * -9) * (-4 * 6)) - ((-7 * -7) * (-8 + -1)))' you split it into multiple subexpressions. The first one is '(-8 * -9) * (-4 * 6)'. and evaluates to '288'.'. The next one is '(-7 * -7) * (-8 + -1)', and evaluates to '49'.'. The next one is '288 - 49', and evaluates to '239'.'. The next one is '(((-8 * -9) * (-4 * 6)) - ((-7 * -7) * (-8 + -1)))', and evaluates to '239'.'. The next one is '(((-8 * -9) * (-4 * 6)) - ((-7 * -7) * (-8 + -1)))', and evaluates to '239'.'. The next the full expression '(((-8 * -9) * (-4 * 6)) - ((-7 * -7) * (-8 + -1)))' evaluates to '239'.'","{'tokens': 48916, 'model': 'openai/text-davinci-003', 'req.': 327, 'avb': '1.16', 'step': 133}",239',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((-8 * -9) * (-4 * 6)) - ((-7 * -7) * (-8 + -1)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((-8 * -9) * (-4 * 6)) - ((-7 * -7) * (-8 + -1)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/697.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-1287,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((9 * -8 - 7) + (-4 * -1 * -5)) - ((5 + 9 - -6) - (-2 - 3 * -3))) * (((2 - -1 * -2) * (-6 - 3 * -3)) - ((2 - -7 * 2) * (5 - 0 - 3))))' you split it into multiple subexpressions. The first one is '9 * -8 - 7'. and evaluates to '-55'.'. The next one is '-4 * -1 * -5' and evaluates to '20'.'. The next one is '5 + 9 - -6' and evaluates to '18'.'. The next one is '-2 - 3 * -3' and evaluates to '7'.'. The next one is '2 - -1 * -2' and evaluates to '4'.'. The next the full expression '((((9 * -8 - 7) + (-4 * -1 * -5)) - ((5 + 9 - -6) - (-2 - 3 * -3))) * (((2 - -1 * -2) * (-6 - 3 * -3)) - ((2 - -7 * 2) * (5 - 0 - 3))))' evaluates to '-1400'.',"{'tokens': 72428, 'model': 'openai/text-davinci-003', 'req.': 472, 'avb': '1.19', 'step': 152}",-1400',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((9 * -8 - 7) + (-4 * -1 * -5)) - ((5 + 9 - -6) - (-2 - 3 * -3))) * (((2 - -1 * -2) * (-6 - 3 * -3)) - ((2 - -7 * 2) * (5 - 0 - 3))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((9 * -8 - 7) + (-4 * -1 * -5)) - ((5 + 9 - -6) - (-2 - 3 * -3))) * (((2 - -1 * -2) * (-6 - 3 * -3)) - ((2 - -7 * 2) * (5 - 0 - 3))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1084.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,3584,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((3 - 7 - 7) - (4 + -2 - 3)) - ((6 - 6 - -6) * (-4 - -4 - -5))) * (((-1 * -4 - 6) * (1 + 5 - -1)) * ((9 + 9 - -1) * (-6 - -1 * 5))))' you split it into multiple subexpressions. The first one is '3 - 7 - 7'. and evaluates to '-11'.'. The next one is '4 + -2 - 3' and evaluates to '-1'.'. The next one is '6 - 6 - -6' and evaluates to '12'.'. The next one is '-4 - -4 - -5' and evaluates to '-1'.'. The next one is '-1 * -4 - 6' and evaluates to '2'.'. The next the full expression '((((3 - 7 - 7) - (4 + -2 - 3)) - ((6 - 6 - -6) * (-4 - -4 - -5))) * (((-1 * -4 - 6) * (1 + 5 - -1)) * ((9 + 9 - -1) * (-6 - -1 * 5))))' evaluates to '-17280'.',"{'tokens': 52279, 'model': 'openai/text-davinci-003', 'req.': 349, 'avb': '1.17', 'step': 122}",-17280',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((3 - 7 - 7) - (4 + -2 - 3)) - ((6 - 6 - -6) * (-4 - -4 - -5))) * (((-1 * -4 - 6) * (1 + 5 - -1)) * ((9 + 9 - -1) * (-6 - -1 * 5))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((3 - 7 - 7) - (4 + -2 - 3)) - ((6 - 6 - -6) * (-4 - -4 - -5))) * (((-1 * -4 - 6) * (1 + 5 - -1)) * ((9 + 9 - -1) * (-6 - -1 * 5))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1081.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-10640,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((-9 + 7 * -9) + (3 - -1 * -7)) - ((1 - 2 + 3) + (0 * -6 * 7)))' you split it into multiple subexpressions. The first one is '(-9 + 7 * -9)'. and evaluates to '-72'.'. The next one is '3 - -1 * -7' and evaluates to '24'.'. The next one is '1 - 2 + 3' and evaluates to '2'.'. The next one is '0 * -6 * 7' and evaluates to '0'.'. The next one is '-72 + 24' and evaluates to '-48'.'. The next the full expression '(((-9 + 7 * -9) + (3 - -1 * -7)) - ((1 - 2 + 3) + (0 * -6 * 7)))' evaluates to '-48'.',"{'tokens': 83091, 'model': 'openai/text-davinci-003', 'req.': 534, 'avb': '1.20', 'step': 118}",-48',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((-9 + 7 * -9) + (3 - -1 * -7)) - ((1 - 2 + 3) + (0 * -6 * 7)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((-9 + 7 * -9) + (3 - -1 * -7)) - ((1 - 2 + 3) + (0 * -6 * 7)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/746.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-78,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((9 * 0 - 8) + (5 * -7 * 1)) - ((8 + -4 * 3) + (-5 - 3 - -2))) + (((5 * -9 - -8) - (9 * 4 - -1)) + ((-2 + 6 - 0) + (-4 - 7 + 6))))' you split it into multiple subexpressions. The first one is '9 * 0 - 8'. and evaluates to '-8'.'. The next one is '5 * -7 * 1' and evaluates to '-35'.'. The next one is '8 + -4 * 3' and evaluates to '-8'.'. The next one is '-5 - 3 - -2' and evaluates to '-4'.'. The next one is '5 * -9 - -8' and evaluates to '-43'.'. The next the full expression '((((9 * 0 - 8) + (5 * -7 * 1)) - ((8 + -4 * 3) + (-5 - 3 - -2))) + (((5 * -9 - -8) - (9 * 4 - -1)) + ((-2 + 6 - 0) + (-4 - 7 + 6))))' evaluates to '-87'.',"{'tokens': 44747, 'model': 'openai/text-davinci-003', 'req.': 300, 'avb': '1.16', 'step': 116}",-87',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((9 * 0 - 8) + (5 * -7 * 1)) - ((8 + -4 * 3) + (-5 - 3 - -2))) + (((5 * -9 - -8) - (9 * 4 - -1)) + ((-2 + 6 - 0) + (-4 - 7 + 6))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((9 * 0 - 8) + (5 * -7 * 1)) - ((8 + -4 * 3) + (-5 - 3 - -2))) + (((5 * -9 - -8) - (9 * 4 - -1)) + ((-2 + 6 - 0) + (-4 - 7 + 6))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1056.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-108,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((-9 - 6 * -8 - 6) - (3 * 0 + -2 - -5)) - ((-4 - 7 - 7 + 7) + (7 + 3 * -3 - -4))) + (((4 * -1 * 8 - 0) - (-7 + -7 + -5 * -7)) + ((-7 * -6 * -8 - -5) * (-8 * 5 * 0 - -9))))' you split it into multiple subexpressions. The first one is '-9 - 6 * -8 - 6'. and evaluates to '-9 - 48 - 6''. The next one is '3 * 0 + -2 - -5' and evaluates to '-2 - -5''. The next one is '-4 - 7 - 7 + 7' and evaluates to '-4 - 7 + 7''. The next one is '7 + 3 * -3 - -4' and evaluates to '7 - 9 - -4''. The next one is '4 * -1 * 8 - 0' and evaluates to '-32 - 0''. The next the full expression '((((-9 - 6 * -8 - 6) - (3 * 0 + -2 - -5)) - ((-4 - 7 - 7 + 7) + (7 + 3 * -3 - -4))) + (((4 * -1 * 8 - 0) - (-7 + -7 + -5 * -7)) + ((-7 * -6 * -8 - -5) * (-8 * 5 * 0 - -9))))' evaluates to '-90'.',"{'tokens': 95425, 'model': 'openai/text-davinci-003', 'req.': 599, 'avb': '1.20', 'step': 186}",-90',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((-9 - 6 * -8 - 6) - (3 * 0 + -2 - -5)) - ((-4 - 7 - 7 + 7) + (7 + 3 * -3 - -4))) + (((4 * -1 * 8 - 0) - (-7 + -7 + -5 * -7)) + ((-7 * -6 * -8 - -5) * (-8 * 5 * 0 - -9))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((-9 - 6 * -8 - 6) - (3 * 0 + -2 - -5)) - ((-4 - 7 - 7 + 7) + (7 + 3 * -3 - -4))) + (((4 * -1 * 8 - 0) - (-7 + -7 + -5 * -7)) + ((-7 * -6 * -8 - -5) * (-8 * 5 * 0 - -9))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1125.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-2993,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,"To evaluate the expression '(5 - 1 + -9)' you split it into multiple subexpressions. The first one is '5 - 1', and evaluates to '4'.'. The next one is '4 + -9', and evaluates to '-5'.'. The next one is '-5 + -9', and evaluates to '-14'.'. The next one is '-14 + -9', and evaluates to '-23'.'. The next one is '-23 + -9', and evaluates to '-32'.'. The next the full expression '(5 - 1 + -9)' evaluates to '-32'.'","{'tokens': 78640, 'model': 'openai/text-davinci-003', 'req.': 505, 'avb': '1.20', 'step': 116}",-32',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(5 - 1 + -9)' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(5 - 1 + -9)' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/110.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-5,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((2 + -7 - -1) - (-8 - -7 - -6)) + ((9 + -3 * -1) - (-1 * 2 * -8)))' you split it into multiple subexpressions. The first one is '2 + -7 - -1'. and evaluates to '2 + -7 + 1''. The next one is '-8 - -7 - -6' and evaluates to '-8 - -7 + 6'.'. The next one is '9 + -3 * -1' and evaluates to '9 - 3'.'. The next one is '-1 * 2 * -8' and evaluates to '-16'.'. The next one is '((2 + -7 + 1) - (-8 - -7 + 6)) + (9 - 3 - -16)' and evaluates to '-1 + 6 + 12''. The next the full expression '(((2 + -7 - -1) - (-8 - -7 - -6)) + ((9 + -3 * -1) - (-1 * 2 * -8)))' evaluates to '17'.',,17',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((2 + -7 - -1) - (-8 - -7 - -6)) + ((9 + -3 * -1) - (-1 * 2 * -8)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((2 + -7 - -1) - (-8 - -7 - -6)) + ((9 + -3 * -1) - (-1 * 2 * -8)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/754.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-13,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,"To evaluate the expression '(((-8 - -5 + 1) + (-7 * 7 - -9)) * ((4 + 9 * 1) * (-8 + -7 - -3)))' you split it into multiple subexpressions. The first one is '(-8 - -5 + 1)'. and evaluates to '-2'.'. The next one is '(-7 * 7 - -9)', and evaluates to '42'.'. The next one is '4 + 9 * 1', and evaluates to '13'.'. The next one is '-8 + -7 - -3', and evaluates to '-2'.'. The next one is '-2 + 42 * 13 -2', and evaluates to '532'.'. The next the full expression '(((-8 - -5 + 1) + (-7 * 7 - -9)) * ((4 + 9 * 1) * (-8 + -7 - -3)))' evaluates to '532'.'","{'tokens': 110192, 'model': 'openai/text-davinci-003', 'req.': 692, 'avb': '1.18', 'step': 185}",532',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((-8 - -5 + 1) + (-7 * 7 - -9)) * ((4 + 9 * 1) * (-8 + -7 - -3)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((-8 - -5 + 1) + (-7 * 7 - -9)) * ((4 + 9 * 1) * (-8 + -7 - -3)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/764.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,6552,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,"To evaluate the expression '((((-8 - 6 * 1 - -4) * (6 + -7 + -7 - 7)) * ((-8 - 0 * 6 * 6) - (-1 + 9 - -9 - 6))) - (((8 * -9 - 9 - 9) * (-2 + -1 * 4 + 7)) - ((6 - -8 * 0 - 9) + (4 * 1 + -3 * 7))))' you split it into multiple subexpressions. The first one is '-8 - 6 * 1 - -4'. and evaluates to '-8 - 6 * 1 + 4''. The next one is '6 + -7 + -7 - 7' and evaluates to '-8'.'. The next one is '-8 - 0 * 6 * 6' and evaluates to '-8 - 0 * 6 * 6''. The next one is '-1 + 9 - -9 - 6' and evaluates to '3'.'. The next one is '8 * -9 - 9 - 9' and evaluates to '-90'.'. The next the full expression '((((-8 - 6 * 1 - -4) * (6 + -7 + -7 - 7)) * ((-8 - 0 * 6 * 6) - (-1 + 9 - -9 - 6))) - (((8 * -9 - 9 - 9) * (-2 + -1 * 4 + 7)) - ((6 - -8 * 0 - 9) + (4 * 1 + -3 * 7))))' evaluates to '-7,890'.'","{'tokens': 90299, 'model': 'openai/text-davinci-003', 'req.': 572, 'avb': '1.20', 'step': 182}","-7,890'","BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((-8 - 6 * 1 - -4) * (6 + -7 + -7 - 7)) * ((-8 - 0 * 6 * 6) - (-1 + 9 - -9 - 6))) - (((8 * -9 - 9 - 9) * (-2 + -1 * 4 + 7)) - ((6 - -8 * 0 - 9) + (4 * 1 + -3 * 7))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((-8 - 6 * 1 - -4) * (6 + -7 + -7 - 7)) * ((-8 - 0 * 6 * 6) - (-1 + 9 - -9 - 6))) - (((8 * -9 - 9 - 9) * (-2 + -1 * 4 + 7)) - ((6 - -8 * 0 - 9) + (4 * 1 + -3 * 7))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1119.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-2780,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((4 - 2 - 2) * (4 - -1 - 7)) + ((-7 - 9 + 2) * (-6 - 3 - 0)))' you split it into multiple subexpressions. The first one is '4 - 2 - 2'. and evaluates to '0'.'. The next one is '4 - -1 - 7' and evaluates to '10'.'. The next one is '-7 - 9 + 2' and evaluates to '-14'.'. The next one is '-6 - 3 - 0' and evaluates to '-9'.'. The next one is '((0) * (10)) + ((-14) * (-9))' and evaluates to '126'.'. The next the full expression '(((4 - 2 - 2) * (4 - -1 - 7)) + ((-7 - 9 + 2) * (-6 - 3 - 0)))' evaluates to '126'.',"{'tokens': 78177, 'model': 'openai/text-davinci-003', 'req.': 502, 'avb': '1.20', 'step': 185}",126',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((4 - 2 - 2) * (4 - -1 - 7)) + ((-7 - 9 + 2) * (-6 - 3 - 0)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((4 - 2 - 2) * (4 - -1 - 7)) + ((-7 - 9 + 2) * (-6 - 3 - 0)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/708.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,126,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((-5 + -5 + -4) - (-8 + -4 + -7)) + ((-9 * -5 + 9) + (9 * 2 - -5)))' you split it into multiple subexpressions. The first one is '(-5 + -5 + -4) - (-8 + -4 + -7)'. and evaluates to '-10 - -15''. The next one is '-9 * -5 + 9' and evaluates to '45'.'. The next one is '9 * 2 - -5' and evaluates to '23'.'. The next one is '-10 - -15 + 45 + 23' and evaluates to '53'.'. The next one is '((-5 + -5 + -4) - (-8 + -4 + -7)) + ((-9 * -5 + 9) + (9 * 2 - -5))' and evaluates to '53'.'. The next the full expression '(((-5 + -5 + -4) - (-8 + -4 + -7)) + ((-9 * -5 + 9) + (9 * 2 - -5)))' evaluates to '53'.',"{'tokens': 118829, 'model': 'openai/text-davinci-003', 'req.': 745, 'avb': '1.17', 'step': 143}",53',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((-5 + -5 + -4) - (-8 + -4 + -7)) + ((-9 * -5 + 9) + (9 * 2 - -5)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((-5 + -5 + -4) - (-8 + -4 + -7)) + ((-9 * -5 + 9) + (9 * 2 - -5)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/765.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,82,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((-2 - 2 * 7) + (8 * -6 + -1)) - ((-8 + -4 * -4) * (-9 * -9 + -4)))' you split it into multiple subexpressions. The first one is '-2 - 2 * 7'. and evaluates to '-16'.'. The next one is '8 * -6 + -1' and evaluates to '-49'.'. The next one is '-8 + -4 * -4' and evaluates to '0'.'. The next one is '-9 * -9 + -4' and evaluates to '-85'.'. The next one is '((-16) + (-49)) - ((0) * (-85))' and evaluates to '-145'.'. The next the full expression '(((-2 - 2 * 7) + (8 * -6 + -1)) - ((-8 + -4 * -4) * (-9 * -9 + -4)))' evaluates to '-145'.',"{'tokens': 132024, 'model': 'openai/text-davinci-003', 'req.': 823, 'avb': '1.16', 'step': 237}",-145',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((-2 - 2 * 7) + (8 * -6 + -1)) - ((-8 + -4 * -4) * (-9 * -9 + -4)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((-2 - 2 * 7) + (8 * -6 + -1)) - ((-8 + -4 * -4) * (-9 * -9 + -4)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/770.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-681,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((3 * 0 + 4 * 2) * (0 * -1 * -8 + -2)) + ((-2 + -4 - 3 + -4) * (6 - 7 + 2 - 9))) - (((2 - -4 + -5 + -7) - (-2 - 5 + 0 * -1)) - ((-5 * -1 - 9 + -9) * (-9 - 1 + -3 - 5))))' you split it into multiple subexpressions. The first one is '((3 * 0 + 4 * 2) * (0 * -1 * -8 + -2))'. and evaluates to '-24'.'. The next one is '((-2 + -4 - 3 + -4) * (6 - 7 + 2 - 9))' and evaluates to '-48'.'. The next one is '((2 - -4 + -5 + -7) - (-2 - 5 + 0 * -1))' and evaluates to '-4'.'. The next one is '((-5 * -1 - 9 + -9) * (-9 - 1 + -3 - 5))' and evaluates to '-360'.'. The next one is '-24 - 48 - 4 - 360' and evaluates to '-436'.'. The next the full expression '((((3 * 0 + 4 * 2) * (0 * -1 * -8 + -2)) + ((-2 + -4 - 3 + -4) * (6 - 7 + 2 - 9))) - (((2 - -4 + -5 + -7) - (-2 - 5 + 0 * -1)) - ((-5 * -1 - 9 + -9) * (-9 - 1 + -3 - 5))))' evaluates to '-436'.',"{'tokens': 113458, 'model': 'openai/text-davinci-003', 'req.': 712, 'avb': '1.18', 'step': 184}",-436',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((3 * 0 + 4 * 2) * (0 * -1 * -8 + -2)) + ((-2 + -4 - 3 + -4) * (6 - 7 + 2 - 9))) - (((2 - -4 + -5 + -7) - (-2 - 5 + 0 * -1)) - ((-5 * -1 - 9 + -9) * (-9 - 1 + -3 - 5))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((3 * 0 + 4 * 2) * (0 * -1 * -8 + -2)) + ((-2 + -4 - 3 + -4) * (6 - 7 + 2 - 9))) - (((2 - -4 + -5 + -7) - (-2 - 5 + 0 * -1)) - ((-5 * -1 - 9 + -9) * (-9 - 1 + -3 - 5))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1129.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,321,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((9 - -6 * -7 + 0) - (-3 * 9 - 4 + 1)) * ((7 * 1 - 4 - -4) * (-1 - -7 + 2 * -6))) + (((0 - -3 - -3 * 8) + (8 + 1 + 7 - -1)) + ((6 + -7 * -2 - -4) * (-4 + -5 + -1 + 9))))' you split it into multiple subexpressions. The first one is '9 - -6 * -7 + 0'. and evaluates to '51'.'. The next one is '-3 * 9 - 4 + 1' and evaluates to '-20'.'. The next one is '7 * 1 - 4 - -4' and evaluates to '4'.'. The next one is '-1 - -7 + 2 * -6' and evaluates to '-17'.'. The next one is '0 - -3 - -3 * 8' and evaluates to '-19'.'. The next the full expression '((((9 - -6 * -7 + 0) - (-3 * 9 - 4 + 1)) * ((7 * 1 - 4 - -4) * (-1 - -7 + 2 * -6))) + (((0 - -3 - -3 * 8) + (8 + 1 + 7 - -1)) + ((6 + -7 * -2 - -4) * (-4 + -5 + -1 + 9))))' evaluates to '-1445'.',"{'tokens': 124621, 'model': 'openai/text-davinci-003', 'req.': 779, 'avb': '1.17', 'step': 183}",-1445',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((9 - -6 * -7 + 0) - (-3 * 9 - 4 + 1)) * ((7 * 1 - 4 - -4) * (-1 - -7 + 2 * -6))) + (((0 - -3 - -3 * 8) + (8 + 1 + 7 - -1)) + ((6 + -7 * -2 - -4) * (-4 + -5 + -1 + 9))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((9 - -6 * -7 + 0) - (-3 * 9 - 4 + 1)) * ((7 * 1 - 4 - -4) * (-1 - -7 + 2 * -6))) + (((0 - -3 - -3 * 8) + (8 + 1 + 7 - -1)) + ((6 + -7 * -2 - -4) * (-4 + -5 + -1 + 9))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1142.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,146,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,"To evaluate the expression '((((8 * 7 * -3 + 9) * (-3 * 5 * -8 * 9)) + ((5 + 5 * 2 * -3) * (1 + -7 + -8 * -3))) - (((-5 * 2 - 7 * -2) * (-8 + -4 + 3 + -2)) * ((5 + 8 - 7 - 3) + (-7 * -3 + 2 * 1))))' you split it into multiple subexpressions. The first one is '8 * 7 * -3 + 9'. and evaluates to '-153'.'. The next one is '-3 * 5 * -8 * 9' and evaluates to '1080'.'. The next one is '5 + 5 * 2 * -3' and evaluates to '-10'.'. The next one is '1 + -7 + -8 * -3' and evaluates to '-22'.'. The next one is '-5 * 2 - 7 * -2' and evaluates to '-3'.'. The next the full expression '((((8 * 7 * -3 + 9) * (-3 * 5 * -8 * 9)) + ((5 + 5 * 2 * -3) * (1 + -7 + -8 * -3))) - (((-5 * 2 - 7 * -2) * (-8 + -4 + 3 + -2)) * ((5 + 8 - 7 - 3) + (-7 * -3 + 2 * 1))))' evaluates to '-14,976'.'","{'tokens': 136089, 'model': 'openai/text-davinci-003', 'req.': 844, 'avb': '1.16', 'step': 112}","-14,976'","BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((8 * 7 * -3 + 9) * (-3 * 5 * -8 * 9)) + ((5 + 5 * 2 * -3) * (1 + -7 + -8 * -3))) - (((-5 * 2 - 7 * -2) * (-8 + -4 + 3 + -2)) * ((5 + 8 - 7 - 3) + (-7 * -3 + 2 * 1))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((8 * 7 * -3 + 9) * (-3 * 5 * -8 * 9)) + ((5 + 5 * 2 * -3) * (1 + -7 + -8 * -3))) - (((-5 * 2 - 7 * -2) * (-8 + -4 + 3 + -2)) * ((5 + 8 - 7 - 3) + (-7 * -3 + 2 * 1))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1144.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-171026,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((1 - 4 - 1 - 7) * (6 + 3 + 1 * -4)) + ((-4 + -5 * 8 - 5) - (-5 - -6 - -3 - 6)))' you split it into multiple subexpressions. The first one is '1 - 4 - 1 - 7'. and evaluates to '-11'.'. The next one is '6 + 3 + 1 * -4' and evaluates to '-5'.'. The next one is '-4 + -5 * 8 - 5' and evaluates to '-37'.'. The next one is '-5 - -6 - -3 - 6' and evaluates to '2'.'. The next one is '-11 * -5' and evaluates to '55'.'. The next the full expression '(((1 - 4 - 1 - 7) * (6 + 3 + 1 * -4)) + ((-4 + -5 * 8 - 5) - (-5 - -6 - -3 - 6)))' evaluates to '53'.',"{'tokens': 144461, 'model': 'openai/text-davinci-003', 'req.': 890, 'avb': '1.16', 'step': 134}",53',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((1 - 4 - 1 - 7) * (6 + 3 + 1 * -4)) + ((-4 + -5 * 8 - 5) - (-5 - -6 - -3 - 6)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((1 - 4 - 1 - 7) * (6 + 3 + 1 * -4)) + ((-4 + -5 * 8 - 5) - (-5 - -6 - -3 - 6)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/828.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-102,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((7 + 6 + -2 * 5) + (9 + 5 + -5 + 6)) - ((1 + -4 - 7 + 7) + (-5 + -3 - -4 - 3))) - (((1 - -8 - 9 + 6) + (0 + 4 * -6 * -1)) * ((-1 - -6 * -6 + -9) + (9 * 0 - 4 - 0))))' you split it into multiple subexpressions. The first one is '7 + 6 + -2 * 5'. and evaluates to '7 + 6 + -10''. The next one is '9 + 5 + -5 + 6' and evaluates to '15'.'. The next one is '1 + -4 - 7 + 7' and evaluates to '1 - 7 + 7''. The next one is '-5 + -3 - -4 - 3' and evaluates to '-5 - -1 - 3''.'. The next one is '1 - -8 - 9 + 6' and evaluates to '1 + 8 + 9 + 6''.'. The next the full expression '((((7 + 6 + -2 * 5) + (9 + 5 + -5 + 6)) - ((1 + -4 - 7 + 7) + (-5 + -3 - -4 - 3))) - (((1 - -8 - 9 + 6) + (0 + 4 * -6 * -1)) * ((-1 - -6 * -6 + -9) + (9 * 0 - 4 - 0))))' evaluates to '-7 - 8 - 54'.',"{'tokens': 149279, 'model': 'openai/text-davinci-003', 'req.': 913, 'avb': '1.16', 'step': 151}",-7 - 8 - 54',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((7 + 6 + -2 * 5) + (9 + 5 + -5 + 6)) - ((1 + -4 - 7 + 7) + (-5 + -3 - -4 - 3))) - (((1 - -8 - 9 + 6) + (0 + 4 * -6 * -1)) * ((-1 - -6 * -6 + -9) + (9 * 0 - 4 - 0))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((7 + 6 + -2 * 5) + (9 + 5 + -5 + 6)) - ((1 + -4 - 7 + 7) + (-5 + -3 - -4 - 3))) - (((1 - -8 - 9 + 6) + (0 + 4 * -6 * -1)) * ((-1 - -6 * -6 + -9) + (9 * 0 - 4 - 0))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1158.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,1528,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((3 * 9 - -7 - -5) + (-3 + -8 + 0 - 2)) - ((-7 - 0 + -1 + -7) + (-2 - 7 * 6 - 1))) - (((-1 * 5 * 8 + 5) - (-8 - 5 - 9 - 3)) - ((1 - -8 + 3 - -9) - (-5 + -3 + 3 * -4))))' you split it into multiple subexpressions. The first one is '3 * 9 - -7 - -5'. and evaluates to '25'.'. The next one is '-3 + -8 + 0 - 2' and evaluates to '-13'.'. The next one is '-7 - 0 + -1 + -7' and evaluates to '-15'.'. The next one is '-2 - 7 * 6 - 1' and evaluates to '-47'.'. The next one is '-1 * 5 * 8 + 5' and evaluates to '37'.'. The next the full expression '((((3 * 9 - -7 - -5) + (-3 + -8 + 0 - 2)) - ((-7 - 0 + -1 + -7) + (-2 - 7 * 6 - 1))) - (((-1 * 5 * 8 + 5) - (-8 - 5 - 9 - 3)) - ((1 - -8 + 3 - -9) - (-5 + -3 + 3 * -4))))' evaluates to '-90'.',"{'tokens': 156964, 'model': 'openai/text-davinci-003', 'req.': 953, 'avb': '1.16', 'step': 149}",-90',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((3 * 9 - -7 - -5) + (-3 + -8 + 0 - 2)) - ((-7 - 0 + -1 + -7) + (-2 - 7 * 6 - 1))) - (((-1 * 5 * 8 + 5) - (-8 - 5 - 9 - 3)) - ((1 - -8 + 3 - -9) - (-5 + -3 + 3 * -4))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((3 * 9 - -7 - -5) + (-3 + -8 + 0 - 2)) - ((-7 - 0 + -1 + -7) + (-2 - 7 * 6 - 1))) - (((-1 * 5 * 8 + 5) - (-8 - 5 - 9 - 3)) - ((1 - -8 + 3 - -9) - (-5 + -3 + 3 * -4))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1165.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,137,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(-8 - -7)' you split it into multiple subexpressions. The first one is '-8'. and evaluates to '-8'.'. The next one is '-7' and evaluates to '-7'.'. The next one is '-8 - -7' and evaluates to '1'.'. The next one is '(-8 - -7)' and evaluates to '1'.'. The next one is '(-8 - -7)' and evaluates to '1'.'. The next the full expression '(-8 - -7)' evaluates to '1'.',"{'tokens': 164893, 'model': 'openai/text-davinci-003', 'req.': 999, 'avb': '1.16', 'step': 197}",1',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(-8 - -7)' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(-8 - -7)' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/85.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-1,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((8 - 0 + 0 + -7) * (-1 - 9 - 4 + -7)) - ((-9 - -1 + -8 * 6) * (9 + 5 - 1 + -3)))' you split it into multiple subexpressions. The first one is '8 - 0 + 0 + -7'. and evaluates to '1'.'. The next one is '-1 - 9 - 4 + -7' and evaluates to '-21'.'. The next one is '-9 - -1 + -8 * 6' and evaluates to '-53'.'. The next one is '9 + 5 - 1 + -3' and evaluates to '10'.'. The next one is '((1) * (-21)) - ((-53) * (10))' and evaluates to '-2313'.'. The next the full expression '(((8 - 0 + 0 + -7) * (-1 - 9 - 4 + -7)) - ((-9 - -1 + -8 * 6) * (9 + 5 - 1 + -3)))' evaluates to '-2313'.',"{'tokens': 150460, 'model': 'openai/text-davinci-003', 'req.': 919, 'avb': '1.16', 'step': 228}",-2313',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((8 - 0 + 0 + -7) * (-1 - 9 - 4 + -7)) - ((-9 - -1 + -8 * 6) * (9 + 5 - 1 + -3)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((8 - 0 + 0 + -7) * (-1 - 9 - 4 + -7)) - ((-9 - -1 + -8 * 6) * (9 + 5 - 1 + -3)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/839.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,539,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,"To evaluate the expression '((((6 - 7 + -3 + 1) + (-8 * 9 - -5 * 9)) * ((-4 * 4 + -8 + 1) - (-3 + 4 - -9 - 2))) * (((-5 - -2 * -6 * 2) - (0 - 6 * -2 * -2)) + ((-4 * -2 + 0 + 1) + (-7 - -2 - 2 + 6))))' you split it into multiple subexpressions. The first one is '6 - 7 + -3 + 1'. and evaluates to '-3'.'. The next one is '-8 * 9 - -5 * 9' and evaluates to '-27'.'. The next one is '-4 * 4 + -8 + 1' and evaluates to '-29'.'. The next one is '-3 + 4 - -9 - 2' and evaluates to '2'.'. The next one is '-5 - -2 * -6 * 2' and evaluates to '-17'.'. The next the full expression '((((6 - 7 + -3 + 1) + (-8 * 9 - -5 * 9)) * ((-4 * 4 + -8 + 1) - (-3 + 4 - -9 - 2))) * (((-5 - -2 * -6 * 2) - (0 - 6 * -2 * -2)) + ((-4 * -2 + 0 + 1) + (-7 - -2 - 2 + 6))))' evaluates to '-7,844'.'","{'tokens': 178365, 'model': 'openai/text-davinci-003', 'req.': 1080, 'avb': '1.15', 'step': 163}","-7,844'","BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((6 - 7 + -3 + 1) + (-8 * 9 - -5 * 9)) * ((-4 * 4 + -8 + 1) - (-3 + 4 - -9 - 2))) * (((-5 - -2 * -6 * 2) - (0 - 6 * -2 * -2)) + ((-4 * -2 + 0 + 1) + (-7 - -2 - 2 + 6))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((6 - 7 + -3 + 1) + (-8 * 9 - -5 * 9)) * ((-4 * 4 + -8 + 1) - (-3 + 4 - -9 - 2))) * (((-5 - -2 * -6 * 2) - (0 - 6 * -2 * -2)) + ((-4 * -2 + 0 + 1) + (-7 - -2 - 2 + 6))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1168.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,2790,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(((0 - -1 + 7 + 7) + (2 - 0 * 9 + -8)) * ((-3 - 5 * -4 * -4) * (6 - -3 - 1 - -3)))' you split it into multiple subexpressions. The first one is '0 - -1 + 7 + 7'. and evaluates to '15'.'. The next one is '2 - 0 * 9 + -8' and evaluates to '-14'.'. The next one is '-3 - 5 * -4 * -4' and evaluates to '-3'.'. The next one is '6 - -3 - 1 - -3' and evaluates to '7'.'. The next one is '((15) + (-14)) * ((-3) * (7))' and evaluates to '-189'.'. The next the full expression '(((0 - -1 + 7 + 7) + (2 - 0 * 9 + -8)) * ((-3 - 5 * -4 * -4) * (6 - -3 - 1 - -3)))' evaluates to '-189'.',"{'tokens': 188870, 'model': 'openai/text-davinci-003', 'req.': 1137, 'avb': '1.14', 'step': 273}",-189',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(((0 - -1 + 7 + 7) + (2 - 0 * 9 + -8)) * ((-3 - 5 * -4 * -4) * (6 - -3 - 1 - -3)))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(((0 - -1 + 7 + 7) + (2 - 0 * 9 + -8)) * ((-3 - 5 * -4 * -4) * (6 - -3 - 1 - -3)))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/858.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-8217,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(-2 + -9 + -3)' you split it into multiple subexpressions. The first one is '-2 + -9'. and evaluates to '-11'.'. The next one is '-11 + -3' and evaluates to '-14'.'. The next one is '-14'. and evaluates to '-14'.'. The next one is '-14'. and evaluates to '-14'.'. The next one is '-14'. and evaluates to '-14'.'. The next the full expression '(-2 + -9 + -3)' evaluates to '-14'.',"{'tokens': 194182, 'model': 'openai/text-davinci-003', 'req.': 1163, 'avb': '1.14', 'step': 217}",-14',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(-2 + -9 + -3)' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(-2 + -9 + -3)' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/117.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-14,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((-7 - -6 + 9 + 8) + (6 - 9 + 0 - 4)) - ((-7 * 6 + 2 * 9) * (3 * 6 * -8 * -6))) + (((-9 + -5 - 2 - -4) + (7 - 3 * 9 + 7)) + ((8 - 1 * 7 + 8) * (-3 * -9 - -2 * -8))))' you split it into multiple subexpressions. The first one is '-7 - -6 + 9 + 8'. and evaluates to '10'.'. The next one is '6 - 9 + 0 - 4' and evaluates to '-7'.'. The next one is '-7 * 6 + 2 * 9' and evaluates to '48'.'. The next one is '3 * 6 * -8 * -6' and evaluates to '-864'.'. The next one is '-9 + -5 - 2 - -4' and evaluates to '-2'.'. The next the full expression '((((-7 - -6 + 9 + 8) + (6 - 9 + 0 - 4)) - ((-7 * 6 + 2 * 9) * (3 * 6 * -8 * -6))) + (((-9 + -5 - 2 - -4) + (7 - 3 * 9 + 7)) + ((8 - 1 * 7 + 8) * (-3 * -9 - -2 * -8))))' evaluates to '-822'.',"{'tokens': 196496, 'model': 'openai/text-davinci-003', 'req.': 1176, 'avb': '1.14', 'step': 161}",-822',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((-7 - -6 + 9 + 8) + (6 - 9 + 0 - 4)) - ((-7 * 6 + 2 * 9) * (3 * 6 * -8 * -6))) + (((-9 + -5 - 2 - -4) + (7 - 3 * 9 + 7)) + ((8 - 1 * 7 + 8) * (-3 * -9 - -2 * -8))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((-7 - -6 + 9 + 8) + (6 - 9 + 0 - 4)) - ((-7 * 6 + 2 * 9) * (3 * 6 * -8 * -6))) + (((-9 + -5 - 2 - -4) + (7 - 3 * 9 + 7)) + ((8 - 1 * 7 + 8) * (-3 * -9 - -2 * -8))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1176.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,20819,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((7 + -5) - (5 + 7)) + ((5 - -4) + (6 + -1))) * (((-5 * -9) - (4 + 9)) + ((-9 + 4) * (-4 * -4))))' you split it into multiple subexpressions. The first one is '7 + -5'. and evaluates to '2'.'. The next one is '5 + 7' and evaluates to '12'.'. The next one is '5 - -4' and evaluates to '9'.'. The next one is '6 + -1' and evaluates to '5'.'. The next one is '-5 * -9' and evaluates to '45'.'. The next the full expression '((((7 + -5) - (5 + 7)) + ((5 - -4) + (6 + -1))) * (((-5 * -9) - (4 + 9)) + ((-9 + 4) * (-4 * -4))))' evaluates to '-1485'.',"{'tokens': 195360, 'model': 'openai/text-davinci-003', 'req.': 1169, 'avb': '1.14', 'step': 217}",-1485',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((7 + -5) - (5 + 7)) + ((5 - -4) + (6 + -1))) * (((-5 * -9) - (4 + 9)) + ((-9 + 4) * (-4 * -4))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((7 + -5) - (5 + 7)) + ((5 - -4) + (6 + -1))) * (((-5 * -9) - (4 + 9)) + ((-9 + 4) * (-4 * -4))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/902.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-192,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((9 * -2) * (2 * -8)) + ((7 * 3) + (-4 + 1))) - (((6 * 7) + (-6 + 4)) - ((4 + 1) - (8 + 8))))' you split it into multiple subexpressions. The first one is '((9 * -2) * (2 * -8))'. and evaluates to '144'.'. The next one is '((7 * 3) + (-4 + 1))' and evaluates to '22'.'. The next one is '((6 * 7) + (-6 + 4))' and evaluates to '44'.'. The next one is '((4 + 1) - (8 + 8))' and evaluates to '-13'.'. The next one is '((((9 * -2) * (2 * -8)) + ((7 * 3) + (-4 + 1))) - (((6 * 7) + (-6 + 4)) - ((4 + 1) - (8 + 8))))' and evaluates to '153'.'. The next the full expression '((((9 * -2) * (2 * -8)) + ((7 * 3) + (-4 + 1))) - (((6 * 7) + (-6 + 4)) - ((4 + 1) - (8 + 8))))' evaluates to '153'.',"{'tokens': 201261, 'model': 'openai/text-davinci-003', 'req.': 1204, 'avb': '1.13', 'step': 235}",153',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((9 * -2) * (2 * -8)) + ((7 * 3) + (-4 + 1))) - (((6 * 7) + (-6 + 4)) - ((4 + 1) - (8 + 8))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((9 * -2) * (2 * -8)) + ((7 * 3) + (-4 + 1))) - (((6 * 7) + (-6 + 4)) - ((4 + 1) - (8 + 8))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/907.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,255,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,"To evaluate the expression '((((-3 - 6) - (-7 + 4)) - ((-7 - 9) * (2 - -5))) - (((-1 + 3) * (9 * 6)) - ((-7 * -4) - (3 - 0))))' you split it into multiple subexpressions. The first one is '-3 - 6'. and evaluates to '-9'.'. The next one is '-7 + 4' and evaluates to '-3'.'. The next one is '-7 - 9' and evaluates to '-16'.'. The next one is '2 - -5' and evaluates to '7'.'. The next one is '-1 + 3' and evaluates to '2'.'. The next the full expression '((((-3 - 6) - (-7 + 4)) - ((-7 - 9) * (2 - -5))) - (((-1 + 3) * (9 * 6)) - ((-7 * -4) - (3 - 0))))' evaluates to '-14,902'.'","{'tokens': 210620, 'model': 'openai/text-davinci-003', 'req.': 1267, 'avb': '1.13', 'step': 100}","-14,902'","BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((-3 - 6) - (-7 + 4)) - ((-7 - 9) * (2 - -5))) - (((-1 + 3) * (9 * 6)) - ((-7 * -4) - (3 - 0))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((-3 - 6) - (-7 + 4)) - ((-7 - 9) * (2 - -5))) - (((-1 + 3) * (9 * 6)) - ((-7 * -4) - (3 - 0))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/911.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,23,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((-5 * 4 - -3 + -2) - (-2 * 3 - 9 * -8)) + ((-4 + -1 * -5 + -3) - (-6 * 8 - 7 - -6))) - (((6 - -5 + -8 - -6) * (7 + 9 * -7 - -5)) - ((-4 * 7 - 2 + 8) * (-6 * -1 - 2 - 5))))' you split it into multiple subexpressions. The first one is '-5 * 4 - -3 + -2'. and evaluates to '-17'.'. The next one is '-2 * 3 - 9 * -8' and evaluates to '-6'.'. The next one is '-4 + -1 * -5 + -3' and evaluates to '-22'.'. The next one is '-6 * 8 - 7 - -6' and evaluates to '-47'.'. The next one is '6 - -5 + -8 - -6' and evaluates to '-3'.'. The next the full expression '((((-5 * 4 - -3 + -2) - (-2 * 3 - 9 * -8)) + ((-4 + -1 * -5 + -3) - (-6 * 8 - 7 - -6))) - (((6 - -5 + -8 - -6) * (7 + 9 * -7 - -5)) - ((-4 * 7 - 2 + 8) * (-6 * -1 - 2 - 5))))' evaluates to '-541'.',"{'tokens': 204560, 'model': 'openai/text-davinci-003', 'req.': 1223, 'avb': '1.13', 'step': 213}",-541',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((-5 * 4 - -3 + -2) - (-2 * 3 - 9 * -8)) + ((-4 + -1 * -5 + -3) - (-6 * 8 - 7 - -6))) - (((6 - -5 + -8 - -6) * (7 + 9 * -7 - -5)) - ((-4 * 7 - 2 + 8) * (-6 * -1 - 2 - 5))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((-5 * 4 - -3 + -2) - (-2 * 3 - 9 * -8)) + ((-4 + -1 * -5 + -3) - (-6 * 8 - 7 - -6))) - (((6 - -5 + -8 - -6) * (7 + 9 * -7 - -5)) - ((-4 * 7 - 2 + 8) * (-6 * -1 - 2 - 5))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1183.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,443,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '((((-9 - 5 + 1 - -5) * (9 - -3 + 2 - -8)) - ((-1 - -6 * 7 * -2) - (-8 * -9 - 9 + 5))) + (((-7 - 6 - 8 - 8) * (-3 * 4 + 8 * 0)) - ((8 + 4 - 0 - 5) - (-1 - 7 + 4 * -8))))' you split it into multiple subexpressions. The first one is '-9 - 5 + 1 - -5'. and evaluates to '2'.'. The next one is '9 - -3 + 2 - -8' and evaluates to '20'.'. The next one is '-1 - -6 * 7 * -2' and evaluates to '13'.'. The next one is '-8 * -9 - 9 + 5' and evaluates to '-72'.'. The next one is '-7 - 6 - 8 - 8' and evaluates to '-29'.'. The next the full expression '((((-9 - 5 + 1 - -5) * (9 - -3 + 2 - -8)) - ((-1 - -6 * 7 * -2) - (-8 * -9 - 9 + 5))) + (((-7 - 6 - 8 - 8) * (-3 * 4 + 8 * 0)) - ((8 + 4 - 0 - 5) - (-1 - 7 + 4 * -8))))' evaluates to '-1445'.',"{'tokens': 213443, 'model': 'openai/text-davinci-003', 'req.': 1286, 'avb': '1.13', 'step': 177}",-1445',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((-9 - 5 + 1 - -5) * (9 - -3 + 2 - -8)) - ((-1 - -6 * 7 * -2) - (-8 * -9 - 9 + 5))) + (((-7 - 6 - 8 - 8) * (-3 * 4 + 8 * 0)) - ((8 + 4 - 0 - 5) - (-1 - 7 + 4 * -8))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((-9 - 5 + 1 - -5) * (9 - -3 + 2 - -8)) - ((-1 - -6 * 7 * -2) - (-8 * -9 - 9 + 5))) + (((-7 - 6 - 8 - 8) * (-3 * 4 + 8 * 0)) - ((8 + 4 - 0 - 5) - (-1 - 7 + 4 * -8))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/1186.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,278,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,"To evaluate the expression '((((-3 + -2) * (5 + 3)) - ((-5 + -3) - (-8 * -3))) - (((-2 + 8) - (6 - 2)) + ((-5 - -4) * (-3 - 8))))' you split it into multiple subexpressions. The first one is '(-3 + -2) * (5 + 3)'. and evaluates to '-1 * 8''. The next one is '(-5 + -3) - (-8 * -3)', and evaluates to '-8 - 24'.'. The next one is '(-2 + 8) - (6 - 2)', and evaluates to '6 - 4'.'. The next one is '(-5 - -4) * (-3 - 8)', and evaluates to '-1 * -11'.'. The next one is '-1 * 8 - 8 - 24 + 6 - 4 - 1 * -11', and evaluates to '-1'.'. The next the full expression '((((-3 + -2) * (5 + 3)) - ((-5 + -3) - (-8 * -3))) - (((-2 + 8) - (6 - 2)) + ((-5 - -4) * (-3 - 8))))' evaluates to '-1'.'","{'tokens': 231992, 'model': 'openai/text-davinci-003', 'req.': 1405, 'avb': '1.12', 'step': 220}",-1',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '((((-3 + -2) * (5 + 3)) - ((-5 + -3) - (-8 * -3))) - (((-2 + 8) - (6 - 2)) + ((-5 - -4) * (-3 - 8))))' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '((((-3 + -2) * (5 + 3)) - ((-5 + -3) - (-8 * -3))) - (((-2 + 8) - (6 - 2)) + ((-5 - -4) * (-3 - 8))))' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/923.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-21,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(-1 * 8)' you split it into multiple subexpressions. The first one is '-1'. and evaluates to '-1'.'. The next one is '* 8' and evaluates to '-8'.'. The next one is '-1 * 8' and evaluates to '-8'.'. The next one is '(-1 * 8)' and evaluates to '-8'.'. The next one is '(-1 * 8)' and evaluates to '-8'.'. The next the full expression '(-1 * 8)' evaluates to '-8'.',"{'tokens': 236634, 'model': 'openai/text-davinci-003', 'req.': 1434, 'avb': '1.12', 'step': 176}",-8',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(-1 * 8)' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(-1 * 8)' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/12.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-8,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(-5 - 0 - 9)' you split it into multiple subexpressions. The first one is '-5'. and evaluates to '-5'.'. The next one is '0' and evaluates to '0'.'. The next one is '-9' and evaluates to '-9'.'. The next one is '-5 - 0' and evaluates to '-5'.'. The next one is '-5 - 0 - 9' and evaluates to '-14'.'. The next the full expression '(-5 - 0 - 9)' evaluates to '-14'.',"{'tokens': 248146, 'model': 'openai/text-davinci-003', 'req.': 1497, 'avb': '1.12', 'step': 213}",-14',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(-5 - 0 - 9)' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(-5 - 0 - 9)' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/123.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-14,multiarith@guided_medium,2023:01:25_16:40:42
argmax,,anon-System-Product-Name,9c993383dbf56690fab46eb2665eda8df7fe9f6b,openai/text-davinci-003,To evaluate the expression '(-5 + -5 - 9)' you split it into multiple subexpressions. The first one is '-5 + -5'. and evaluates to '-10'.'. The next one is '-10 - 9' and evaluates to '-19'.'. The next one is '-19'. and evaluates to '-19'.'. The next one is '-19'. and evaluates to '-19'.'. The next one is '-19'. and evaluates to '-19'.'. The next the full expression '(-5 + -5 - 9)' evaluates to '-19'.',"{'tokens': 258779, 'model': 'openai/text-davinci-003', 'req.': 1566, 'avb': '1.11', 'step': 223}",-19',"BEAM(dclib_decoder=""argmax"", max_length=512, top1_distribution=True)
    ""To evaluate the expression '(-5 + -5 - 9)' you split it into multiple subexpressions. The first one is '[subexpression] and evaluates to '[subeval]'.[control_var]"" 
    num_eval_steps = 0 
    while num_eval_steps < 4 and control_var.startswith("" The next""):
        "" one is '[subexpression] and evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1 
    "" the full expression '(-5 + -5 - 9)' evaluates to '[answer]'""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"","" To conclude,""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpzzb321nr/148.lmql,8dae26f05ee9b4fecfdbfd0849d3a0d51888ea0c,0,-19,multiarith@guided_medium,2023:01:25_16:40:42
