decoder,distribution,executor,lmql_hash,model,model_result,prediction,query,query_file,repo_hash,shots,target,task_name,timestamp
argmax,,anon-System-Product-Name,863282e0421ebbbcdda56f97bc80e2950b9d0866,openai/text-davinci-003,"Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.To evaluate the expression '(-5 - 0 - 9)' you split it into multiple subexpressions. The first subexpression is '-5 - 0',. This evaluates to '-5'.. The next subexpression is '-5 - 9',. This evaluates to '-14'.'. To conclude,  the full expression '(-5 - 0 - 9)' evaluates to '-14'.",-14',"BEAM(dclib_decoder=""argmax"", max_length=512)
    ""Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.""
    ""To evaluate the expression '(-5 - 0 - 9)' you split it into multiple subexpressions. The first subexpression is '[subexpression]. This evaluates to '[subeval].[control_var]""
    num_eval_steps = 0
    while num_eval_steps < 8 and control_var.startswith("" The next""):
        "" subexpression is '[subexpression]. This evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1
    "" the full expression '(-5 - 0 - 9)' evaluates to '[answer]""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"", "" To conclude, ""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpwiaqq1mf/123.lmql,efaa54f0d67c4a8560583492cab7a84eb2dfd118,0,-14,multistep_arithmetic_mini,2023:01:20_15:14:35
argmax,,anon-System-Product-Name,863282e0421ebbbcdda56f97bc80e2950b9d0866,openai/text-davinci-003,"Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.To evaluate the expression '((-5 - -2 * 0) - (4 + 3 + -3))' you split it into multiple subexpressions. The first subexpression is '-5 - -2 * 0',. This evaluates to '-5 - 0',. The next subexpression is '4 + 3 + -3',. This evaluates to '4 + 0','. To conclude,  the full expression '((-5 - -2 * 0) - (4 + 3 + -3))' evaluates to '-5 - 4',","-5 - 4',","BEAM(dclib_decoder=""argmax"", max_length=512)
    ""Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.""
    ""To evaluate the expression '((-5 - -2 * 0) - (4 + 3 + -3))' you split it into multiple subexpressions. The first subexpression is '[subexpression]. This evaluates to '[subeval].[control_var]""
    num_eval_steps = 0
    while num_eval_steps < 8 and control_var.startswith("" The next""):
        "" subexpression is '[subexpression]. This evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1
    "" the full expression '((-5 - -2 * 0) - (4 + 3 + -3))' evaluates to '[answer]""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"", "" To conclude, ""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpwiaqq1mf/425.lmql,efaa54f0d67c4a8560583492cab7a84eb2dfd118,0,-9,multistep_arithmetic_mini,2023:01:20_15:14:35
argmax,,anon-System-Product-Name,863282e0421ebbbcdda56f97bc80e2950b9d0866,openai/text-davinci-003,"Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.To evaluate the expression '(-9 * -5)' you split it into multiple subexpressions. The first subexpression is '-9'. This evaluates to '-9'.. The next subexpression is '-5'.. This evaluates to '-5'.'. To conclude,  the full expression '(-9 * -5)' evaluates to '45'.",45',"BEAM(dclib_decoder=""argmax"", max_length=512)
    ""Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.""
    ""To evaluate the expression '(-9 * -5)' you split it into multiple subexpressions. The first subexpression is '[subexpression]. This evaluates to '[subeval].[control_var]""
    num_eval_steps = 0
    while num_eval_steps < 8 and control_var.startswith("" The next""):
        "" subexpression is '[subexpression]. This evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1
    "" the full expression '(-9 * -5)' evaluates to '[answer]""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"", "" To conclude, ""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpwiaqq1mf/37.lmql,efaa54f0d67c4a8560583492cab7a84eb2dfd118,0,45,multistep_arithmetic_mini,2023:01:20_15:14:35
argmax,,anon-System-Product-Name,863282e0421ebbbcdda56f97bc80e2950b9d0866,openai/text-davinci-003,"Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.To evaluate the expression '(-1 * -1)' you split it into multiple subexpressions. The first subexpression is '-1'. This evaluates to '-1'.. The next subexpression is '-1'.. This evaluates to '-1'.'. To conclude,  the full expression '(-1 * -1)' evaluates to '1'.",1',"BEAM(dclib_decoder=""argmax"", max_length=512)
    ""Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.""
    ""To evaluate the expression '(-1 * -1)' you split it into multiple subexpressions. The first subexpression is '[subexpression]. This evaluates to '[subeval].[control_var]""
    num_eval_steps = 0
    while num_eval_steps < 8 and control_var.startswith("" The next""):
        "" subexpression is '[subexpression]. This evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1
    "" the full expression '(-1 * -1)' evaluates to '[answer]""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"", "" To conclude, ""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpwiaqq1mf/33.lmql,efaa54f0d67c4a8560583492cab7a84eb2dfd118,0,1,multistep_arithmetic_mini,2023:01:20_15:14:35
argmax,,anon-System-Product-Name,863282e0421ebbbcdda56f97bc80e2950b9d0866,openai/text-davinci-003,"Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.To evaluate the expression '(-9 + -2 - -2)' you split it into multiple subexpressions. The first subexpression is '-9 + -2'. This evaluates to '-11'.. The next subexpression is '-11 - -2'.. This evaluates to '-9'.'. To conclude,  the full expression '(-9 + -2 - -2)' evaluates to '-9'.",-9',"BEAM(dclib_decoder=""argmax"", max_length=512)
    ""Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.""
    ""To evaluate the expression '(-9 + -2 - -2)' you split it into multiple subexpressions. The first subexpression is '[subexpression]. This evaluates to '[subeval].[control_var]""
    num_eval_steps = 0
    while num_eval_steps < 8 and control_var.startswith("" The next""):
        "" subexpression is '[subexpression]. This evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1
    "" the full expression '(-9 + -2 - -2)' evaluates to '[answer]""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"", "" To conclude, ""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpwiaqq1mf/175.lmql,efaa54f0d67c4a8560583492cab7a84eb2dfd118,0,-9,multistep_arithmetic_mini,2023:01:20_15:14:35
argmax,,anon-System-Product-Name,863282e0421ebbbcdda56f97bc80e2950b9d0866,openai/text-davinci-003,"Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.To evaluate the expression '((((3 - -6 + -5) * (-6 * -5 - 5)) + ((-4 * 0 - 6) + (4 + 5 - 8))) - (((-6 * 2 + 9) - (3 * 2 * -7)) - ((8 * 9 + 0) + (5 * -1 * 9))))' you split it into multiple subexpressions. The first subexpression is '3 - -6 + -5'. This evaluates to '4'.. The next subexpression is '-6 * -5 - 5'. This evaluates to '35'.'. The next subexpression is '-4 * 0 - 6'. This evaluates to '-6'.'. The next subexpression is '4 + 5 - 8'.. This evaluates to '1'.'. The next subexpression is '-6 * 2 + 9'.. This evaluates to '3'.'. The next subexpression is '3 * 2 * -7'.. This evaluates to '-42'.'. The next subexpression is '8 * 9 + 0'.. This evaluates to '72'.'. The next subexpression is '5 * -1 * 9'.. This evaluates to '-45'.'. To conclude,  the full expression '((((3 - -6 + -5) * (-6 * -5 - 5)) + ((-4 * 0 - 6) + (4 + 5 - 8))) - (((-6 * 2 + 9) - (3 * 2 * -7)) - ((8 * 9 + 0) + (5 * -1 * 9))))' evaluates to '-7'.",-7',"BEAM(dclib_decoder=""argmax"", max_length=512)
    ""Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.""
    ""To evaluate the expression '((((3 - -6 + -5) * (-6 * -5 - 5)) + ((-4 * 0 - 6) + (4 + 5 - 8))) - (((-6 * 2 + 9) - (3 * 2 * -7)) - ((8 * 9 + 0) + (5 * -1 * 9))))' you split it into multiple subexpressions. The first subexpression is '[subexpression]. This evaluates to '[subeval].[control_var]""
    num_eval_steps = 0
    while num_eval_steps < 8 and control_var.startswith("" The next""):
        "" subexpression is '[subexpression]. This evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1
    "" the full expression '((((3 - -6 + -5) * (-6 * -5 - 5)) + ((-4 * 0 - 6) + (4 + 5 - 8))) - (((-6 * 2 + 9) - (3 * 2 * -7)) - ((8 * 9 + 0) + (5 * -1 * 9))))' evaluates to '[answer]""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"", "" To conclude, ""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpwiaqq1mf/1043.lmql,efaa54f0d67c4a8560583492cab7a84eb2dfd118,0,83,multistep_arithmetic_mini,2023:01:20_15:14:35
argmax,,anon-System-Product-Name,863282e0421ebbbcdda56f97bc80e2950b9d0866,openai/text-davinci-003,"Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.To evaluate the expression '((((-3 + -2) * (5 + 3)) - ((-5 + -3) - (-8 * -3))) - (((-2 + 8) - (6 - 2)) + ((-5 - -4) * (-3 - 8))))' you split it into multiple subexpressions. The first subexpression is '(-3 + -2) * (5 + 3)',. This evaluates to '-5 * 8',. The next subexpression is '(-5 + -3) - (-8 * -3)',. This evaluates to '-8 - 24','. The next subexpression is '(-2 + 8) - (6 - 2)',. This evaluates to '6 - 4','. The next subexpression is '(-5 - -4) * (-3 - 8)',. This evaluates to '-1 * -11','. To conclude,  the full expression '((((-3 + -2) * (5 + 3)) - ((-5 + -3) - (-8 * -3))) - (((-2 + 8) - (6 - 2)) + ((-5 - -4) * (-3 - 8))))' evaluates to '-5 * 8 - 8 - 24 + 6 - 4 - 1 * -11',","-5 * 8 - 8 - 24 + 6 - 4 - 1 * -11',","BEAM(dclib_decoder=""argmax"", max_length=512)
    ""Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.""
    ""To evaluate the expression '((((-3 + -2) * (5 + 3)) - ((-5 + -3) - (-8 * -3))) - (((-2 + 8) - (6 - 2)) + ((-5 - -4) * (-3 - 8))))' you split it into multiple subexpressions. The first subexpression is '[subexpression]. This evaluates to '[subeval].[control_var]""
    num_eval_steps = 0
    while num_eval_steps < 8 and control_var.startswith("" The next""):
        "" subexpression is '[subexpression]. This evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1
    "" the full expression '((((-3 + -2) * (5 + 3)) - ((-5 + -3) - (-8 * -3))) - (((-2 + 8) - (6 - 2)) + ((-5 - -4) * (-3 - 8))))' evaluates to '[answer]""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"", "" To conclude, ""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpwiaqq1mf/923.lmql,efaa54f0d67c4a8560583492cab7a84eb2dfd118,0,-21,multistep_arithmetic_mini,2023:01:20_15:14:35
argmax,,anon-System-Product-Name,863282e0421ebbbcdda56f97bc80e2950b9d0866,openai/text-davinci-003,"Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.To evaluate the expression '((((-9 - 5 + 1 - -5) * (9 - -3 + 2 - -8)) - ((-1 - -6 * 7 * -2) - (-8 * -9 - 9 + 5))) + (((-7 - 6 - 8 - 8) * (-3 * 4 + 8 * 0)) - ((8 + 4 - 0 - 5) - (-1 - 7 + 4 * -8))))' you split it into multiple subexpressions. The first subexpression is '-9 - 5 + 1 - -5'. This evaluates to '-8'.. The next subexpression is '9 - -3 + 2 - -8',. This evaluates to '20'.'. The next subexpression is '-1 - -6 * 7 * -2',. This evaluates to '13'.'. The next subexpression is '-8 * -9 - 9 + 5',. This evaluates to '-64'.'. The next subexpression is '-7 - 6 - 8 - 8',. This evaluates to '-29'.'. The next subexpression is '-3 * 4 + 8 * 0',. This evaluates to '-12'.'. The next subexpression is '8 + 4 - 0 - 5',. This evaluates to '7'.'. The next subexpression is '-1 - 7 + 4 * -8',. This evaluates to '-41'.'. To conclude,  the full expression '((((-9 - 5 + 1 - -5) * (9 - -3 + 2 - -8)) - ((-1 - -6 * 7 * -2) - (-8 * -9 - 9 + 5))) + (((-7 - 6 - 8 - 8) * (-3 * 4 + 8 * 0)) - ((8 + 4 - 0 - 5) - (-1 - 7 + 4 * -8))))' evaluates to '-945'.",-945',"BEAM(dclib_decoder=""argmax"", max_length=512)
    ""Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.""
    ""To evaluate the expression '((((-9 - 5 + 1 - -5) * (9 - -3 + 2 - -8)) - ((-1 - -6 * 7 * -2) - (-8 * -9 - 9 + 5))) + (((-7 - 6 - 8 - 8) * (-3 * 4 + 8 * 0)) - ((8 + 4 - 0 - 5) - (-1 - 7 + 4 * -8))))' you split it into multiple subexpressions. The first subexpression is '[subexpression]. This evaluates to '[subeval].[control_var]""
    num_eval_steps = 0
    while num_eval_steps < 8 and control_var.startswith("" The next""):
        "" subexpression is '[subexpression]. This evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1
    "" the full expression '((((-9 - 5 + 1 - -5) * (9 - -3 + 2 - -8)) - ((-1 - -6 * 7 * -2) - (-8 * -9 - 9 + 5))) + (((-7 - 6 - 8 - 8) * (-3 * 4 + 8 * 0)) - ((8 + 4 - 0 - 5) - (-1 - 7 + 4 * -8))))' evaluates to '[answer]""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"", "" To conclude, ""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpwiaqq1mf/1186.lmql,efaa54f0d67c4a8560583492cab7a84eb2dfd118,0,278,multistep_arithmetic_mini,2023:01:20_15:14:35
argmax,,anon-System-Product-Name,863282e0421ebbbcdda56f97bc80e2950b9d0866,openai/text-davinci-003,"Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.To evaluate the expression '(((-8 * -9) * (-4 * 6)) - ((-7 * -7) * (-8 + -1)))' you split it into multiple subexpressions. The first subexpression is '(-8 * -9)',. This evaluates to '72'.. The next subexpression is '(-4 * 6)',. This evaluates to '-24'.'. The next subexpression is '(-7 * -7)',. This evaluates to '49'.'. The next subexpression is '(-8 + -1)',. This evaluates to '-9'.'. The next subexpression is '((-8 * -9) * (-4 * 6))',. This evaluates to '1728'.'. The next subexpression is '((-7 * -7) * (-8 + -1))',. This evaluates to '441'.'. To conclude,  the full expression '(((-8 * -9) * (-4 * 6)) - ((-7 * -7) * (-8 + -1)))' evaluates to '1287'.",1287',"BEAM(dclib_decoder=""argmax"", max_length=512)
    ""Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.""
    ""To evaluate the expression '(((-8 * -9) * (-4 * 6)) - ((-7 * -7) * (-8 + -1)))' you split it into multiple subexpressions. The first subexpression is '[subexpression]. This evaluates to '[subeval].[control_var]""
    num_eval_steps = 0
    while num_eval_steps < 8 and control_var.startswith("" The next""):
        "" subexpression is '[subexpression]. This evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1
    "" the full expression '(((-8 * -9) * (-4 * 6)) - ((-7 * -7) * (-8 + -1)))' evaluates to '[answer]""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"", "" To conclude, ""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpwiaqq1mf/697.lmql,efaa54f0d67c4a8560583492cab7a84eb2dfd118,0,-1287,multistep_arithmetic_mini,2023:01:20_15:14:35
argmax,,anon-System-Product-Name,863282e0421ebbbcdda56f97bc80e2950b9d0866,openai/text-davinci-003,"Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.To evaluate the expression '((((7 + 6 + -2 * 5) + (9 + 5 + -5 + 6)) - ((1 + -4 - 7 + 7) + (-5 + -3 - -4 - 3))) - (((1 - -8 - 9 + 6) + (0 + 4 * -6 * -1)) * ((-1 - -6 * -6 + -9) + (9 * 0 - 4 - 0))))' you split it into multiple subexpressions. The first subexpression is '7 + 6 + -2 * 5'. This evaluates to '7 + 6 + -10'. The next subexpression is '9 + 5 + -5 + 6'. This evaluates to '13 + 1'.'. The next subexpression is '1 + -4 - 7 + 7'.. This evaluates to '-3 + 7''. The next subexpression is '-5 + -3 - -4 - 3'.. This evaluates to '-5 + -3 - 4 - 3'.'. The next subexpression is '1 - -8 - 9 + 6'.. This evaluates to '1 - -8 - 3'.'. The next subexpression is '0 + 4 * -6 * -1'.. This evaluates to '0 + 24'.'. The next subexpression is '-1 - -6 * -6 + -9'.. This evaluates to '-1 - 36 + -9'.'. The next subexpression is '9 * 0 - 4 - 0'.. This evaluates to '-4'.'. To conclude,  the full expression '((((7 + 6 + -2 * 5) + (9 + 5 + -5 + 6)) - ((1 + -4 - 7 + 7) + (-5 + -3 - -4 - 3))) - (((1 - -8 - 9 + 6) + (0 + 4 * -6 * -1)) * ((-1 - -6 * -6 + -9) + (9 * 0 - 4 - 0))))' evaluates to '-37'.",-37',"BEAM(dclib_decoder=""argmax"", max_length=512)
    ""Evaluate the following arithmetic expression by evaluating subexpressions first. When you are done, begin the last sentence with 'To conclude' and end on a new line.""
    ""To evaluate the expression '((((7 + 6 + -2 * 5) + (9 + 5 + -5 + 6)) - ((1 + -4 - 7 + 7) + (-5 + -3 - -4 - 3))) - (((1 - -8 - 9 + 6) + (0 + 4 * -6 * -1)) * ((-1 - -6 * -6 + -9) + (9 * 0 - 4 - 0))))' you split it into multiple subexpressions. The first subexpression is '[subexpression]. This evaluates to '[subeval].[control_var]""
    num_eval_steps = 0
    while num_eval_steps < 8 and control_var.startswith("" The next""):
        "" subexpression is '[subexpression]. This evaluates to '[subeval]'.[control_var]""
        num_eval_steps +=1
    "" the full expression '((((7 + 6 + -2 * 5) + (9 + 5 + -5 + 6)) - ((1 + -4 - 7 + 7) + (-5 + -3 - -4 - 3))) - (((1 - -8 - 9 + 6) + (0 + 4 * -6 * -1)) * ((-1 - -6 * -6 + -9) + (9 * 0 - 4 - 0))))' evaluates to '[answer]""
FROM 
    ""openai/text-davinci-003""
WHERE
    control_var in ["" The next"", "" To conclude, ""] and STOPS_AT (subexpression, ""'"") and not ""\n"" in subexpression and STOPS_AT(subeval, ""'"") and STOPS_AT(answer, ""'"")",/tmp/tmpwiaqq1mf/1158.lmql,efaa54f0d67c4a8560583492cab7a84eb2dfd118,0,1528,multistep_arithmetic_mini,2023:01:20_15:14:35
