,Accuracy,model,execmode,prompt,icl
model=Meta-Llama-3.1-8B-Instruct-Turbo_execmode=trace_prompt=standard_icl=6_output.json,0.6299212598425197,Meta-Llama-3.1-8B-Instruct-Turbo,trace,standard,6
model=command-r-plus_execmode=trace_prompt=standard_icl=2_output.json,0.5590551181102362,command-r-plus,trace,standard,2
model=gpt-3.5-turbo_execmode=trace_prompt=standard_icl=2_output.json,0.5511811023622047,gpt-3.5-turbo,trace,standard,2
model=command-r-plus_execmode=plan_only_prompt=standard_icl=4_output.json,0.5511811023622047,command-r-plus,plan,standard,4
model=gpt-3.5-turbo_execmode=plan_only_prompt=standard_icl=4_output.json,0.5433070866141733,gpt-3.5-turbo,plan,standard,4
model=gpt-3.5-turbo_execmode=plan_only_prompt=standard_icl=6_output.json,0.531496062992126,gpt-3.5-turbo,plan,standard,6
model=command-r-plus_execmode=plan_only_prompt=standard_icl=6_output.json,0.5196850393700787,command-r-plus,plan,standard,6
model=gpt-3.5-turbo_execmode=trace_prompt=standard_icl=4_output.json,0.5196850393700787,gpt-3.5-turbo,trace,standard,4
model=command-r-plus_execmode=trace_prompt=standard_icl=6_output.json,0.5196850393700787,command-r-plus,trace,standard,6
model=command-r-plus_execmode=plan_only_prompt=standard_icl=2_output.json,0.515748031496063,command-r-plus,plan,standard,2
model=command-r-plus_execmode=trace_prompt=standard_icl=4_output.json,0.5039370078740157,command-r-plus,trace,standard,4
model=gpt-3.5-turbo_execmode=plan_only_prompt=standard_icl=2_output.json,0.48031496062992124,gpt-3.5-turbo,plan,standard,2
model=command-r_execmode=trace_prompt=standard_icl=4_output.json,0.43700787401574803,command-r,trace,standard,4
model=command-r_execmode=trace_prompt=standard_icl=6_output.json,0.3858267716535433,command-r,trace,standard,6
model=gpt-3.5-turbo_execmode=trace_prompt=standard_icl=6_output.json,0.3543307086614173,gpt-3.5-turbo,trace,standard,6
model=command-r_execmode=plan_only_prompt=standard_icl=4_output.json,0.35039370078740156,command-r,plan,standard,4
model=command-r_execmode=plan_only_prompt=standard_icl=6_output.json,0.3464566929133858,command-r,plan,standard,6
model=command-r_execmode=trace_prompt=standard_icl=2_output.json,0.3464566929133858,command-r,trace,standard,2
model=command-r_execmode=plan_only_prompt=standard_icl=2_output.json,0.3346456692913386,command-r,plan,standard,2
model=Meta-Llama-3-8B_execmode=trace_prompt=standard_icl=2_output.json,0.1732283464566929,Meta-Llama-3-8B,trace,standard,2
model=Meta-Llama-3-8B_execmode=trace_prompt=standard_icl=1_output.json,0.14173228346456693,Meta-Llama-3-8B,trace,standard,1
model=Mixtral-8x7B-v0.1_execmode=trace_prompt=standard_icl=4_output.json,0.14173228346456693,Mixtral-8x7B-v0.1,trace,standard,4
model=Mixtral-8x7B-v0.1_execmode=trace_prompt=standard_icl=6_output.json,0.12992125984251968,Mixtral-8x7B-v0.1,trace,standard,6
model=Mixtral-8x7B-v0.1_execmode=trace_prompt=standard_icl=2_output.json,0.12598425196850394,Mixtral-8x7B-v0.1,trace,standard,2
