,Accuracy,model,execmode,prompt,icl
model=Meta-Llama-3.1-8B-Instruct-Turbo_execmode=trace_prompt=standard_icl=8_output.json,0.7270659590598939,Meta-Llama-3.1-8B-Instruct-Turbo,trace,standard,8
model=command-r-plus_execmode=trace_prompt=standard_icl=4_output.json,0.714177407126611,command-r-plus,trace,standard,4
model=command-r-plus_execmode=trace_prompt=standard_icl=2_output.json,0.7134192570128886,command-r-plus,trace,standard,2
model=command-r-plus_execmode=trace_prompt=standard_icl=6_output.json,0.7028051554207733,command-r-plus,trace,standard,6
model=command-r-plus_execmode=trace_prompt=standard_icl=8_output.json,0.6868840030326004,command-r-plus,trace,standard,8
model=gpt-3.5-turbo_execmode=trace_prompt=standard_icl=2_output.json,0.6815769522365428,gpt-3.5-turbo,trace,standard,2
model=gpt-3.5-turbo_execmode=trace_prompt=standard_icl=6_output.json,0.6724791508718726,gpt-3.5-turbo,trace,standard,6
model=gpt-3.5-turbo_execmode=trace_prompt=standard_icl=4_output.json,0.6633813495072024,gpt-3.5-turbo,trace,standard,4
model=command-r_execmode=trace_prompt=standard_icl=8_output.json,0.5246398786959818,command-r,trace,standard,8
model=command-r_execmode=trace_prompt=standard_icl=6_output.json,0.5079605761940864,command-r,trace,standard,6
model=command-r_execmode=trace_prompt=standard_icl=4_output.json,0.49962092494313876,command-r,trace,standard,4
model=command-r_execmode=trace_prompt=standard_icl=2_output.json,0.4564063684609553,command-r,trace,standard,2
model=command-r-plus_execmode=plan_only_prompt=standard_icl=8_output.json,0.40788476118271416,command-r-plus,plan,standard,8
model=command-r-plus_execmode=plan_only_prompt=standard_icl=6_output.json,0.3980288097043215,command-r-plus,plan,standard,6
model=gpt-3.5-turbo_execmode=plan_only_prompt=standard_icl=8_output.json,0.3616376042456406,gpt-3.5-turbo,plan,standard,8
model=gpt-3.5-turbo_execmode=plan_only_prompt=standard_icl=6_output.json,0.34420015163002277,gpt-3.5-turbo,plan,standard,6
model=command-r_execmode=plan_only_prompt=standard_icl=8_output.json,0.3115996967399545,command-r,plan,standard,8
model=Meta-Llama-3-8B_execmode=trace_prompt=standard_icl=1_output.json,0.26914329037149354,Meta-Llama-3-8B,trace,standard,1
model=command-r_execmode=plan_only_prompt=standard_icl=6_output.json,0.24715693707354056,command-r,plan,standard,6
model=Meta-Llama-3-8B_execmode=trace_prompt=standard_icl=2_output.json,0.2441243366186505,Meta-Llama-3-8B,trace,standard,2
model=Mixtral-8x7B-v0.1_execmode=trace_prompt=standard_icl=2_output.json,0.11751326762699014,Mixtral-8x7B-v0.1,trace,standard,2
model=Mixtral-8x7B-v0.1_execmode=trace_prompt=standard_icl=4_output.json,0.10841546626231995,Mixtral-8x7B-v0.1,trace,standard,4
model=Mixtral-8x7B-v0.1_execmode=trace_prompt=standard_icl=6_output.json,0.0932524639878696,Mixtral-8x7B-v0.1,trace,standard,6
