group,MA-f1_mean,MA-f1_std,wMA-f1_mean,wMA-f1_std,MI-f1_mean,MI-f1_std,wMI-f1_mean,wMI-f1_std,dtype,model,MA-f1,wMA-f1,MI-f1,wMI-f1
language_claude_3_5_sonnet_temp0.0,49.5,12.6,48.4,13.4,55.4,10.0,49.4,11.9,language,claude_3_5_sonnet_temp0.0,49.5±12.6,48.4±13.4,55.4±10.0,49.4±11.9
language_claude_3_5_sonnet_temp0.25,50.7,12.5,49.2,13.6,57.3,11.9,50.7,12.1,language,claude_3_5_sonnet_temp0.25,50.7±12.5,49.2±13.6,57.3±11.9,50.7±12.1
language_claude_3_5_sonnet_temp0.5,50.9,12.5,49.3,13.8,56.9,10.7,50.5,12.1,language,claude_3_5_sonnet_temp0.5,50.9±12.5,49.3±13.8,56.9±10.7,50.5±12.1
language_claude_3_5_sonnet_temp0.75,49.6,13.3,48.4,14.8,55.9,11.0,49.7,12.8,language,claude_3_5_sonnet_temp0.75,49.6±13.3,48.4±14.8,55.9±11.0,49.7±12.8
language_claude_3_5_sonnet_temp1.0,48.8,11.2,47.1,12.2,55.3,9.8,48.5,10.5,language,claude_3_5_sonnet_temp1.0,48.8±11.2,47.1±12.2,55.3±9.8,48.5±10.5
language_claude_3_haiku_temp0.0,41.4,9.0,49.8,8.5,44.1,7.8,55.8,10.0,language,claude_3_haiku_temp0.0,41.4±9.0,49.8±8.5,44.1±7.8,55.8±10.0
language_claude_3_haiku_temp0.25,41.9,5.9,50.2,4.8,43.3,4.7,55.4,4.5,language,claude_3_haiku_temp0.25,41.9±5.9,50.2±4.8,43.3±4.7,55.4±4.5
language_claude_3_haiku_temp0.5,40.5,6.8,49.0,7.1,42.6,5.7,55.3,7.5,language,claude_3_haiku_temp0.5,40.5±6.8,49.0±7.1,42.6±5.7,55.3±7.5
language_claude_3_haiku_temp0.75,41.9,3.7,49.7,4.7,42.6,4.0,53.9,6.6,language,claude_3_haiku_temp0.75,41.9±3.7,49.7±4.7,42.6±4.0,53.9±6.6
language_claude_3_haiku_temp1.0,39.6,6.7,48.1,7.4,42.6,6.8,54.9,8.1,language,claude_3_haiku_temp1.0,39.6±6.7,48.1±7.4,42.6±6.8,54.9±8.1
language_gpt_4o_mini_temp0.0,43.9,9.0,48.4,9.3,45.2,9.6,49.1,9.4,language,gpt_4o_mini_temp0.0,43.9±9.0,48.4±9.3,45.2±9.6,49.1±9.4
language_gpt_4o_mini_temp0.25,39.8,8.1,45.7,8.5,40.4,7.1,47.3,8.1,language,gpt_4o_mini_temp0.25,39.8±8.1,45.7±8.5,40.4±7.1,47.3±8.1
language_gpt_4o_mini_temp0.5,39.3,8.2,43.9,10.5,40.0,7.0,45.5,10.8,language,gpt_4o_mini_temp0.5,39.3±8.2,43.9±10.5,40.0±7.0,45.5±10.8
language_gpt_4o_mini_temp0.75,40.4,8.6,45.3,8.4,41.5,9.7,45.9,8.1,language,gpt_4o_mini_temp0.75,40.4±8.6,45.3±8.4,41.5±9.7,45.9±8.1
language_gpt_4o_mini_temp1.0,43.7,10.1,49.3,11.1,44.1,9.3,50.2,11.6,language,gpt_4o_mini_temp1.0,43.7±10.1,49.3±11.1,44.1±9.3,50.2±11.6
language_gpt_4o_temp0.0,60.8,7.8,67.2,8.2,62.2,7.3,68.7,8.7,language,gpt_4o_temp0.0,60.8±7.8,67.2±8.2,62.2±7.3,68.7±8.7
language_gpt_4o_temp0.25,60.6,7.5,65.4,8.0,61.9,8.7,66.0,8.3,language,gpt_4o_temp0.25,60.6±7.5,65.4±8.0,61.9±8.7,66.0±8.3
language_gpt_4o_temp0.5,64.4,10.9,69.6,11.1,65.6,10.5,70.2,11.2,language,gpt_4o_temp0.5,64.4±10.9,69.6±11.1,65.6±10.5,70.2±11.2
language_gpt_4o_temp0.75,63.2,8.5,68.5,7.5,64.8,10.4,70.1,7.7,language,gpt_4o_temp0.75,63.2±8.5,68.5±7.5,64.8±10.4,70.1±7.7
language_gpt_4o_temp1.0,62.2,6.6,68.0,7.3,63.3,6.2,69.4,7.8,language,gpt_4o_temp1.0,62.2±6.6,68.0±7.3,63.3±6.2,69.4±7.8
symbolic_claude_3_5_sonnet_temp0.0,59.5,9.7,59.2,11.9,63.6,7.5,59.4,10.5,symbolic,claude_3_5_sonnet_temp0.0,59.5±9.7,59.2±11.9,63.6±7.5,59.4±10.5
symbolic_claude_3_5_sonnet_temp0.25,56.6,10.0,55.7,12.3,61.2,7.8,56.0,11.5,symbolic,claude_3_5_sonnet_temp0.25,56.6±10.0,55.7±12.3,61.2±7.8,56.0±11.5
symbolic_claude_3_5_sonnet_temp0.5,55.6,11.6,54.5,13.8,60.9,9.3,55.2,12.9,symbolic,claude_3_5_sonnet_temp0.5,55.6±11.6,54.5±13.8,60.9±9.3,55.2±12.9
symbolic_claude_3_5_sonnet_temp0.75,57.7,9.6,56.6,11.6,63.2,7.6,57.5,10.9,symbolic,claude_3_5_sonnet_temp0.75,57.7±9.6,56.6±11.6,63.2±7.6,57.5±10.9
symbolic_claude_3_5_sonnet_temp1.0,55.0,12.3,54.4,15.4,59.3,9.9,54.9,14.0,symbolic,claude_3_5_sonnet_temp1.0,55.0±12.3,54.4±15.4,59.3±9.9,54.9±14.0
symbolic_claude_3_haiku_temp0.0,21.3,6.4,22.9,7.1,23.7,6.5,25.3,7.3,symbolic,claude_3_haiku_temp0.0,21.3±6.4,22.9±7.1,23.7±6.5,25.3±7.3
symbolic_claude_3_haiku_temp0.25,22.7,3.4,25.4,5.1,24.8,2.4,27.4,5.4,symbolic,claude_3_haiku_temp0.25,22.7±3.4,25.4±5.1,24.8±2.4,27.4±5.4
symbolic_claude_3_haiku_temp0.5,24.5,7.7,27.5,8.9,26.7,7.5,30.0,8.2,symbolic,claude_3_haiku_temp0.5,24.5±7.7,27.5±8.9,26.7±7.5,30.0±8.2
symbolic_claude_3_haiku_temp0.75,25.3,6.8,26.2,9.2,29.3,6.6,29.5,9.2,symbolic,claude_3_haiku_temp0.75,25.3±6.8,26.2±9.2,29.3±6.6,29.5±9.2
symbolic_claude_3_haiku_temp1.0,18.5,3.7,20.5,4.9,21.5,5.6,23.2,5.7,symbolic,claude_3_haiku_temp1.0,18.5±3.7,20.5±4.9,21.5±5.6,23.2±5.7
symbolic_gpt_4o_mini_temp0.0,22.8,6.0,26.2,8.9,23.3,6.0,27.3,9.9,symbolic,gpt_4o_mini_temp0.0,22.8±6.0,26.2±8.9,23.3±6.0,27.3±9.9
symbolic_gpt_4o_mini_temp0.25,25.4,8.2,26.7,9.7,26.3,9.2,26.9,10.3,symbolic,gpt_4o_mini_temp0.25,25.4±8.2,26.7±9.7,26.3±9.2,26.9±10.3
symbolic_gpt_4o_mini_temp0.5,23.6,11.4,25.0,12.8,24.4,11.5,25.5,13.1,symbolic,gpt_4o_mini_temp0.5,23.6±11.4,25.0±12.8,24.4±11.5,25.5±13.1
symbolic_gpt_4o_mini_temp0.75,21.9,5.0,23.8,6.7,22.2,5.1,24.8,7.9,symbolic,gpt_4o_mini_temp0.75,21.9±5.0,23.8±6.7,22.2±5.1,24.8±7.9
symbolic_gpt_4o_mini_temp1.0,21.9,5.8,24.7,7.0,22.2,6.3,25.1,6.5,symbolic,gpt_4o_mini_temp1.0,21.9±5.8,24.7±7.0,22.2±6.3,25.1±6.5
symbolic_gpt_4o_temp0.0,37.5,7.4,35.9,8.3,42.6,9.1,38.1,8.2,symbolic,gpt_4o_temp0.0,37.5±7.4,35.9±8.3,42.6±9.1,38.1±8.2
symbolic_gpt_4o_temp0.25,38.0,5.8,37.0,6.7,42.6,8.0,39.2,6.6,symbolic,gpt_4o_temp0.25,38.0±5.8,37.0±6.7,42.6±8.0,39.2±6.6
symbolic_gpt_4o_temp0.5,35.7,6.8,34.0,6.8,39.6,9.0,35.8,6.4,symbolic,gpt_4o_temp0.5,35.7±6.8,34.0±6.8,39.6±9.0,35.8±6.4
symbolic_gpt_4o_temp0.75,39.5,8.2,40.5,8.5,42.6,11.0,41.5,8.8,symbolic,gpt_4o_temp0.75,39.5±8.2,40.5±8.5,42.6±11.0,41.5±8.8
symbolic_gpt_4o_temp1.0,34.1,10.4,33.2,11.0,37.8,12.1,34.6,11.0,symbolic,gpt_4o_temp1.0,34.1±10.4,33.2±11.0,37.8±12.1,34.6±11.0
