group,MA-f1_mean,MA-f1_std,wMA-f1_mean,wMA-f1_std,MI-f1_mean,MI-f1_std,wMI-f1_mean,wMI-f1_std,dtype,model,MA-f1,wMA-f1,MI-f1,wMI-f1
random_str_language_claude_3_5_sonnet,80.1,0.1,81.6,0.3,81.6,0.4,81.3,0.4,random_str_language,claude_3_5_sonnet,80.1±0.1,81.6±0.3,81.6±0.4,81.3±0.4
random_str_language_claude_3_haiku,53.0,0.6,61.7,0.3,52.8,0.4,64.7,1.1,random_str_language,claude_3_haiku,53.0±0.6,61.7±0.3,52.8±0.4,64.7±1.1
random_str_language_gpt_4o,72.8,1.3,78.7,1.1,73.0,1.4,79.1,1.1,random_str_language,gpt_4o,72.8±1.3,78.7±1.1,73.0±1.4,79.1±1.1
random_str_language_gpt_4o_mini,58.0,1.4,63.8,1.7,56.8,1.2,64.0,1.7,random_str_language,gpt_4o_mini,58.0±1.4,63.8±1.7,56.8±1.2,64.0±1.7
random_str_language_ollama_llama3_8b,47.8,1.7,51.6,1.6,48.8,1.7,52.2,1.4,random_str_language,ollama_llama3_8b,47.8±1.7,51.6±1.6,48.8±1.7,52.2±1.4
random_str_language_ollama_mistral_7b,28.1,1.0,22.9,0.8,49.6,1.7,32.9,0.7,random_str_language,ollama_mistral_7b,28.1±1.0,22.9±0.8,49.6±1.7,32.9±0.7
random_str_language_ollama_qwen2_7b,41.4,1.3,49.5,1.0,42.4,1.5,54.6,1.0,random_str_language,ollama_qwen2_7b,41.4±1.3,49.5±1.0,42.4±1.5,54.6±1.0
random_str_symbolic_claude_3_5_sonnet,70.8,0.9,75.4,1.1,72.3,0.5,75.7,1.2,random_str_symbolic,claude_3_5_sonnet,70.8±0.9,75.4±1.1,72.3±0.5,75.7±1.2
random_str_symbolic_claude_3_haiku,38.3,1.5,46.1,1.2,40.2,1.5,51.7,0.9,random_str_symbolic,claude_3_haiku,38.3±1.5,46.1±1.2,40.2±1.5,51.7±0.9
random_str_symbolic_gpt_4o,54.2,0.7,57.6,0.9,57.5,0.9,58.9,0.9,random_str_symbolic,gpt_4o,54.2±0.7,57.6±0.9,57.5±0.9,58.9±0.9
random_str_symbolic_gpt_4o_mini,39.9,0.3,44.3,0.2,40.7,0.3,46.1,0.2,random_str_symbolic,gpt_4o_mini,39.9±0.3,44.3±0.2,40.7±0.3,46.1±0.2
random_str_symbolic_ollama_llama3_8b,30.8,1.5,31.8,1.9,36.4,0.9,36.7,1.5,random_str_symbolic,ollama_llama3_8b,30.8±1.5,31.8±1.9,36.4±0.9,36.7±1.5
random_str_symbolic_ollama_mistral_7b,29.4,1.7,23.7,2.1,51.2,0.9,33.6,1.6,random_str_symbolic,ollama_mistral_7b,29.4±1.7,23.7±2.1,51.2±0.9,33.6±1.6
random_str_symbolic_ollama_qwen2_7b,41.2,0.4,40.8,0.2,47.8,0.7,43.9,0.4,random_str_symbolic,ollama_qwen2_7b,41.2±0.4,40.8±0.2,47.8±0.7,43.9±0.4
random_word_language_claude_3_5_sonnet,82.4,1.3,82.4,2.0,84.4,1.3,82.0,2.0,random_word_language,claude_3_5_sonnet,82.4±1.3,82.4±2.0,84.4±1.3,82.0±2.0
random_word_language_claude_3_haiku,58.9,0.5,66.7,0.9,59.0,0.4,68.1,1.1,random_word_language,claude_3_haiku,58.9±0.5,66.7±0.9,59.0±0.4,68.1±1.1
random_word_language_gpt_4o,75.3,0.4,81.2,0.3,76.2,0.2,81.5,0.4,random_word_language,gpt_4o,75.3±0.4,81.2±0.3,76.2±0.2,81.5±0.4
random_word_language_gpt_4o_mini,57.8,0.6,63.5,1.3,57.8,0.4,63.5,1.7,random_word_language,gpt_4o_mini,57.8±0.6,63.5±1.3,57.8±0.4,63.5±1.7
random_word_language_ollama_llama3_8b,44.7,3.2,47.5,2.9,46.9,3.3,48.3,2.9,random_word_language,ollama_llama3_8b,44.7±3.2,47.5±2.9,46.9±3.3,48.3±2.9
random_word_language_ollama_mistral_7b,28.5,0.7,23.7,1.0,50.2,0.6,33.6,0.6,random_word_language,ollama_mistral_7b,28.5±0.7,23.7±1.0,50.2±0.6,33.6±0.6
random_word_language_ollama_qwen2_7b,35.4,2.2,41.1,2.5,37.6,1.9,45.2,2.3,random_word_language,ollama_qwen2_7b,35.4±2.2,41.1±2.5,37.6±1.9,45.2±2.3
random_word_symbolic_claude_3_5_sonnet,75.0,2.4,78.9,2.4,77.1,2.1,78.9,2.4,random_word_symbolic,claude_3_5_sonnet,75.0±2.4,78.9±2.4,77.1±2.1,78.9±2.4
random_word_symbolic_claude_3_haiku,39.4,1.5,47.4,1.4,41.2,1.7,52.3,1.1,random_word_symbolic,claude_3_haiku,39.4±1.5,47.4±1.4,41.2±1.7,52.3±1.1
random_word_symbolic_gpt_4o,48.6,2.2,52.2,2.7,51.4,1.8,53.7,2.7,random_word_symbolic,gpt_4o,48.6±2.2,52.2±2.7,51.4±1.8,53.7±2.7
random_word_symbolic_gpt_4o_mini,34.2,2.6,37.4,2.8,35.1,2.4,39.4,2.6,random_word_symbolic,gpt_4o_mini,34.2±2.6,37.4±2.8,35.1±2.4,39.4±2.6
random_word_symbolic_ollama_llama3_8b,32.1,0.4,33.3,0.8,37.5,0.3,37.9,1.1,random_word_symbolic,ollama_llama3_8b,32.1±0.4,33.3±0.8,37.5±0.3,37.9±1.1
random_word_symbolic_ollama_mistral_7b,29.4,2.5,24.0,2.9,51.2,1.2,33.9,2.0,random_word_symbolic,ollama_mistral_7b,29.4±2.5,24.0±2.9,51.2±1.2,33.9±2.0
random_word_symbolic_ollama_qwen2_7b,27.0,1.3,27.2,1.2,35.8,1.2,35.1,0.8,random_word_symbolic,ollama_qwen2_7b,27.0±1.3,27.2±1.2,35.8±1.2,35.1±0.8
related_word_language_claude_3_5_sonnet,79.9,2.5,80.3,2.9,82.5,2.0,79.8,3.0,related_word_language,claude_3_5_sonnet,79.9±2.5,80.3±2.9,82.5±2.0,79.8±3.0
related_word_language_claude_3_haiku,55.7,3.0,64.6,3.0,55.6,3.0,66.1,2.8,related_word_language,claude_3_haiku,55.7±3.0,64.6±3.0,55.6±3.0,66.1±2.8
related_word_language_gpt_4o,72.9,0.6,79.2,0.9,74.2,0.5,79.4,0.9,related_word_language,gpt_4o,72.9±0.6,79.2±0.9,74.2±0.5,79.4±0.9
related_word_language_gpt_4o_mini,57.1,1.8,63.6,1.7,56.8,2.2,63.7,1.6,related_word_language,gpt_4o_mini,57.1±1.8,63.6±1.7,56.8±2.2,63.7±1.6
related_word_language_ollama_llama3_8b,48.7,0.6,52.8,0.8,51.1,0.5,53.5,0.6,related_word_language,ollama_llama3_8b,48.7±0.6,52.8±0.8,51.1±0.5,53.5±0.6
related_word_language_ollama_mistral_7b,30.0,0.6,24.6,0.8,53.1,1.1,34.6,1.0,related_word_language,ollama_mistral_7b,30.0±0.6,24.6±0.8,53.1±1.1,34.6±1.0
related_word_language_ollama_qwen2_7b,39.0,0.2,47.8,0.4,39.7,0.2,51.6,0.6,related_word_language,ollama_qwen2_7b,39.0±0.2,47.8±0.4,39.7±0.2,51.6±0.6
related_word_symbolic_claude_3_5_sonnet,73.1,2.0,77.0,2.6,76.3,1.4,77.2,2.6,related_word_symbolic,claude_3_5_sonnet,73.1±2.0,77.0±2.6,76.3±1.4,77.2±2.6
related_word_symbolic_claude_3_haiku,38.4,0.9,46.5,0.7,40.0,1.2,50.9,1.0,related_word_symbolic,claude_3_haiku,38.4±0.9,46.5±0.7,40.0±1.2,50.9±1.0
related_word_symbolic_gpt_4o,52.0,1.9,56.1,1.9,55.3,2.2,57.3,1.9,related_word_symbolic,gpt_4o,52.0±1.9,56.1±1.9,55.3±2.2,57.3±1.9
related_word_symbolic_gpt_4o_mini,35.3,2.0,39.5,2.7,36.0,1.8,41.8,2.9,related_word_symbolic,gpt_4o_mini,35.3±2.0,39.5±2.7,36.0±1.8,41.8±2.9
related_word_symbolic_ollama_llama3_8b,31.0,0.1,32.7,0.3,35.7,0.7,37.1,0.4,related_word_symbolic,ollama_llama3_8b,31.0±0.1,32.7±0.3,35.7±0.7,37.1±0.4
related_word_symbolic_ollama_mistral_7b,29.5,0.2,24.6,0.3,51.0,0.5,33.7,0.5,related_word_symbolic,ollama_mistral_7b,29.5±0.2,24.6±0.3,51.0±0.5,33.7±0.5
related_word_symbolic_ollama_qwen2_7b,31.4,0.6,31.4,0.6,39.4,1.8,37.7,0.9,related_word_symbolic,ollama_qwen2_7b,31.4±0.6,31.4±0.6,39.4±1.8,37.7±0.9
