group,MA-f1_mean,MA-f1_std,wMA-f1_mean,wMA-f1_std,MI-f1_mean,MI-f1_std,wMI-f1_mean,wMI-f1_std,dtype,model,MA-f1,wMA-f1,MI-f1,wMI-f1
random_str_language_claude_3_5_sonnet,79.8,1.7,81.9,1.2,81.1,1.7,81.5,1.2,random_str_language,claude_3_5_sonnet,79.8±1.7,81.9±1.2,81.1±1.7,81.5±1.2
random_str_language_claude_3_haiku,52.6,1.3,62.7,0.8,52.7,1.1,67.7,0.3,random_str_language,claude_3_haiku,52.6±1.3,62.7±0.8,52.7±1.1,67.7±0.3
random_str_language_gpt_4o,75.8,1.0,80.9,1.3,76.3,0.5,81.1,1.5,random_str_language,gpt_4o,75.8±1.0,80.9±1.3,76.3±0.5,81.1±1.5
random_str_language_gpt_4o_mini,59.1,2.3,65.0,2.6,58.1,2.3,65.2,2.8,random_str_language,gpt_4o_mini,59.1±2.3,65.0±2.6,58.1±2.3,65.2±2.8
random_str_language_ollama_llama3_8b,51.5,2.2,52.8,2.6,54.5,2.2,52.6,2.5,random_str_language,ollama_llama3_8b,51.5±2.2,52.8±2.6,54.5±2.2,52.6±2.5
random_str_language_ollama_mistral_7b,41.1,2.4,39.8,2.8,49.3,0.8,41.3,2.0,random_str_language,ollama_mistral_7b,41.1±2.4,39.8±2.8,49.3±0.8,41.3±2.0
random_str_language_ollama_qwen2_7b,53.4,1.4,52.6,0.9,59.2,1.7,53.2,1.1,random_str_language,ollama_qwen2_7b,53.4±1.4,52.6±0.9,59.2±1.7,53.2±1.1
random_str_symbolic_claude_3_5_sonnet,71.5,1.4,76.0,1.4,73.0,1.5,76.3,1.3,random_str_symbolic,claude_3_5_sonnet,71.5±1.4,76.0±1.4,73.0±1.5,76.3±1.3
random_str_symbolic_claude_3_haiku,36.6,0.7,44.1,1.0,38.9,0.9,50.3,1.0,random_str_symbolic,claude_3_haiku,36.6±0.7,44.1±1.0,38.9±0.9,50.3±1.0
random_str_symbolic_gpt_4o,56.1,0.6,59.4,0.7,59.8,0.6,60.4,0.6,random_str_symbolic,gpt_4o,56.1±0.6,59.4±0.7,59.8±0.6,60.4±0.6
random_str_symbolic_gpt_4o_mini,39.0,1.9,43.0,2.3,39.7,1.7,44.9,2.2,random_str_symbolic,gpt_4o_mini,39.0±1.9,43.0±2.3,39.7±1.7,44.9±2.2
random_str_symbolic_ollama_llama3_8b,31.1,1.1,32.4,1.5,36.1,0.9,37.2,1.5,random_str_symbolic,ollama_llama3_8b,31.1±1.1,32.4±1.5,36.1±0.9,37.2±1.5
random_str_symbolic_ollama_mistral_7b,38.1,0.4,36.3,0.6,47.1,0.5,38.3,0.5,random_str_symbolic,ollama_mistral_7b,38.1±0.4,36.3±0.6,47.1±0.5,38.3±0.5
random_str_symbolic_ollama_qwen2_7b,39.2,1.4,38.1,1.4,46.5,1.9,41.1,1.5,random_str_symbolic,ollama_qwen2_7b,39.2±1.4,38.1±1.4,46.5±1.9,41.1±1.5
random_word_language_claude_3_5_sonnet,82.7,0.9,84.0,0.8,84.6,1.0,83.7,0.9,random_word_language,claude_3_5_sonnet,82.7±0.9,84.0±0.8,84.6±1.0,83.7±0.9
random_word_language_claude_3_haiku,57.8,0.6,66.0,0.5,57.9,0.5,67.9,0.5,random_word_language,claude_3_haiku,57.8±0.6,66.0±0.5,57.9±0.5,67.9±0.5
random_word_language_gpt_4o,77.8,1.8,82.9,1.8,78.9,2.2,83.1,1.8,random_word_language,gpt_4o,77.8±1.8,82.9±1.8,78.9±2.2,83.1±1.8
random_word_language_gpt_4o_mini,58.2,1.4,63.9,1.1,58.3,1.2,64.0,1.0,random_word_language,gpt_4o_mini,58.2±1.4,63.9±1.1,58.3±1.2,64.0±1.0
random_word_language_ollama_llama3_8b,48.3,0.2,49.6,0.6,52.1,0.9,50.0,0.1,random_word_language,ollama_llama3_8b,48.3±0.2,49.6±0.6,52.1±0.9,50.0±0.1
random_word_language_ollama_mistral_7b,39.6,1.1,38.3,1.2,48.8,1.6,40.1,1.0,random_word_language,ollama_mistral_7b,39.6±1.1,38.3±1.2,48.8±1.6,40.1±1.0
random_word_language_ollama_qwen2_7b,50.5,1.1,47.7,1.2,59.4,2.1,49.2,1.1,random_word_language,ollama_qwen2_7b,50.5±1.1,47.7±1.2,59.4±2.1,49.2±1.1
random_word_symbolic_claude_3_5_sonnet,74.7,1.4,78.8,1.3,76.7,0.9,78.9,1.3,random_word_symbolic,claude_3_5_sonnet,74.7±1.4,78.8±1.3,76.7±0.9,78.9±1.3
random_word_symbolic_claude_3_haiku,38.4,0.7,46.4,0.8,40.0,0.8,51.4,1.0,random_word_symbolic,claude_3_haiku,38.4±0.7,46.4±0.8,40.0±0.8,51.4±1.0
random_word_symbolic_gpt_4o,50.6,1.8,54.3,1.7,53.5,1.6,55.5,1.7,random_word_symbolic,gpt_4o,50.6±1.8,54.3±1.7,53.5±1.6,55.5±1.7
random_word_symbolic_gpt_4o_mini,34.8,0.8,38.3,1.1,35.9,1.0,40.6,1.4,random_word_symbolic,gpt_4o_mini,34.8±0.8,38.3±1.1,35.9±1.0,40.6±1.4
random_word_symbolic_ollama_llama3_8b,31.5,0.6,32.6,0.1,37.1,1.5,37.2,0.6,random_word_symbolic,ollama_llama3_8b,31.5±0.6,32.6±0.1,37.1±1.5,37.2±0.6
random_word_symbolic_ollama_mistral_7b,37.5,1.9,35.8,2.0,46.6,1.6,37.7,1.6,random_word_symbolic,ollama_mistral_7b,37.5±1.9,35.8±2.0,46.6±1.6,37.7±1.6
random_word_symbolic_ollama_qwen2_7b,39.4,0.6,35.9,0.7,51.1,0.7,40.2,0.7,random_word_symbolic,ollama_qwen2_7b,39.4±0.6,35.9±0.7,51.1±0.7,40.2±0.7
related_word_language_claude_3_5_sonnet,80.0,0.4,81.9,0.7,82.1,0.4,81.5,0.8,related_word_language,claude_3_5_sonnet,80.0±0.4,81.9±0.7,82.1±0.4,81.5±0.8
related_word_language_claude_3_haiku,56.1,2.3,65.5,2.5,55.9,2.5,67.5,2.5,related_word_language,claude_3_haiku,56.1±2.3,65.5±2.5,55.9±2.5,67.5±2.5
related_word_language_gpt_4o,74.6,1.5,80.4,0.3,76.0,1.7,80.5,0.4,related_word_language,gpt_4o,74.6±1.5,80.4±0.3,76.0±1.7,80.5±0.4
related_word_language_gpt_4o_mini,56.4,1.5,63.4,1.6,55.6,1.8,63.6,1.7,related_word_language,gpt_4o_mini,56.4±1.5,63.4±1.6,55.6±1.8,63.6±1.7
related_word_language_ollama_llama3_8b,50.3,0.9,51.3,1.1,55.4,0.8,51.6,1.0,related_word_language,ollama_llama3_8b,50.3±0.9,51.3±1.1,55.4±0.8,51.6±1.0
related_word_language_ollama_mistral_7b,42.1,1.5,41.2,1.9,51.0,0.8,42.3,1.6,related_word_language,ollama_mistral_7b,42.1±1.5,41.2±1.9,51.0±0.8,42.3±1.6
related_word_language_ollama_qwen2_7b,54.5,1.7,53.4,2.4,61.9,1.2,53.9,2.0,related_word_language,ollama_qwen2_7b,54.5±1.7,53.4±2.4,61.9±1.2,53.9±2.0
related_word_symbolic_claude_3_5_sonnet,73.5,0.9,77.8,1.7,76.5,0.4,78.0,1.7,related_word_symbolic,claude_3_5_sonnet,73.5±0.9,77.8±1.7,76.5±0.4,78.0±1.7
related_word_symbolic_claude_3_haiku,37.0,0.3,45.1,0.4,38.9,0.3,50.2,0.7,related_word_symbolic,claude_3_haiku,37.0±0.3,45.1±0.4,38.9±0.3,50.2±0.7
related_word_symbolic_gpt_4o,53.0,0.9,56.6,1.6,56.7,0.8,57.8,1.3,related_word_symbolic,gpt_4o,53.0±0.9,56.6±1.6,56.7±0.8,57.8±1.3
related_word_symbolic_gpt_4o_mini,35.8,2.1,39.6,1.6,36.5,2.2,41.5,1.1,related_word_symbolic,gpt_4o_mini,35.8±2.1,39.6±1.6,36.5±2.2,41.5±1.1
related_word_symbolic_ollama_llama3_8b,31.3,1.7,32.5,1.8,36.8,1.4,36.9,1.4,related_word_symbolic,ollama_llama3_8b,31.3±1.7,32.5±1.8,36.8±1.4,36.9±1.4
related_word_symbolic_ollama_mistral_7b,36.6,1.0,34.1,1.3,48.5,0.6,37.2,0.7,related_word_symbolic,ollama_mistral_7b,36.6±1.0,34.1±1.3,48.5±0.6,37.2±0.7
related_word_symbolic_ollama_qwen2_7b,42.1,2.0,38.7,2.3,54.2,1.6,42.6,2.2,related_word_symbolic,ollama_qwen2_7b,42.1±2.0,38.7±2.3,54.2±1.6,42.6±2.2
