group,MA-f1_mean,MA-f1_std,wMA-f1_mean,wMA-f1_std,MI-f1_mean,MI-f1_std,wMI-f1_mean,wMI-f1_std,dtype,model,MA-f1,wMA-f1,MI-f1,wMI-f1
random_str_language_claude_3_5_sonnet,48.0,0.6,47.4,0.7,51.8,0.4,46.9,0.5,random_str_language,claude_3_5_sonnet,48.0±0.6,47.4±0.7,51.8±0.4,46.9±0.5
random_str_language_claude_3_haiku,41.6,0.9,49.3,0.8,43.4,0.5,54.9,0.5,random_str_language,claude_3_haiku,41.6±0.9,49.3±0.8,43.4±0.5,54.9±0.5
random_str_language_gpt_4o,62.9,1.4,68.6,1.5,63.1,1.1,70.0,1.7,random_str_language,gpt_4o,62.9±1.4,68.6±1.5,63.1±1.1,70.0±1.7
random_str_language_gpt_4o_mini,43.1,1.8,48.1,1.9,42.2,1.7,48.0,2.2,random_str_language,gpt_4o_mini,43.1±1.8,48.1±1.9,42.2±1.7,48.0±2.2
random_str_language_ollama_llama3_8b,37.4,0.5,38.9,0.3,38.2,0.9,38.7,0.4,random_str_language,ollama_llama3_8b,37.4±0.5,38.9±0.3,38.2±0.9,38.7±0.4
random_str_language_ollama_mistral_7b,26.3,1.1,23.0,1.2,42.0,1.3,31.3,1.3,random_str_language,ollama_mistral_7b,26.3±1.1,23.0±1.2,42.0±1.3,31.3±1.3
random_str_language_ollama_qwen2_7b,40.7,1.1,45.9,1.0,42.6,0.7,49.8,0.6,random_str_language,ollama_qwen2_7b,40.7±1.1,45.9±1.0,42.6±0.7,49.8±0.6
random_str_symbolic_claude_3_5_sonnet,57.1,0.9,57.6,0.6,60.0,1.0,57.2,0.8,random_str_symbolic,claude_3_5_sonnet,57.1±0.9,57.6±0.6,60.0±1.0,57.2±0.8
random_str_symbolic_claude_3_haiku,25.3,0.4,28.6,0.3,27.0,1.0,30.5,0.7,random_str_symbolic,claude_3_haiku,25.3±0.4,28.6±0.3,27.0±1.0,30.5±0.7
random_str_symbolic_gpt_4o,44.4,0.7,43.6,1.3,48.2,0.6,44.7,0.8,random_str_symbolic,gpt_4o,44.4±0.7,43.6±1.3,48.2±0.6,44.7±0.8
random_str_symbolic_gpt_4o_mini,25.2,1.6,26.6,1.9,25.3,1.6,26.1,2.0,random_str_symbolic,gpt_4o_mini,25.2±1.6,26.6±1.9,25.3±1.6,26.1±2.0
random_str_symbolic_ollama_llama3_8b,25.4,1.4,25.8,1.3,32.4,1.0,32.5,0.8,random_str_symbolic,ollama_llama3_8b,25.4±1.4,25.8±1.3,32.4±1.0,32.5±0.8
random_str_symbolic_ollama_mistral_7b,25.2,1.2,20.4,1.4,46.1,0.7,32.1,0.9,random_str_symbolic,ollama_mistral_7b,25.2±1.2,20.4±1.4,46.1±0.7,32.1±0.9
random_str_symbolic_ollama_qwen2_7b,33.7,0.3,31.9,0.5,39.8,0.6,34.7,0.6,random_str_symbolic,ollama_qwen2_7b,33.7±0.3,31.9±0.5,39.8±0.6,34.7±0.6
random_word_language_claude_3_5_sonnet,59.0,1.2,58.4,1.7,61.3,0.8,57.5,1.5,random_word_language,claude_3_5_sonnet,59.0±1.2,58.4±1.7,61.3±0.8,57.5±1.5
random_word_language_claude_3_haiku,44.2,1.0,51.1,1.4,44.7,1.2,55.2,2.0,random_word_language,claude_3_haiku,44.2±1.0,51.1±1.4,44.7±1.2,55.2±2.0
random_word_language_gpt_4o,64.5,1.0,69.2,0.6,64.4,0.9,70.1,0.8,random_word_language,gpt_4o,64.5±1.0,69.2±0.6,64.4±0.9,70.1±0.8
random_word_language_gpt_4o_mini,42.1,1.4,46.6,1.7,41.2,1.5,46.8,1.7,random_word_language,gpt_4o_mini,42.1±1.4,46.6±1.7,41.2±1.5,46.8±1.7
random_word_language_ollama_llama3_8b,38.1,0.6,39.4,0.5,39.3,0.7,40.0,0.5,random_word_language,ollama_llama3_8b,38.1±0.6,39.4±0.5,39.3±0.7,40.0±0.5
random_word_language_ollama_mistral_7b,27.9,0.9,24.3,1.0,45.3,0.5,33.7,0.5,random_word_language,ollama_mistral_7b,27.9±0.9,24.3±1.0,45.3±0.5,33.7±0.5
random_word_language_ollama_qwen2_7b,39.1,0.7,42.8,0.8,40.3,0.5,45.3,0.8,random_word_language,ollama_qwen2_7b,39.1±0.7,42.8±0.8,40.3±0.5,45.3±0.8
random_word_symbolic_claude_3_5_sonnet,55.7,1.7,55.0,2.5,59.5,1.0,54.9,2.3,random_word_symbolic,claude_3_5_sonnet,55.7±1.7,55.0±2.5,59.5±1.0,54.9±2.3
random_word_symbolic_claude_3_haiku,25.9,1.3,29.3,1.4,26.7,1.6,30.9,1.8,random_word_symbolic,claude_3_haiku,25.9±1.3,29.3±1.4,26.7±1.6,30.9±1.8
random_word_symbolic_gpt_4o,36.9,0.6,37.4,0.5,37.9,0.6,37.6,0.5,random_word_symbolic,gpt_4o,36.9±0.6,37.4±0.5,37.9±0.6,37.6±0.5
random_word_symbolic_gpt_4o_mini,25.0,0.8,27.1,0.9,24.2,0.7,26.7,0.9,random_word_symbolic,gpt_4o_mini,25.0±0.8,27.1±0.9,24.2±0.7,26.7±0.9
random_word_symbolic_ollama_llama3_8b,28.4,1.2,29.1,1.1,33.4,0.7,33.9,0.3,random_word_symbolic,ollama_llama3_8b,28.4±1.2,29.1±1.1,33.4±0.7,33.9±0.3
random_word_symbolic_ollama_mistral_7b,26.6,0.9,22.2,1.1,45.7,0.3,32.6,0.4,random_word_symbolic,ollama_mistral_7b,26.6±0.9,22.2±1.1,45.7±0.3,32.6±0.4
random_word_symbolic_ollama_qwen2_7b,25.1,0.3,24.7,0.3,32.9,0.3,31.7,0.7,random_word_symbolic,ollama_qwen2_7b,25.1±0.3,24.7±0.3,32.9±0.3,31.7±0.7
related_word_language_claude_3_5_sonnet,54.8,1.9,53.9,1.5,58.5,2.1,53.4,1.5,related_word_language,claude_3_5_sonnet,54.8±1.9,53.9±1.5,58.5±2.1,53.4±1.5
related_word_language_claude_3_haiku,40.9,1.1,48.6,1.0,41.8,1.1,53.1,1.4,related_word_language,claude_3_haiku,40.9±1.1,48.6±1.0,41.8±1.1,53.1±1.4
related_word_language_gpt_4o,63.1,1.8,67.4,1.7,63.4,1.9,67.6,1.6,related_word_language,gpt_4o,63.1±1.8,67.4±1.7,63.4±1.9,67.6±1.6
related_word_language_gpt_4o_mini,40.5,1.1,45.4,1.2,39.6,1.0,45.3,1.7,related_word_language,gpt_4o_mini,40.5±1.1,45.4±1.2,39.6±1.0,45.3±1.7
related_word_language_ollama_llama3_8b,35.5,0.7,37.0,0.9,36.6,0.3,36.9,0.7,related_word_language,ollama_llama3_8b,35.5±0.7,37.0±0.9,36.6±0.3,36.9±0.7
related_word_language_ollama_mistral_7b,26.6,0.2,23.1,0.2,44.1,0.6,32.7,0.2,related_word_language,ollama_mistral_7b,26.6±0.2,23.1±0.2,44.1±0.6,32.7±0.2
related_word_language_ollama_qwen2_7b,37.3,1.7,42.0,2.3,38.9,1.8,45.0,2.4,related_word_language,ollama_qwen2_7b,37.3±1.7,42.0±2.3,38.9±1.8,45.0±2.4
related_word_symbolic_claude_3_5_sonnet,51.9,1.8,51.1,2.3,56.5,0.9,51.4,2.0,related_word_symbolic,claude_3_5_sonnet,51.9±1.8,51.1±2.3,56.5±0.9,51.4±2.0
related_word_symbolic_claude_3_haiku,24.4,0.6,27.6,1.0,25.4,0.4,28.9,0.8,related_word_symbolic,claude_3_haiku,24.4±0.6,27.6±1.0,25.4±0.4,28.9±0.8
related_word_symbolic_gpt_4o,37.2,0.4,37.2,0.6,38.8,0.2,37.4,0.5,related_word_symbolic,gpt_4o,37.2±0.4,37.2±0.6,38.8±0.2,37.4±0.5
related_word_symbolic_gpt_4o_mini,23.2,1.2,25.2,1.1,22.4,1.2,24.9,0.9,related_word_symbolic,gpt_4o_mini,23.2±1.2,25.2±1.1,22.4±1.2,24.9±0.9
related_word_symbolic_ollama_llama3_8b,26.1,0.8,26.3,0.6,32.4,1.2,31.9,0.8,related_word_symbolic,ollama_llama3_8b,26.1±0.8,26.3±0.6,32.4±1.2,31.9±0.8
related_word_symbolic_ollama_mistral_7b,27.8,1.1,24.4,1.3,44.6,1.0,33.3,1.0,related_word_symbolic,ollama_mistral_7b,27.8±1.1,24.4±1.3,44.6±1.0,33.3±1.0
related_word_symbolic_ollama_qwen2_7b,30.1,1.0,29.3,1.3,36.2,0.2,34.0,0.9,related_word_symbolic,ollama_qwen2_7b,30.1±1.0,29.3±1.3,36.2±0.2,34.0±0.9
