group,MA-f1_mean,MA-f1_std,wMA-f1_mean,wMA-f1_std,MI-f1_mean,MI-f1_std,wMI-f1_mean,wMI-f1_std,dtype,model,MA-f1,wMA-f1,MI-f1,wMI-f1
random_str_language_claude_3_5_sonnet,48.6,2.0,48.0,2.1,52.6,1.5,47.5,1.9,random_str_language,claude_3_5_sonnet,48.6±2.0,48.0±2.1,52.6±1.5,47.5±1.9
random_str_language_claude_3_haiku,41.9,1.2,49.9,1.1,44.5,0.9,57.0,1.1,random_str_language,claude_3_haiku,41.9±1.2,49.9±1.1,44.5±0.9,57.0±1.1
random_str_language_gpt_4o,64.7,0.6,69.0,0.7,65.0,0.9,69.2,0.7,random_str_language,gpt_4o,64.7±0.6,69.0±0.7,65.0±0.9,69.2±0.7
random_str_language_gpt_4o_mini,44.8,2.2,49.8,1.9,44.0,2.5,49.7,1.6,random_str_language,gpt_4o_mini,44.8±2.2,49.8±1.9,44.0±2.5,49.7±1.6
random_str_language_ollama_llama3_8b,38.9,1.7,38.9,1.9,41.6,1.5,39.0,1.7,random_str_language,ollama_llama3_8b,38.9±1.7,38.9±1.9,41.6±1.5,39.0±1.7
random_str_language_ollama_mistral_7b,36.7,0.6,35.9,0.8,42.9,0.6,37.5,0.7,random_str_language,ollama_mistral_7b,36.7±0.6,35.9±0.8,42.9±0.6,37.5±0.7
random_str_language_ollama_qwen2_7b,36.7,1.4,34.9,1.3,42.2,1.6,36.2,1.4,random_str_language,ollama_qwen2_7b,36.7±1.4,34.9±1.3,42.2±1.6,36.2±1.4
random_str_symbolic_claude_3_5_sonnet,55.9,0.9,56.7,0.8,58.4,0.9,56.2,0.8,random_str_symbolic,claude_3_5_sonnet,55.9±0.9,56.7±0.8,58.4±0.9,56.2±0.8
random_str_symbolic_claude_3_haiku,23.6,0.4,26.5,0.4,25.2,0.4,28.1,0.3,random_str_symbolic,claude_3_haiku,23.6±0.4,26.5±0.4,25.2±0.4,28.1±0.3
random_str_symbolic_gpt_4o,45.8,3.0,44.8,3.5,50.2,2.8,45.9,3.3,random_str_symbolic,gpt_4o,45.8±3.0,44.8±3.5,50.2±2.8,45.9±3.3
random_str_symbolic_gpt_4o_mini,23.5,0.9,25.0,0.8,23.3,1.0,24.5,0.9,random_str_symbolic,gpt_4o_mini,23.5±0.9,25.0±0.8,23.3±1.0,24.5±0.9
random_str_symbolic_ollama_llama3_8b,28.9,1.7,28.7,1.7,33.6,1.5,32.2,1.5,random_str_symbolic,ollama_llama3_8b,28.9±1.7,28.7±1.7,33.6±1.5,32.2±1.5
random_str_symbolic_ollama_mistral_7b,29.8,0.4,27.0,0.5,41.6,0.8,32.3,0.6,random_str_symbolic,ollama_mistral_7b,29.8±0.4,27.0±0.5,41.6±0.8,32.3±0.6
random_str_symbolic_ollama_qwen2_7b,31.7,1.4,29.3,1.4,39.0,1.3,32.3,1.3,random_str_symbolic,ollama_qwen2_7b,31.7±1.4,29.3±1.4,39.0±1.3,32.3±1.3
random_word_language_claude_3_5_sonnet,59.6,0.8,59.0,0.6,62.0,1.1,58.1,0.6,random_word_language,claude_3_5_sonnet,59.6±0.8,59.0±0.6,62.0±1.1,58.1±0.6
random_word_language_claude_3_haiku,42.5,1.0,49.4,1.0,43.0,0.8,53.3,1.2,random_word_language,claude_3_haiku,42.5±1.0,49.4±1.0,43.0±0.8,53.3±1.2
random_word_language_gpt_4o,68.1,0.8,71.8,0.6,68.1,0.7,72.1,0.6,random_word_language,gpt_4o,68.1±0.8,71.8±0.6,68.1±0.7,72.1±0.6
random_word_language_gpt_4o_mini,41.8,0.8,46.4,0.8,40.8,0.8,46.6,1.0,random_word_language,gpt_4o_mini,41.8±0.8,46.4±0.8,40.8±0.8,46.6±1.0
random_word_language_ollama_llama3_8b,37.6,0.1,37.7,0.4,39.9,0.7,38.1,0.2,random_word_language,ollama_llama3_8b,37.6±0.1,37.7±0.4,39.9±0.7,38.1±0.2
random_word_language_ollama_mistral_7b,38.5,1.9,37.7,2.4,44.1,0.6,39.0,1.5,random_word_language,ollama_mistral_7b,38.5±1.9,37.7±2.4,44.1±0.6,39.0±1.5
random_word_language_ollama_qwen2_7b,34.8,0.6,31.6,0.6,44.8,0.9,35.6,0.7,random_word_language,ollama_qwen2_7b,34.8±0.6,31.6±0.6,44.8±0.9,35.6±0.7
random_word_symbolic_claude_3_5_sonnet,57.3,2.1,57.0,2.6,60.5,2.1,56.8,2.6,random_word_symbolic,claude_3_5_sonnet,57.3±2.1,57.0±2.6,60.5±2.1,56.8±2.6
random_word_symbolic_claude_3_haiku,25.3,0.8,28.8,1.4,25.9,1.1,30.2,1.8,random_word_symbolic,claude_3_haiku,25.3±0.8,28.8±1.4,25.9±1.1,30.2±1.8
random_word_symbolic_gpt_4o,39.1,1.3,39.1,1.7,40.6,1.3,39.3,1.7,random_word_symbolic,gpt_4o,39.1±1.3,39.1±1.7,40.6±1.3,39.3±1.7
random_word_symbolic_gpt_4o_mini,24.6,1.3,26.6,1.5,23.8,1.5,26.3,1.7,random_word_symbolic,gpt_4o_mini,24.6±1.3,26.6±1.5,23.8±1.5,26.3±1.7
random_word_symbolic_ollama_llama3_8b,29.9,1.5,30.4,1.6,33.9,1.4,33.8,1.2,random_word_symbolic,ollama_llama3_8b,29.9±1.5,30.4±1.6,33.9±1.4,33.8±1.2
random_word_symbolic_ollama_mistral_7b,30.9,0.6,28.3,0.7,40.8,0.7,32.4,0.7,random_word_symbolic,ollama_mistral_7b,30.9±0.6,28.3±0.7,40.8±0.7,32.4±0.7
random_word_symbolic_ollama_qwen2_7b,31.0,1.1,28.2,1.4,40.2,0.2,31.9,0.7,random_word_symbolic,ollama_qwen2_7b,31.0±1.1,28.2±1.4,40.2±0.2,31.9±0.7
related_word_language_claude_3_5_sonnet,55.7,1.2,54.7,1.4,59.6,0.3,54.1,1.2,related_word_language,claude_3_5_sonnet,55.7±1.2,54.7±1.4,59.6±0.3,54.1±1.2
related_word_language_claude_3_haiku,40.3,1.8,48.1,1.6,41.3,1.9,52.9,2.0,related_word_language,claude_3_haiku,40.3±1.8,48.1±1.6,41.3±1.9,52.9±2.0
related_word_language_gpt_4o,64.4,0.3,68.4,0.5,64.7,0.5,68.4,0.5,related_word_language,gpt_4o,64.4±0.3,68.4±0.5,64.7±0.5,68.4±0.5
related_word_language_gpt_4o_mini,39.4,2.1,44.5,1.5,38.4,2.2,44.5,1.3,related_word_language,gpt_4o_mini,39.4±2.1,44.5±1.5,38.4±2.2,44.5±1.3
related_word_language_ollama_llama3_8b,36.5,1.6,36.7,2.1,38.8,0.8,36.8,1.9,related_word_language,ollama_llama3_8b,36.5±1.6,36.7±2.1,38.8±0.8,36.8±1.9
related_word_language_ollama_mistral_7b,37.5,1.3,37.4,1.3,42.3,1.3,38.2,1.3,related_word_language,ollama_mistral_7b,37.5±1.3,37.4±1.3,42.3±1.3,38.2±1.3
related_word_language_ollama_qwen2_7b,37.6,0.6,35.5,0.8,44.5,0.5,37.3,0.5,related_word_language,ollama_qwen2_7b,37.6±0.6,35.5±0.8,44.5±0.5,37.3±0.5
related_word_symbolic_claude_3_5_sonnet,53.9,0.6,53.3,0.5,58.1,0.9,53.5,0.6,related_word_symbolic,claude_3_5_sonnet,53.9±0.6,53.3±0.5,58.1±0.9,53.5±0.6
related_word_symbolic_claude_3_haiku,23.9,1.0,27.0,1.4,24.9,0.8,28.3,1.3,related_word_symbolic,claude_3_haiku,23.9±1.0,27.0±1.4,24.9±0.8,28.3±1.3
related_word_symbolic_gpt_4o,38.8,1.1,38.6,0.9,40.8,1.6,38.8,1.0,related_word_symbolic,gpt_4o,38.8±1.1,38.6±0.9,40.8±1.6,38.8±1.0
related_word_symbolic_gpt_4o_mini,23.8,1.5,26.5,1.8,22.7,1.4,26.4,2.0,related_word_symbolic,gpt_4o_mini,23.8±1.5,26.5±1.8,22.7±1.4,26.4±2.0
related_word_symbolic_ollama_llama3_8b,29.7,0.3,29.3,0.2,35.7,0.4,33.8,0.4,related_word_symbolic,ollama_llama3_8b,29.7±0.3,29.3±0.2,35.7±0.4,33.8±0.4
related_word_symbolic_ollama_mistral_7b,31.0,0.8,28.1,0.9,42.1,0.8,32.8,0.7,related_word_symbolic,ollama_mistral_7b,31.0±0.8,28.1±0.9,42.1±0.8,32.8±0.7
related_word_symbolic_ollama_qwen2_7b,28.8,0.7,26.0,0.7,37.5,0.8,29.5,0.6,related_word_symbolic,ollama_qwen2_7b,28.8±0.7,26.0±0.7,37.5±0.8,29.5±0.6
