{
  "claude-4-sonnet": {
    "overall": {
      "total_comparisons": 1800,
      "line0_exact_matches": 926,
      "line0_exact_match_rate": 51.44,
      "avg_cosine": 0.65
    },
    "categories": {
      "pattern_matching": {
        "total_comparisons": 300,
        "line0_exact_matches": 161,
        "line0_exact_match_rate": 53.67,
        "avg_cosine": 0.66
      },
      "code2NL_NL2code": {
        "total_comparisons": 300,
        "line0_exact_matches": 156,
        "line0_exact_match_rate": 52.0,
        "avg_cosine": 0.58
      },
      "api_usage": {
        "total_comparisons": 300,
        "line0_exact_matches": 109,
        "line0_exact_match_rate": 36.33,
        "avg_cosine": 0.57
      },
      "code_purpose_understanding": {
        "total_comparisons": 300,
        "line0_exact_matches": 172,
        "line0_exact_match_rate": 57.33,
        "avg_cosine": 0.71
      },
      "syntax_completion": {
        "total_comparisons": 300,
        "line0_exact_matches": 142,
        "line0_exact_match_rate": 47.33,
        "avg_cosine": 0.61
      },
      "low_context": {
        "total_comparisons": 300,
        "line0_exact_matches": 186,
        "line0_exact_match_rate": 62.0,
        "avg_cosine": 0.75
      }
    },
    "languages": {
      "c_sharp": {
        "total_comparisons": 300,
        "line0_exact_matches": 152,
        "line0_exact_match_rate": 50.67,
        "avg_cosine": 0.65
      },
      "python": {
        "total_comparisons": 300,
        "line0_exact_matches": 153,
        "line0_exact_match_rate": 51.0,
        "avg_cosine": 0.68
      },
      "typescript": {
        "total_comparisons": 300,
        "line0_exact_matches": 116,
        "line0_exact_match_rate": 38.67,
        "avg_cosine": 0.53
      },
      "java": {
        "total_comparisons": 300,
        "line0_exact_matches": 195,
        "line0_exact_match_rate": 65.0,
        "avg_cosine": 0.74
      },
      "cpp": {
        "total_comparisons": 300,
        "line0_exact_matches": 177,
        "line0_exact_match_rate": 59.0,
        "avg_cosine": 0.72
      },
      "javascript": {
        "total_comparisons": 300,
        "line0_exact_matches": 133,
        "line0_exact_match_rate": 44.33,
        "avg_cosine": 0.56
      }
    }
  },
  "DeepSeek-V3.1": {
    "overall": {
      "total_comparisons": 1800,
      "line0_exact_matches": 939,
      "line0_exact_match_rate": 52.17,
      "avg_cosine": 0.64
    },
    "categories": {
      "pattern_matching": {
        "total_comparisons": 300,
        "line0_exact_matches": 172,
        "line0_exact_match_rate": 57.33,
        "avg_cosine": 0.69
      },
      "code2NL_NL2code": {
        "total_comparisons": 300,
        "line0_exact_matches": 145,
        "line0_exact_match_rate": 48.33,
        "avg_cosine": 0.5
      },
      "api_usage": {
        "total_comparisons": 300,
        "line0_exact_matches": 119,
        "line0_exact_match_rate": 39.67,
        "avg_cosine": 0.56
      },
      "code_purpose_understanding": {
        "total_comparisons": 300,
        "line0_exact_matches": 168,
        "line0_exact_match_rate": 56.0,
        "avg_cosine": 0.68
      },
      "syntax_completion": {
        "total_comparisons": 300,
        "line0_exact_matches": 150,
        "line0_exact_match_rate": 50.0,
        "avg_cosine": 0.62
      },
      "low_context": {
        "total_comparisons": 300,
        "line0_exact_matches": 185,
        "line0_exact_match_rate": 61.67,
        "avg_cosine": 0.77
      }
    },
    "languages": {
      "c_sharp": {
        "total_comparisons": 300,
        "line0_exact_matches": 146,
        "line0_exact_match_rate": 48.67,
        "avg_cosine": 0.63
      },
      "python": {
        "total_comparisons": 300,
        "line0_exact_matches": 161,
        "line0_exact_match_rate": 53.67,
        "avg_cosine": 0.71
      },
      "typescript": {
        "total_comparisons": 300,
        "line0_exact_matches": 124,
        "line0_exact_match_rate": 41.33,
        "avg_cosine": 0.51
      },
      "java": {
        "total_comparisons": 300,
        "line0_exact_matches": 183,
        "line0_exact_match_rate": 61.0,
        "avg_cosine": 0.7
      },
      "cpp": {
        "total_comparisons": 300,
        "line0_exact_matches": 187,
        "line0_exact_match_rate": 62.33,
        "avg_cosine": 0.72
      },
      "javascript": {
        "total_comparisons": 300,
        "line0_exact_matches": 138,
        "line0_exact_match_rate": 46.0,
        "avg_cosine": 0.54
      }
    }
  },
  "Ministral-3B": {
    "overall": {
      "total_comparisons": 1800,
      "line0_exact_matches": 510,
      "line0_exact_match_rate": 28.33,
      "avg_cosine": 0.47
    },
    "categories": {
      "pattern_matching": {
        "total_comparisons": 300,
        "line0_exact_matches": 89,
        "line0_exact_match_rate": 29.67,
        "avg_cosine": 0.53
      },
      "code2NL_NL2code": {
        "total_comparisons": 300,
        "line0_exact_matches": 81,
        "line0_exact_match_rate": 27.0,
        "avg_cosine": 0.36
      },
      "api_usage": {
        "total_comparisons": 300,
        "line0_exact_matches": 62,
        "line0_exact_match_rate": 20.67,
        "avg_cosine": 0.41
      },
      "code_purpose_understanding": {
        "total_comparisons": 300,
        "line0_exact_matches": 106,
        "line0_exact_match_rate": 35.33,
        "avg_cosine": 0.53
      },
      "syntax_completion": {
        "total_comparisons": 300,
        "line0_exact_matches": 71,
        "line0_exact_match_rate": 23.67,
        "avg_cosine": 0.43
      },
      "low_context": {
        "total_comparisons": 300,
        "line0_exact_matches": 101,
        "line0_exact_match_rate": 33.67,
        "avg_cosine": 0.55
      }
    },
    "languages": {
      "c_sharp": {
        "total_comparisons": 300,
        "line0_exact_matches": 92,
        "line0_exact_match_rate": 30.67,
        "avg_cosine": 0.49
      },
      "python": {
        "total_comparisons": 300,
        "line0_exact_matches": 86,
        "line0_exact_match_rate": 28.67,
        "avg_cosine": 0.51
      },
      "typescript": {
        "total_comparisons": 300,
        "line0_exact_matches": 54,
        "line0_exact_match_rate": 18.0,
        "avg_cosine": 0.35
      },
      "java": {
        "total_comparisons": 300,
        "line0_exact_matches": 105,
        "line0_exact_match_rate": 35.0,
        "avg_cosine": 0.54
      },
      "cpp": {
        "total_comparisons": 300,
        "line0_exact_matches": 105,
        "line0_exact_match_rate": 35.0,
        "avg_cosine": 0.52
      },
      "javascript": {
        "total_comparisons": 300,
        "line0_exact_matches": 68,
        "line0_exact_match_rate": 22.67,
        "avg_cosine": 0.4
      }
    }
  },
  "claude-3-7-sonnet": {
    "overall": {
      "total_comparisons": 1800,
      "line0_exact_matches": 890,
      "line0_exact_match_rate": 49.44,
      "avg_cosine": 0.63
    },
    "categories": {
      "pattern_matching": {
        "total_comparisons": 300,
        "line0_exact_matches": 159,
        "line0_exact_match_rate": 53.0,
        "avg_cosine": 0.7
      },
      "code2NL_NL2code": {
        "total_comparisons": 300,
        "line0_exact_matches": 159,
        "line0_exact_match_rate": 53.0,
        "avg_cosine": 0.59
      },
      "api_usage": {
        "total_comparisons": 300,
        "line0_exact_matches": 95,
        "line0_exact_match_rate": 31.67,
        "avg_cosine": 0.5
      },
      "code_purpose_understanding": {
        "total_comparisons": 300,
        "line0_exact_matches": 157,
        "line0_exact_match_rate": 52.33,
        "avg_cosine": 0.65
      },
      "syntax_completion": {
        "total_comparisons": 300,
        "line0_exact_matches": 133,
        "line0_exact_match_rate": 44.33,
        "avg_cosine": 0.59
      },
      "low_context": {
        "total_comparisons": 300,
        "line0_exact_matches": 187,
        "line0_exact_match_rate": 62.33,
        "avg_cosine": 0.75
      }
    },
    "languages": {
      "c_sharp": {
        "total_comparisons": 300,
        "line0_exact_matches": 151,
        "line0_exact_match_rate": 50.33,
        "avg_cosine": 0.64
      },
      "python": {
        "total_comparisons": 300,
        "line0_exact_matches": 139,
        "line0_exact_match_rate": 46.33,
        "avg_cosine": 0.64
      },
      "typescript": {
        "total_comparisons": 300,
        "line0_exact_matches": 109,
        "line0_exact_match_rate": 36.33,
        "avg_cosine": 0.5
      },
      "java": {
        "total_comparisons": 300,
        "line0_exact_matches": 181,
        "line0_exact_match_rate": 60.33,
        "avg_cosine": 0.71
      },
      "cpp": {
        "total_comparisons": 300,
        "line0_exact_matches": 175,
        "line0_exact_match_rate": 58.33,
        "avg_cosine": 0.71
      },
      "javascript": {
        "total_comparisons": 300,
        "line0_exact_matches": 135,
        "line0_exact_match_rate": 45.0,
        "avg_cosine": 0.57
      }
    }
  },
  "gpt-4.1": {
    "overall": {
      "total_comparisons": 1800,
      "line0_exact_matches": 887,
      "line0_exact_match_rate": 49.28,
      "avg_cosine": 0.64
    },
    "categories": {
      "pattern_matching": {
        "total_comparisons": 300,
        "line0_exact_matches": 159,
        "line0_exact_match_rate": 53.0,
        "avg_cosine": 0.7
      },
      "code2NL_NL2code": {
        "total_comparisons": 300,
        "line0_exact_matches": 129,
        "line0_exact_match_rate": 43.0,
        "avg_cosine": 0.48
      },
      "api_usage": {
        "total_comparisons": 300,
        "line0_exact_matches": 115,
        "line0_exact_match_rate": 38.33,
        "avg_cosine": 0.57
      },
      "code_purpose_understanding": {
        "total_comparisons": 300,
        "line0_exact_matches": 157,
        "line0_exact_match_rate": 52.33,
        "avg_cosine": 0.69
      },
      "syntax_completion": {
        "total_comparisons": 300,
        "line0_exact_matches": 138,
        "line0_exact_match_rate": 46.0,
        "avg_cosine": 0.62
      },
      "low_context": {
        "total_comparisons": 300,
        "line0_exact_matches": 189,
        "line0_exact_match_rate": 63.0,
        "avg_cosine": 0.77
      }
    },
    "languages": {
      "c_sharp": {
        "total_comparisons": 300,
        "line0_exact_matches": 146,
        "line0_exact_match_rate": 48.67,
        "avg_cosine": 0.65
      },
      "python": {
        "total_comparisons": 300,
        "line0_exact_matches": 146,
        "line0_exact_match_rate": 48.67,
        "avg_cosine": 0.68
      },
      "typescript": {
        "total_comparisons": 300,
        "line0_exact_matches": 100,
        "line0_exact_match_rate": 33.33,
        "avg_cosine": 0.5
      },
      "java": {
        "total_comparisons": 300,
        "line0_exact_matches": 179,
        "line0_exact_match_rate": 59.67,
        "avg_cosine": 0.71
      },
      "cpp": {
        "total_comparisons": 300,
        "line0_exact_matches": 181,
        "line0_exact_match_rate": 60.33,
        "avg_cosine": 0.72
      },
      "javascript": {
        "total_comparisons": 300,
        "line0_exact_matches": 135,
        "line0_exact_match_rate": 45.0,
        "avg_cosine": 0.57
      }
    }
  },
  "gpt-4.1-mini": {
    "overall": {
      "total_comparisons": 1800,
      "line0_exact_matches": 899,
      "line0_exact_match_rate": 49.94,
      "avg_cosine": 0.64
    },
    "categories": {
      "pattern_matching": {
        "total_comparisons": 300,
        "line0_exact_matches": 156,
        "line0_exact_match_rate": 52.0,
        "avg_cosine": 0.67
      },
      "code2NL_NL2code": {
        "total_comparisons": 300,
        "line0_exact_matches": 133,
        "line0_exact_match_rate": 44.33,
        "avg_cosine": 0.49
      },
      "api_usage": {
        "total_comparisons": 300,
        "line0_exact_matches": 111,
        "line0_exact_match_rate": 37.0,
        "avg_cosine": 0.57
      },
      "code_purpose_understanding": {
        "total_comparisons": 300,
        "line0_exact_matches": 170,
        "line0_exact_match_rate": 56.67,
        "avg_cosine": 0.72
      },
      "syntax_completion": {
        "total_comparisons": 300,
        "line0_exact_matches": 136,
        "line0_exact_match_rate": 45.33,
        "avg_cosine": 0.61
      },
      "low_context": {
        "total_comparisons": 300,
        "line0_exact_matches": 193,
        "line0_exact_match_rate": 64.33,
        "avg_cosine": 0.79
      }
    },
    "languages": {
      "c_sharp": {
        "total_comparisons": 300,
        "line0_exact_matches": 144,
        "line0_exact_match_rate": 48.0,
        "avg_cosine": 0.65
      },
      "python": {
        "total_comparisons": 300,
        "line0_exact_matches": 159,
        "line0_exact_match_rate": 53.0,
        "avg_cosine": 0.71
      },
      "typescript": {
        "total_comparisons": 300,
        "line0_exact_matches": 109,
        "line0_exact_match_rate": 36.33,
        "avg_cosine": 0.5
      },
      "java": {
        "total_comparisons": 300,
        "line0_exact_matches": 171,
        "line0_exact_match_rate": 57.0,
        "avg_cosine": 0.72
      },
      "cpp": {
        "total_comparisons": 300,
        "line0_exact_matches": 180,
        "line0_exact_match_rate": 60.0,
        "avg_cosine": 0.72
      },
      "javascript": {
        "total_comparisons": 300,
        "line0_exact_matches": 136,
        "line0_exact_match_rate": 45.33,
        "avg_cosine": 0.57
      }
    }
  },
  "DeepSeek-V3-0324": {
    "overall": {
      "total_comparisons": 1800,
      "line0_exact_matches": 930,
      "line0_exact_match_rate": 51.67,
      "avg_cosine": 0.67
    },
    "categories": {
      "pattern_matching": {
        "total_comparisons": 300,
        "line0_exact_matches": 180,
        "line0_exact_match_rate": 60.0,
        "avg_cosine": 0.75
      },
      "code2NL_NL2code": {
        "total_comparisons": 300,
        "line0_exact_matches": 142,
        "line0_exact_match_rate": 47.33,
        "avg_cosine": 0.53
      },
      "api_usage": {
        "total_comparisons": 300,
        "line0_exact_matches": 112,
        "line0_exact_match_rate": 37.33,
        "avg_cosine": 0.58
      },
      "code_purpose_understanding": {
        "total_comparisons": 300,
        "line0_exact_matches": 162,
        "line0_exact_match_rate": 54.0,
        "avg_cosine": 0.71
      },
      "syntax_completion": {
        "total_comparisons": 300,
        "line0_exact_matches": 146,
        "line0_exact_match_rate": 48.67,
        "avg_cosine": 0.65
      },
      "low_context": {
        "total_comparisons": 300,
        "line0_exact_matches": 188,
        "line0_exact_match_rate": 62.67,
        "avg_cosine": 0.79
      }
    },
    "languages": {
      "c_sharp": {
        "total_comparisons": 300,
        "line0_exact_matches": 146,
        "line0_exact_match_rate": 48.67,
        "avg_cosine": 0.66
      },
      "python": {
        "total_comparisons": 300,
        "line0_exact_matches": 151,
        "line0_exact_match_rate": 50.33,
        "avg_cosine": 0.7
      },
      "typescript": {
        "total_comparisons": 300,
        "line0_exact_matches": 130,
        "line0_exact_match_rate": 43.33,
        "avg_cosine": 0.57
      },
      "java": {
        "total_comparisons": 300,
        "line0_exact_matches": 192,
        "line0_exact_match_rate": 64.0,
        "avg_cosine": 0.75
      },
      "cpp": {
        "total_comparisons": 300,
        "line0_exact_matches": 177,
        "line0_exact_match_rate": 59.0,
        "avg_cosine": 0.73
      },
      "javascript": {
        "total_comparisons": 300,
        "line0_exact_matches": 134,
        "line0_exact_match_rate": 44.67,
        "avg_cosine": 0.58
      }
    }
  },
  "gpt-4.1-nano": {
    "overall": {
      "total_comparisons": 1800,
      "line0_exact_matches": 693,
      "line0_exact_match_rate": 38.5,
      "avg_cosine": 0.56
    },
    "categories": {
      "pattern_matching": {
        "total_comparisons": 300,
        "line0_exact_matches": 125,
        "line0_exact_match_rate": 41.67,
        "avg_cosine": 0.59
      },
      "code2NL_NL2code": {
        "total_comparisons": 300,
        "line0_exact_matches": 98,
        "line0_exact_match_rate": 32.67,
        "avg_cosine": 0.39
      },
      "api_usage": {
        "total_comparisons": 300,
        "line0_exact_matches": 76,
        "line0_exact_match_rate": 25.33,
        "avg_cosine": 0.49
      },
      "code_purpose_understanding": {
        "total_comparisons": 300,
        "line0_exact_matches": 137,
        "line0_exact_match_rate": 45.67,
        "avg_cosine": 0.64
      },
      "syntax_completion": {
        "total_comparisons": 300,
        "line0_exact_matches": 103,
        "line0_exact_match_rate": 34.33,
        "avg_cosine": 0.53
      },
      "low_context": {
        "total_comparisons": 300,
        "line0_exact_matches": 154,
        "line0_exact_match_rate": 51.33,
        "avg_cosine": 0.71
      }
    },
    "languages": {
      "c_sharp": {
        "total_comparisons": 300,
        "line0_exact_matches": 107,
        "line0_exact_match_rate": 35.67,
        "avg_cosine": 0.55
      },
      "python": {
        "total_comparisons": 300,
        "line0_exact_matches": 115,
        "line0_exact_match_rate": 38.33,
        "avg_cosine": 0.59
      },
      "typescript": {
        "total_comparisons": 300,
        "line0_exact_matches": 86,
        "line0_exact_match_rate": 28.67,
        "avg_cosine": 0.42
      },
      "java": {
        "total_comparisons": 300,
        "line0_exact_matches": 139,
        "line0_exact_match_rate": 46.33,
        "avg_cosine": 0.64
      },
      "cpp": {
        "total_comparisons": 300,
        "line0_exact_matches": 148,
        "line0_exact_match_rate": 49.33,
        "avg_cosine": 0.64
      },
      "javascript": {
        "total_comparisons": 300,
        "line0_exact_matches": 98,
        "line0_exact_match_rate": 32.67,
        "avg_cosine": 0.49
      }
    }
  },
  "gpt-4o": {
    "overall": {
      "total_comparisons": 1800,
      "line0_exact_matches": 903,
      "line0_exact_match_rate": 50.17,
      "avg_cosine": 0.65
    },
    "categories": {
      "pattern_matching": {
        "total_comparisons": 300,
        "line0_exact_matches": 163,
        "line0_exact_match_rate": 54.33,
        "avg_cosine": 0.7
      },
      "code2NL_NL2code": {
        "total_comparisons": 300,
        "line0_exact_matches": 127,
        "line0_exact_match_rate": 42.33,
        "avg_cosine": 0.48
      },
      "api_usage": {
        "total_comparisons": 300,
        "line0_exact_matches": 112,
        "line0_exact_match_rate": 37.33,
        "avg_cosine": 0.56
      },
      "code_purpose_understanding": {
        "total_comparisons": 300,
        "line0_exact_matches": 168,
        "line0_exact_match_rate": 56.0,
        "avg_cosine": 0.72
      },
      "syntax_completion": {
        "total_comparisons": 300,
        "line0_exact_matches": 141,
        "line0_exact_match_rate": 47.0,
        "avg_cosine": 0.63
      },
      "low_context": {
        "total_comparisons": 300,
        "line0_exact_matches": 192,
        "line0_exact_match_rate": 64.0,
        "avg_cosine": 0.77
      }
    },
    "languages": {
      "c_sharp": {
        "total_comparisons": 300,
        "line0_exact_matches": 139,
        "line0_exact_match_rate": 46.33,
        "avg_cosine": 0.64
      },
      "python": {
        "total_comparisons": 300,
        "line0_exact_matches": 144,
        "line0_exact_match_rate": 48.0,
        "avg_cosine": 0.68
      },
      "typescript": {
        "total_comparisons": 300,
        "line0_exact_matches": 120,
        "line0_exact_match_rate": 40.0,
        "avg_cosine": 0.53
      },
      "java": {
        "total_comparisons": 300,
        "line0_exact_matches": 182,
        "line0_exact_match_rate": 60.67,
        "avg_cosine": 0.72
      },
      "cpp": {
        "total_comparisons": 300,
        "line0_exact_matches": 180,
        "line0_exact_match_rate": 60.0,
        "avg_cosine": 0.72
      },
      "javascript": {
        "total_comparisons": 300,
        "line0_exact_matches": 138,
        "line0_exact_match_rate": 46.0,
        "avg_cosine": 0.58
      }
    }
  }
}