{
  "slug": "accuracy_of_automated_evaluation_for_llms",
  "init": [
    "2208.05950",
    "2212.13138",
    "2303.07263",
    "2303.16750",
    "2305.14752",
    "2305.16344",
    "2307.03875",
    "2307.16139",
    "2308.05012",
    "2308.13577"
  ],
  "evolution": {
    "2024-01": [
      "2402.14245",
      "2402.13740",
      "2402.12038",
      "2402.10767",
      "2402.05904",
      "2402.01411",
      "2401.17019"
    ],
    "2024-03": [
      "2404.03732",
      "2404.15320",
      "2404.02183",
      "2404.01549",
      "2403.18802",
      "2403.14965",
      "2403.12844",
      "2403.12196"
    ],
    "2024-05": [
      "2406.06591",
      "2406.06559",
      "2405.20585",
      "2405.19456",
      "2405.13219"
    ],
    "2024-07": [
      "2408.04650",
      "2408.01667",
      "2407.21429",
      "2407.20906",
      "2407.19056",
      "2407.15353",
      "2407.13166"
    ],
    "2024-09": [
      "2409.19006",
      "2409.12962",
      "2409.12405",
      "2409.11703",
      "2409.10504",
      "2409.10574",
      "2409.13727"
    ],
    "2024-11": [
      "2411.14258",
      "2411.13163",
      "2411.10213",
      "2411.09590",
      "2411.09269",
      "2411.09255",
      "2411.06852"
    ]
  },
  "validation": [
    "2405.14445",
    "2406.01943",
    "2406.06657",
    "2407.14567",
    "2409.05768",
    "2411.06691",
    "2501.00826",
    "2501.00940",
    "2501.01014",
    "2501.01588",
    "2501.01743",
    "2501.06496",
    "2501.08208",
    "2501.09126",
    "2501.09158",
    "2501.10421",
    "2501.11006",
    "2501.11496",
    "2501.13957",
    "2501.14499",
    "2501.14983",
    "2501.15581",
    "2501.16309",
    "2501.17183",
    "2501.18638",
    "2501.18908",
    "2502.00025",
    "2502.00562",
    "2502.01691",
    "2502.02715",
    "2502.04349",
    "2502.04355",
    "2502.05675",
    "2502.06111",
    "2502.07912",
    "2502.08909",
    "2502.10263",
    "2502.10953",
    "2502.12183",
    "2502.15702",
    "2502.15745",
    "2507.00769",
    "2507.02983",
    "2507.03410",
    "2507.03616",
    "2507.03834",
    "2507.05613",
    "2507.05816",
    "2507.05962",
    "2507.06920",
    "2507.10646",
    "2507.10803",
    "2507.11014",
    "2507.11527",
    "2507.13758",
    "2507.14107",
    "2507.14221",
    "2507.15268",
    "2507.16037",
    "2507.18476",
    "2507.19027",
    "2507.19969",
    "2507.20553",
    "2507.21103",
    "2507.21340",
    "2507.22936",
    "2508.05650",
    "2601.00254",
    "2601.00559",
    "2601.01196",
    "2601.02669",
    "2601.03232",
    "2601.03594",
    "2601.04680",
    "2601.05187",
    "2601.06615",
    "2601.06818",
    "2601.07019",
    "2601.07754",
    "2601.07954",
    "2601.09053",
    "2601.10173",
    "2601.16280",
    "2601.19913",
    "2601.20868",
    "2603.22625"
  ],
  "_provenance": {
    "init_count": 10,
    "evolution_window_count": 6,
    "evolution_total_papers": 41,
    "validation_count": 86,
    "cached_total": 137
  }
}