{
  "slug": "reinforcement_learning_from_human_feedback",
  "init": [
    "1902.00719",
    "1902.04257",
    "1904.08621",
    "1908.00169",
    "1909.06682",
    "1909.07502",
    "1909.09209",
    "1910.00682",
    "2001.07549",
    "2001.06781",
    "2002.10904",
    "2003.02638",
    "2007.00192",
    "2007.03363",
    "2007.12904",
    "2009.01325",
    "2009.02476",
    "2101.11333",
    "2102.02639",
    "2102.07024",
    "2102.07615",
    "2107.00359",
    "2107.10253",
    "2107.11965",
    "2108.01358",
    "2108.02839",
    "2201.00469",
    "2201.01251",
    "2201.08102",
    "2202.02465",
    "2208.02932",
    "2208.08241",
    "2209.14010",
    "2209.14375",
    "2301.00964",
    "2301.10528",
    "2301.11270",
    "2301.11774",
    "2307.00360",
    "2307.05532",
    "2307.04098"
  ],
  "evolution": {
    "2024-01": [
      "2401.15043",
      "2402.01698",
      "2401.13136",
      "2401.12086",
      "2401.11977",
      "2401.11458",
      "2401.11206",
      "2401.10882"
    ],
    "2024-03": [
      "2403.08694",
      "2403.08635",
      "2403.08309",
      "2403.07865",
      "2403.07708",
      "2403.06754",
      "2403.06516",
      "2403.05171"
    ],
    "2024-07": [
      "2407.14622",
      "2407.14503",
      "2407.14477",
      "2407.13887",
      "2407.08770",
      "2407.08213"
    ],
    "2024-09": [
      "2409.12914",
      "2409.12798",
      "2409.11741",
      "2410.00033",
      "2409.11704",
      "2409.15360",
      "2409.10164",
      "2409.09603"
    ],
    "2024-11": [
      "2411.08302",
      "2411.08923",
      "2411.07618",
      "2411.07595",
      "2411.07317",
      "2411.05273",
      "2411.04625",
      "2411.04712"
    ]
  },
  "validation": [
    "1903.03064",
    "1905.04127",
    "2001.08703",
    "2101.11071",
    "2203.02155",
    "2209.07858",
    "2307.00593",
    "2407.06902",
    "2407.13399",
    "2501.01332",
    "2501.02790",
    "2501.03262",
    "2501.03486",
    "2501.03884",
    "2501.05790",
    "2501.06416",
    "2501.07886",
    "2501.08617",
    "2501.09254",
    "2501.09620",
    "2501.11463",
    "2501.12698",
    "2501.12735",
    "2501.13927",
    "2501.15453",
    "2501.17112",
    "2501.18663",
    "2501.18873",
    "2501.19266",
    "2501.19358",
    "2502.00666",
    "2502.00814",
    "2502.01819",
    "2502.02671",
    "2502.03095",
    "2502.04270",
    "2502.04354",
    "2502.04357",
    "2502.06861",
    "2507.00665",
    "2507.01352",
    "2507.01915",
    "2507.02778",
    "2507.04136",
    "2507.04340",
    "2507.04453",
    "2507.04730",
    "2507.04736",
    "2507.07375",
    "2507.08027",
    "2507.09016",
    "2507.09406",
    "2507.09973",
    "2507.13171",
    "2507.13579",
    "2507.15507",
    "2507.16331",
    "2507.18802",
    "2507.21931",
    "2508.01612",
    "2508.01930",
    "2508.02618",
    "2508.03058",
    "2508.04149",
    "2508.05242",
    "2508.07126",
    "2508.07137",
    "2601.04736",
    "2601.05633",
    "2601.06108",
    "2601.06700",
    "2601.07349",
    "2601.09236",
    "2601.09992",
    "2601.10599",
    "2601.16403",
    "2601.18730",
    "2601.18824",
    "2601.19063",
    "2601.21350",
    "2601.22664",
    "2602.00426",
    "2602.01137",
    "2602.01685",
    "2602.01750",
    "2602.02383",
    "2602.02482",
    "2602.02488",
    "2602.02530",
    "2602.03876",
    "2602.04000",
    "2602.04651",
    "2602.05472",
    "2602.11180"
  ],
  "_provenance": {
    "init_count": 41,
    "evolution_window_count": 5,
    "evolution_total_papers": 38,
    "validation_count": 94,
    "cached_total": 173
  }
}