{
  "experiment_name": "async_staleness_seed456",
  "total_timesteps": 10000,
  "total_time": 454.54545454545456,
  "avg_throughput": 22,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": -0.02491047619505481,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 101,
      "pass_at_1": 0.022068486102478434,
      "avg_reward": 0.046089401275991176,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 202,
      "pass_at_1": 0.04640412901945819,
      "avg_reward": 0.11860272985526682,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 303,
      "pass_at_1": 0.035130233327018194,
      "avg_reward": 0.05057834549463397,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 404,
      "pass_at_1": 0.031871656448526825,
      "avg_reward": 0.009735783673206221,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 505,
      "pass_at_1": 0.10522012900785976,
      "avg_reward": 0.027664541373084703,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 606,
      "pass_at_1": 0.12587616796379233,
      "avg_reward": 0.11259348983104846,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 707,
      "pass_at_1": 0.14420903035599347,
      "avg_reward": 0.21260234394550037,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 808,
      "pass_at_1": 0.19164820541662375,
      "avg_reward": 0.19933598212525586,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 909,
      "pass_at_1": 0.17470974000791437,
      "avg_reward": 0.1976453939047832,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.15652821155893712,
      "avg_reward": 0.1207849875153718,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.1419162097011488,
      "avg_reward": 0.09432994314644635,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.1868592978109897,
      "avg_reward": 0.15630602925013523,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.15946060019843003,
      "avg_reward": 0.11251420580501681,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.17171123838084829,
      "avg_reward": 0.19445073268810947,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.1461472693073841,
      "avg_reward": 0.10319877062545245,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.19243385165523627,
      "avg_reward": 0.08195267812657553,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.20445149297362764,
      "avg_reward": 0.1219059429080333,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.1941983105092468,
      "avg_reward": 0.15967597558135482,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.19074680145359252,
      "avg_reward": 0.09197231307793699,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.18892584246083385,
      "avg_reward": 0.1331966596430544,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.21340517428432612,
      "avg_reward": 0.1436699478571013,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.1920747558938083,
      "avg_reward": 0.13909662035281706,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.20301082045453853,
      "avg_reward": 0.2224902006594795,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.19848316002211547,
      "avg_reward": 0.18105812916494257,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.18048142515929028,
      "avg_reward": 0.14774176815764317,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.17979118211887968,
      "avg_reward": 0.09899210779879183,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.23196297745994496,
      "avg_reward": 0.18160664240617488,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.19726819081971217,
      "avg_reward": 0.1585046760260598,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.18504840070128234,
      "avg_reward": 0.234345490385517,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.20615213907047675,
      "avg_reward": 0.17763198703984145,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.21362992795862906,
      "avg_reward": 0.1675763570580254,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.20165043406019162,
      "avg_reward": 0.14501367390132067,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.23844089951283515,
      "avg_reward": 0.15907044643105384,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.22532948735039726,
      "avg_reward": 0.2709471505912692,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.23267340271011083,
      "avg_reward": 0.14201658692873567,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.25714552355084597,
      "avg_reward": 0.24841333340229638,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.2546504114051777,
      "avg_reward": 0.21830447784994622,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.24513601430676862,
      "avg_reward": 0.265379159210696,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.23822984221615723,
      "avg_reward": 0.24110258589494787,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.2523562046932508,
      "avg_reward": 0.24219246796917243,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.2506722289007057,
      "avg_reward": 0.18818894960731494,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.23679483861535758,
      "avg_reward": 0.14635353508390414,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.2779593831110348,
      "avg_reward": 0.18287141430270076,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.26932265981929365,
      "avg_reward": 0.20115323007053842,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.2459632633092099,
      "avg_reward": 0.25149283991927995,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.29638842686976213,
      "avg_reward": 0.14156471864772496,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.26988683034784544,
      "avg_reward": 0.24721944804373555,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.27195511458666716,
      "avg_reward": 0.3336960900982403,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.3189626907988161,
      "avg_reward": 0.2750124070404892,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.26143561518494,
      "avg_reward": 0.16647964988325886
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.23840096857715642,
      "avg_reward": 0.24943553190905077
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.2631158410105439,
      "avg_reward": 0.24501844540934742
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.3003641828956397,
      "avg_reward": 0.2166889319993186
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.27219481959490843,
      "avg_reward": 0.21419308179616905
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.28611172967484505,
      "avg_reward": 0.28276803214780205
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.33663428816934127,
      "avg_reward": 0.28691183644196794
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.3154491817766203,
      "avg_reward": 0.19462717655767175
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.3303498986266128,
      "avg_reward": 0.39290790388102403
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.31527289676869114,
      "avg_reward": 0.21204252045151414
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.3023532648177482,
      "avg_reward": 0.19227724958697215
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.290088608117453,
      "avg_reward": 0.1979250205190122
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.3345975306908187,
      "avg_reward": 0.24045315050986174
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.3186674220246289,
      "avg_reward": 0.22184592325368452
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.3119445673413167,
      "avg_reward": 0.17410684141264013
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.29738443728029995,
      "avg_reward": 0.2570056612499287
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.32572348781124566,
      "avg_reward": 0.28986785238636775
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.35200195736824635,
      "avg_reward": 0.4020462409190145
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.32644898196701644,
      "avg_reward": 0.1965051688344121
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.33248629581787786,
      "avg_reward": 0.35830915495763643
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.31784956310543505,
      "avg_reward": 0.217854831031714
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.33217482748235544,
      "avg_reward": 0.28333282223579515
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.3602450005804543,
      "avg_reward": 0.3324190735094573
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.35190281014839514,
      "avg_reward": 0.16549724515272135
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.339878306281188,
      "avg_reward": 0.22226272059432783
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.3421991352018797,
      "avg_reward": 0.24559367730949602
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.3451532278172135,
      "avg_reward": 0.318801256241514
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.34637099990422643,
      "avg_reward": 0.190172560273278
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.36492422358485394,
      "avg_reward": 0.2511382137794292
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.3476551414275517,
      "avg_reward": 0.2626272051564233
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.33363672075723555,
      "avg_reward": 0.18322343314899656
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.36046142870938835,
      "avg_reward": 0.3258362492880387
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.37903787745330353,
      "avg_reward": 0.15672142896929428
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.35563376114394923,
      "avg_reward": 0.32134269198994897
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.40617079568147896,
      "avg_reward": 0.3820857800163438
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.34292729270654376,
      "avg_reward": 0.2507656296709699
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.3935048811442505,
      "avg_reward": 0.27485487484356386
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.3279326765573924,
      "avg_reward": 0.2390275299933834
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.3741456942821547,
      "avg_reward": 0.32062326797538226
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.36546727254223066,
      "avg_reward": 0.33146539494667604
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.37185657330489597,
      "avg_reward": 0.3264476550797999
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.3811745218348157,
      "avg_reward": 0.21397902551111198
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.3451959496997376,
      "avg_reward": 0.18136983157688097
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.3915344041649047,
      "avg_reward": 0.31507107988546984
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.3654054325594142,
      "avg_reward": 0.32139003895714785
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.36695700062171477,
      "avg_reward": 0.2028406224189277
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.39216125190548295,
      "avg_reward": 0.368344815819818
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.40547714133893525,
      "avg_reward": 0.2822104950838327
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.35883156881549716,
      "avg_reward": 0.2839710885790014
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.42486847735208955,
      "avg_reward": 0.3893675930438712
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": -0.02491047619505481,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.42486847735208955,
      "avg_reward": 0.3893675930438712
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 11.0,
      "update": 1,
      "cumulative_wall_time": 4.545454545454546
    },
    {
      "timestep": 101,
      "throughput": 12.100000000000001,
      "update": 2,
      "cumulative_wall_time": 9.090909090909092
    },
    {
      "timestep": 202,
      "throughput": 13.2,
      "update": 3,
      "cumulative_wall_time": 13.636363636363637
    },
    {
      "timestep": 303,
      "throughput": 14.3,
      "update": 4,
      "cumulative_wall_time": 18.181818181818183
    },
    {
      "timestep": 404,
      "throughput": 15.399999999999999,
      "update": 5,
      "cumulative_wall_time": 22.72727272727273
    },
    {
      "timestep": 505,
      "throughput": 16.5,
      "update": 6,
      "cumulative_wall_time": 27.272727272727277
    },
    {
      "timestep": 606,
      "throughput": 17.6,
      "update": 7,
      "cumulative_wall_time": 31.818181818181824
    },
    {
      "timestep": 707,
      "throughput": 18.7,
      "update": 8,
      "cumulative_wall_time": 36.36363636363637
    },
    {
      "timestep": 808,
      "throughput": 19.8,
      "update": 9,
      "cumulative_wall_time": 40.909090909090914
    },
    {
      "timestep": 909,
      "throughput": 20.9,
      "update": 10,
      "cumulative_wall_time": 45.45454545454546
    },
    {
      "timestep": 1010,
      "throughput": 23.119961514633832,
      "update": 11,
      "cumulative_wall_time": 50.00000000000001
    },
    {
      "timestep": 1111,
      "throughput": 20.028546254838638,
      "update": 12,
      "cumulative_wall_time": 54.545454545454554
    },
    {
      "timestep": 1212,
      "throughput": 19.432426060549396,
      "update": 13,
      "cumulative_wall_time": 59.0909090909091
    },
    {
      "timestep": 1313,
      "throughput": 23.515230527828248,
      "update": 14,
      "cumulative_wall_time": 63.63636363636365
    },
    {
      "timestep": 1414,
      "throughput": 18.834855170723817,
      "update": 15,
      "cumulative_wall_time": 68.18181818181819
    },
    {
      "timestep": 1515,
      "throughput": 26.325108196401533,
      "update": 16,
      "cumulative_wall_time": 72.72727272727273
    },
    {
      "timestep": 1616,
      "throughput": 24.015328248417987,
      "update": 17,
      "cumulative_wall_time": 77.27272727272728
    },
    {
      "timestep": 1717,
      "throughput": 19.997239273035227,
      "update": 18,
      "cumulative_wall_time": 81.81818181818183
    },
    {
      "timestep": 1818,
      "throughput": 21.7604296756139,
      "update": 19,
      "cumulative_wall_time": 86.36363636363637
    },
    {
      "timestep": 1919,
      "throughput": 18.49514949714797,
      "update": 20,
      "cumulative_wall_time": 90.90909090909092
    },
    {
      "timestep": 2020,
      "throughput": 21.2788762793894,
      "update": 21,
      "cumulative_wall_time": 95.45454545454547
    },
    {
      "timestep": 2121,
      "throughput": 24.75857117258385,
      "update": 22,
      "cumulative_wall_time": 100.00000000000001
    },
    {
      "timestep": 2222,
      "throughput": 26.062581438349568,
      "update": 23,
      "cumulative_wall_time": 104.54545454545456
    },
    {
      "timestep": 2323,
      "throughput": 23.51114693465213,
      "update": 24,
      "cumulative_wall_time": 109.09090909090911
    },
    {
      "timestep": 2424,
      "throughput": 16.797628931062683,
      "update": 25,
      "cumulative_wall_time": 113.63636363636365
    },
    {
      "timestep": 2525,
      "throughput": 23.068700519255884,
      "update": 26,
      "cumulative_wall_time": 118.1818181818182
    },
    {
      "timestep": 2626,
      "throughput": 23.08259057277522,
      "update": 27,
      "cumulative_wall_time": 122.72727272727275
    },
    {
      "timestep": 2727,
      "throughput": 21.07315984675114,
      "update": 28,
      "cumulative_wall_time": 127.2727272727273
    },
    {
      "timestep": 2828,
      "throughput": 23.99943079899622,
      "update": 29,
      "cumulative_wall_time": 131.81818181818184
    },
    {
      "timestep": 2929,
      "throughput": 19.404235120830826,
      "update": 30,
      "cumulative_wall_time": 136.36363636363637
    },
    {
      "timestep": 3030,
      "throughput": 23.468115287597918,
      "update": 31,
      "cumulative_wall_time": 140.9090909090909
    },
    {
      "timestep": 3131,
      "throughput": 21.742923573904267,
      "update": 32,
      "cumulative_wall_time": 145.45454545454544
    },
    {
      "timestep": 3232,
      "throughput": 23.127331247579015,
      "update": 33,
      "cumulative_wall_time": 149.99999999999997
    },
    {
      "timestep": 3333,
      "throughput": 27.15009897378207,
      "update": 34,
      "cumulative_wall_time": 154.5454545454545
    },
    {
      "timestep": 3434,
      "throughput": 22.76053679384033,
      "update": 35,
      "cumulative_wall_time": 159.09090909090904
    },
    {
      "timestep": 3535,
      "throughput": 20.95431123251723,
      "update": 36,
      "cumulative_wall_time": 163.63636363636357
    },
    {
      "timestep": 3636,
      "throughput": 19.97912553769357,
      "update": 37,
      "cumulative_wall_time": 168.1818181818181
    },
    {
      "timestep": 3737,
      "throughput": 21.39671910205124,
      "update": 38,
      "cumulative_wall_time": 172.72727272727263
    },
    {
      "timestep": 3838,
      "throughput": 22.042157832145747,
      "update": 39,
      "cumulative_wall_time": 177.27272727272717
    },
    {
      "timestep": 3939,
      "throughput": 20.77523628002092,
      "update": 40,
      "cumulative_wall_time": 181.8181818181817
    },
    {
      "timestep": 4040,
      "throughput": 26.26452011851967,
      "update": 41,
      "cumulative_wall_time": 186.36363636363623
    },
    {
      "timestep": 4141,
      "throughput": 23.265378204734663,
      "update": 42,
      "cumulative_wall_time": 190.90909090909076
    },
    {
      "timestep": 4242,
      "throughput": 21.12830435732508,
      "update": 43,
      "cumulative_wall_time": 195.4545454545453
    },
    {
      "timestep": 4343,
      "throughput": 25.10512594929253,
      "update": 44,
      "cumulative_wall_time": 199.99999999999983
    },
    {
      "timestep": 4444,
      "throughput": 18.338566213164498,
      "update": 45,
      "cumulative_wall_time": 204.54545454545436
    },
    {
      "timestep": 4545,
      "throughput": 24.906359542928147,
      "update": 46,
      "cumulative_wall_time": 209.0909090909089
    },
    {
      "timestep": 4646,
      "throughput": 24.775447457030012,
      "update": 47,
      "cumulative_wall_time": 213.63636363636343
    },
    {
      "timestep": 4747,
      "throughput": 26.518754927887713,
      "update": 48,
      "cumulative_wall_time": 218.18181818181796
    },
    {
      "timestep": 4848,
      "throughput": 22.42664471711029,
      "update": 49,
      "cumulative_wall_time": 222.7272727272725
    },
    {
      "timestep": 4949,
      "throughput": 24.48016013202159,
      "update": 50,
      "cumulative_wall_time": 227.27272727272702
    },
    {
      "timestep": 5050,
      "throughput": 23.037563175481417,
      "update": 51,
      "cumulative_wall_time": 231.81818181818156
    },
    {
      "timestep": 5151,
      "throughput": 23.363671207673534,
      "update": 52,
      "cumulative_wall_time": 236.3636363636361
    },
    {
      "timestep": 5252,
      "throughput": 19.805453214883464,
      "update": 53,
      "cumulative_wall_time": 240.90909090909062
    },
    {
      "timestep": 5353,
      "throughput": 25.311270101278975,
      "update": 54,
      "cumulative_wall_time": 245.45454545454515
    },
    {
      "timestep": 5454,
      "throughput": 22.750430460245727,
      "update": 55,
      "cumulative_wall_time": 249.9999999999997
    },
    {
      "timestep": 5555,
      "throughput": 19.231028039986743,
      "update": 56,
      "cumulative_wall_time": 254.54545454545422
    },
    {
      "timestep": 5656,
      "throughput": 21.770663264815322,
      "update": 57,
      "cumulative_wall_time": 259.0909090909088
    },
    {
      "timestep": 5757,
      "throughput": 17.850186425443077,
      "update": 58,
      "cumulative_wall_time": 263.63636363636334
    },
    {
      "timestep": 5858,
      "throughput": 18.13668868075986,
      "update": 59,
      "cumulative_wall_time": 268.1818181818179
    },
    {
      "timestep": 5959,
      "throughput": 19.913801993031722,
      "update": 60,
      "cumulative_wall_time": 272.72727272727246
    },
    {
      "timestep": 6060,
      "throughput": 23.59453757550456,
      "update": 61,
      "cumulative_wall_time": 277.272727272727
    },
    {
      "timestep": 6161,
      "throughput": 24.855141362144526,
      "update": 62,
      "cumulative_wall_time": 281.8181818181816
    },
    {
      "timestep": 6262,
      "throughput": 20.085577340165692,
      "update": 63,
      "cumulative_wall_time": 286.36363636363615
    },
    {
      "timestep": 6363,
      "throughput": 21.203780131786825,
      "update": 64,
      "cumulative_wall_time": 290.9090909090907
    },
    {
      "timestep": 6464,
      "throughput": 22.421590971464045,
      "update": 65,
      "cumulative_wall_time": 295.45454545454527
    },
    {
      "timestep": 6565,
      "throughput": 21.853913650971247,
      "update": 66,
      "cumulative_wall_time": 299.99999999999983
    },
    {
      "timestep": 6666,
      "throughput": 22.431564725664625,
      "update": 67,
      "cumulative_wall_time": 304.5454545454544
    },
    {
      "timestep": 6767,
      "throughput": 19.326877691458524,
      "update": 68,
      "cumulative_wall_time": 309.09090909090895
    },
    {
      "timestep": 6868,
      "throughput": 23.20497875921956,
      "update": 69,
      "cumulative_wall_time": 313.6363636363635
    },
    {
      "timestep": 6969,
      "throughput": 21.540938100137282,
      "update": 70,
      "cumulative_wall_time": 318.1818181818181
    },
    {
      "timestep": 7070,
      "throughput": 20.99614914908322,
      "update": 71,
      "cumulative_wall_time": 322.72727272727263
    },
    {
      "timestep": 7171,
      "throughput": 23.390661012872748,
      "update": 72,
      "cumulative_wall_time": 327.2727272727272
    },
    {
      "timestep": 7272,
      "throughput": 22.569309788567264,
      "update": 73,
      "cumulative_wall_time": 331.81818181818176
    },
    {
      "timestep": 7373,
      "throughput": 23.011807207093774,
      "update": 74,
      "cumulative_wall_time": 336.3636363636363
    },
    {
      "timestep": 7474,
      "throughput": 21.600558277502362,
      "update": 75,
      "cumulative_wall_time": 340.9090909090909
    },
    {
      "timestep": 7575,
      "throughput": 25.250383326952296,
      "update": 76,
      "cumulative_wall_time": 345.45454545454544
    },
    {
      "timestep": 7676,
      "throughput": 21.277277411723382,
      "update": 77,
      "cumulative_wall_time": 350.0
    },
    {
      "timestep": 7777,
      "throughput": 25.034766460068436,
      "update": 78,
      "cumulative_wall_time": 354.54545454545456
    },
    {
      "timestep": 7878,
      "throughput": 21.327955603629576,
      "update": 79,
      "cumulative_wall_time": 359.0909090909091
    },
    {
      "timestep": 7979,
      "throughput": 23.49317246741433,
      "update": 80,
      "cumulative_wall_time": 363.6363636363637
    },
    {
      "timestep": 8080,
      "throughput": 19.751230163348986,
      "update": 81,
      "cumulative_wall_time": 368.18181818181824
    },
    {
      "timestep": 8181,
      "throughput": 17.884203997017938,
      "update": 82,
      "cumulative_wall_time": 372.7272727272728
    },
    {
      "timestep": 8282,
      "throughput": 24.11731829218486,
      "update": 83,
      "cumulative_wall_time": 377.27272727272737
    },
    {
      "timestep": 8383,
      "throughput": 21.073231636634773,
      "update": 84,
      "cumulative_wall_time": 381.8181818181819
    },
    {
      "timestep": 8484,
      "throughput": 23.77462368108833,
      "update": 85,
      "cumulative_wall_time": 386.3636363636365
    },
    {
      "timestep": 8585,
      "throughput": 25.037178328355015,
      "update": 86,
      "cumulative_wall_time": 390.90909090909105
    },
    {
      "timestep": 8686,
      "throughput": 20.35406668589609,
      "update": 87,
      "cumulative_wall_time": 395.4545454545456
    },
    {
      "timestep": 8787,
      "throughput": 20.660803197488015,
      "update": 88,
      "cumulative_wall_time": 400.00000000000017
    },
    {
      "timestep": 8888,
      "throughput": 22.30386899028124,
      "update": 89,
      "cumulative_wall_time": 404.54545454545473
    },
    {
      "timestep": 8989,
      "throughput": 21.463631532468742,
      "update": 90,
      "cumulative_wall_time": 409.0909090909093
    },
    {
      "timestep": 9090,
      "throughput": 22.237135763568098,
      "update": 91,
      "cumulative_wall_time": 413.63636363636385
    },
    {
      "timestep": 9191,
      "throughput": 24.03151901191627,
      "update": 92,
      "cumulative_wall_time": 418.1818181818184
    },
    {
      "timestep": 9292,
      "throughput": 19.887109371463495,
      "update": 93,
      "cumulative_wall_time": 422.727272727273
    },
    {
      "timestep": 9393,
      "throughput": 21.778048008536704,
      "update": 94,
      "cumulative_wall_time": 427.27272727272754
    },
    {
      "timestep": 9494,
      "throughput": 24.739041156234553,
      "update": 95,
      "cumulative_wall_time": 431.8181818181821
    },
    {
      "timestep": 9595,
      "throughput": 24.03033255920702,
      "update": 96,
      "cumulative_wall_time": 436.36363636363666
    },
    {
      "timestep": 9696,
      "throughput": 24.103116915457246,
      "update": 97,
      "cumulative_wall_time": 440.9090909090912
    },
    {
      "timestep": 9797,
      "throughput": 20.585385663133664,
      "update": 98,
      "cumulative_wall_time": 445.4545454545458
    },
    {
      "timestep": 9898,
      "throughput": 22.33775950539584,
      "update": 99,
      "cumulative_wall_time": 450.00000000000034
    },
    {
      "timestep": 10000,
      "throughput": 23.221001747891705,
      "update": 100,
      "cumulative_wall_time": 454.5454545454549
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 2000,
        "success_rate": 0.85,
        "mean_reward": 0.774535753066723,
        "recent_gradient": 0.00880228815501225
      },
      "level_2": {
        "num_pulls": 2000,
        "success_rate": 0.65,
        "mean_reward": 0.6076855357527491,
        "recent_gradient": 0.021498278466352168
      },
      "level_3": {
        "num_pulls": 2000,
        "success_rate": 0.45,
        "mean_reward": 0.3831754599108145,
        "recent_gradient": 0.03149706388174175
      },
      "level_4": {
        "num_pulls": 2000,
        "success_rate": 0.28,
        "mean_reward": 0.28015326432172166,
        "recent_gradient": 0.019275276932362185
      },
      "level_5": {
        "num_pulls": 2000,
        "success_rate": 0.15,
        "mean_reward": 0.13334041455555007,
        "recent_gradient": 0.012821048819579189
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.15
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 4.269411344381984
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.280264511263108
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 5.37398672115195
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 4.826192872277722
      }
    }
  },
  "config": {
    "use_async": true,
    "curriculum_strategy": "uniform",
    "use_csc": true
  }
}