{
  "experiment_name": "async_staleness_seed42",
  "total_timesteps": 10000,
  "total_time": 454.54545454545456,
  "avg_throughput": 22,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.009934283060224654,
      "avg_reward": 0.0010342113896204897,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 101,
      "pass_at_1": 0.022650740458983548,
      "avg_reward": 0.09427208518758812,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 202,
      "pass_at_1": 0.014710871899472674,
      "avg_reward": 6.184967211911134e-05,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 303,
      "pass_at_1": 0.06067516540105691,
      "avg_reward": 0.08691186877849097,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 404,
      "pass_at_1": 0.029398391069179745,
      "avg_reward": 0.050646715034642034,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 505,
      "pass_at_1": 0.13627120206138654,
      "avg_reward": 0.08573047397059638,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 606,
      "pass_at_1": 0.15295233470895173,
      "avg_reward": 0.026697855534271495,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 707,
      "pass_at_1": 0.11621326704358825,
      "avg_reward": 0.06485623717282198,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 808,
      "pass_at_1": 0.13307806237689995,
      "avg_reward": 0.12217481653128366,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 909,
      "pass_at_1": 0.13782129187311734,
      "avg_reward": 0.0396418484317293,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.18796534106448662,
      "avg_reward": 0.1390834578272625,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.16269647751768954,
      "avg_reward": 0.0589197727034788,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.15317418961401466,
      "avg_reward": 0.12808548117670504,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.14377968974527666,
      "avg_reward": 0.13380865271350492,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.15754567115199986,
      "avg_reward": 0.11145184943193605,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.1603037195666754,
      "avg_reward": 0.22085688487878724,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.1748671713321704,
      "avg_reward": 0.0870081906179413,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.1944064468902683,
      "avg_reward": 0.09448297501366351,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.18496971206332063,
      "avg_reward": 0.049992263456667727,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.15708333810655103,
      "avg_reward": 0.135509732278697,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.20128798518546676,
      "avg_reward": 0.16959880220787193,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.18709348633821707,
      "avg_reward": 0.13461960429110922,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.1627392236771602,
      "avg_reward": 0.09419916852199273,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.18601470351916982,
      "avg_reward": 0.20166787412628165,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.20503143747923927,
      "avg_reward": 0.07587314221525474,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.20758527781252228,
      "avg_reward": 0.146814108229202,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.19052176009548602,
      "avg_reward": 0.1830012225184322,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.2276479933331238,
      "avg_reward": 0.22868240062230896,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.1932217686687666,
      "avg_reward": 0.1391167961424526,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.21961891706654743,
      "avg_reward": 0.22447239000935593,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.20640619390884027,
      "avg_reward": 0.15584200629388137,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.19686658756926723,
      "avg_reward": 0.09768293885138027,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.23825405775492958,
      "avg_reward": 0.2584152476324848,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.22357929834899032,
      "avg_reward": 0.2290400835737935,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.23527293810038397,
      "avg_reward": 0.155962362750051,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.23829264997320676,
      "avg_reward": 0.2675359483018639,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.23337558205760056,
      "avg_reward": 0.26493264843678077,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.18472644809699978,
      "avg_reward": 0.18887628369636103,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.24189245649614946,
      "avg_reward": 0.1785635976736262,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.24501684730999618,
      "avg_reward": 0.0966350321179523,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.2418172965090429,
      "avg_reward": 0.21130946578282164,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.27879573892168924,
      "avg_reward": 0.19712308022366903,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.23609216896079444,
      "avg_reward": 0.16378588298940874,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.27359036729238256,
      "avg_reward": 0.23530984931689028,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.2477025523593436,
      "avg_reward": 0.2238254135431427,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.26324893929236515,
      "avg_reward": 0.25903140096053656,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.2502692188004057,
      "avg_reward": 0.18383226771043618,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.2594633391080536,
      "avg_reward": 0.13439492387983695,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.27621453657276257,
      "avg_reward": 0.23402439286720453,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.27337152538344417,
      "avg_reward": 0.206967863637998,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.24792856380455247,
      "avg_reward": 0.17731058490537405
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.27233712158419443,
      "avg_reward": 0.1777558338062746
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.2789089694241874,
      "avg_reward": 0.24332971838007686
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.32278865438282967,
      "avg_reward": 0.2669598141478557
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.2931323361487184,
      "avg_reward": 0.2307835731306664
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.25250761033210534,
      "avg_reward": 0.20068039449322345
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.29497385212391175,
      "avg_reward": 0.35914118732339373
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.2927919599761502,
      "avg_reward": 0.2493109350976008
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.2987978235568456,
      "avg_reward": 0.18060435696449986
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.3251835934502633,
      "avg_reward": 0.2977435263945494
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.320964323641925,
      "avg_reward": 0.21130208617380308
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.33599687983178445,
      "avg_reward": 0.1987049507258135
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.32245551962943086,
      "avg_reward": 0.36748719699404364
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.29366444682764936,
      "avg_reward": 0.2066166709819809
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.31820376668554506,
      "avg_reward": 0.2293892306426261
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.2879111895957403,
      "avg_reward": 0.23375710041689363
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.3003696615013904,
      "avg_reward": 0.26397535073287137
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.30589551729360714,
      "avg_reward": 0.3222131340857627
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.3112636451464902,
      "avg_reward": 0.2329078403069084
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.34581968581737416,
      "avg_reward": 0.2151125328322016
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.33669459541007757,
      "avg_reward": 0.33471281404218345
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.3025667401470449,
      "avg_reward": 0.2512850850442511
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.3424595746923032,
      "avg_reward": 0.3130588033427081
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.31504250229711406,
      "avg_reward": 0.18601117118347743
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.35271363206719053,
      "avg_reward": 0.2970201393154117
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.3497512561825116,
      "avg_reward": 0.2971234154208581
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.33358046975168254,
      "avg_reward": 0.2784770606593962
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.355454622273077,
      "avg_reward": 0.24864612691714322
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.38929321674695894,
      "avg_reward": 0.33512621944315657
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.3305082811014131,
      "avg_reward": 0.29723430531282197
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.3371691626630571,
      "avg_reward": 0.30908956031756823
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.3821347465679561,
      "avg_reward": 0.2646736813367794
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.38050178717275845,
      "avg_reward": 0.32504047608503167
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.3799181078865503,
      "avg_reward": 0.3987741354419376
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.36078283544373185,
      "avg_reward": 0.250939460137111
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.3500849199637493,
      "avg_reward": 0.23927742172272753
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.3684885894416738,
      "avg_reward": 0.31184847029417123
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.377690566914506,
      "avg_reward": 0.343511615983406
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.3745135571347664,
      "avg_reward": 0.372287549565679
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.371027741331753,
      "avg_reward": 0.43283065139488336
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.3908721431412089,
      "avg_reward": 0.269839836692153
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.35894941243986345,
      "avg_reward": 0.31128315071405
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.37787702830702496,
      "avg_reward": 0.3380016473502246
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.39376063917010995,
      "avg_reward": 0.31136706570324435
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.3692802394118455,
      "avg_reward": 0.21968183029518318
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.37917672678309217,
      "avg_reward": 0.3461613211426474
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.3942505748141219,
      "avg_reward": 0.25311352091569816
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.3952648476989417,
      "avg_reward": 0.33547774714559525
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.3759275733394191,
      "avg_reward": 0.3084283139688117
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.3965434762427287,
      "avg_reward": 0.2600862661026518
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.009934283060224654,
      "avg_reward": 0.0010342113896204897,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.3965434762427287,
      "avg_reward": 0.2600862661026518
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 11.0,
      "update": 1,
      "cumulative_wall_time": 4.545454545454546
    },
    {
      "timestep": 101,
      "throughput": 12.100000000000001,
      "update": 2,
      "cumulative_wall_time": 9.090909090909092
    },
    {
      "timestep": 202,
      "throughput": 13.2,
      "update": 3,
      "cumulative_wall_time": 13.636363636363637
    },
    {
      "timestep": 303,
      "throughput": 14.3,
      "update": 4,
      "cumulative_wall_time": 18.181818181818183
    },
    {
      "timestep": 404,
      "throughput": 15.399999999999999,
      "update": 5,
      "cumulative_wall_time": 22.72727272727273
    },
    {
      "timestep": 505,
      "throughput": 16.5,
      "update": 6,
      "cumulative_wall_time": 27.272727272727277
    },
    {
      "timestep": 606,
      "throughput": 17.6,
      "update": 7,
      "cumulative_wall_time": 31.818181818181824
    },
    {
      "timestep": 707,
      "throughput": 18.7,
      "update": 8,
      "cumulative_wall_time": 36.36363636363637
    },
    {
      "timestep": 808,
      "throughput": 19.8,
      "update": 9,
      "cumulative_wall_time": 40.909090909090914
    },
    {
      "timestep": 909,
      "throughput": 20.9,
      "update": 10,
      "cumulative_wall_time": 45.45454545454546
    },
    {
      "timestep": 1010,
      "throughput": 22.787132192766222,
      "update": 11,
      "cumulative_wall_time": 50.00000000000001
    },
    {
      "timestep": 1111,
      "throughput": 23.233725958010115,
      "update": 12,
      "cumulative_wall_time": 54.545454545454554
    },
    {
      "timestep": 1212,
      "throughput": 24.38271273498561,
      "update": 13,
      "cumulative_wall_time": 59.0909090909091
    },
    {
      "timestep": 1313,
      "throughput": 24.318364514476784,
      "update": 14,
      "cumulative_wall_time": 63.63636363636365
    },
    {
      "timestep": 1414,
      "throughput": 18.9691273904944,
      "update": 15,
      "cumulative_wall_time": 68.18181818181819
    },
    {
      "timestep": 1515,
      "throughput": 19.936784912186727,
      "update": 16,
      "cumulative_wall_time": 72.72727272727273
    },
    {
      "timestep": 1616,
      "throughput": 23.13307758785905,
      "update": 17,
      "cumulative_wall_time": 77.27272727272728
    },
    {
      "timestep": 1717,
      "throughput": 23.13032909200686,
      "update": 18,
      "cumulative_wall_time": 81.81818181818183
    },
    {
      "timestep": 1818,
      "throughput": 23.133104909873303,
      "update": 19,
      "cumulative_wall_time": 86.36363636363637
    },
    {
      "timestep": 1919,
      "throughput": 30.476009279440387,
      "update": 20,
      "cumulative_wall_time": 90.90909090909092
    },
    {
      "timestep": 2020,
      "throughput": 23.255959123524967,
      "update": 21,
      "cumulative_wall_time": 95.45454545454547
    },
    {
      "timestep": 2121,
      "throughput": 24.498244408397316,
      "update": 22,
      "cumulative_wall_time": 100.00000000000001
    },
    {
      "timestep": 2222,
      "throughput": 24.098803879685043,
      "update": 23,
      "cumulative_wall_time": 104.54545454545456
    },
    {
      "timestep": 2323,
      "throughput": 23.433060752872755,
      "update": 24,
      "cumulative_wall_time": 109.09090909090911
    },
    {
      "timestep": 2424,
      "throughput": 21.30640766179124,
      "update": 25,
      "cumulative_wall_time": 113.63636363636365
    },
    {
      "timestep": 2525,
      "throughput": 23.66973228508519,
      "update": 26,
      "cumulative_wall_time": 118.1818181818182
    },
    {
      "timestep": 2626,
      "throughput": 20.299784528017344,
      "update": 27,
      "cumulative_wall_time": 122.72727272727275
    },
    {
      "timestep": 2727,
      "throughput": 21.47899906517198,
      "update": 28,
      "cumulative_wall_time": 127.2727272727273
    },
    {
      "timestep": 2828,
      "throughput": 20.932200194775973,
      "update": 29,
      "cumulative_wall_time": 131.81818181818184
    },
    {
      "timestep": 2929,
      "throughput": 22.18012310664991,
      "update": 30,
      "cumulative_wall_time": 136.36363636363637
    },
    {
      "timestep": 3030,
      "throughput": 27.09224884668172,
      "update": 31,
      "cumulative_wall_time": 140.9090909090909
    },
    {
      "timestep": 3131,
      "throughput": 17.892016576298154,
      "update": 32,
      "cumulative_wall_time": 145.45454545454544
    },
    {
      "timestep": 3232,
      "throughput": 23.50977241882393,
      "update": 33,
      "cumulative_wall_time": 149.99999999999997
    },
    {
      "timestep": 3333,
      "throughput": 18.452025083382765,
      "update": 34,
      "cumulative_wall_time": 154.5454545454545
    },
    {
      "timestep": 3434,
      "throughput": 20.961749895263246,
      "update": 35,
      "cumulative_wall_time": 159.09090909090904
    },
    {
      "timestep": 3535,
      "throughput": 24.395691313328207,
      "update": 36,
      "cumulative_wall_time": 163.63636363636357
    },
    {
      "timestep": 3636,
      "throughput": 22.141416042010015,
      "update": 37,
      "cumulative_wall_time": 168.1818181818181
    },
    {
      "timestep": 3737,
      "throughput": 19.628961488555525,
      "update": 38,
      "cumulative_wall_time": 172.72727272727263
    },
    {
      "timestep": 3838,
      "throughput": 20.42633183962807,
      "update": 39,
      "cumulative_wall_time": 177.27272727272717
    },
    {
      "timestep": 3939,
      "throughput": 23.495115047656284,
      "update": 40,
      "cumulative_wall_time": 181.8181818181817
    },
    {
      "timestep": 4040,
      "throughput": 20.3931934102223,
      "update": 41,
      "cumulative_wall_time": 186.36363636363623
    },
    {
      "timestep": 4141,
      "throughput": 22.476208897080348,
      "update": 42,
      "cumulative_wall_time": 190.90909090909076
    },
    {
      "timestep": 4242,
      "throughput": 22.100258047788387,
      "update": 43,
      "cumulative_wall_time": 195.4545454545453
    },
    {
      "timestep": 4343,
      "throughput": 20.566479235267202,
      "update": 44,
      "cumulative_wall_time": 199.99999999999983
    },
    {
      "timestep": 4444,
      "throughput": 26.71667699651572,
      "update": 45,
      "cumulative_wall_time": 204.54545454545436
    },
    {
      "timestep": 4545,
      "throughput": 23.39462184909962,
      "update": 46,
      "cumulative_wall_time": 209.0909090909089
    },
    {
      "timestep": 4646,
      "throughput": 17.544686309353267,
      "update": 47,
      "cumulative_wall_time": 213.63636363636343
    },
    {
      "timestep": 4747,
      "throughput": 22.410199492492744,
      "update": 48,
      "cumulative_wall_time": 218.18181818181796
    },
    {
      "timestep": 4848,
      "throughput": 20.544069777509545,
      "update": 49,
      "cumulative_wall_time": 222.7272727272725
    },
    {
      "timestep": 4949,
      "throughput": 23.87535333655169,
      "update": 50,
      "cumulative_wall_time": 227.27272727272702
    },
    {
      "timestep": 5050,
      "throughput": 20.256454375448058,
      "update": 51,
      "cumulative_wall_time": 231.81818181818156
    },
    {
      "timestep": 5151,
      "throughput": 21.74757982877282,
      "update": 52,
      "cumulative_wall_time": 236.3636363636361
    },
    {
      "timestep": 5252,
      "throughput": 23.110972013757006,
      "update": 53,
      "cumulative_wall_time": 240.90909090909062
    },
    {
      "timestep": 5353,
      "throughput": 23.90466142717427,
      "update": 54,
      "cumulative_wall_time": 245.45454545454515
    },
    {
      "timestep": 5454,
      "throughput": 19.359347904477293,
      "update": 55,
      "cumulative_wall_time": 249.9999999999997
    },
    {
      "timestep": 5555,
      "throughput": 21.264097281149915,
      "update": 56,
      "cumulative_wall_time": 254.54545454545422
    },
    {
      "timestep": 5656,
      "throughput": 20.955120315445896,
      "update": 57,
      "cumulative_wall_time": 259.0909090909088
    },
    {
      "timestep": 5757,
      "throughput": 20.562675688337833,
      "update": 58,
      "cumulative_wall_time": 263.63636363636334
    },
    {
      "timestep": 5858,
      "throughput": 25.883999328618412,
      "update": 59,
      "cumulative_wall_time": 268.1818181818179
    },
    {
      "timestep": 5959,
      "throughput": 22.890959764114104,
      "update": 60,
      "cumulative_wall_time": 272.72727272727246
    },
    {
      "timestep": 6060,
      "throughput": 19.2260553004629,
      "update": 61,
      "cumulative_wall_time": 277.272727272727
    },
    {
      "timestep": 6161,
      "throughput": 24.019296283520507,
      "update": 62,
      "cumulative_wall_time": 281.8181818181816
    },
    {
      "timestep": 6262,
      "throughput": 26.66874363342779,
      "update": 63,
      "cumulative_wall_time": 286.36363636363615
    },
    {
      "timestep": 6363,
      "throughput": 24.271423573212523,
      "update": 64,
      "cumulative_wall_time": 290.9090909090907
    },
    {
      "timestep": 6464,
      "throughput": 18.65738607490117,
      "update": 65,
      "cumulative_wall_time": 295.45454545454527
    },
    {
      "timestep": 6565,
      "throughput": 20.934685039694244,
      "update": 66,
      "cumulative_wall_time": 299.99999999999983
    },
    {
      "timestep": 6666,
      "throughput": 24.78720452821057,
      "update": 67,
      "cumulative_wall_time": 304.5454545454544
    },
    {
      "timestep": 6767,
      "throughput": 20.443127175638683,
      "update": 68,
      "cumulative_wall_time": 309.09090909090895
    },
    {
      "timestep": 6868,
      "throughput": 22.976402741921703,
      "update": 69,
      "cumulative_wall_time": 313.6363636363635
    },
    {
      "timestep": 6969,
      "throughput": 23.70419491754454,
      "update": 70,
      "cumulative_wall_time": 318.1818181818181
    },
    {
      "timestep": 7070,
      "throughput": 19.96075296252822,
      "update": 71,
      "cumulative_wall_time": 322.72727272727263
    },
    {
      "timestep": 7171,
      "throughput": 21.86904421666404,
      "update": 72,
      "cumulative_wall_time": 327.2727272727272
    },
    {
      "timestep": 7272,
      "throughput": 14.86921185184804,
      "update": 73,
      "cumulative_wall_time": 331.81818181818176
    },
    {
      "timestep": 7373,
      "throughput": 19.74634718906456,
      "update": 74,
      "cumulative_wall_time": 336.3636363636363
    },
    {
      "timestep": 7474,
      "throughput": 21.444350066935048,
      "update": 75,
      "cumulative_wall_time": 340.9090909090909
    },
    {
      "timestep": 7575,
      "throughput": 19.25487699967733,
      "update": 76,
      "cumulative_wall_time": 345.45454545454544
    },
    {
      "timestep": 7676,
      "throughput": 25.591304868649598,
      "update": 77,
      "cumulative_wall_time": 350.0
    },
    {
      "timestep": 7777,
      "throughput": 18.85368896848661,
      "update": 78,
      "cumulative_wall_time": 354.54545454545456
    },
    {
      "timestep": 7878,
      "throughput": 21.031902129266633,
      "update": 79,
      "cumulative_wall_time": 359.0909090909091
    },
    {
      "timestep": 7979,
      "throughput": 22.2876292700294,
      "update": 80,
      "cumulative_wall_time": 363.6363636363637
    },
    {
      "timestep": 8080,
      "throughput": 25.170801235945454,
      "update": 81,
      "cumulative_wall_time": 368.18181818181824
    },
    {
      "timestep": 8181,
      "throughput": 18.841103267405234,
      "update": 82,
      "cumulative_wall_time": 372.7272727272728
    },
    {
      "timestep": 8282,
      "throughput": 24.55896025474091,
      "update": 83,
      "cumulative_wall_time": 377.27272727272737
    },
    {
      "timestep": 8383,
      "throughput": 22.02251273424309,
      "update": 84,
      "cumulative_wall_time": 381.8181818181819
    },
    {
      "timestep": 8484,
      "throughput": 19.840680967694507,
      "update": 85,
      "cumulative_wall_time": 386.3636363636365
    },
    {
      "timestep": 8585,
      "throughput": 23.016627643379195,
      "update": 86,
      "cumulative_wall_time": 390.90909090909105
    },
    {
      "timestep": 8686,
      "throughput": 22.437931330261634,
      "update": 87,
      "cumulative_wall_time": 395.4545454545456
    },
    {
      "timestep": 8787,
      "throughput": 20.67952287025065,
      "update": 88,
      "cumulative_wall_time": 400.00000000000017
    },
    {
      "timestep": 8888,
      "throughput": 22.15356458697804,
      "update": 89,
      "cumulative_wall_time": 404.54545454545473
    },
    {
      "timestep": 8989,
      "throughput": 21.152310086904127,
      "update": 90,
      "cumulative_wall_time": 409.0909090909093
    },
    {
      "timestep": 9090,
      "throughput": 22.249738159552745,
      "update": 91,
      "cumulative_wall_time": 413.63636363636385
    },
    {
      "timestep": 9191,
      "throughput": 23.456687483946304,
      "update": 92,
      "cumulative_wall_time": 418.1818181818184
    },
    {
      "timestep": 9292,
      "throughput": 25.489236995519775,
      "update": 93,
      "cumulative_wall_time": 422.727272727273
    },
    {
      "timestep": 9393,
      "throughput": 19.276805902580932,
      "update": 94,
      "cumulative_wall_time": 427.27272727272754
    },
    {
      "timestep": 9494,
      "throughput": 26.69267342424379,
      "update": 95,
      "cumulative_wall_time": 431.8181818181821
    },
    {
      "timestep": 9595,
      "throughput": 17.705406841050497,
      "update": 96,
      "cumulative_wall_time": 436.36363636363666
    },
    {
      "timestep": 9696,
      "throughput": 21.666072790921717,
      "update": 97,
      "cumulative_wall_time": 440.9090909090912
    },
    {
      "timestep": 9797,
      "throughput": 23.29429785426607,
      "update": 98,
      "cumulative_wall_time": 445.4545454545458
    },
    {
      "timestep": 9898,
      "throughput": 22.61818210901707,
      "update": 99,
      "cumulative_wall_time": 450.00000000000034
    },
    {
      "timestep": 10000,
      "throughput": 20.63006105639469,
      "update": 100,
      "cumulative_wall_time": 454.5454545454549
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 2000,
        "success_rate": 0.85,
        "mean_reward": 0.7608375549928545,
        "recent_gradient": 0.009013998130682335
      },
      "level_2": {
        "num_pulls": 2000,
        "success_rate": 0.65,
        "mean_reward": 0.5732127048611159,
        "recent_gradient": 0.02169920419404205
      },
      "level_3": {
        "num_pulls": 2000,
        "success_rate": 0.45,
        "mean_reward": 0.412140309719301,
        "recent_gradient": 0.028614180809478692
      },
      "level_4": {
        "num_pulls": 2000,
        "success_rate": 0.28,
        "mean_reward": 0.2699919975086651,
        "recent_gradient": 0.02061459904175322
      },
      "level_5": {
        "num_pulls": 2000,
        "success_rate": 0.15,
        "mean_reward": 0.1512572423767792,
        "recent_gradient": 0.011259257683847225
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.15
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 4.5855024945389635
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.719909479901515
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 5.373646802561631
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 5.3051851327167325
      }
    }
  },
  "config": {
    "use_async": true,
    "curriculum_strategy": "uniform",
    "use_csc": true
  }
}