{
  "experiment_name": "async_seed123",
  "total_timesteps": 10000,
  "total_time": 400.0,
  "avg_throughput": 25,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": 0.04986727232917929,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 101,
      "pass_at_1": 0.013740378041847924,
      "avg_reward": -0.06432243326242626,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 202,
      "pass_at_1": 0.004589611122245438,
      "avg_reward": 0.0862435157526539,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 303,
      "pass_at_1": 0.0,
      "avg_reward": -0.021445631442808866,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 404,
      "pass_at_1": 0.05764195749734301,
      "avg_reward": 0.0027765458846193206,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 505,
      "pass_at_1": 0.12221031280485325,
      "avg_reward": 0.09303280179703806,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 606,
      "pass_at_1": 0.16743362248574867,
      "avg_reward": 0.10200179815436639,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 707,
      "pass_at_1": 0.13055547726142347,
      "avg_reward": 0.08272681802821291,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 808,
      "pass_at_1": 0.18539422951526321,
      "avg_reward": 0.2576546880608999,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 909,
      "pass_at_1": 0.16320816678971306,
      "avg_reward": 0.14987585339051326,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.15973658775574215,
      "avg_reward": 0.20232587161213367,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.12814504193010134,
      "avg_reward": 0.16130748578318627,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.1236666863719069,
      "avg_reward": 0.06704577397485502,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.16877875580056836,
      "avg_reward": 0.06358896962915624,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.1497370885389715,
      "avg_reward": 0.07670192603819292,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.1493370256484754,
      "avg_reward": -0.02045983475425589,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.12093851347281007,
      "avg_reward": 0.06175694904835219,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.17684666578700844,
      "avg_reward": 0.13279554849009598,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.16029071641518872,
      "avg_reward": 0.16264370868726521,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.14458724560157254,
      "avg_reward": 0.12985116267162258,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.1480222579636393,
      "avg_reward": 0.03203433166488108,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.15827029214429045,
      "avg_reward": 0.15530652683568527,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.17482548939561054,
      "avg_reward": 0.13926886679254744,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.21787278629487392,
      "avg_reward": 0.19494383705133808,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.19157795253665472,
      "avg_reward": 0.2651695289542214,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.14810487811998385,
      "avg_reward": 0.06654449198573942,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.21084939942046865,
      "avg_reward": 0.12877638277432182,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.1785622213240379,
      "avg_reward": 0.19631557553044776,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.1977805272471501,
      "avg_reward": 0.24596873089677557,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.21188117164870726,
      "avg_reward": 0.22297457080425265,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.16851965352062043,
      "avg_reward": 0.17455885620615724,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.19226805568949443,
      "avg_reward": 0.08750117155457274,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.21634023087850732,
      "avg_reward": 0.21343401143173418,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.19091812662104596,
      "avg_reward": 0.1410798982476161,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.16805841085655027,
      "avg_reward": 0.14442293236317183,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.20341094968375525,
      "avg_reward": 0.12117101053484025,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.21930519641991092,
      "avg_reward": 0.12058400481177704,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.15561885998574818,
      "avg_reward": 0.17648144253323356,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.1920336893303795,
      "avg_reward": 0.14732547219865286,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.1853707981309512,
      "avg_reward": 0.06799850046889082,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.2292455698150509,
      "avg_reward": 0.14895300665969466,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.23937871725670223,
      "avg_reward": 0.23186838311589825,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.20188209406338384,
      "avg_reward": 0.10721055519436376,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.19554394101212366,
      "avg_reward": 0.09580899625494047,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.2539492972018572,
      "avg_reward": 0.21138149927297703,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.2372225085956151,
      "avg_reward": 0.12641040442598073,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.2198475815122781,
      "avg_reward": 0.2347711621502514,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.21153185560619917,
      "avg_reward": 0.22078120743104646,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.1985422152436705,
      "avg_reward": 0.09066019496400719,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.2298190020173903,
      "avg_reward": 0.16489637988528463,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.2370650197286681,
      "avg_reward": 0.09075761920691205
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.24045728450598108,
      "avg_reward": 0.32228102396825065
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.22770228140484067,
      "avg_reward": 0.18386893156936462
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.2337629612235678,
      "avg_reward": 0.0939115834392649
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.24066605842364677,
      "avg_reward": 0.1122623595381192
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.2255542984516332,
      "avg_reward": 0.24258691624149342
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.22136155885722866,
      "avg_reward": 0.20215169656415294
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.25827156677378554,
      "avg_reward": 0.22055429622382844
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.2125412270548757,
      "avg_reward": 0.15340921787632988
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.2810840057807684,
      "avg_reward": 0.12361491647474118
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.2383074675194332,
      "avg_reward": 0.1630405704411412
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.24815703121463648,
      "avg_reward": 0.23593640583107073
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.27982595411267475,
      "avg_reward": 0.2103491436896819
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.26579984079849833,
      "avg_reward": 0.23762687988205733
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.26093134910117743,
      "avg_reward": 0.18054888270461833
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.23337956009382047,
      "avg_reward": 0.13170149244402152
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.24006872407641108,
      "avg_reward": 0.20813930805444023
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.27227752984916764,
      "avg_reward": 0.2339954662721789
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.24792981869106834,
      "avg_reward": 0.28864236044947844
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.2911256342638031,
      "avg_reward": 0.21520050177353384
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.24610784282992845,
      "avg_reward": 0.20339702197184126
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.28973907433793616,
      "avg_reward": 0.2484295083330548
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.2773289287174847,
      "avg_reward": 0.2112591368602065
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.2771161978844765,
      "avg_reward": 0.29892018088038813
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.26497795957714476,
      "avg_reward": 0.21914775428710945
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.2766157157933448,
      "avg_reward": 0.23547884042322773
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.24505692993214295,
      "avg_reward": 0.10220211115201966
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.2546439800632503,
      "avg_reward": 0.21211229882068364
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.28784342280588193,
      "avg_reward": 0.20374101025602437
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.30602731073226175,
      "avg_reward": 0.23766304986950004
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.28059079431421846,
      "avg_reward": 0.21477444192374165
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.2845535917682961,
      "avg_reward": 0.26286657711681705
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.29686079963317846,
      "avg_reward": 0.19256749267606327
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.31568160836898507,
      "avg_reward": 0.19779396382384218
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.2884392441728605,
      "avg_reward": 0.21703156666217077
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.26750686101988086,
      "avg_reward": 0.21024945941721312
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.2752878883518995,
      "avg_reward": 0.22387567284532223
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.29976869819436697,
      "avg_reward": 0.31341142700415714
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.2994427000386189,
      "avg_reward": 0.20899289301565388
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.2870357615922566,
      "avg_reward": 0.23662751457953346
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.29829551407006893,
      "avg_reward": 0.3116158746674762
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.32587639348478165,
      "avg_reward": 0.24275431847571224
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.2885243356985696,
      "avg_reward": 0.1029667383554628
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.2900313354990127,
      "avg_reward": 0.183122183094996
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.2954104662441561,
      "avg_reward": 0.25590758511283046
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.30753259151173357,
      "avg_reward": 0.24452767285700974
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.3094466939233628,
      "avg_reward": 0.24125146647714069
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.31084620126185075,
      "avg_reward": 0.087124210613515
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.302955142136475,
      "avg_reward": 0.23682157765652967
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.3029353468815797,
      "avg_reward": 0.2314509644001167
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": 0.04986727232917929,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.3029353468815797,
      "avg_reward": 0.2314509644001167
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 12.5,
      "update": 1,
      "cumulative_wall_time": 4.0
    },
    {
      "timestep": 101,
      "throughput": 13.750000000000002,
      "update": 2,
      "cumulative_wall_time": 8.0
    },
    {
      "timestep": 202,
      "throughput": 15.0,
      "update": 3,
      "cumulative_wall_time": 12.0
    },
    {
      "timestep": 303,
      "throughput": 16.25,
      "update": 4,
      "cumulative_wall_time": 16.0
    },
    {
      "timestep": 404,
      "throughput": 17.5,
      "update": 5,
      "cumulative_wall_time": 20.0
    },
    {
      "timestep": 505,
      "throughput": 18.75,
      "update": 6,
      "cumulative_wall_time": 24.0
    },
    {
      "timestep": 606,
      "throughput": 20.0,
      "update": 7,
      "cumulative_wall_time": 28.0
    },
    {
      "timestep": 707,
      "throughput": 21.25,
      "update": 8,
      "cumulative_wall_time": 32.0
    },
    {
      "timestep": 808,
      "throughput": 22.5,
      "update": 9,
      "cumulative_wall_time": 36.0
    },
    {
      "timestep": 909,
      "throughput": 23.75,
      "update": 10,
      "cumulative_wall_time": 40.0
    },
    {
      "timestep": 1010,
      "throughput": 26.758275294516825,
      "update": 11,
      "cumulative_wall_time": 44.0
    },
    {
      "timestep": 1111,
      "throughput": 23.504736671647937,
      "update": 12,
      "cumulative_wall_time": 48.0
    },
    {
      "timestep": 1212,
      "throughput": 30.501755248042823,
      "update": 13,
      "cumulative_wall_time": 52.0
    },
    {
      "timestep": 1313,
      "throughput": 26.720742325555218,
      "update": 14,
      "cumulative_wall_time": 56.0
    },
    {
      "timestep": 1414,
      "throughput": 24.98423187271532,
      "update": 15,
      "cumulative_wall_time": 60.0
    },
    {
      "timestep": 1515,
      "throughput": 24.483344242006083,
      "update": 16,
      "cumulative_wall_time": 64.0
    },
    {
      "timestep": 1616,
      "throughput": 24.783694284044664,
      "update": 17,
      "cumulative_wall_time": 68.0
    },
    {
      "timestep": 1717,
      "throughput": 22.71173232514005,
      "update": 18,
      "cumulative_wall_time": 72.0
    },
    {
      "timestep": 1818,
      "throughput": 24.761993651854976,
      "update": 19,
      "cumulative_wall_time": 76.0
    },
    {
      "timestep": 1919,
      "throughput": 25.696708791817635,
      "update": 20,
      "cumulative_wall_time": 80.0
    },
    {
      "timestep": 2020,
      "throughput": 26.448854038933074,
      "update": 21,
      "cumulative_wall_time": 84.0
    },
    {
      "timestep": 2121,
      "throughput": 26.449224447860836,
      "update": 22,
      "cumulative_wall_time": 88.0
    },
    {
      "timestep": 2222,
      "throughput": 24.312806133585163,
      "update": 23,
      "cumulative_wall_time": 92.0
    },
    {
      "timestep": 2323,
      "throughput": 21.459794368695174,
      "update": 24,
      "cumulative_wall_time": 96.0
    },
    {
      "timestep": 2424,
      "throughput": 23.327243434416385,
      "update": 25,
      "cumulative_wall_time": 100.0
    },
    {
      "timestep": 2525,
      "throughput": 29.030482607030972,
      "update": 26,
      "cumulative_wall_time": 104.0
    },
    {
      "timestep": 2626,
      "throughput": 27.240145783524873,
      "update": 27,
      "cumulative_wall_time": 108.0
    },
    {
      "timestep": 2727,
      "throughput": 25.924048965760438,
      "update": 28,
      "cumulative_wall_time": 112.0
    },
    {
      "timestep": 2828,
      "throughput": 23.09676438809969,
      "update": 29,
      "cumulative_wall_time": 116.0
    },
    {
      "timestep": 2929,
      "throughput": 25.009112887434444,
      "update": 30,
      "cumulative_wall_time": 120.0
    },
    {
      "timestep": 3030,
      "throughput": 21.860828285843795,
      "update": 31,
      "cumulative_wall_time": 124.0
    },
    {
      "timestep": 3131,
      "throughput": 23.620157810759814,
      "update": 32,
      "cumulative_wall_time": 128.0
    },
    {
      "timestep": 3232,
      "throughput": 24.386991645787013,
      "update": 33,
      "cumulative_wall_time": 132.0
    },
    {
      "timestep": 3333,
      "throughput": 24.095900170336968,
      "update": 34,
      "cumulative_wall_time": 136.0
    },
    {
      "timestep": 3434,
      "throughput": 27.391504827640027,
      "update": 35,
      "cumulative_wall_time": 140.0
    },
    {
      "timestep": 3535,
      "throughput": 21.453185214911368,
      "update": 36,
      "cumulative_wall_time": 144.0
    },
    {
      "timestep": 3636,
      "throughput": 22.836419321212116,
      "update": 37,
      "cumulative_wall_time": 148.0
    },
    {
      "timestep": 3737,
      "throughput": 21.563280072444453,
      "update": 38,
      "cumulative_wall_time": 152.0
    },
    {
      "timestep": 3838,
      "throughput": 21.906616968280364,
      "update": 39,
      "cumulative_wall_time": 156.0
    },
    {
      "timestep": 3939,
      "throughput": 25.310139741116622,
      "update": 40,
      "cumulative_wall_time": 160.0
    },
    {
      "timestep": 4040,
      "throughput": 20.99889866735932,
      "update": 41,
      "cumulative_wall_time": 164.0
    },
    {
      "timestep": 4141,
      "throughput": 26.88467194709409,
      "update": 42,
      "cumulative_wall_time": 168.0
    },
    {
      "timestep": 4242,
      "throughput": 24.382960557647312,
      "update": 43,
      "cumulative_wall_time": 172.0
    },
    {
      "timestep": 4343,
      "throughput": 25.171970831314944,
      "update": 44,
      "cumulative_wall_time": 176.0
    },
    {
      "timestep": 4444,
      "throughput": 25.80644184499301,
      "update": 45,
      "cumulative_wall_time": 180.0
    },
    {
      "timestep": 4545,
      "throughput": 23.914583699371022,
      "update": 46,
      "cumulative_wall_time": 184.0
    },
    {
      "timestep": 4646,
      "throughput": 27.581199289383445,
      "update": 47,
      "cumulative_wall_time": 188.0
    },
    {
      "timestep": 4747,
      "throughput": 24.514143183180913,
      "update": 48,
      "cumulative_wall_time": 192.0
    },
    {
      "timestep": 4848,
      "throughput": 26.485175638097676,
      "update": 49,
      "cumulative_wall_time": 196.0
    },
    {
      "timestep": 4949,
      "throughput": 24.50221904310687,
      "update": 50,
      "cumulative_wall_time": 200.0
    },
    {
      "timestep": 5050,
      "throughput": 25.72718596856231,
      "update": 51,
      "cumulative_wall_time": 204.0
    },
    {
      "timestep": 5151,
      "throughput": 25.699156675394903,
      "update": 52,
      "cumulative_wall_time": 208.0
    },
    {
      "timestep": 5252,
      "throughput": 25.62492484863883,
      "update": 53,
      "cumulative_wall_time": 212.0
    },
    {
      "timestep": 5353,
      "throughput": 22.5642303759477,
      "update": 54,
      "cumulative_wall_time": 216.0
    },
    {
      "timestep": 5454,
      "throughput": 26.0896894263686,
      "update": 55,
      "cumulative_wall_time": 220.0
    },
    {
      "timestep": 5555,
      "throughput": 24.20260752725101,
      "update": 56,
      "cumulative_wall_time": 224.0
    },
    {
      "timestep": 5656,
      "throughput": 26.576220076224793,
      "update": 57,
      "cumulative_wall_time": 228.0
    },
    {
      "timestep": 5757,
      "throughput": 19.618766388969238,
      "update": 58,
      "cumulative_wall_time": 232.0
    },
    {
      "timestep": 5858,
      "throughput": 21.337209444862623,
      "update": 59,
      "cumulative_wall_time": 236.0
    },
    {
      "timestep": 5959,
      "throughput": 25.908613905337575,
      "update": 60,
      "cumulative_wall_time": 240.0
    },
    {
      "timestep": 6060,
      "throughput": 29.657318962763075,
      "update": 61,
      "cumulative_wall_time": 244.0
    },
    {
      "timestep": 6161,
      "throughput": 27.08764686702809,
      "update": 62,
      "cumulative_wall_time": 248.0
    },
    {
      "timestep": 6262,
      "throughput": 23.29387266450005,
      "update": 63,
      "cumulative_wall_time": 252.0
    },
    {
      "timestep": 6363,
      "throughput": 20.76986896155511,
      "update": 64,
      "cumulative_wall_time": 256.0
    },
    {
      "timestep": 6464,
      "throughput": 26.85671555290405,
      "update": 65,
      "cumulative_wall_time": 260.0
    },
    {
      "timestep": 6565,
      "throughput": 24.798541944892623,
      "update": 66,
      "cumulative_wall_time": 264.0
    },
    {
      "timestep": 6666,
      "throughput": 26.47676054473596,
      "update": 67,
      "cumulative_wall_time": 268.0
    },
    {
      "timestep": 6767,
      "throughput": 25.288246805526978,
      "update": 68,
      "cumulative_wall_time": 272.0
    },
    {
      "timestep": 6868,
      "throughput": 25.074107312801235,
      "update": 69,
      "cumulative_wall_time": 276.0
    },
    {
      "timestep": 6969,
      "throughput": 32.39656361473294,
      "update": 70,
      "cumulative_wall_time": 280.0
    },
    {
      "timestep": 7070,
      "throughput": 24.984675097386052,
      "update": 71,
      "cumulative_wall_time": 284.0
    },
    {
      "timestep": 7171,
      "throughput": 24.601886976866837,
      "update": 72,
      "cumulative_wall_time": 288.0
    },
    {
      "timestep": 7272,
      "throughput": 24.696378311489944,
      "update": 73,
      "cumulative_wall_time": 292.0
    },
    {
      "timestep": 7373,
      "throughput": 23.541158208230858,
      "update": 74,
      "cumulative_wall_time": 296.0
    },
    {
      "timestep": 7474,
      "throughput": 27.47533223678828,
      "update": 75,
      "cumulative_wall_time": 300.0
    },
    {
      "timestep": 7575,
      "throughput": 24.115614165546628,
      "update": 76,
      "cumulative_wall_time": 304.0
    },
    {
      "timestep": 7676,
      "throughput": 26.589856764111474,
      "update": 77,
      "cumulative_wall_time": 308.0
    },
    {
      "timestep": 7777,
      "throughput": 25.711507574533893,
      "update": 78,
      "cumulative_wall_time": 312.0
    },
    {
      "timestep": 7878,
      "throughput": 28.047464655331066,
      "update": 79,
      "cumulative_wall_time": 316.0
    },
    {
      "timestep": 7979,
      "throughput": 26.050448992470905,
      "update": 80,
      "cumulative_wall_time": 320.0
    },
    {
      "timestep": 8080,
      "throughput": 21.96653804763088,
      "update": 81,
      "cumulative_wall_time": 324.0
    },
    {
      "timestep": 8181,
      "throughput": 21.68378053736515,
      "update": 82,
      "cumulative_wall_time": 328.0
    },
    {
      "timestep": 8282,
      "throughput": 28.520922865192254,
      "update": 83,
      "cumulative_wall_time": 332.0
    },
    {
      "timestep": 8383,
      "throughput": 23.478222991838894,
      "update": 84,
      "cumulative_wall_time": 336.0
    },
    {
      "timestep": 8484,
      "throughput": 21.698493550525868,
      "update": 85,
      "cumulative_wall_time": 340.0
    },
    {
      "timestep": 8585,
      "throughput": 23.325953500325607,
      "update": 86,
      "cumulative_wall_time": 344.0
    },
    {
      "timestep": 8686,
      "throughput": 28.161563217420017,
      "update": 87,
      "cumulative_wall_time": 348.0
    },
    {
      "timestep": 8787,
      "throughput": 21.449467502628718,
      "update": 88,
      "cumulative_wall_time": 352.0
    },
    {
      "timestep": 8888,
      "throughput": 22.833761990600976,
      "update": 89,
      "cumulative_wall_time": 356.0
    },
    {
      "timestep": 8989,
      "throughput": 23.332981228008702,
      "update": 90,
      "cumulative_wall_time": 360.0
    },
    {
      "timestep": 9090,
      "throughput": 21.87202531631701,
      "update": 91,
      "cumulative_wall_time": 364.0
    },
    {
      "timestep": 9191,
      "throughput": 22.039181653720842,
      "update": 92,
      "cumulative_wall_time": 368.0
    },
    {
      "timestep": 9292,
      "throughput": 21.204730061840856,
      "update": 93,
      "cumulative_wall_time": 372.0
    },
    {
      "timestep": 9393,
      "throughput": 23.847031467158196,
      "update": 94,
      "cumulative_wall_time": 376.0
    },
    {
      "timestep": 9494,
      "throughput": 24.11272792064979,
      "update": 95,
      "cumulative_wall_time": 380.0
    },
    {
      "timestep": 9595,
      "throughput": 23.293654614491736,
      "update": 96,
      "cumulative_wall_time": 384.0
    },
    {
      "timestep": 9696,
      "throughput": 20.865755402580895,
      "update": 97,
      "cumulative_wall_time": 388.0
    },
    {
      "timestep": 9797,
      "throughput": 28.133339867139988,
      "update": 98,
      "cumulative_wall_time": 392.0
    },
    {
      "timestep": 9898,
      "throughput": 21.677302927069597,
      "update": 99,
      "cumulative_wall_time": 396.0
    },
    {
      "timestep": 10000,
      "throughput": 25.69508428005718,
      "update": 100,
      "cumulative_wall_time": 400.0
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 2000,
        "success_rate": 0.85,
        "mean_reward": 0.7435046681376225,
        "recent_gradient": 0.011336633733483056
      },
      "level_2": {
        "num_pulls": 2000,
        "success_rate": 0.65,
        "mean_reward": 0.6041166471033433,
        "recent_gradient": 0.01824477282674469
      },
      "level_3": {
        "num_pulls": 2000,
        "success_rate": 0.45,
        "mean_reward": 0.3665256854060575,
        "recent_gradient": 0.03139157463827921
      },
      "level_4": {
        "num_pulls": 2000,
        "success_rate": 0.28,
        "mean_reward": 0.28951601093427276,
        "recent_gradient": 0.02083138907978487
      },
      "level_5": {
        "num_pulls": 2000,
        "success_rate": 0.15,
        "mean_reward": 0.13821088842959436,
        "recent_gradient": 0.011639521219220378
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.15
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 5.382527422998509
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.585505583119495
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 4.670424344651676
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 5.305561775027956
      }
    }
  },
  "config": {
    "use_async": true,
    "curriculum_strategy": "uniform"
  }
}