{
  "experiment_name": "async_seed42",
  "total_timesteps": 10000,
  "total_time": 400.0,
  "avg_throughput": 25,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.009934283060224654,
      "avg_reward": 0.0010342113896204897,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 101,
      "pass_at_1": 0.021034578842821932,
      "avg_reward": 0.09297915589465883,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 202,
      "pass_at_1": 0.011478548667149445,
      "avg_reward": -0.0025240089137394707,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 303,
      "pass_at_1": 0.055826680552572075,
      "avg_reward": 0.0830330808997031,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 404,
      "pass_at_1": 0.022933744604533287,
      "avg_reward": 0.04547499786292486,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 505,
      "pass_at_1": 0.1265196819810451,
      "avg_reward": 0.07792925790632324,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 606,
      "pass_at_1": 0.1424450753945836,
      "avg_reward": 0.018292048082776985,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 707,
      "pass_at_1": 0.10493675980408412,
      "avg_reward": 0.055835031381218675,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 808,
      "pass_at_1": 0.12101900545406562,
      "avg_reward": 0.11252757099301619,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 909,
      "pass_at_1": 0.12496660732171129,
      "avg_reward": 0.029358100790604455,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.17430219161624838,
      "avg_reward": 0.1281529382686719,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.14821228339190765,
      "avg_reward": 0.04733241740285328,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.1378566452363835,
      "avg_reward": 0.11583144567460012,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.1276167803361163,
      "avg_reward": 0.12087832518617664,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.14052568914436872,
      "avg_reward": 0.09783586382583115,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.1424152808144994,
      "avg_reward": 0.2065461338770464,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.15609923106824833,
      "avg_reward": 0.07199383840680365,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.17474831539390057,
      "avg_reward": 0.07875646981656934,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.16441106999734761,
      "avg_reward": 0.033545349803889304,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.13561425148378498,
      "avg_reward": 0.11833446298048417,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.17889891992485982,
      "avg_reward": 0.15168754999938638,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.16377532237162765,
      "avg_reward": 0.11596507311783769,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.13848326856826595,
      "avg_reward": 0.07479440443487734,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.16081270555692365,
      "avg_reward": 0.1815062757564847,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.17887559820927704,
      "avg_reward": 0.05494847079928494,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.18046826397110474,
      "avg_reward": 0.12512049715606796,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.16243671491189088,
      "avg_reward": 0.16053318637155609,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.19858854716789032,
      "avg_reward": 0.2054348436901222,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.1631820489568339,
      "avg_reward": 0.1150850203729064,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.18859355753610915,
      "avg_reward": 0.1996521023850053,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.17439034304865847,
      "avg_reward": 0.1302293256057359,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.16385591631923654,
      "avg_reward": 0.0712744018513557,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.20424476639685424,
      "avg_reward": 0.23120781454602457,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.18856812257681735,
      "avg_reward": 0.20103114295605512,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.1992571542515187,
      "avg_reward": 0.12714973567095872,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.20127007940501063,
      "avg_reward": 0.237917891847307,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.1953445946557213,
      "avg_reward": 0.23450785851527736,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.14568596490480212,
      "avg_reward": 0.1576438971426029,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.2018419514571851,
      "avg_reward": 0.1465231936424547,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.2039563481181623,
      "avg_reward": 0.06378663276448521,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.19974738456381627,
      "avg_reward": 0.17765353622664035,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.23571754838857376,
      "avg_reward": 0.16266052779717663,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.1920073849398693,
      "avg_reward": 0.12851805577266862,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.2285012231005743,
      "avg_reward": 0.19923853396344368,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.20161182593475274,
      "avg_reward": 0.18695283240347002,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.21615994873164326,
      "avg_reward": 0.2213602085119591,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.20218581704279096,
      "avg_reward": 0.14536554630434437,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.21038990778221633,
      "avg_reward": 0.09513617881916714,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.22615597902507736,
      "avg_reward": 0.19397754682905635,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.2223332589086768,
      "avg_reward": 0.16613725045818412,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.1959165111022232,
      "avg_reward": 0.1357009427435106
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.21935770146603534,
      "avg_reward": 0.13537229771174733
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.2249690868001501,
      "avg_reward": 0.20017781228084702
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.2678956895550048,
      "avg_reward": 0.2230454422855958
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.23729413344429587,
      "avg_reward": 0.18611301096712835
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.19573246610812844,
      "avg_reward": 0.15526027911404194
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.23727050217805074,
      "avg_reward": 0.3129785073667049
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.23416956639903566,
      "avg_reward": 0.20241302023590915
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.23926596106266296,
      "avg_reward": 0.13297886696915376
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.2647522352233031,
      "avg_reward": 0.24939843981298118
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.25964382673761766,
      "avg_reward": 0.16224568865035718
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.27379797017141566,
      "avg_reward": 0.1489458229975185
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.2593892766282391,
      "avg_reward": 0.3170342025930902
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.22974228769634816,
      "avg_reward": 0.15547894367693993
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.25343743044549427,
      "avg_reward": 0.17757616165058546
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.22231272084801584,
      "avg_reward": 0.18127832541871405
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.23395139398987144,
      "avg_reward": 0.21084073672365622
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.23867005730192498,
      "avg_reward": 0.26843276609241695
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.2432438547682584,
      "avg_reward": 0.17849200800432297
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.2770186661385657,
      "avg_reward": 0.1600717170891548
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.26712566964172435,
      "avg_reward": 0.2790576734275009
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.2322434367456246,
      "avg_reward": 0.1950264423231149
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.27139561050425226,
      "avg_reward": 0.2562076319922673
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.24325176576287028,
      "avg_reward": 0.1285785819560824
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.28021016651903696,
      "avg_reward": 0.23901736687688888
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.2765492432692698,
      "avg_reward": 0.23856180509026462
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.2596942130219977,
      "avg_reward": 0.21936805527564834
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.2808985309476607,
      "avg_reward": 0.1890012538568102
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.31408178970871287,
      "avg_reward": 0.2749570778125597
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.2546560911308627,
      "avg_reward": 0.23655255333638164
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.2606908409449796,
      "avg_reward": 0.24790690294310627
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.3050449674935109,
      "avg_reward": 0.2030018580772232
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.3028152534598183,
      "avg_reward": 0.26289124911467954
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.3016495360393043,
      "avg_reward": 0.3361592779641408
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.2819469415709908,
      "avg_reward": 0.18787074503891818
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.2706964059737401,
      "avg_reward": 0.17576661053072018
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.28856212962946537,
      "avg_reward": 0.2479073024444045
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.29724079495657996,
      "avg_reward": 0.27915179841706517
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.2935550535036287,
      "avg_reward": 0.3075207466607688
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.2895750211418895,
      "avg_reward": 0.3676684752429925
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.308939644436126,
      "avg_reward": 0.20429383772808668
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.2765514849284203,
      "avg_reward": 0.24536480870489552
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.29502792255577653,
      "avg_reward": 0.27172236274922584
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.310474496256928,
      "avg_reward": 0.2447381513726988
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.28557108104468437,
      "avg_reward": 0.15271450360145428
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.2950584458864134,
      "avg_reward": 0.2788666964253044
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.3097369265841966,
      "avg_reward": 0.18550260233175792
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.31036944112800485,
      "avg_reward": 0.26756142188884574
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.29066386320746745,
      "avg_reward": 0.2402173458632504
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.31092475557463145,
      "avg_reward": 0.191591289568174
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.009934283060224654,
      "avg_reward": 0.0010342113896204897,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.31092475557463145,
      "avg_reward": 0.191591289568174
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 12.5,
      "update": 1,
      "cumulative_wall_time": 4.0
    },
    {
      "timestep": 101,
      "throughput": 13.750000000000002,
      "update": 2,
      "cumulative_wall_time": 8.0
    },
    {
      "timestep": 202,
      "throughput": 15.0,
      "update": 3,
      "cumulative_wall_time": 12.0
    },
    {
      "timestep": 303,
      "throughput": 16.25,
      "update": 4,
      "cumulative_wall_time": 16.0
    },
    {
      "timestep": 404,
      "throughput": 17.5,
      "update": 5,
      "cumulative_wall_time": 20.0
    },
    {
      "timestep": 505,
      "throughput": 18.75,
      "update": 6,
      "cumulative_wall_time": 24.0
    },
    {
      "timestep": 606,
      "throughput": 20.0,
      "update": 7,
      "cumulative_wall_time": 28.0
    },
    {
      "timestep": 707,
      "throughput": 21.25,
      "update": 8,
      "cumulative_wall_time": 32.0
    },
    {
      "timestep": 808,
      "throughput": 22.5,
      "update": 9,
      "cumulative_wall_time": 36.0
    },
    {
      "timestep": 909,
      "throughput": 23.75,
      "update": 10,
      "cumulative_wall_time": 40.0
    },
    {
      "timestep": 1010,
      "throughput": 25.894468400870707,
      "update": 11,
      "cumulative_wall_time": 44.0
    },
    {
      "timestep": 1111,
      "throughput": 26.401961315920587,
      "update": 12,
      "cumulative_wall_time": 48.0
    },
    {
      "timestep": 1212,
      "throughput": 27.70762810793819,
      "update": 13,
      "cumulative_wall_time": 52.0
    },
    {
      "timestep": 1313,
      "throughput": 27.634505130087256,
      "update": 14,
      "cumulative_wall_time": 56.0
    },
    {
      "timestep": 1414,
      "throughput": 21.555826580107272,
      "update": 15,
      "cumulative_wall_time": 60.0
    },
    {
      "timestep": 1515,
      "throughput": 22.655437400212193,
      "update": 16,
      "cumulative_wall_time": 64.0
    },
    {
      "timestep": 1616,
      "throughput": 26.287588168021646,
      "update": 17,
      "cumulative_wall_time": 68.0
    },
    {
      "timestep": 1717,
      "throughput": 26.284464877280524,
      "update": 18,
      "cumulative_wall_time": 72.0
    },
    {
      "timestep": 1818,
      "throughput": 26.28761921576512,
      "update": 19,
      "cumulative_wall_time": 76.0
    },
    {
      "timestep": 1919,
      "throughput": 34.631828726636805,
      "update": 20,
      "cumulative_wall_time": 80.0
    },
    {
      "timestep": 2020,
      "throughput": 26.427226276732917,
      "update": 21,
      "cumulative_wall_time": 84.0
    },
    {
      "timestep": 2121,
      "throughput": 27.838914100451497,
      "update": 22,
      "cumulative_wall_time": 88.0
    },
    {
      "timestep": 2222,
      "throughput": 27.385004408733003,
      "update": 23,
      "cumulative_wall_time": 92.0
    },
    {
      "timestep": 2323,
      "throughput": 26.628478128264494,
      "update": 24,
      "cumulative_wall_time": 96.0
    },
    {
      "timestep": 2424,
      "throughput": 24.211826888399134,
      "update": 25,
      "cumulative_wall_time": 100.0
    },
    {
      "timestep": 2525,
      "throughput": 26.897423051233172,
      "update": 26,
      "cumulative_wall_time": 104.0
    },
    {
      "timestep": 2626,
      "throughput": 23.06793696365607,
      "update": 27,
      "cumulative_wall_time": 108.0
    },
    {
      "timestep": 2727,
      "throughput": 24.407953483149978,
      "update": 28,
      "cumulative_wall_time": 112.0
    },
    {
      "timestep": 2828,
      "throughput": 23.786591130427244,
      "update": 29,
      "cumulative_wall_time": 116.0
    },
    {
      "timestep": 2929,
      "throughput": 25.204685348465805,
      "update": 30,
      "cumulative_wall_time": 120.0
    },
    {
      "timestep": 3030,
      "throughput": 30.786646416683773,
      "update": 31,
      "cumulative_wall_time": 124.0
    },
    {
      "timestep": 3131,
      "throughput": 20.33183701852063,
      "update": 32,
      "cumulative_wall_time": 128.0
    },
    {
      "timestep": 3232,
      "throughput": 26.715650475936283,
      "update": 33,
      "cumulative_wall_time": 132.0
    },
    {
      "timestep": 3333,
      "throughput": 20.96821032202587,
      "update": 34,
      "cumulative_wall_time": 136.0
    },
    {
      "timestep": 3434,
      "throughput": 23.820170335526416,
      "update": 35,
      "cumulative_wall_time": 140.0
    },
    {
      "timestep": 3535,
      "throughput": 27.722376492418416,
      "update": 36,
      "cumulative_wall_time": 144.0
    },
    {
      "timestep": 3636,
      "throughput": 25.160700047738654,
      "update": 37,
      "cumulative_wall_time": 148.0
    },
    {
      "timestep": 3737,
      "throughput": 22.305638055176736,
      "update": 38,
      "cumulative_wall_time": 152.0
    },
    {
      "timestep": 3838,
      "throughput": 23.21174072685008,
      "update": 39,
      "cumulative_wall_time": 156.0
    },
    {
      "timestep": 3939,
      "throughput": 26.69899437233669,
      "update": 40,
      "cumulative_wall_time": 160.0
    },
    {
      "timestep": 4040,
      "throughput": 23.17408342070716,
      "update": 41,
      "cumulative_wall_time": 164.0
    },
    {
      "timestep": 4141,
      "throughput": 25.54114647395494,
      "update": 42,
      "cumulative_wall_time": 168.0
    },
    {
      "timestep": 4242,
      "throughput": 25.113929599759533,
      "update": 43,
      "cumulative_wall_time": 172.0
    },
    {
      "timestep": 4343,
      "throughput": 23.370999130985457,
      "update": 44,
      "cumulative_wall_time": 176.0
    },
    {
      "timestep": 4444,
      "throughput": 30.35986022331332,
      "update": 45,
      "cumulative_wall_time": 180.0
    },
    {
      "timestep": 4545,
      "throughput": 26.584797555795024,
      "update": 46,
      "cumulative_wall_time": 184.0
    },
    {
      "timestep": 4646,
      "throughput": 19.937143533355982,
      "update": 47,
      "cumulative_wall_time": 188.0
    },
    {
      "timestep": 4747,
      "throughput": 25.466135786923573,
      "update": 48,
      "cumulative_wall_time": 192.0
    },
    {
      "timestep": 4848,
      "throughput": 23.34553383807903,
      "update": 49,
      "cumulative_wall_time": 196.0
    },
    {
      "timestep": 4949,
      "throughput": 27.131083336990557,
      "update": 50,
      "cumulative_wall_time": 200.0
    },
    {
      "timestep": 5050,
      "throughput": 23.018698153918248,
      "update": 51,
      "cumulative_wall_time": 204.0
    },
    {
      "timestep": 5151,
      "throughput": 24.71315889633275,
      "update": 52,
      "cumulative_wall_time": 208.0
    },
    {
      "timestep": 5252,
      "throughput": 26.262468197451145,
      "update": 53,
      "cumulative_wall_time": 212.0
    },
    {
      "timestep": 5353,
      "throughput": 27.164387985425304,
      "update": 54,
      "cumulative_wall_time": 216.0
    },
    {
      "timestep": 5454,
      "throughput": 21.99925898236056,
      "update": 55,
      "cumulative_wall_time": 220.0
    },
    {
      "timestep": 5555,
      "throughput": 24.16374691039763,
      "update": 56,
      "cumulative_wall_time": 224.0
    },
    {
      "timestep": 5656,
      "throughput": 23.81263672209761,
      "update": 57,
      "cumulative_wall_time": 228.0
    },
    {
      "timestep": 5757,
      "throughput": 23.36667691856572,
      "update": 58,
      "cumulative_wall_time": 232.0
    },
    {
      "timestep": 5858,
      "throughput": 29.413635600702744,
      "update": 59,
      "cumulative_wall_time": 236.0
    },
    {
      "timestep": 5959,
      "throughput": 26.01245427740239,
      "update": 60,
      "cumulative_wall_time": 240.0
    },
    {
      "timestep": 6060,
      "throughput": 21.847790114162386,
      "update": 61,
      "cumulative_wall_time": 244.0
    },
    {
      "timestep": 6161,
      "throughput": 27.294654867636943,
      "update": 62,
      "cumulative_wall_time": 248.0
    },
    {
      "timestep": 6262,
      "throughput": 30.30539049253158,
      "update": 63,
      "cumulative_wall_time": 252.0
    },
    {
      "timestep": 6363,
      "throughput": 27.58116315137787,
      "update": 64,
      "cumulative_wall_time": 256.0
    },
    {
      "timestep": 6464,
      "throughput": 21.201575085114964,
      "update": 65,
      "cumulative_wall_time": 260.0
    },
    {
      "timestep": 6565,
      "throughput": 23.78941481783437,
      "update": 66,
      "cumulative_wall_time": 264.0
    },
    {
      "timestep": 6666,
      "throughput": 28.167277872966558,
      "update": 67,
      "cumulative_wall_time": 268.0
    },
    {
      "timestep": 6767,
      "throughput": 23.230826335953047,
      "update": 68,
      "cumulative_wall_time": 272.0
    },
    {
      "timestep": 6868,
      "throughput": 26.109548570365572,
      "update": 69,
      "cumulative_wall_time": 276.0
    },
    {
      "timestep": 6969,
      "throughput": 26.93658513357334,
      "update": 70,
      "cumulative_wall_time": 280.0
    },
    {
      "timestep": 7070,
      "throughput": 22.682673821054795,
      "update": 71,
      "cumulative_wall_time": 284.0
    },
    {
      "timestep": 7171,
      "throughput": 24.8511866098455,
      "update": 72,
      "cumulative_wall_time": 288.0
    },
    {
      "timestep": 7272,
      "throughput": 16.89683164982732,
      "update": 73,
      "cumulative_wall_time": 292.0
    },
    {
      "timestep": 7373,
      "throughput": 22.439030896664274,
      "update": 74,
      "cumulative_wall_time": 296.0
    },
    {
      "timestep": 7474,
      "throughput": 24.3685796215171,
      "update": 75,
      "cumulative_wall_time": 300.0
    },
    {
      "timestep": 7575,
      "throughput": 21.880542045087875,
      "update": 76,
      "cumulative_wall_time": 304.0
    },
    {
      "timestep": 7676,
      "throughput": 29.08102825982909,
      "update": 77,
      "cumulative_wall_time": 308.0
    },
    {
      "timestep": 7777,
      "throughput": 21.424646555098416,
      "update": 78,
      "cumulative_wall_time": 312.0
    },
    {
      "timestep": 7878,
      "throughput": 23.899888783257538,
      "update": 79,
      "cumulative_wall_time": 316.0
    },
    {
      "timestep": 7979,
      "throughput": 25.326851443215226,
      "update": 80,
      "cumulative_wall_time": 320.0
    },
    {
      "timestep": 8080,
      "throughput": 28.60318322266529,
      "update": 81,
      "cumulative_wall_time": 324.0
    },
    {
      "timestep": 8181,
      "throughput": 21.410344622051404,
      "update": 82,
      "cumulative_wall_time": 328.0
    },
    {
      "timestep": 8282,
      "throughput": 27.907909380387398,
      "update": 83,
      "cumulative_wall_time": 332.0
    },
    {
      "timestep": 8383,
      "throughput": 25.025582652548966,
      "update": 84,
      "cumulative_wall_time": 336.0
    },
    {
      "timestep": 8484,
      "throughput": 22.546228372380124,
      "update": 85,
      "cumulative_wall_time": 340.0
    },
    {
      "timestep": 8585,
      "throughput": 26.15525868565818,
      "update": 86,
      "cumulative_wall_time": 344.0
    },
    {
      "timestep": 8686,
      "throughput": 25.497649238933672,
      "update": 87,
      "cumulative_wall_time": 348.0
    },
    {
      "timestep": 8787,
      "throughput": 23.499457807103013,
      "update": 88,
      "cumulative_wall_time": 352.0
    },
    {
      "timestep": 8888,
      "throughput": 25.174505212475047,
      "update": 89,
      "cumulative_wall_time": 356.0
    },
    {
      "timestep": 8989,
      "throughput": 24.036716007845598,
      "update": 90,
      "cumulative_wall_time": 360.0
    },
    {
      "timestep": 9090,
      "throughput": 25.283793363128122,
      "update": 91,
      "cumulative_wall_time": 364.0
    },
    {
      "timestep": 9191,
      "throughput": 26.655326686302615,
      "update": 92,
      "cumulative_wall_time": 368.0
    },
    {
      "timestep": 9292,
      "throughput": 28.965042040363382,
      "update": 93,
      "cumulative_wall_time": 372.0
    },
    {
      "timestep": 9393,
      "throughput": 21.905461252932877,
      "update": 94,
      "cumulative_wall_time": 376.0
    },
    {
      "timestep": 9494,
      "throughput": 30.332583436640668,
      "update": 95,
      "cumulative_wall_time": 380.0
    },
    {
      "timestep": 9595,
      "throughput": 20.119780501193745,
      "update": 96,
      "cumulative_wall_time": 384.0
    },
    {
      "timestep": 9696,
      "throughput": 24.62053726241104,
      "update": 97,
      "cumulative_wall_time": 388.0
    },
    {
      "timestep": 9797,
      "throughput": 26.47079301621144,
      "update": 98,
      "cumulative_wall_time": 392.0
    },
    {
      "timestep": 9898,
      "throughput": 25.70247966933758,
      "update": 99,
      "cumulative_wall_time": 396.0
    },
    {
      "timestep": 10000,
      "throughput": 23.443251200448515,
      "update": 100,
      "cumulative_wall_time": 400.0
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 2000,
        "success_rate": 0.85,
        "mean_reward": 0.7608375549928545,
        "recent_gradient": 0.009013998130682335
      },
      "level_2": {
        "num_pulls": 2000,
        "success_rate": 0.65,
        "mean_reward": 0.5732127048611159,
        "recent_gradient": 0.02169920419404205
      },
      "level_3": {
        "num_pulls": 2000,
        "success_rate": 0.45,
        "mean_reward": 0.412140309719301,
        "recent_gradient": 0.028614180809478692
      },
      "level_4": {
        "num_pulls": 2000,
        "success_rate": 0.28,
        "mean_reward": 0.2699919975086651,
        "recent_gradient": 0.02061459904175322
      },
      "level_5": {
        "num_pulls": 2000,
        "success_rate": 0.15,
        "mean_reward": 0.1512572423767792,
        "recent_gradient": 0.011259257683847225
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.15
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 4.5855024945389635
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.719909479901515
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 5.373646802561631
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 5.3051851327167325
      }
    }
  },
  "config": {
    "use_async": true,
    "curriculum_strategy": "uniform"
  }
}