{
  "experiment_name": "sync_seed456",
  "total_timesteps": 10000,
  "total_time": 1000.0,
  "avg_throughput": 10,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": -0.02491047619505481,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 101,
      "pass_at_1": 0.02146242549641783,
      "avg_reward": 0.0456045527911427,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 202,
      "pass_at_1": 0.045192007807336974,
      "avg_reward": 0.11763303288556984,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 303,
      "pass_at_1": 0.03331205150883638,
      "avg_reward": 0.04912380004008852,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 404,
      "pass_at_1": 0.029447414024284406,
      "avg_reward": 0.007796389733812286,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 505,
      "pass_at_1": 0.08083831321899532,
      "avg_reward": 0.008159088741993142,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 606,
      "pass_at_1": 0.1016224524048974,
      "avg_reward": 0.0931905173839325,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 707,
      "pass_at_1": 0.12009546413932808,
      "avg_reward": 0.19331149097216804,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 808,
      "pass_at_1": 0.16768679635704128,
      "avg_reward": 0.18016685487758988,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 909,
      "pass_at_1": 0.1509124315696906,
      "avg_reward": 0.1786075471542042,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.13290685935105545,
      "avg_reward": 0.10188790574906646,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.11848255758815326,
      "avg_reward": 0.07558302145604993,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.1636249537106741,
      "avg_reward": 0.13771855396988275,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.13643701164154398,
      "avg_reward": 0.09409533495950798,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.1489096679116321,
      "avg_reward": 0.1762094763127365,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.12357876980705361,
      "avg_reward": 0.08514397102518806,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.17010924167348854,
      "avg_reward": 0.06409299014117734,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.18238133215579544,
      "avg_reward": 0.10424981425376753,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.17239287520885632,
      "avg_reward": 0.14223162734104244,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.16921606062174532,
      "avg_reward": 0.07474772041245922,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.1676794339050134,
      "avg_reward": 0.11619953279839804,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.19245238138988913,
      "avg_reward": 0.12690771354155173,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.17142448490155082,
      "avg_reward": 0.12257640355901107,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.18267157838729528,
      "avg_reward": 0.2062188070056849,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.17846303335235636,
      "avg_reward": 0.16504202782913527,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.16078805930810453,
      "avg_reward": 0.13198707547669458,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.16043176187458433,
      "avg_reward": 0.08350457160335556,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.21294420840182285,
      "avg_reward": 0.1663916271596772,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.17859628182907958,
      "avg_reward": 0.14356714883355373,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.16672904763822252,
      "avg_reward": 0.21969000793506915,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.18819050969016843,
      "avg_reward": 0.16326268353559478,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.19603064813627435,
      "avg_reward": 0.15349693320014163,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.1844175753881292,
      "avg_reward": 0.13122738696367073,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.22157796832755086,
      "avg_reward": 0.1455801014828264,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.20883941524084973,
      "avg_reward": 0.2577550929036312,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.21655853855211654,
      "avg_reward": 0.12912469560234022,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.24140762710526656,
      "avg_reward": 0.23582301624583285,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.2392906485103674,
      "avg_reward": 0.20601666753409797,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.23015495368822797,
      "avg_reward": 0.2533943107158635,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.22362745392865505,
      "avg_reward": 0.22942067526494614,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.2381318602028766,
      "avg_reward": 0.23081299237687303,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.2368247028064598,
      "avg_reward": 0.17711092873191825,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.22332231200203295,
      "avg_reward": 0.1355755137932444,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.26485944851735327,
      "avg_reward": 0.17239146662775554,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.2565923277975919,
      "avg_reward": 0.19096896445317701,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.23359897054547651,
      "avg_reward": 0.24160140570829322,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.28438604582557003,
      "avg_reward": 0.1319628138123713,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.25824168037875145,
      "avg_reward": 0.23790332806846035,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.26066197448501494,
      "avg_reward": 0.32466157801691853,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.3080158127026228,
      "avg_reward": 0.2662549045635345,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.2508287397887175,
      "avg_reward": 0.15799414956628086
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.22812734157514797,
      "avg_reward": 0.241216630307444
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.2531682306979827,
      "avg_reward": 0.23706035715929846
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.2907348988492821,
      "avg_reward": 0.20898550476223252
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.26287573235028483,
      "avg_reward": 0.20673781200047017
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.2770942913144255,
      "avg_reward": 0.27555408145946636
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.3279095537331365,
      "avg_reward": 0.27993204889300416
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.30700783140464527,
      "avg_reward": 0.18787409626009174
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.32218226034112285,
      "avg_reward": 0.386373793252632
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.3073689698031632,
      "avg_reward": 0.20571937887909178
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.29470274339920755,
      "avg_reward": 0.18615683245213963
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.28268090560892456,
      "avg_reward": 0.19199885851218942
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.3274218040014,
      "avg_reward": 0.23471256915832675
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.3117125961959081,
      "avg_reward": 0.21628206259070787
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.3051993602205731,
      "avg_reward": 0.16871067571604526
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.2908373841930967,
      "avg_reward": 0.251768018780166
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.3193629661486211,
      "avg_reward": 0.28477943505626807
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.3458162110066988,
      "avg_reward": 0.3970976438297764
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.3204261454428198,
      "avg_reward": 0.19168689961505475
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.32661441818092485,
      "avg_reward": 0.35361165284807405
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.31211663138174767,
      "avg_reward": 0.21326848565276407
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.32656878967857655,
      "avg_reward": 0.27884799199277205
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.35475378816801767,
      "avg_reward": 0.328026103579508
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.3465143599696102,
      "avg_reward": 0.1611864850096934
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.33458058182414113,
      "avg_reward": 0.2180245410286904
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.3369801471958043,
      "avg_reward": 0.24141848690463572
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.340001054104781,
      "avg_reward": 0.31467951727156795
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.3412738045520276,
      "avg_reward": 0.18609480399151895
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.3598702751981387,
      "avg_reward": 0.247095055070057
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.34263283064004657,
      "avg_reward": 0.2586093565264192
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.3286345768715339,
      "avg_reward": 0.17922171804043527
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.3554681354679814,
      "avg_reward": 0.3218416146949131
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.3740422879247667,
      "avg_reward": 0.15272495734646482
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.35062491171309973,
      "avg_reward": 0.31733561244526937
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.4011379191364503,
      "avg_reward": 0.37805947878032087
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.33785983041967815,
      "avg_reward": 0.24671165984147742
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.3883924943474602,
      "avg_reward": 0.27076496540613165
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.322765256716191,
      "avg_reward": 0.23489359412042227
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.36891337257588525,
      "avg_reward": 0.3164374106103667
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.3601604284611251,
      "avg_reward": 0.3272199196817916
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.36646584237747587,
      "avg_reward": 0.3221350703378638
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.3756908025017887,
      "avg_reward": 0.2095920500446904
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.3396104093529568,
      "avg_reward": 0.1769013992994563
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.3858384843721386,
      "avg_reward": 0.31051434405125694
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.35959085349762754,
      "avg_reward": 0.3167383757077185
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.3610157647432847,
      "avg_reward": 0.1980876337161836
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.3860856468632853,
      "avg_reward": 0.3634843317860599
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.3992597421975254,
      "avg_reward": 0.2772365757707049
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.35246523957669795,
      "avg_reward": 0.27887802518796206
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.4183463718241885,
      "avg_reward": 0.38414990862155035
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": -0.02491047619505481,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.4183463718241885,
      "avg_reward": 0.38414990862155035
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 5.0,
      "update": 1,
      "cumulative_wall_time": 10.0
    },
    {
      "timestep": 101,
      "throughput": 5.5,
      "update": 2,
      "cumulative_wall_time": 20.0
    },
    {
      "timestep": 202,
      "throughput": 6.0,
      "update": 3,
      "cumulative_wall_time": 30.0
    },
    {
      "timestep": 303,
      "throughput": 6.5,
      "update": 4,
      "cumulative_wall_time": 40.0
    },
    {
      "timestep": 404,
      "throughput": 7.0,
      "update": 5,
      "cumulative_wall_time": 50.0
    },
    {
      "timestep": 505,
      "throughput": 7.5,
      "update": 6,
      "cumulative_wall_time": 60.0
    },
    {
      "timestep": 606,
      "throughput": 8.0,
      "update": 7,
      "cumulative_wall_time": 70.0
    },
    {
      "timestep": 707,
      "throughput": 8.5,
      "update": 8,
      "cumulative_wall_time": 80.0
    },
    {
      "timestep": 808,
      "throughput": 9.0,
      "update": 9,
      "cumulative_wall_time": 90.0
    },
    {
      "timestep": 909,
      "throughput": 9.5,
      "update": 10,
      "cumulative_wall_time": 100.0
    },
    {
      "timestep": 1010,
      "throughput": 10.509073415742652,
      "update": 11,
      "cumulative_wall_time": 110.0
    },
    {
      "timestep": 1111,
      "throughput": 9.103884661290289,
      "update": 12,
      "cumulative_wall_time": 120.0
    },
    {
      "timestep": 1212,
      "throughput": 8.832920936613363,
      "update": 13,
      "cumulative_wall_time": 130.0
    },
    {
      "timestep": 1313,
      "throughput": 10.68874114901284,
      "update": 14,
      "cumulative_wall_time": 140.0
    },
    {
      "timestep": 1414,
      "throughput": 8.561297804874462,
      "update": 15,
      "cumulative_wall_time": 150.0
    },
    {
      "timestep": 1515,
      "throughput": 11.965958271091605,
      "update": 16,
      "cumulative_wall_time": 160.0
    },
    {
      "timestep": 1616,
      "throughput": 10.91605829473545,
      "update": 17,
      "cumulative_wall_time": 170.0
    },
    {
      "timestep": 1717,
      "throughput": 9.089654215016012,
      "update": 18,
      "cumulative_wall_time": 180.0
    },
    {
      "timestep": 1818,
      "throughput": 9.891104398006318,
      "update": 19,
      "cumulative_wall_time": 190.0
    },
    {
      "timestep": 1919,
      "throughput": 8.40688613506726,
      "update": 20,
      "cumulative_wall_time": 200.0
    },
    {
      "timestep": 2020,
      "throughput": 9.672216490631547,
      "update": 21,
      "cumulative_wall_time": 210.0
    },
    {
      "timestep": 2121,
      "throughput": 11.253895987538113,
      "update": 22,
      "cumulative_wall_time": 220.0
    },
    {
      "timestep": 2222,
      "throughput": 11.84662792652253,
      "update": 23,
      "cumulative_wall_time": 230.0
    },
    {
      "timestep": 2323,
      "throughput": 10.686884970296422,
      "update": 24,
      "cumulative_wall_time": 240.0
    },
    {
      "timestep": 2424,
      "throughput": 7.6352858777557655,
      "update": 25,
      "cumulative_wall_time": 250.0
    },
    {
      "timestep": 2525,
      "throughput": 10.48577296329813,
      "update": 26,
      "cumulative_wall_time": 260.0
    },
    {
      "timestep": 2626,
      "throughput": 10.492086623988737,
      "update": 27,
      "cumulative_wall_time": 270.0
    },
    {
      "timestep": 2727,
      "throughput": 9.578709021250518,
      "update": 28,
      "cumulative_wall_time": 280.0
    },
    {
      "timestep": 2828,
      "throughput": 10.908832181361918,
      "update": 29,
      "cumulative_wall_time": 290.0
    },
    {
      "timestep": 2929,
      "throughput": 8.82010687310492,
      "update": 30,
      "cumulative_wall_time": 300.0
    },
    {
      "timestep": 3030,
      "throughput": 10.667325130726326,
      "update": 31,
      "cumulative_wall_time": 310.0
    },
    {
      "timestep": 3131,
      "throughput": 9.883147079047394,
      "update": 32,
      "cumulative_wall_time": 320.0
    },
    {
      "timestep": 3232,
      "throughput": 10.512423294354099,
      "update": 33,
      "cumulative_wall_time": 330.0
    },
    {
      "timestep": 3333,
      "throughput": 12.34095407899185,
      "update": 34,
      "cumulative_wall_time": 340.0
    },
    {
      "timestep": 3434,
      "throughput": 10.345698542654695,
      "update": 35,
      "cumulative_wall_time": 350.0
    },
    {
      "timestep": 3535,
      "throughput": 9.524686923871467,
      "update": 36,
      "cumulative_wall_time": 360.0
    },
    {
      "timestep": 3636,
      "throughput": 9.081420698951623,
      "update": 37,
      "cumulative_wall_time": 370.0
    },
    {
      "timestep": 3737,
      "throughput": 9.725781410023291,
      "update": 38,
      "cumulative_wall_time": 380.0
    },
    {
      "timestep": 3838,
      "throughput": 10.019162650975339,
      "update": 39,
      "cumulative_wall_time": 390.0
    },
    {
      "timestep": 3939,
      "throughput": 9.443289218191328,
      "update": 40,
      "cumulative_wall_time": 400.0
    },
    {
      "timestep": 4040,
      "throughput": 11.93841823569076,
      "update": 41,
      "cumulative_wall_time": 410.0
    },
    {
      "timestep": 4141,
      "throughput": 10.575171911243029,
      "update": 42,
      "cumulative_wall_time": 420.0
    },
    {
      "timestep": 4242,
      "throughput": 9.603774707875036,
      "update": 43,
      "cumulative_wall_time": 430.0
    },
    {
      "timestep": 4343,
      "throughput": 11.411420886042059,
      "update": 44,
      "cumulative_wall_time": 440.0
    },
    {
      "timestep": 4444,
      "throughput": 8.335711915074771,
      "update": 45,
      "cumulative_wall_time": 450.0
    },
    {
      "timestep": 4545,
      "throughput": 11.321072519512793,
      "update": 46,
      "cumulative_wall_time": 460.0
    },
    {
      "timestep": 4646,
      "throughput": 11.261567025922732,
      "update": 47,
      "cumulative_wall_time": 470.0
    },
    {
      "timestep": 4747,
      "throughput": 12.053979512676234,
      "update": 48,
      "cumulative_wall_time": 480.0
    },
    {
      "timestep": 4848,
      "throughput": 10.193929416868313,
      "update": 49,
      "cumulative_wall_time": 490.0
    },
    {
      "timestep": 4949,
      "throughput": 11.12734551455527,
      "update": 50,
      "cumulative_wall_time": 500.0
    },
    {
      "timestep": 5050,
      "throughput": 10.471619625218826,
      "update": 51,
      "cumulative_wall_time": 510.0
    },
    {
      "timestep": 5151,
      "throughput": 10.619850548942516,
      "update": 52,
      "cumulative_wall_time": 520.0
    },
    {
      "timestep": 5252,
      "throughput": 9.002478734037938,
      "update": 53,
      "cumulative_wall_time": 530.0
    },
    {
      "timestep": 5353,
      "throughput": 11.505122773308624,
      "update": 54,
      "cumulative_wall_time": 540.0
    },
    {
      "timestep": 5454,
      "throughput": 10.341104754657149,
      "update": 55,
      "cumulative_wall_time": 550.0
    },
    {
      "timestep": 5555,
      "throughput": 8.741376381812156,
      "update": 56,
      "cumulative_wall_time": 560.0
    },
    {
      "timestep": 5656,
      "throughput": 9.89575602946151,
      "update": 57,
      "cumulative_wall_time": 570.0
    },
    {
      "timestep": 5757,
      "throughput": 8.113721102474125,
      "update": 58,
      "cumulative_wall_time": 580.0
    },
    {
      "timestep": 5858,
      "throughput": 8.243949400345391,
      "update": 59,
      "cumulative_wall_time": 590.0
    },
    {
      "timestep": 5959,
      "throughput": 9.051728178650784,
      "update": 60,
      "cumulative_wall_time": 600.0
    },
    {
      "timestep": 6060,
      "throughput": 10.724789807047529,
      "update": 61,
      "cumulative_wall_time": 610.0
    },
    {
      "timestep": 6161,
      "throughput": 11.297791528247512,
      "update": 62,
      "cumulative_wall_time": 620.0
    },
    {
      "timestep": 6262,
      "throughput": 9.129807881893496,
      "update": 63,
      "cumulative_wall_time": 630.0
    },
    {
      "timestep": 6363,
      "throughput": 9.638081878084922,
      "update": 64,
      "cumulative_wall_time": 640.0
    },
    {
      "timestep": 6464,
      "throughput": 10.191632259756386,
      "update": 65,
      "cumulative_wall_time": 650.0
    },
    {
      "timestep": 6565,
      "throughput": 9.93359711407784,
      "update": 66,
      "cumulative_wall_time": 660.0
    },
    {
      "timestep": 6666,
      "throughput": 10.196165784393012,
      "update": 67,
      "cumulative_wall_time": 670.0
    },
    {
      "timestep": 6767,
      "throughput": 8.784944405208421,
      "update": 68,
      "cumulative_wall_time": 680.0
    },
    {
      "timestep": 6868,
      "throughput": 10.547717617827072,
      "update": 69,
      "cumulative_wall_time": 690.0
    },
    {
      "timestep": 6969,
      "throughput": 9.7913355000624,
      "update": 70,
      "cumulative_wall_time": 700.0
    },
    {
      "timestep": 7070,
      "throughput": 9.54370415867419,
      "update": 71,
      "cumulative_wall_time": 710.0
    },
    {
      "timestep": 7171,
      "throughput": 10.632118642214884,
      "update": 72,
      "cumulative_wall_time": 720.0
    },
    {
      "timestep": 7272,
      "throughput": 10.258777176621482,
      "update": 73,
      "cumulative_wall_time": 730.0
    },
    {
      "timestep": 7373,
      "throughput": 10.459912366860806,
      "update": 74,
      "cumulative_wall_time": 740.0
    },
    {
      "timestep": 7474,
      "throughput": 9.818435580682891,
      "update": 75,
      "cumulative_wall_time": 750.0
    },
    {
      "timestep": 7575,
      "throughput": 11.4774469667965,
      "update": 76,
      "cumulative_wall_time": 760.0
    },
    {
      "timestep": 7676,
      "throughput": 9.671489732601536,
      "update": 77,
      "cumulative_wall_time": 770.0
    },
    {
      "timestep": 7777,
      "throughput": 11.379439300031107,
      "update": 78,
      "cumulative_wall_time": 780.0
    },
    {
      "timestep": 7878,
      "throughput": 9.69452527437708,
      "update": 79,
      "cumulative_wall_time": 790.0
    },
    {
      "timestep": 7979,
      "throughput": 10.678714757915603,
      "update": 80,
      "cumulative_wall_time": 800.0
    },
    {
      "timestep": 8080,
      "throughput": 8.977831892431357,
      "update": 81,
      "cumulative_wall_time": 810.0
    },
    {
      "timestep": 8181,
      "throughput": 8.129183635008154,
      "update": 82,
      "cumulative_wall_time": 820.0
    },
    {
      "timestep": 8282,
      "throughput": 10.962417405538572,
      "update": 83,
      "cumulative_wall_time": 830.0
    },
    {
      "timestep": 8383,
      "throughput": 9.578741653015806,
      "update": 84,
      "cumulative_wall_time": 840.0
    },
    {
      "timestep": 8484,
      "throughput": 10.806647127767421,
      "update": 85,
      "cumulative_wall_time": 850.0
    },
    {
      "timestep": 8585,
      "throughput": 11.380535603797735,
      "update": 86,
      "cumulative_wall_time": 860.0
    },
    {
      "timestep": 8686,
      "throughput": 9.251848493589133,
      "update": 87,
      "cumulative_wall_time": 870.0
    },
    {
      "timestep": 8787,
      "throughput": 9.39127418067637,
      "update": 88,
      "cumulative_wall_time": 880.0
    },
    {
      "timestep": 8888,
      "throughput": 10.138122268309655,
      "update": 89,
      "cumulative_wall_time": 890.0
    },
    {
      "timestep": 8989,
      "throughput": 9.756196151122156,
      "update": 90,
      "cumulative_wall_time": 900.0
    },
    {
      "timestep": 9090,
      "throughput": 10.107788983440045,
      "update": 91,
      "cumulative_wall_time": 910.0
    },
    {
      "timestep": 9191,
      "throughput": 10.923417732689213,
      "update": 92,
      "cumulative_wall_time": 920.0
    },
    {
      "timestep": 9292,
      "throughput": 9.039595168847043,
      "update": 93,
      "cumulative_wall_time": 930.0
    },
    {
      "timestep": 9393,
      "throughput": 9.899112731153046,
      "update": 94,
      "cumulative_wall_time": 940.0
    },
    {
      "timestep": 9494,
      "throughput": 11.24501870737934,
      "update": 95,
      "cumulative_wall_time": 950.0
    },
    {
      "timestep": 9595,
      "throughput": 10.922878436003192,
      "update": 96,
      "cumulative_wall_time": 960.0
    },
    {
      "timestep": 9696,
      "throughput": 10.955962234298749,
      "update": 97,
      "cumulative_wall_time": 970.0
    },
    {
      "timestep": 9797,
      "throughput": 9.356993483242576,
      "update": 98,
      "cumulative_wall_time": 980.0
    },
    {
      "timestep": 9898,
      "throughput": 10.1535270479072,
      "update": 99,
      "cumulative_wall_time": 990.0
    },
    {
      "timestep": 10000,
      "throughput": 10.55500079449623,
      "update": 100,
      "cumulative_wall_time": 1000.0
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 2000,
        "success_rate": 0.85,
        "mean_reward": 0.774535753066723,
        "recent_gradient": 0.00880228815501225
      },
      "level_2": {
        "num_pulls": 2000,
        "success_rate": 0.65,
        "mean_reward": 0.6076855357527491,
        "recent_gradient": 0.021498278466352168
      },
      "level_3": {
        "num_pulls": 2000,
        "success_rate": 0.45,
        "mean_reward": 0.3831754599108145,
        "recent_gradient": 0.03149706388174175
      },
      "level_4": {
        "num_pulls": 2000,
        "success_rate": 0.28,
        "mean_reward": 0.28015326432172166,
        "recent_gradient": 0.019275276932362185
      },
      "level_5": {
        "num_pulls": 2000,
        "success_rate": 0.15,
        "mean_reward": 0.13334041455555007,
        "recent_gradient": 0.012821048819579189
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.15
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 4.269411344381984
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.280264511263108
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 5.37398672115195
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 4.826192872277722
      }
    }
  },
  "config": {
    "use_async": false,
    "curriculum_strategy": "uniform"
  }
}