{
  "experiment_name": "sync_curriculum_seed42",
  "total_timesteps": 10000,
  "total_time": 1111.111111111111,
  "avg_throughput": 9,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.009934283060224654,
      "avg_reward": 0.0010342113896204897,
      "difficulty_1_ratio": 0.5703496647219384,
      "difficulty_2_ratio": 0.34593455841067655,
      "difficulty_3_ratio": 0.0771884334190506,
      "difficulty_4_ratio": 0.006336012450983674,
      "difficulty_5_ratio": 0.00019133099735093797
    },
    {
      "timestep": 101,
      "pass_at_1": 0.024064881873124964,
      "avg_reward": 0.09540339831890125,
      "difficulty_1_ratio": 0.545817584309558,
      "difficulty_2_ratio": 0.3592137008263376,
      "difficulty_3_ratio": 0.0869688606806755,
      "difficulty_4_ratio": 0.007746048051242527,
      "difficulty_5_ratio": 0.00025380613218624814
    },
    {
      "timestep": 202,
      "pass_at_1": 0.017539154727755506,
      "avg_reward": 0.0023244759347453778,
      "difficulty_1_ratio": 0.5207065136269264,
      "difficulty_2_ratio": 0.3718356202546844,
      "difficulty_3_ratio": 0.09768198799373931,
      "difficulty_4_ratio": 0.009440250235689705,
      "difficulty_5_ratio": 0.00033562788896017117
    },
    {
      "timestep": 303,
      "pass_at_1": 0.06491758964348116,
      "avg_reward": 0.09030580817243036,
      "difficulty_1_ratio": 0.4951092343136047,
      "difficulty_2_ratio": 0.38362916613190773,
      "difficulty_3_ratio": 0.10935225097641152,
      "difficulty_4_ratio": 0.011466987914927423,
      "difficulty_5_ratio": 0.00044236066314863343
    },
    {
      "timestep": 404,
      "pass_at_1": 0.035054956725745406,
      "avg_reward": 0.055171967559894564,
      "difficulty_1_ratio": 0.469130336180388,
      "difficulty_2_ratio": 0.3944179935925989,
      "difficulty_3_ratio": 0.12199033943415045,
      "difficulty_4_ratio": 0.013880326375356456,
      "difficulty_5_ratio": 0.0005810044175062076
    },
    {
      "timestep": 505,
      "pass_at_1": 0.10564987861168393,
      "avg_reward": 0.0612334152108343,
      "difficulty_1_ratio": 0.4428854101147015,
      "difficulty_2_ratio": 0.40402402094501866,
      "difficulty_3_ratio": 0.13559026749360029,
      "difficulty_4_ratio": 0.0167399966441195,
      "difficulty_5_ratio": 0.0007603048025599198
    },
    {
      "timestep": 606,
      "pass_at_1": 0.12347368305774217,
      "avg_reward": 0.0031149342133038466,
      "difficulty_1_ratio": 0.4164998456831705,
      "difficulty_2_ratio": 0.41227145735706794,
      "difficulty_3_ratio": 0.15012644832783253,
      "difficulty_4_ratio": 0.02011113911124073,
      "difficulty_5_ratio": 0.0009911095206882054
    },
    {
      "timestep": 707,
      "pass_at_1": 0.08793864177496254,
      "avg_reward": 0.0422365369579214,
      "difficulty_1_ratio": 0.390107224895361,
      "difficulty_2_ratio": 0.4189913219593774,
      "difficulty_3_ratio": 0.1655509131479823,
      "difficulty_4_ratio": 0.024063769070528613,
      "difficulty_5_ratio": 0.0012867709267507749
    },
    {
      "timestep": 808,
      "pass_at_1": 0.10606912597061448,
      "avg_reward": 0.10056766740625528,
      "difficulty_1_ratio": 0.3638473227132847,
      "difficulty_2_ratio": 0.42402633368046766,
      "difficulty_3_ratio": 0.18179083819928793,
      "difficulty_4_ratio": 0.028671913216506643,
      "difficulty_5_ratio": 0.0016635921904528722
    },
    {
      "timestep": 909,
      "pass_at_1": 0.11213988802547346,
      "avg_reward": 0.019096725353614202,
      "difficulty_1_ratio": 0.337863746670805,
      "difficulty_2_ratio": 0.4272360092470168,
      "difficulty_3_ratio": 0.19874656153923254,
      "difficulty_4_ratio": 0.03401237165049899,
      "difficulty_5_ratio": 0.0021413108924466314
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.16367336192510767,
      "avg_reward": 0.11964987451575936,
      "difficulty_1_ratio": 0.31230127114431194,
      "difficulty_2_ratio": 0.4285017684753959,
      "difficulty_3_ratio": 0.21629028030484038,
      "difficulty_4_ratio": 0.04016307038955698,
      "difficulty_5_ratio": 0.0027436096858948753
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.13985572517238434,
      "avg_reward": 0.04064717082723464,
      "difficulty_1_ratio": 0.2873029447333821,
      "difficulty_2_ratio": 0.4277318152433385,
      "difficulty_3_ratio": 0.23426561605703436,
      "difficulty_4_ratio": 0.04720098526509968,
      "difficulty_5_ratio": 0.0034986387011453407
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.13184623220126726,
      "avg_reward": 0.11102311524650713,
      "difficulty_1_ratio": 0.2630070699260558,
      "difficulty_2_ratio": 0.4248655434002136,
      "difficulty_3_ratio": 0.2524882182255638,
      "difficulty_4_ratio": 0.05519963957750222,
      "difficulty_5_ratio": 0.004439528870664513
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.12402571265177376,
      "avg_reward": 0.11800547103870261,
      "difficulty_1_ratio": 0.23954417068994155,
      "difficulty_2_ratio": 0.41987721294759744,
      "difficulty_3_ratio": 0.2707475422306048,
      "difficulty_4_ratio": 0.06422620455155005,
      "difficulty_5_ratio": 0.005604869580306165
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.13942632379040085,
      "avg_reward": 0.09695637154265685,
      "difficulty_1_ratio": 0.21703407392185683,
      "difficulty_2_ratio": 0.412778655730858,
      "difficulty_3_ratio": 0.2888098894295048,
      "difficulty_4_ratio": 0.07433826251589389,
      "difficulty_5_ratio": 0.0070391184018864465
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.14387895829589525,
      "avg_reward": 0.2077170758621631,
      "difficulty_1_ratio": 0.1955832332539105,
      "difficulty_2_ratio": 0.4036208028084852,
      "difficulty_3_ratio": 0.3064227321494006,
      "difficulty_4_ratio": 0.08558032615731795,
      "difficulty_5_ratio": 0.008792905630886071
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.1601960991360906,
      "avg_reward": 0.07527133286107746,
      "difficulty_1_ratio": 0.17528241761460614,
      "difficulty_2_ratio": 0.39249387697759325,
      "difficulty_3_ratio": 0.3233202719632032,
      "difficulty_4_ratio": 0.09798024091278032,
      "difficulty_5_ratio": 0.010923192531817163
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.1815471504842922,
      "avg_reward": 0.08419553788888265,
      "difficulty_1_ratio": 0.15620487203762,
      "difficulty_2_ratio": 0.3795261610306469,
      "difficulty_3_ratio": 0.3392300979084394,
      "difficulty_4_ratio": 0.11154562879642933,
      "difficulty_5_ratio": 0.013493240226864338
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.17397909714879203,
      "avg_reward": 0.04119977152504485,
      "difficulty_1_ratio": 0.13840503524267814,
      "difficulty_2_ratio": 0.36488133073132456,
      "difficulty_3_ratio": 0.3538807296736819,
      "difficulty_4_ratio": 0.12626055765373156,
      "difficulty_5_ratio": 0.016572346698583963
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.14801696353999572,
      "avg_reward": 0.12825663262545275,
      "difficulty_1_ratio": 0.12191786908589192,
      "difficulty_2_ratio": 0.3487544252621549,
      "difficulty_3_ratio": 0.36700975575577915,
      "difficulty_4_ratio": 0.1420826368959247,
      "difficulty_5_ratio": 0.02023531300024945
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.1941998968721299,
      "avg_reward": 0.16392833155720246,
      "difficulty_1_ratio": 0.10675882140395278,
      "difficulty_2_ratio": 0.33136661015926444,
      "difficulty_3_ratio": 0.37837221513402225,
      "difficulty_4_ratio": 0.158940746377412,
      "difficulty_5_ratio": 0.02456160692534847
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.1820360516966936,
      "avg_reward": 0.13057365657789044,
      "difficulty_1_ratio": 0.09292440882580433,
      "difficulty_2_ratio": 0.3129589615253456,
      "difficulty_3_ratio": 0.38774882932075583,
      "difficulty_4_ratio": 0.1767335970180918,
      "difficulty_5_ratio": 0.02963420331000244
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.15976296755332597,
      "avg_reward": 0.09181816362292536,
      "difficulty_1_ratio": 0.08039337269830067,
      "difficulty_2_ratio": 0.29378555928253614,
      "difficulty_3_ratio": 0.3949536745312958,
      "difficulty_4_ratio": 0.19532929872471466,
      "difficulty_5_ratio": 0.03553809476315268
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.18516814645242355,
      "avg_reward": 0.20099062847288462,
      "difficulty_1_ratio": 0.0691283320657602,
      "difficulty_2_ratio": 0.2741062164565189,
      "difficulty_3_ratio": 0.39984089400061734,
      "difficulty_4_ratio": 0.21456607296103805,
      "difficulty_5_ratio": 0.04235848451606555
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.20636093724162372,
      "avg_reward": 0.07693674202516229,
      "difficulty_1_ratio": 0.05907783484757915,
      "difficulty_2_ratio": 0.2541791879471294,
      "difficulty_3_ratio": 0.40231008867116286,
      "difficulty_4_ratio": 0.23425419509772658,
      "difficulty_5_ratio": 0.05017869343640206
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.21113487515104515,
      "avg_reward": 0.14965378610002028,
      "difficulty_1_ratio": 0.050178693436402015,
      "difficulty_2_ratio": 0.2342541950977265,
      "difficulty_3_ratio": 0.40231008867116286,
      "difficulty_4_ratio": 0.2541791879471295,
      "difficulty_5_ratio": 0.059077834847579204
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.19633302960941781,
      "avg_reward": 0.18765023812957765,
      "difficulty_1_ratio": 0.04235848451606552,
      "difficulty_2_ratio": 0.21456607296103797,
      "difficulty_3_ratio": 0.3998408940006174,
      "difficulty_4_ratio": 0.274106216456519,
      "difficulty_5_ratio": 0.06912833206576029
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.23575990041083747,
      "avg_reward": 0.23517192628447992,
      "difficulty_1_ratio": 0.03553809476315264,
      "difficulty_2_ratio": 0.1953292987247146,
      "difficulty_3_ratio": 0.3949536745312958,
      "difficulty_4_ratio": 0.2937855592825363,
      "difficulty_5_ratio": 0.08039337269830077
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.20367053339251862,
      "avg_reward": 0.14747580792145418,
      "difficulty_1_ratio": 0.029634203310002414,
      "difficulty_2_ratio": 0.17673359701809171,
      "difficulty_3_ratio": 0.38774882932075583,
      "difficulty_4_ratio": 0.31295896152534575,
      "difficulty_5_ratio": 0.09292440882580441
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.23243788596833537,
      "avg_reward": 0.23472756513078627,
      "difficulty_1_ratio": 0.02456160692534847,
      "difficulty_2_ratio": 0.158940746377412,
      "difficulty_3_ratio": 0.37837221513402225,
      "difficulty_4_ratio": 0.33136661015926444,
      "difficulty_5_ratio": 0.10675882140395278
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.2216257204260815,
      "avg_reward": 0.16801762750767435,
      "difficulty_1_ratio": 0.020235313000249448,
      "difficulty_2_ratio": 0.14208263689592468,
      "difficulty_3_ratio": 0.3670097557557791,
      "difficulty_4_ratio": 0.34875442526215483,
      "difficulty_5_ratio": 0.12191786908589189
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.21451392200563918,
      "avg_reward": 0.11180080640047782,
      "difficulty_1_ratio": 0.016572346698583963,
      "difficulty_2_ratio": 0.12626055765373156,
      "difficulty_3_ratio": 0.35388072967368184,
      "difficulty_4_ratio": 0.3648813307313245,
      "difficulty_5_ratio": 0.13840503524267814
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.25835324749954347,
      "avg_reward": 0.27449459942817594,
      "difficulty_1_ratio": 0.013493240226864338,
      "difficulty_2_ratio": 0.11154562879642933,
      "difficulty_3_ratio": 0.3392300979084394,
      "difficulty_4_ratio": 0.3795261610306469,
      "difficulty_5_ratio": 0.15620487203762
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.24615109904653054,
      "avg_reward": 0.24709752413182567,
      "difficulty_1_ratio": 0.010923192531817153,
      "difficulty_2_ratio": 0.09798024091278025,
      "difficulty_3_ratio": 0.32332027196320307,
      "difficulty_4_ratio": 0.39249387697759325,
      "difficulty_5_ratio": 0.17528241761460625
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.2603347363964557,
      "avg_reward": 0.17601180138690836,
      "difficulty_1_ratio": 0.00879290563088607,
      "difficulty_2_ratio": 0.08558032615731792,
      "difficulty_3_ratio": 0.3064227321494005,
      "difficulty_4_ratio": 0.40362080280848517,
      "difficulty_5_ratio": 0.19558323325391047
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.2658583983835631,
      "avg_reward": 0.28958854703014897,
      "difficulty_1_ratio": 0.007039118401886442,
      "difficulty_2_ratio": 0.07433826251589386,
      "difficulty_3_ratio": 0.2888098894295048,
      "difficulty_4_ratio": 0.41277865573085804,
      "difficulty_5_ratio": 0.21703407392185695
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.2634557464279372,
      "avg_reward": 0.28899677993305006,
      "difficulty_1_ratio": 0.00560486958030616,
      "difficulty_2_ratio": 0.06422620455155001,
      "difficulty_3_ratio": 0.2707475422306047,
      "difficulty_4_ratio": 0.41987721294759744,
      "difficulty_5_ratio": 0.2395441706899417
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.21732796803251705,
      "avg_reward": 0.21495749964477484,
      "difficulty_1_ratio": 0.004439528870664501,
      "difficulty_2_ratio": 0.05519963957750214,
      "difficulty_3_ratio": 0.2524882182255636,
      "difficulty_4_ratio": 0.42486554340021365,
      "difficulty_5_ratio": 0.2630070699260561
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.2770187190480687,
      "avg_reward": 0.2066646077151616,
      "difficulty_1_ratio": 0.0034986387011453407,
      "difficulty_2_ratio": 0.04720098526509968,
      "difficulty_3_ratio": 0.23426561605703436,
      "difficulty_4_ratio": 0.4277318152433385,
      "difficulty_5_ratio": 0.2873029447333821
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.2826676741107592,
      "avg_reward": 0.12675569355856273,
      "difficulty_1_ratio": 0.0027436096858948753,
      "difficulty_2_ratio": 0.04016307038955698,
      "difficulty_3_ratio": 0.21629028030484038,
      "difficulty_4_ratio": 0.4285017684753959,
      "difficulty_5_ratio": 0.31230127114431194
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.28198894445015027,
      "avg_reward": 0.24344678413570753,
      "difficulty_1_ratio": 0.0021413108924466314,
      "difficulty_2_ratio": 0.03401237165049899,
      "difficulty_3_ratio": 0.19874656153923254,
      "difficulty_4_ratio": 0.4272360092470168,
      "difficulty_5_ratio": 0.337863746670805
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.32148091436922327,
      "avg_reward": 0.23127122058169625,
      "difficulty_1_ratio": 0.0016635921904528726,
      "difficulty_2_ratio": 0.02867191321650665,
      "difficulty_3_ratio": 0.18179083819928796,
      "difficulty_4_ratio": 0.42402633368046766,
      "difficulty_5_ratio": 0.3638473227132848
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.28128005540482287,
      "avg_reward": 0.19993619214463149,
      "difficulty_1_ratio": 0.0012867709267507727,
      "difficulty_2_ratio": 0.02406376907052859,
      "difficulty_3_ratio": 0.16555091314798218,
      "difficulty_4_ratio": 0.41899132195937727,
      "difficulty_5_ratio": 0.3901072248953611
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.3212666662288457,
      "avg_reward": 0.27345088846606075,
      "difficulty_1_ratio": 0.0009911095206882065,
      "difficulty_2_ratio": 0.020111139111240753,
      "difficulty_3_ratio": 0.15012644832783265,
      "difficulty_4_ratio": 0.41227145735706805,
      "difficulty_5_ratio": 0.4164998456831704
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.2978495371078624,
      "avg_reward": 0.2639430013419577,
      "difficulty_1_ratio": 0.0007603048025599186,
      "difficulty_2_ratio": 0.01673999664411949,
      "difficulty_3_ratio": 0.1355902674936002,
      "difficulty_4_ratio": 0.40402402094501866,
      "difficulty_5_ratio": 0.44288541011470167
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.3158455213618025,
      "avg_reward": 0.3011086666160865,
      "difficulty_1_ratio": 0.0005810044175062084,
      "difficulty_2_ratio": 0.013880326375356472,
      "difficulty_3_ratio": 0.12199033943415054,
      "difficulty_4_ratio": 0.3944179935925989,
      "difficulty_5_ratio": 0.4691303361803878
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.3052910263270296,
      "avg_reward": 0.2278497137317353,
      "difficulty_1_ratio": 0.00044236066314863197,
      "difficulty_2_ratio": 0.011466987914927403,
      "difficulty_3_ratio": 0.10935225097641141,
      "difficulty_4_ratio": 0.3836291661319077,
      "difficulty_5_ratio": 0.49510923431360493
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.31688280680977227,
      "avg_reward": 0.18033049804121187,
      "difficulty_1_ratio": 0.0003356278889601711,
      "difficulty_2_ratio": 0.009440250235689705,
      "difficulty_3_ratio": 0.09768198799373934,
      "difficulty_4_ratio": 0.3718356202546845,
      "difficulty_5_ratio": 0.5207065136269263
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.3360010065880148,
      "avg_reward": 0.2818535688794063,
      "difficulty_1_ratio": 0.00025380613218624744,
      "difficulty_2_ratio": 0.007746048051242511,
      "difficulty_3_ratio": 0.08696886068067541,
      "difficulty_4_ratio": 0.3592137008263375,
      "difficulty_5_ratio": 0.5458175843095583
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.3354913582956962,
      "avg_reward": 0.2566637299677996,
      "difficulty_1_ratio": 0.00019133099735093795,
      "difficulty_2_ratio": 0.006336012450983673,
      "difficulty_3_ratio": 0.0771884334190506,
      "difficulty_4_ratio": 0.3459345584106765,
      "difficulty_5_ratio": 0.5703496647219383
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.31234525909362726,
      "avg_reward": 0.22884394113663387
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.3390114466943541,
      "avg_reward": 0.23109529389440234
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.34779909659637576,
      "avg_reward": 0.29844182011782755
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.393850304365003,
      "avg_reward": 0.32380913413359436
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.36631892787383813,
      "avg_reward": 0.2893328465107622
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.32777041563811093,
      "avg_reward": 0.2608906387380279
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.37226215458365386,
      "avg_reward": 0.4209718292911874
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.3720532169075757,
      "avg_reward": 0.31271994064274117
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.3799778302942769,
      "avg_reward": 0.2455483623544449
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.4082266489759283,
      "avg_reward": 0.3641779708150814
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.40581339670238326,
      "avg_reward": 0.2791813446221697
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.42259377469593085,
      "avg_reward": 0.26798246661713065
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.4107410406826342,
      "avg_reward": 0.4381156138366063
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.3835785612395736,
      "avg_reward": 0.27854796251152036
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.40968576443654253,
      "avg_reward": 0.3025748288434241
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.3808998401976321,
      "avg_reward": 0.30814802089840704
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.39480336680220035,
      "avg_reward": 0.33952231497351937
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.40171245981163195,
      "avg_reward": 0.39886668810018255
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.4084019314362599,
      "avg_reward": 0.31061846933872417
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.4442174844278841,
      "avg_reward": 0.29383077172060956
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.4362902690535208,
      "avg_reward": 0.41438935295693813
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.40329897175354124,
      "avg_reward": 0.3318708703294482
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.4442674870822712,
      "avg_reward": 0.3945051332546825
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.4178657712574805,
      "avg_reward": 0.26826978635177057
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.4564925926701584,
      "avg_reward": 0.38004330779778606
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.45442700223574806,
      "avg_reward": 0.38086401226344724
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.4390949463162419,
      "avg_reward": 0.3628886419110437
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.4617507112299003,
      "avg_reward": 0.3336829980826019
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.496314815434198,
      "avg_reward": 0.4207434983929478
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.43820037408299173,
      "avg_reward": 0.3833879796980849
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.4454778867237105,
      "avg_reward": 0.395736539566091
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.4910074490614545,
      "avg_reward": 0.35177184333157807
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.48988707787812324,
      "avg_reward": 0.4125487086493235
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.48976590455185354,
      "avg_reward": 0.4866523727741802
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.47104440321860785,
      "avg_reward": 0.33914871435701177
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.4607129049401453,
      "avg_reward": 0.32777980970384435
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.47943704653774677,
      "avg_reward": 0.4006072359710296
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.4889149823490904,
      "avg_reward": 0.43249114833107355
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.4859708657496384,
      "avg_reward": 0.46145339645757655
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.48267633902619234,
      "avg_reward": 0.5221495295504348
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.5026718946882761,
      "avg_reward": 0.35927963792980677
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.47086165495655613,
      "avg_reward": 0.40081294472740414
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.48986457065124694,
      "avg_reward": 0.42759168122560215
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.5057877575363601,
      "avg_reward": 0.4009887603962444
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.4813126693948933,
      "avg_reward": 0.30930777428162143
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.49118165217484294,
      "avg_reward": 0.435765261456048
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.5061966133935483,
      "avg_reward": 0.34267035177923927
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.5071220342685439,
      "avg_reward": 0.42496349640127695
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.48766734025432884,
      "avg_reward": 0.3978201275007395
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.5081386316704389,
      "avg_reward": 0.34936239044482
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.009934283060224654,
      "avg_reward": 0.0010342113896204897,
      "difficulty_1_ratio": 0.5703496647219384,
      "difficulty_2_ratio": 0.34593455841067655,
      "difficulty_3_ratio": 0.0771884334190506,
      "difficulty_4_ratio": 0.006336012450983674,
      "difficulty_5_ratio": 0.00019133099735093797
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.5081386316704389,
      "avg_reward": 0.34936239044482
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 4.5,
      "update": 1,
      "cumulative_wall_time": 11.11111111111111
    },
    {
      "timestep": 101,
      "throughput": 4.95,
      "update": 2,
      "cumulative_wall_time": 22.22222222222222
    },
    {
      "timestep": 202,
      "throughput": 5.3999999999999995,
      "update": 3,
      "cumulative_wall_time": 33.33333333333333
    },
    {
      "timestep": 303,
      "throughput": 5.8500000000000005,
      "update": 4,
      "cumulative_wall_time": 44.44444444444444
    },
    {
      "timestep": 404,
      "throughput": 6.3,
      "update": 5,
      "cumulative_wall_time": 55.55555555555556
    },
    {
      "timestep": 505,
      "throughput": 6.75,
      "update": 6,
      "cumulative_wall_time": 66.66666666666667
    },
    {
      "timestep": 606,
      "throughput": 7.2,
      "update": 7,
      "cumulative_wall_time": 77.77777777777779
    },
    {
      "timestep": 707,
      "throughput": 7.6499999999999995,
      "update": 8,
      "cumulative_wall_time": 88.8888888888889
    },
    {
      "timestep": 808,
      "throughput": 8.1,
      "update": 9,
      "cumulative_wall_time": 100.00000000000001
    },
    {
      "timestep": 909,
      "throughput": 8.549999999999999,
      "update": 10,
      "cumulative_wall_time": 111.11111111111113
    },
    {
      "timestep": 1010,
      "throughput": 9.322008624313455,
      "update": 11,
      "cumulative_wall_time": 122.22222222222224
    },
    {
      "timestep": 1111,
      "throughput": 9.50470607373141,
      "update": 12,
      "cumulative_wall_time": 133.33333333333334
    },
    {
      "timestep": 1212,
      "throughput": 9.97474611885775,
      "update": 13,
      "cumulative_wall_time": 144.44444444444446
    },
    {
      "timestep": 1313,
      "throughput": 9.948421846831412,
      "update": 14,
      "cumulative_wall_time": 155.55555555555557
    },
    {
      "timestep": 1414,
      "throughput": 7.760097568838619,
      "update": 15,
      "cumulative_wall_time": 166.66666666666669
    },
    {
      "timestep": 1515,
      "throughput": 8.155957464076389,
      "update": 16,
      "cumulative_wall_time": 177.7777777777778
    },
    {
      "timestep": 1616,
      "throughput": 9.463531740487793,
      "update": 17,
      "cumulative_wall_time": 188.8888888888889
    },
    {
      "timestep": 1717,
      "throughput": 9.462407355820988,
      "update": 18,
      "cumulative_wall_time": 200.00000000000003
    },
    {
      "timestep": 1818,
      "throughput": 9.463542917675442,
      "update": 19,
      "cumulative_wall_time": 211.11111111111114
    },
    {
      "timestep": 1919,
      "throughput": 12.46745834158925,
      "update": 20,
      "cumulative_wall_time": 222.22222222222226
    },
    {
      "timestep": 2020,
      "throughput": 9.513801459623851,
      "update": 21,
      "cumulative_wall_time": 233.33333333333337
    },
    {
      "timestep": 2121,
      "throughput": 10.022009076162538,
      "update": 22,
      "cumulative_wall_time": 244.44444444444449
    },
    {
      "timestep": 2222,
      "throughput": 9.858601587143882,
      "update": 23,
      "cumulative_wall_time": 255.5555555555556
    },
    {
      "timestep": 2323,
      "throughput": 9.586252126175218,
      "update": 24,
      "cumulative_wall_time": 266.6666666666667
    },
    {
      "timestep": 2424,
      "throughput": 8.716257679823688,
      "update": 25,
      "cumulative_wall_time": 277.77777777777777
    },
    {
      "timestep": 2525,
      "throughput": 9.683072298443943,
      "update": 26,
      "cumulative_wall_time": 288.88888888888886
    },
    {
      "timestep": 2626,
      "throughput": 8.304457306916186,
      "update": 27,
      "cumulative_wall_time": 299.99999999999994
    },
    {
      "timestep": 2727,
      "throughput": 8.786863253933992,
      "update": 28,
      "cumulative_wall_time": 311.11111111111103
    },
    {
      "timestep": 2828,
      "throughput": 8.563172806953807,
      "update": 29,
      "cumulative_wall_time": 322.2222222222221
    },
    {
      "timestep": 2929,
      "throughput": 9.07368672544769,
      "update": 30,
      "cumulative_wall_time": 333.3333333333332
    },
    {
      "timestep": 3030,
      "throughput": 11.083192710006157,
      "update": 31,
      "cumulative_wall_time": 344.4444444444443
    },
    {
      "timestep": 3131,
      "throughput": 7.319461326667427,
      "update": 32,
      "cumulative_wall_time": 355.5555555555554
    },
    {
      "timestep": 3232,
      "throughput": 9.61763417133706,
      "update": 33,
      "cumulative_wall_time": 366.66666666666646
    },
    {
      "timestep": 3333,
      "throughput": 7.5485557159293135,
      "update": 34,
      "cumulative_wall_time": 377.77777777777754
    },
    {
      "timestep": 3434,
      "throughput": 8.57526132078951,
      "update": 35,
      "cumulative_wall_time": 388.88888888888863
    },
    {
      "timestep": 3535,
      "throughput": 9.98005553727063,
      "update": 36,
      "cumulative_wall_time": 399.9999999999997
    },
    {
      "timestep": 3636,
      "throughput": 9.057852017185915,
      "update": 37,
      "cumulative_wall_time": 411.1111111111108
    },
    {
      "timestep": 3737,
      "throughput": 8.030029699863626,
      "update": 38,
      "cumulative_wall_time": 422.2222222222219
    },
    {
      "timestep": 3838,
      "throughput": 8.356226661666028,
      "update": 39,
      "cumulative_wall_time": 433.333333333333
    },
    {
      "timestep": 3939,
      "throughput": 9.611637974041207,
      "update": 40,
      "cumulative_wall_time": 444.44444444444406
    },
    {
      "timestep": 4040,
      "throughput": 8.342670031454578,
      "update": 41,
      "cumulative_wall_time": 455.55555555555515
    },
    {
      "timestep": 4141,
      "throughput": 9.194812730623779,
      "update": 42,
      "cumulative_wall_time": 466.66666666666623
    },
    {
      "timestep": 4242,
      "throughput": 9.041014655913433,
      "update": 43,
      "cumulative_wall_time": 477.7777777777773
    },
    {
      "timestep": 4343,
      "throughput": 8.413559687154764,
      "update": 44,
      "cumulative_wall_time": 488.8888888888884
    },
    {
      "timestep": 4444,
      "throughput": 10.929549680392794,
      "update": 45,
      "cumulative_wall_time": 499.9999999999995
    },
    {
      "timestep": 4545,
      "throughput": 9.57052712008621,
      "update": 46,
      "cumulative_wall_time": 511.1111111111106
    },
    {
      "timestep": 4646,
      "throughput": 7.177371672008154,
      "update": 47,
      "cumulative_wall_time": 522.2222222222217
    },
    {
      "timestep": 4747,
      "throughput": 9.167808883292485,
      "update": 48,
      "cumulative_wall_time": 533.3333333333328
    },
    {
      "timestep": 4848,
      "throughput": 8.40439218170845,
      "update": 49,
      "cumulative_wall_time": 544.4444444444439
    },
    {
      "timestep": 4949,
      "throughput": 9.767190001316601,
      "update": 50,
      "cumulative_wall_time": 555.555555555555
    },
    {
      "timestep": 5050,
      "throughput": 8.28673133541057,
      "update": 51,
      "cumulative_wall_time": 566.6666666666661
    },
    {
      "timestep": 5151,
      "throughput": 8.896737202679791,
      "update": 52,
      "cumulative_wall_time": 577.7777777777771
    },
    {
      "timestep": 5252,
      "throughput": 9.454488551082411,
      "update": 53,
      "cumulative_wall_time": 588.8888888888882
    },
    {
      "timestep": 5353,
      "throughput": 9.77917967475311,
      "update": 54,
      "cumulative_wall_time": 599.9999999999993
    },
    {
      "timestep": 5454,
      "throughput": 7.919733233649801,
      "update": 55,
      "cumulative_wall_time": 611.1111111111104
    },
    {
      "timestep": 5555,
      "throughput": 8.698948887743146,
      "update": 56,
      "cumulative_wall_time": 622.2222222222215
    },
    {
      "timestep": 5656,
      "throughput": 8.572549219955139,
      "update": 57,
      "cumulative_wall_time": 633.3333333333326
    },
    {
      "timestep": 5757,
      "throughput": 8.41200369068366,
      "update": 58,
      "cumulative_wall_time": 644.4444444444437
    },
    {
      "timestep": 5858,
      "throughput": 10.588908816252987,
      "update": 59,
      "cumulative_wall_time": 655.5555555555547
    },
    {
      "timestep": 5959,
      "throughput": 9.36448353986486,
      "update": 60,
      "cumulative_wall_time": 666.6666666666658
    },
    {
      "timestep": 6060,
      "throughput": 7.8652044410984585,
      "update": 61,
      "cumulative_wall_time": 677.7777777777769
    },
    {
      "timestep": 6161,
      "throughput": 9.826075752349299,
      "update": 62,
      "cumulative_wall_time": 688.888888888888
    },
    {
      "timestep": 6262,
      "throughput": 10.90994057731137,
      "update": 63,
      "cumulative_wall_time": 699.9999999999991
    },
    {
      "timestep": 6363,
      "throughput": 9.929218734496033,
      "update": 64,
      "cumulative_wall_time": 711.1111111111102
    },
    {
      "timestep": 6464,
      "throughput": 7.632567030641388,
      "update": 65,
      "cumulative_wall_time": 722.2222222222213
    },
    {
      "timestep": 6565,
      "throughput": 8.564189334420373,
      "update": 66,
      "cumulative_wall_time": 733.3333333333323
    },
    {
      "timestep": 6666,
      "throughput": 10.14022003426796,
      "update": 67,
      "cumulative_wall_time": 744.4444444444434
    },
    {
      "timestep": 6767,
      "throughput": 8.363097480943097,
      "update": 68,
      "cumulative_wall_time": 755.5555555555545
    },
    {
      "timestep": 6868,
      "throughput": 9.399437485331605,
      "update": 69,
      "cumulative_wall_time": 766.6666666666656
    },
    {
      "timestep": 6969,
      "throughput": 9.697170648086404,
      "update": 70,
      "cumulative_wall_time": 777.7777777777767
    },
    {
      "timestep": 7070,
      "throughput": 8.165762575579725,
      "update": 71,
      "cumulative_wall_time": 788.8888888888878
    },
    {
      "timestep": 7171,
      "throughput": 8.94642717954438,
      "update": 72,
      "cumulative_wall_time": 799.9999999999989
    },
    {
      "timestep": 7272,
      "throughput": 6.082859393937834,
      "update": 73,
      "cumulative_wall_time": 811.11111111111
    },
    {
      "timestep": 7373,
      "throughput": 8.078051122799138,
      "update": 74,
      "cumulative_wall_time": 822.222222222221
    },
    {
      "timestep": 7474,
      "throughput": 8.772688663746155,
      "update": 75,
      "cumulative_wall_time": 833.3333333333321
    },
    {
      "timestep": 7575,
      "throughput": 7.876995136231635,
      "update": 76,
      "cumulative_wall_time": 844.4444444444432
    },
    {
      "timestep": 7676,
      "throughput": 10.469170173538473,
      "update": 77,
      "cumulative_wall_time": 855.5555555555543
    },
    {
      "timestep": 7777,
      "throughput": 7.71287275983543,
      "update": 78,
      "cumulative_wall_time": 866.6666666666654
    },
    {
      "timestep": 7878,
      "throughput": 8.603959961972715,
      "update": 79,
      "cumulative_wall_time": 877.7777777777765
    },
    {
      "timestep": 7979,
      "throughput": 9.117666519557481,
      "update": 80,
      "cumulative_wall_time": 888.8888888888875
    },
    {
      "timestep": 8080,
      "throughput": 10.297145960159504,
      "update": 81,
      "cumulative_wall_time": 899.9999999999986
    },
    {
      "timestep": 8181,
      "throughput": 7.707724063938505,
      "update": 82,
      "cumulative_wall_time": 911.1111111111097
    },
    {
      "timestep": 8282,
      "throughput": 10.046847376939462,
      "update": 83,
      "cumulative_wall_time": 922.2222222222208
    },
    {
      "timestep": 8383,
      "throughput": 9.009209754917627,
      "update": 84,
      "cumulative_wall_time": 933.3333333333319
    },
    {
      "timestep": 8484,
      "throughput": 8.116642214056844,
      "update": 85,
      "cumulative_wall_time": 944.444444444443
    },
    {
      "timestep": 8585,
      "throughput": 9.415893126836945,
      "update": 86,
      "cumulative_wall_time": 955.5555555555541
    },
    {
      "timestep": 8686,
      "throughput": 9.179153726016121,
      "update": 87,
      "cumulative_wall_time": 966.6666666666652
    },
    {
      "timestep": 8787,
      "throughput": 8.459804810557085,
      "update": 88,
      "cumulative_wall_time": 977.7777777777762
    },
    {
      "timestep": 8888,
      "throughput": 9.062821876491016,
      "update": 89,
      "cumulative_wall_time": 988.8888888888873
    },
    {
      "timestep": 8989,
      "throughput": 8.653217762824415,
      "update": 90,
      "cumulative_wall_time": 999.9999999999984
    },
    {
      "timestep": 9090,
      "throughput": 9.102165610726123,
      "update": 91,
      "cumulative_wall_time": 1011.1111111111095
    },
    {
      "timestep": 9191,
      "throughput": 9.595917607068941,
      "update": 92,
      "cumulative_wall_time": 1022.2222222222206
    },
    {
      "timestep": 9292,
      "throughput": 10.427415134530817,
      "update": 93,
      "cumulative_wall_time": 1033.3333333333317
    },
    {
      "timestep": 9393,
      "throughput": 7.885966051055837,
      "update": 94,
      "cumulative_wall_time": 1044.4444444444428
    },
    {
      "timestep": 9494,
      "throughput": 10.919730037190641,
      "update": 95,
      "cumulative_wall_time": 1055.5555555555538
    },
    {
      "timestep": 9595,
      "throughput": 7.243120980429748,
      "update": 96,
      "cumulative_wall_time": 1066.666666666665
    },
    {
      "timestep": 9696,
      "throughput": 8.863393414467975,
      "update": 97,
      "cumulative_wall_time": 1077.777777777776
    },
    {
      "timestep": 9797,
      "throughput": 9.529485485836119,
      "update": 98,
      "cumulative_wall_time": 1088.888888888887
    },
    {
      "timestep": 9898,
      "throughput": 9.252892680961528,
      "update": 99,
      "cumulative_wall_time": 1099.9999999999982
    },
    {
      "timestep": 10000,
      "throughput": 8.439570432161466,
      "update": 100,
      "cumulative_wall_time": 1111.1111111111093
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 1500,
        "success_rate": 0.85,
        "mean_reward": 0.7608375549928545,
        "recent_gradient": 0.009013998130682335
      },
      "level_2": {
        "num_pulls": 2000,
        "success_rate": 0.65,
        "mean_reward": 0.5732127048611159,
        "recent_gradient": 0.02169920419404205
      },
      "level_3": {
        "num_pulls": 2500,
        "success_rate": 0.45,
        "mean_reward": 0.412140309719301,
        "recent_gradient": 0.028614180809478692
      },
      "level_4": {
        "num_pulls": 2500,
        "success_rate": 0.28,
        "mean_reward": 0.2699919975086651,
        "recent_gradient": 0.02061459904175322
      },
      "level_5": {
        "num_pulls": 1500,
        "success_rate": 0.15,
        "mean_reward": 0.1512572423767792,
        "recent_gradient": 0.011259257683847225
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.15
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 4.5855024945389635
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.719909479901515
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 5.373646802561631
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 5.3051851327167325
      }
    }
  },
  "config": {
    "use_async": false,
    "curriculum_strategy": "fixed"
  }
}