{
  "experiment_name": "sync_curriculum_seed456",
  "total_timesteps": 10000,
  "total_time": 1111.111111111111,
  "avg_throughput": 9,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": -0.02491047619505481,
      "difficulty_1_ratio": 0.5703496647219384,
      "difficulty_2_ratio": 0.34593455841067655,
      "difficulty_3_ratio": 0.0771884334190506,
      "difficulty_4_ratio": 0.006336012450983674,
      "difficulty_5_ratio": 0.00019133099735093797
    },
    {
      "timestep": 101,
      "pass_at_1": 0.02348262751661985,
      "avg_reward": 0.04722071440730431,
      "difficulty_1_ratio": 0.545817584309558,
      "difficulty_2_ratio": 0.3592137008263376,
      "difficulty_3_ratio": 0.0869688606806755,
      "difficulty_4_ratio": 0.007746048051242527,
      "difficulty_5_ratio": 0.00025380613218624814
    },
    {
      "timestep": 202,
      "pass_at_1": 0.04923241184774102,
      "avg_reward": 0.12086535611789308,
      "difficulty_1_ratio": 0.5207065136269264,
      "difficulty_2_ratio": 0.3718356202546844,
      "difficulty_3_ratio": 0.09768198799373931,
      "difficulty_4_ratio": 0.009440250235689705,
      "difficulty_5_ratio": 0.00033562788896017117
    },
    {
      "timestep": 303,
      "pass_at_1": 0.03937265756944244,
      "avg_reward": 0.05397228488857338,
      "difficulty_1_ratio": 0.4951092343136047,
      "difficulty_2_ratio": 0.38362916613190773,
      "difficulty_3_ratio": 0.10935225097641152,
      "difficulty_4_ratio": 0.011466987914927423,
      "difficulty_5_ratio": 0.00044236066314863343
    },
    {
      "timestep": 404,
      "pass_at_1": 0.03752822210509249,
      "avg_reward": 0.014261036198458754,
      "difficulty_1_ratio": 0.469130336180388,
      "difficulty_2_ratio": 0.3944179935925989,
      "difficulty_3_ratio": 0.12199033943415045,
      "difficulty_4_ratio": 0.013880326375356456,
      "difficulty_5_ratio": 0.0005810044175062076
    },
    {
      "timestep": 505,
      "pass_at_1": 0.07459880555815715,
      "avg_reward": 0.0031674826133226003,
      "difficulty_1_ratio": 0.4428854101147015,
      "difficulty_2_ratio": 0.40402402094501866,
      "difficulty_3_ratio": 0.13559026749360029,
      "difficulty_4_ratio": 0.0167399966441195,
      "difficulty_5_ratio": 0.0007603048025599198
    },
    {
      "timestep": 606,
      "pass_at_1": 0.09639751631258278,
      "avg_reward": 0.08901056851008081,
      "difficulty_1_ratio": 0.4164998456831705,
      "difficulty_2_ratio": 0.41227145735706794,
      "difficulty_3_ratio": 0.15012644832783253,
      "difficulty_4_ratio": 0.02011113911124073,
      "difficulty_5_ratio": 0.0009911095206882054
    },
    {
      "timestep": 707,
      "pass_at_1": 0.11593440508736777,
      "avg_reward": 0.1899826437305998,
      "difficulty_1_ratio": 0.390107224895361,
      "difficulty_2_ratio": 0.4189913219593774,
      "difficulty_3_ratio": 0.1655509131479823,
      "difficulty_4_ratio": 0.024063769070528613,
      "difficulty_5_ratio": 0.0012867709267507749
    },
    {
      "timestep": 808,
      "pass_at_1": 0.16463926901033826,
      "avg_reward": 0.17772883300022746,
      "difficulty_1_ratio": 0.3638473227132847,
      "difficulty_2_ratio": 0.42402633368046766,
      "difficulty_3_ratio": 0.18179083819928793,
      "difficulty_4_ratio": 0.028671913216506643,
      "difficulty_5_ratio": 0.0016635921904528722
    },
    {
      "timestep": 909,
      "pass_at_1": 0.1490283361602705,
      "avg_reward": 0.17710027082666813,
      "difficulty_1_ratio": 0.337863746670805,
      "difficulty_2_ratio": 0.4272360092470168,
      "difficulty_3_ratio": 0.19874656153923254,
      "difficulty_4_ratio": 0.03401237165049899,
      "difficulty_5_ratio": 0.0021413108924466314
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.13223623241955818,
      "avg_reward": 0.10135140420386865,
      "difficulty_1_ratio": 0.31230127114431194,
      "difficulty_2_ratio": 0.4285017684753959,
      "difficulty_3_ratio": 0.21629028030484038,
      "difficulty_4_ratio": 0.04016307038955698,
      "difficulty_5_ratio": 0.0027436096858948753
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.1190754573558436,
      "avg_reward": 0.07605734127020221,
      "difficulty_1_ratio": 0.2873029447333821,
      "difficulty_2_ratio": 0.4277318152433385,
      "difficulty_3_ratio": 0.23426561605703436,
      "difficulty_4_ratio": 0.04720098526509968,
      "difficulty_5_ratio": 0.0034986387011453407
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.1655313403982423,
      "avg_reward": 0.13924366331993732,
      "difficulty_1_ratio": 0.2630070699260558,
      "difficulty_2_ratio": 0.4248655434002136,
      "difficulty_3_ratio": 0.2524882182255638,
      "difficulty_4_ratio": 0.05519963957750222,
      "difficulty_5_ratio": 0.004439528870664513
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.13970662310492712,
      "avg_reward": 0.09671102413021448,
      "difficulty_1_ratio": 0.23954417068994155,
      "difficulty_2_ratio": 0.41987721294759744,
      "difficulty_3_ratio": 0.2707475422306048,
      "difficulty_4_ratio": 0.06422620455155005,
      "difficulty_5_ratio": 0.005604869580306165
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.15359189101924928,
      "avg_reward": 0.17995525479883026,
      "difficulty_1_ratio": 0.21703407392185683,
      "difficulty_2_ratio": 0.412778655730858,
      "difficulty_3_ratio": 0.2888098894295048,
      "difficulty_4_ratio": 0.07433826251589389,
      "difficulty_5_ratio": 0.0070391184018864465
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.12972250803660393,
      "avg_reward": 0.09005896160882831,
      "difficulty_1_ratio": 0.1955832332539105,
      "difficulty_2_ratio": 0.4036208028084852,
      "difficulty_3_ratio": 0.3064227321494006,
      "difficulty_4_ratio": 0.08558032615731795,
      "difficulty_5_ratio": 0.008792905630886071
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.17776277945915647,
      "avg_reward": 0.07021582036971169,
      "difficulty_1_ratio": 0.17528241761460614,
      "difficulty_2_ratio": 0.39249387697759325,
      "difficulty_3_ratio": 0.3233202719632032,
      "difficulty_4_ratio": 0.09798024091278032,
      "difficulty_5_ratio": 0.010923192531817163
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.19159219656765153,
      "avg_reward": 0.11161850578325241,
      "difficulty_1_ratio": 0.15620487203762,
      "difficulty_2_ratio": 0.3795261610306469,
      "difficulty_3_ratio": 0.3392300979084394,
      "difficulty_4_ratio": 0.11154562879642933,
      "difficulty_5_ratio": 0.013493240226864338
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.1832076955947182,
      "avg_reward": 0.15088348364973195,
      "difficulty_1_ratio": 0.13840503524267814,
      "difficulty_2_ratio": 0.36488133073132456,
      "difficulty_3_ratio": 0.3538807296736819,
      "difficulty_4_ratio": 0.12626055765373156,
      "difficulty_5_ratio": 0.016572346698583963
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.1816804268870372,
      "avg_reward": 0.08471921342469274,
      "difficulty_1_ratio": 0.12191786908589192,
      "difficulty_2_ratio": 0.3487544252621549,
      "difficulty_3_ratio": 0.36700975575577915,
      "difficulty_4_ratio": 0.1420826368959247,
      "difficulty_5_ratio": 0.02023531300024945
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.181837754147497,
      "avg_reward": 0.12752618899238494,
      "difficulty_1_ratio": 0.10675882140395278,
      "difficulty_2_ratio": 0.33136661015926444,
      "difficulty_3_ratio": 0.37837221513402225,
      "difficulty_4_ratio": 0.158940746377412,
      "difficulty_5_ratio": 0.02456160692534847
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.20834773964280265,
      "avg_reward": 0.13962400014388254,
      "difficulty_1_ratio": 0.09292440882580433,
      "difficulty_2_ratio": 0.3129589615253456,
      "difficulty_3_ratio": 0.38774882932075583,
      "difficulty_4_ratio": 0.1767335970180918,
      "difficulty_5_ratio": 0.02963420331000244
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.18909849976997406,
      "avg_reward": 0.13671561545374966,
      "difficulty_1_ratio": 0.08039337269830067,
      "difficulty_2_ratio": 0.29378555928253614,
      "difficulty_3_ratio": 0.3949536745312958,
      "difficulty_4_ratio": 0.19532929872471466,
      "difficulty_5_ratio": 0.03553809476315268
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.20216426338779225,
      "avg_reward": 0.22181295500608247,
      "difficulty_1_ratio": 0.0691283320657602,
      "difficulty_2_ratio": 0.2741062164565189,
      "difficulty_3_ratio": 0.39984089400061734,
      "difficulty_4_ratio": 0.21456607296103805,
      "difficulty_5_ratio": 0.04235848451606555
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.1998126597844999,
      "avg_reward": 0.18212172897485013,
      "difficulty_1_ratio": 0.05907783484757915,
      "difficulty_2_ratio": 0.2541791879471294,
      "difficulty_3_ratio": 0.40231008867116286,
      "difficulty_4_ratio": 0.23425419509772658,
      "difficulty_5_ratio": 0.05017869343640206
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.18403102249781314,
      "avg_reward": 0.15058144602846146,
      "difficulty_1_ratio": 0.050178693436402015,
      "difficulty_2_ratio": 0.2342541950977265,
      "difficulty_3_ratio": 0.40231008867116286,
      "difficulty_4_ratio": 0.2541791879471295,
      "difficulty_5_ratio": 0.059077834847579204
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.18560245163281147,
      "avg_reward": 0.10364112340993728,
      "difficulty_1_ratio": 0.04235848451606552,
      "difficulty_2_ratio": 0.21456607296103797,
      "difficulty_3_ratio": 0.3998408940006174,
      "difficulty_4_ratio": 0.274106216456519,
      "difficulty_5_ratio": 0.06912833206576029
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.24007488453765863,
      "avg_reward": 0.18809616806834584,
      "difficulty_1_ratio": 0.03553809476315264,
      "difficulty_2_ratio": 0.1953292987247146,
      "difficulty_3_ratio": 0.3949536745312958,
      "difficulty_4_ratio": 0.2937855592825363,
      "difficulty_5_ratio": 0.08039337269830077
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.20771695554346414,
      "avg_reward": 0.1668636878050614,
      "difficulty_1_ratio": 0.029634203310002414,
      "difficulty_2_ratio": 0.17673359701809171,
      "difficulty_3_ratio": 0.38774882932075583,
      "difficulty_4_ratio": 0.31295896152534575,
      "difficulty_5_ratio": 0.09292440882580441
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.19786736960307028,
      "avg_reward": 0.24460066550694734,
      "difficulty_1_ratio": 0.02456160692534847,
      "difficulty_2_ratio": 0.158940746377412,
      "difficulty_3_ratio": 0.37837221513402225,
      "difficulty_4_ratio": 0.33136661015926444,
      "difficulty_5_ratio": 0.10675882140395278
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.22137166558771798,
      "avg_reward": 0.18980760825363444,
      "difficulty_1_ratio": 0.020235313000249448,
      "difficulty_2_ratio": 0.14208263689592468,
      "difficulty_3_ratio": 0.3670097557557791,
      "difficulty_4_ratio": 0.34875442526215483,
      "difficulty_5_ratio": 0.12191786908589189
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.23127726239500102,
      "avg_reward": 0.18169422460712295,
      "difficulty_1_ratio": 0.016572346698583963,
      "difficulty_2_ratio": 0.12626055765373156,
      "difficulty_3_ratio": 0.35388072967368184,
      "difficulty_4_ratio": 0.3648813307313245,
      "difficulty_5_ratio": 0.13840503524267814
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.2217496238048055,
      "avg_reward": 0.16109302569701178,
      "difficulty_1_ratio": 0.013493240226864338,
      "difficulty_2_ratio": 0.11154562879642933,
      "difficulty_3_ratio": 0.3392300979084394,
      "difficulty_4_ratio": 0.3795261610306469,
      "difficulty_5_ratio": 0.15620487203762
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.26101270021037537,
      "avg_reward": 0.17712788698908602,
      "difficulty_1_ratio": 0.010923192531817153,
      "difficulty_2_ratio": 0.09798024091278025,
      "difficulty_3_ratio": 0.32332027196320307,
      "difficulty_4_ratio": 0.39249387697759325,
      "difficulty_5_ratio": 0.17528241761460625
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.250391285646469,
      "avg_reward": 0.2909965892281266,
      "difficulty_1_ratio": 0.00879290563088607,
      "difficulty_2_ratio": 0.08558032615731792,
      "difficulty_3_ratio": 0.3064227321494005,
      "difficulty_4_ratio": 0.40362080280848517,
      "difficulty_5_ratio": 0.19558323325391047
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.2602391511204672,
      "avg_reward": 0.16406918565702075,
      "difficulty_1_ratio": 0.007039118401886442,
      "difficulty_2_ratio": 0.07433826251589386,
      "difficulty_3_ratio": 0.2888098894295048,
      "difficulty_4_ratio": 0.41277865573085804,
      "difficulty_5_ratio": 0.21703407392185695
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.2872256879211826,
      "avg_reward": 0.27247746489856567,
      "difficulty_1_ratio": 0.00560486958030616,
      "difficulty_2_ratio": 0.06422620455155001,
      "difficulty_3_ratio": 0.2707475422306047,
      "difficulty_4_ratio": 0.41987721294759744,
      "difficulty_5_ratio": 0.2395441706899417
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.287251931340695,
      "avg_reward": 0.24438569379836006,
      "difficulty_1_ratio": 0.004439528870664501,
      "difficulty_2_ratio": 0.05519963957750214,
      "difficulty_3_ratio": 0.2524882182255636,
      "difficulty_4_ratio": 0.42486554340021365,
      "difficulty_5_ratio": 0.2630070699260561
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.2802622768586879,
      "avg_reward": 0.2934801692522314,
      "difficulty_1_ratio": 0.0034986387011453407,
      "difficulty_2_ratio": 0.04720098526509968,
      "difficulty_3_ratio": 0.23426561605703436,
      "difficulty_4_ratio": 0.4277318152433385,
      "difficulty_5_ratio": 0.2873029447333821
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.27588066901692027,
      "avg_reward": 0.2712232473355583,
      "difficulty_1_ratio": 0.0027436096858948753,
      "difficulty_2_ratio": 0.04016307038955698,
      "difficulty_3_ratio": 0.21629028030484038,
      "difficulty_4_ratio": 0.4285017684753959,
      "difficulty_5_ratio": 0.31230127114431194
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.29252785263435815,
      "avg_reward": 0.2743297863220583,
      "difficulty_1_ratio": 0.0021413108924466314,
      "difficulty_2_ratio": 0.03401237165049899,
      "difficulty_3_ratio": 0.19874656153923254,
      "difficulty_4_ratio": 0.4272360092470168,
      "difficulty_5_ratio": 0.337863746670805
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.2933574043482397,
      "avg_reward": 0.22233708996534216,
      "difficulty_1_ratio": 0.0016635921904528726,
      "difficulty_2_ratio": 0.02867191321650665,
      "difficulty_3_ratio": 0.18179083819928796,
      "difficulty_4_ratio": 0.42402633368046766,
      "difficulty_5_ratio": 0.3638473227132848
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.281982725059386,
      "avg_reward": 0.18250384423912686,
      "difficulty_1_ratio": 0.0012867709267507727,
      "difficulty_2_ratio": 0.02406376907052859,
      "difficulty_3_ratio": 0.16555091314798218,
      "difficulty_4_ratio": 0.41899132195937727,
      "difficulty_5_ratio": 0.3901072248953611
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.32563568204749793,
      "avg_reward": 0.22101245345187126,
      "difficulty_1_ratio": 0.0009911095206882065,
      "difficulty_2_ratio": 0.020111139111240753,
      "difficulty_3_ratio": 0.15012644832783265,
      "difficulty_4_ratio": 0.41227145735706805,
      "difficulty_5_ratio": 0.4164998456831704
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.3194696445678124,
      "avg_reward": 0.2412708178693534,
      "difficulty_1_ratio": 0.0007603048025599186,
      "difficulty_2_ratio": 0.01673999664411949,
      "difficulty_3_ratio": 0.1355902674936002,
      "difficulty_4_ratio": 0.40402402094501866,
      "difficulty_5_ratio": 0.44288541011470167
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.2985598453786472,
      "avg_reward": 0.29357010557482976,
      "difficulty_1_ratio": 0.0005810044175062084,
      "difficulty_2_ratio": 0.013880326375356472,
      "difficulty_3_ratio": 0.12199033943415054,
      "difficulty_4_ratio": 0.3944179935925989,
      "difficulty_5_ratio": 0.4691303361803878
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.351410234396386,
      "avg_reward": 0.18558216466902405,
      "difficulty_1_ratio": 0.00044236066314863197,
      "difficulty_2_ratio": 0.011466987914927403,
      "difficulty_3_ratio": 0.10935225097641141,
      "difficulty_4_ratio": 0.3836291661319077,
      "difficulty_5_ratio": 0.49510923431360493
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.3273062980495641,
      "avg_reward": 0.29315502220511047,
      "difficulty_1_ratio": 0.0003356278889601711,
      "difficulty_2_ratio": 0.009440250235689705,
      "difficulty_3_ratio": 0.09768198799373934,
      "difficulty_4_ratio": 0.3718356202546845,
      "difficulty_5_ratio": 0.5207065136269263
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.3317415846019194,
      "avg_reward": 0.3815252661104421,
      "difficulty_1_ratio": 0.00025380613218624744,
      "difficulty_2_ratio": 0.007746048051242511,
      "difficulty_3_ratio": 0.08696886068067541,
      "difficulty_4_ratio": 0.3592137008263375,
      "difficulty_5_ratio": 0.5458175843095583
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.38108252371106816,
      "avg_reward": 0.32470827337029085,
      "difficulty_1_ratio": 0.00019133099735093795,
      "difficulty_2_ratio": 0.006336012450983673,
      "difficulty_3_ratio": 0.0771884334190506,
      "difficulty_4_ratio": 0.3459345584106765,
      "difficulty_5_ratio": 0.5703496647219383
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.3258523104740148,
      "avg_reward": 0.2180130061145187
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.3050752936873161,
      "avg_reward": 0.3027749919971785
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.33200596818273226,
      "avg_reward": 0.3001305471470981
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.37142583287781306,
      "avg_reward": 0.27353825198505727
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.34538141132002814,
      "avg_reward": 0.2727423551762648
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.36137453498085065,
      "avg_reward": 0.34297827639260653
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.4139225906290834,
      "avg_reward": 0.34874247840976164
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.3947104387080458,
      "avg_reward": 0.25803618210281215
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.4115299053640441,
      "avg_reward": 0.4578519092709691
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.3983159522943561,
      "avg_reward": 0.2784769648720461
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.38720233787820646,
      "avg_reward": 0.2601565080353388
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.3766855029815994,
      "avg_reward": 0.2672025364103293
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.422883051744022,
      "avg_reward": 0.31108156735242437
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.40858153643655315,
      "avg_reward": 0.29377721478322394
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.40342656509231417,
      "avg_reward": 0.2472924396134381
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.39037308788219177,
      "avg_reward": 0.3313965817314421
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.4201571931120556,
      "avg_reward": 0.36541481662701575
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.44781889988627116,
      "avg_reward": 0.4786997949334343
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.42358726825678616,
      "avg_reward": 0.2742157978662279
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.4308840944283878,
      "avg_reward": 0.43702739384604444
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.4174452367488783,
      "avg_reward": 0.2975313699464686
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.4329070590888518,
      "avg_reward": 0.36391860752099225
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.4620529129704223,
      "avg_reward": 0.41386540342143174
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.45472607910876156,
      "avg_reward": 0.2477558603210145
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.44365726688415585,
      "avg_reward": 0.3052858890767022
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.44687488125511615,
      "avg_reward": 0.32933427415208516
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.4506677043817729,
      "avg_reward": 0.4032128374931615
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.4526670888610497,
      "avg_reward": 0.27520943143873666
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.471945822272093,
      "avg_reward": 0.3367554927292204
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.45534723440913033,
      "avg_reward": 0.3487808795416862
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.441945444817889,
      "avg_reward": 0.2698704123975193
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.46933413120288675,
      "avg_reward": 0.4129344112828374
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.48842316815866826,
      "avg_reward": 0.24422966153358608
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.4654815578092525,
      "avg_reward": 0.40922092932219156
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.5164323634563549,
      "avg_reward": 0.4702950342362446
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.45355527768293974,
      "avg_reward": 0.3392680176520867
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.5044533382403235,
      "avg_reward": 0.3636136405204223
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.43915709199197683,
      "avg_reward": 0.3280070623410509
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.4856030028970267,
      "avg_reward": 0.40978911486727987
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.47711587023667,
      "avg_reward": 0.42078427310222755
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.4836563248519632,
      "avg_reward": 0.4158874563174536
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.4930867643515084,
      "avg_reward": 0.3035088195244661
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.4571834920439596,
      "avg_reward": 0.2709598654522586
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.5035615225311548,
      "avg_reward": 0.40469277457846997
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.477437862542462,
      "avg_reward": 0.4110159829435861
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.47896192601346554,
      "avg_reward": 0.29244456273232833
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.5041072904849093,
      "avg_reward": 0.4579016466833591
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.5173343279085374,
      "avg_reward": 0.3716962443395144
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.4705713357304069,
      "avg_reward": 0.3733629021109292
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.5364636327797998,
      "avg_reward": 0.4786437173860394
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": -0.02491047619505481,
      "difficulty_1_ratio": 0.5703496647219384,
      "difficulty_2_ratio": 0.34593455841067655,
      "difficulty_3_ratio": 0.0771884334190506,
      "difficulty_4_ratio": 0.006336012450983674,
      "difficulty_5_ratio": 0.00019133099735093797
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.5364636327797998,
      "avg_reward": 0.4786437173860394
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 4.5,
      "update": 1,
      "cumulative_wall_time": 11.11111111111111
    },
    {
      "timestep": 101,
      "throughput": 4.95,
      "update": 2,
      "cumulative_wall_time": 22.22222222222222
    },
    {
      "timestep": 202,
      "throughput": 5.3999999999999995,
      "update": 3,
      "cumulative_wall_time": 33.33333333333333
    },
    {
      "timestep": 303,
      "throughput": 5.8500000000000005,
      "update": 4,
      "cumulative_wall_time": 44.44444444444444
    },
    {
      "timestep": 404,
      "throughput": 6.3,
      "update": 5,
      "cumulative_wall_time": 55.55555555555556
    },
    {
      "timestep": 505,
      "throughput": 6.75,
      "update": 6,
      "cumulative_wall_time": 66.66666666666667
    },
    {
      "timestep": 606,
      "throughput": 7.2,
      "update": 7,
      "cumulative_wall_time": 77.77777777777779
    },
    {
      "timestep": 707,
      "throughput": 7.6499999999999995,
      "update": 8,
      "cumulative_wall_time": 88.8888888888889
    },
    {
      "timestep": 808,
      "throughput": 8.1,
      "update": 9,
      "cumulative_wall_time": 100.00000000000001
    },
    {
      "timestep": 909,
      "throughput": 8.549999999999999,
      "update": 10,
      "cumulative_wall_time": 111.11111111111113
    },
    {
      "timestep": 1010,
      "throughput": 9.458166074168386,
      "update": 11,
      "cumulative_wall_time": 122.22222222222224
    },
    {
      "timestep": 1111,
      "throughput": 8.19349619516126,
      "update": 12,
      "cumulative_wall_time": 133.33333333333334
    },
    {
      "timestep": 1212,
      "throughput": 7.949628842952026,
      "update": 13,
      "cumulative_wall_time": 144.44444444444446
    },
    {
      "timestep": 1313,
      "throughput": 9.619867034111556,
      "update": 14,
      "cumulative_wall_time": 155.55555555555557
    },
    {
      "timestep": 1414,
      "throughput": 7.7051680243870155,
      "update": 15,
      "cumulative_wall_time": 166.66666666666669
    },
    {
      "timestep": 1515,
      "throughput": 10.769362443982445,
      "update": 16,
      "cumulative_wall_time": 177.7777777777778
    },
    {
      "timestep": 1616,
      "throughput": 9.824452465261905,
      "update": 17,
      "cumulative_wall_time": 188.8888888888889
    },
    {
      "timestep": 1717,
      "throughput": 8.180688793514411,
      "update": 18,
      "cumulative_wall_time": 200.00000000000003
    },
    {
      "timestep": 1818,
      "throughput": 8.901993958205686,
      "update": 19,
      "cumulative_wall_time": 211.11111111111114
    },
    {
      "timestep": 1919,
      "throughput": 7.566197521560534,
      "update": 20,
      "cumulative_wall_time": 222.22222222222226
    },
    {
      "timestep": 2020,
      "throughput": 8.704994841568393,
      "update": 21,
      "cumulative_wall_time": 233.33333333333337
    },
    {
      "timestep": 2121,
      "throughput": 10.128506388784302,
      "update": 22,
      "cumulative_wall_time": 244.44444444444449
    },
    {
      "timestep": 2222,
      "throughput": 10.661965133870277,
      "update": 23,
      "cumulative_wall_time": 255.5555555555556
    },
    {
      "timestep": 2323,
      "throughput": 9.61819647326678,
      "update": 24,
      "cumulative_wall_time": 266.6666666666667
    },
    {
      "timestep": 2424,
      "throughput": 6.871757289980189,
      "update": 25,
      "cumulative_wall_time": 277.77777777777777
    },
    {
      "timestep": 2525,
      "throughput": 9.437195666968318,
      "update": 26,
      "cumulative_wall_time": 288.88888888888886
    },
    {
      "timestep": 2626,
      "throughput": 9.442877961589863,
      "update": 27,
      "cumulative_wall_time": 299.99999999999994
    },
    {
      "timestep": 2727,
      "throughput": 8.620838119125466,
      "update": 28,
      "cumulative_wall_time": 311.11111111111103
    },
    {
      "timestep": 2828,
      "throughput": 9.817948963225726,
      "update": 29,
      "cumulative_wall_time": 322.2222222222221
    },
    {
      "timestep": 2929,
      "throughput": 7.938096185794429,
      "update": 30,
      "cumulative_wall_time": 333.3333333333332
    },
    {
      "timestep": 3030,
      "throughput": 9.600592617653694,
      "update": 31,
      "cumulative_wall_time": 344.4444444444443
    },
    {
      "timestep": 3131,
      "throughput": 8.894832371142655,
      "update": 32,
      "cumulative_wall_time": 355.5555555555554
    },
    {
      "timestep": 3232,
      "throughput": 9.46118096491869,
      "update": 33,
      "cumulative_wall_time": 366.66666666666646
    },
    {
      "timestep": 3333,
      "throughput": 11.106858671092665,
      "update": 34,
      "cumulative_wall_time": 377.77777777777754
    },
    {
      "timestep": 3434,
      "throughput": 9.311128688389227,
      "update": 35,
      "cumulative_wall_time": 388.88888888888863
    },
    {
      "timestep": 3535,
      "throughput": 8.572218231484321,
      "update": 36,
      "cumulative_wall_time": 399.9999999999997
    },
    {
      "timestep": 3636,
      "throughput": 8.173278629056462,
      "update": 37,
      "cumulative_wall_time": 411.1111111111108
    },
    {
      "timestep": 3737,
      "throughput": 8.753203269020961,
      "update": 38,
      "cumulative_wall_time": 422.2222222222219
    },
    {
      "timestep": 3838,
      "throughput": 9.017246385877806,
      "update": 39,
      "cumulative_wall_time": 433.333333333333
    },
    {
      "timestep": 3939,
      "throughput": 8.498960296372195,
      "update": 40,
      "cumulative_wall_time": 444.44444444444406
    },
    {
      "timestep": 4040,
      "throughput": 10.744576412121685,
      "update": 41,
      "cumulative_wall_time": 455.55555555555515
    },
    {
      "timestep": 4141,
      "throughput": 9.517654720118726,
      "update": 42,
      "cumulative_wall_time": 466.66666666666623
    },
    {
      "timestep": 4242,
      "throughput": 8.643397237087534,
      "update": 43,
      "cumulative_wall_time": 477.7777777777773
    },
    {
      "timestep": 4343,
      "throughput": 10.270278797437852,
      "update": 44,
      "cumulative_wall_time": 488.8888888888884
    },
    {
      "timestep": 4444,
      "throughput": 7.502140723567295,
      "update": 45,
      "cumulative_wall_time": 499.9999999999995
    },
    {
      "timestep": 4545,
      "throughput": 10.188965267561514,
      "update": 46,
      "cumulative_wall_time": 511.1111111111106
    },
    {
      "timestep": 4646,
      "throughput": 10.135410323330458,
      "update": 47,
      "cumulative_wall_time": 522.2222222222217
    },
    {
      "timestep": 4747,
      "throughput": 10.848581561408611,
      "update": 48,
      "cumulative_wall_time": 533.3333333333328
    },
    {
      "timestep": 4848,
      "throughput": 9.174536475181482,
      "update": 49,
      "cumulative_wall_time": 544.4444444444439
    },
    {
      "timestep": 4949,
      "throughput": 10.014610963099742,
      "update": 50,
      "cumulative_wall_time": 555.555555555555
    },
    {
      "timestep": 5050,
      "throughput": 9.424457662696945,
      "update": 51,
      "cumulative_wall_time": 566.6666666666661
    },
    {
      "timestep": 5151,
      "throughput": 9.557865494048263,
      "update": 52,
      "cumulative_wall_time": 577.7777777777771
    },
    {
      "timestep": 5252,
      "throughput": 8.102230860634144,
      "update": 53,
      "cumulative_wall_time": 588.8888888888882
    },
    {
      "timestep": 5353,
      "throughput": 10.354610495977763,
      "update": 54,
      "cumulative_wall_time": 599.9999999999993
    },
    {
      "timestep": 5454,
      "throughput": 9.306994279191434,
      "update": 55,
      "cumulative_wall_time": 611.1111111111104
    },
    {
      "timestep": 5555,
      "throughput": 7.86723874363094,
      "update": 56,
      "cumulative_wall_time": 622.2222222222215
    },
    {
      "timestep": 5656,
      "throughput": 8.906180426515359,
      "update": 57,
      "cumulative_wall_time": 633.3333333333326
    },
    {
      "timestep": 5757,
      "throughput": 7.302348992226713,
      "update": 58,
      "cumulative_wall_time": 644.4444444444437
    },
    {
      "timestep": 5858,
      "throughput": 7.419554460310852,
      "update": 59,
      "cumulative_wall_time": 655.5555555555547
    },
    {
      "timestep": 5959,
      "throughput": 8.146555360785705,
      "update": 60,
      "cumulative_wall_time": 666.6666666666658
    },
    {
      "timestep": 6060,
      "throughput": 9.652310826342775,
      "update": 61,
      "cumulative_wall_time": 677.7777777777769
    },
    {
      "timestep": 6161,
      "throughput": 10.16801237542276,
      "update": 62,
      "cumulative_wall_time": 688.888888888888
    },
    {
      "timestep": 6262,
      "throughput": 8.216827093704147,
      "update": 63,
      "cumulative_wall_time": 699.9999999999991
    },
    {
      "timestep": 6363,
      "throughput": 8.67427369027643,
      "update": 64,
      "cumulative_wall_time": 711.1111111111102
    },
    {
      "timestep": 6464,
      "throughput": 9.172469033780747,
      "update": 65,
      "cumulative_wall_time": 722.2222222222213
    },
    {
      "timestep": 6565,
      "throughput": 8.940237402670055,
      "update": 66,
      "cumulative_wall_time": 733.3333333333323
    },
    {
      "timestep": 6666,
      "throughput": 9.17654920595371,
      "update": 67,
      "cumulative_wall_time": 744.4444444444434
    },
    {
      "timestep": 6767,
      "throughput": 7.906449964687578,
      "update": 68,
      "cumulative_wall_time": 755.5555555555545
    },
    {
      "timestep": 6868,
      "throughput": 9.492945856044365,
      "update": 69,
      "cumulative_wall_time": 766.6666666666656
    },
    {
      "timestep": 6969,
      "throughput": 8.81220195005616,
      "update": 70,
      "cumulative_wall_time": 777.7777777777767
    },
    {
      "timestep": 7070,
      "throughput": 8.58933374280677,
      "update": 71,
      "cumulative_wall_time": 788.8888888888878
    },
    {
      "timestep": 7171,
      "throughput": 9.568906777993396,
      "update": 72,
      "cumulative_wall_time": 799.9999999999989
    },
    {
      "timestep": 7272,
      "throughput": 9.232899458959334,
      "update": 73,
      "cumulative_wall_time": 811.11111111111
    },
    {
      "timestep": 7373,
      "throughput": 9.413921130174726,
      "update": 74,
      "cumulative_wall_time": 822.222222222221
    },
    {
      "timestep": 7474,
      "throughput": 8.836592022614603,
      "update": 75,
      "cumulative_wall_time": 833.3333333333321
    },
    {
      "timestep": 7575,
      "throughput": 10.329702270116849,
      "update": 76,
      "cumulative_wall_time": 844.4444444444432
    },
    {
      "timestep": 7676,
      "throughput": 8.704340759341383,
      "update": 77,
      "cumulative_wall_time": 855.5555555555543
    },
    {
      "timestep": 7777,
      "throughput": 10.241495370027996,
      "update": 78,
      "cumulative_wall_time": 866.6666666666654
    },
    {
      "timestep": 7878,
      "throughput": 8.725072746939372,
      "update": 79,
      "cumulative_wall_time": 877.7777777777765
    },
    {
      "timestep": 7979,
      "throughput": 9.610843282124044,
      "update": 80,
      "cumulative_wall_time": 888.8888888888875
    },
    {
      "timestep": 8080,
      "throughput": 8.080048703188222,
      "update": 81,
      "cumulative_wall_time": 899.9999999999986
    },
    {
      "timestep": 8181,
      "throughput": 7.316265271507338,
      "update": 82,
      "cumulative_wall_time": 911.1111111111097
    },
    {
      "timestep": 8282,
      "throughput": 9.866175664984715,
      "update": 83,
      "cumulative_wall_time": 922.2222222222208
    },
    {
      "timestep": 8383,
      "throughput": 8.620867487714225,
      "update": 84,
      "cumulative_wall_time": 933.3333333333319
    },
    {
      "timestep": 8484,
      "throughput": 9.725982414990678,
      "update": 85,
      "cumulative_wall_time": 944.444444444443
    },
    {
      "timestep": 8585,
      "throughput": 10.242482043417962,
      "update": 86,
      "cumulative_wall_time": 955.5555555555541
    },
    {
      "timestep": 8686,
      "throughput": 8.32666364423022,
      "update": 87,
      "cumulative_wall_time": 966.6666666666652
    },
    {
      "timestep": 8787,
      "throughput": 8.452146762608734,
      "update": 88,
      "cumulative_wall_time": 977.7777777777762
    },
    {
      "timestep": 8888,
      "throughput": 9.12431004147869,
      "update": 89,
      "cumulative_wall_time": 988.8888888888873
    },
    {
      "timestep": 8989,
      "throughput": 8.78057653600994,
      "update": 90,
      "cumulative_wall_time": 999.9999999999984
    },
    {
      "timestep": 9090,
      "throughput": 9.09701008509604,
      "update": 91,
      "cumulative_wall_time": 1011.1111111111095
    },
    {
      "timestep": 9191,
      "throughput": 9.831075959420293,
      "update": 92,
      "cumulative_wall_time": 1022.2222222222206
    },
    {
      "timestep": 9292,
      "throughput": 8.135635651962339,
      "update": 93,
      "cumulative_wall_time": 1033.3333333333317
    },
    {
      "timestep": 9393,
      "throughput": 8.909201458037742,
      "update": 94,
      "cumulative_wall_time": 1044.4444444444428
    },
    {
      "timestep": 9494,
      "throughput": 10.120516836641407,
      "update": 95,
      "cumulative_wall_time": 1055.5555555555538
    },
    {
      "timestep": 9595,
      "throughput": 9.830590592402872,
      "update": 96,
      "cumulative_wall_time": 1066.666666666665
    },
    {
      "timestep": 9696,
      "throughput": 9.860366010868873,
      "update": 97,
      "cumulative_wall_time": 1077.777777777776
    },
    {
      "timestep": 9797,
      "throughput": 8.421294134918318,
      "update": 98,
      "cumulative_wall_time": 1088.888888888887
    },
    {
      "timestep": 9898,
      "throughput": 9.13817434311648,
      "update": 99,
      "cumulative_wall_time": 1099.9999999999982
    },
    {
      "timestep": 10000,
      "throughput": 9.499500715046606,
      "update": 100,
      "cumulative_wall_time": 1111.1111111111093
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 1500,
        "success_rate": 0.85,
        "mean_reward": 0.774535753066723,
        "recent_gradient": 0.00880228815501225
      },
      "level_2": {
        "num_pulls": 2000,
        "success_rate": 0.65,
        "mean_reward": 0.6076855357527491,
        "recent_gradient": 0.021498278466352168
      },
      "level_3": {
        "num_pulls": 2500,
        "success_rate": 0.45,
        "mean_reward": 0.3831754599108145,
        "recent_gradient": 0.03149706388174175
      },
      "level_4": {
        "num_pulls": 2500,
        "success_rate": 0.28,
        "mean_reward": 0.28015326432172166,
        "recent_gradient": 0.019275276932362185
      },
      "level_5": {
        "num_pulls": 1500,
        "success_rate": 0.15,
        "mean_reward": 0.13334041455555007,
        "recent_gradient": 0.012821048819579189
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.15
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 4.269411344381984
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.280264511263108
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 5.37398672115195
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 4.826192872277722
      }
    }
  },
  "config": {
    "use_async": false,
    "curriculum_strategy": "fixed"
  }
}