{
  "experiment_name": "sync_curriculum_seed123",
  "total_timesteps": 10000,
  "total_time": 1111.111111111111,
  "avg_throughput": 9,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": 0.04986727232917929,
      "difficulty_1_ratio": 0.5703496647219384,
      "difficulty_2_ratio": 0.34593455841067655,
      "difficulty_3_ratio": 0.0771884334190506,
      "difficulty_4_ratio": 0.006336012450983674,
      "difficulty_5_ratio": 0.00019133099735093797
    },
    {
      "timestep": 101,
      "pass_at_1": 0.016770681072150954,
      "avg_reward": -0.06189819083818384,
      "difficulty_1_ratio": 0.545817584309558,
      "difficulty_2_ratio": 0.3592137008263376,
      "difficulty_3_ratio": 0.0869688606806755,
      "difficulty_4_ratio": 0.007746048051242527,
      "difficulty_5_ratio": 0.00025380613218624814
    },
    {
      "timestep": 202,
      "pass_at_1": 0.0106502171828515,
      "avg_reward": 0.09109200060113876,
      "difficulty_1_ratio": 0.5207065136269264,
      "difficulty_2_ratio": 0.3718356202546844,
      "difficulty_3_ratio": 0.09768198799373931,
      "difficulty_4_ratio": 0.009440250235689705,
      "difficulty_5_ratio": 0.00033562788896017117
    },
    {
      "timestep": 303,
      "pass_at_1": 0.0,
      "avg_reward": -0.021445631442808866,
      "difficulty_1_ratio": 0.4951092343136047,
      "difficulty_2_ratio": 0.38362916613190773,
      "difficulty_3_ratio": 0.10935225097641152,
      "difficulty_4_ratio": 0.011466987914927423,
      "difficulty_5_ratio": 0.00044236066314863343
    },
    {
      "timestep": 404,
      "pass_at_1": 0.06976316961855514,
      "avg_reward": 0.012473515581589024,
      "difficulty_1_ratio": 0.469130336180388,
      "difficulty_2_ratio": 0.3944179935925989,
      "difficulty_3_ratio": 0.12199033943415045,
      "difficulty_4_ratio": 0.013880326375356456,
      "difficulty_5_ratio": 0.0005810044175062076
    },
    {
      "timestep": 505,
      "pass_at_1": 0.10134050943549208,
      "avg_reward": 0.07633695910154913,
      "difficulty_1_ratio": 0.4428854101147015,
      "difficulty_2_ratio": 0.40402402094501866,
      "difficulty_3_ratio": 0.13559026749360029,
      "difficulty_4_ratio": 0.0167399966441195,
      "difficulty_5_ratio": 0.0007603048025599198
    },
    {
      "timestep": 606,
      "pass_at_1": 0.14846223014890725,
      "avg_reward": 0.08682468428489326,
      "difficulty_1_ratio": 0.4164998456831705,
      "difficulty_2_ratio": 0.41227145735706794,
      "difficulty_3_ratio": 0.15012644832783253,
      "difficulty_4_ratio": 0.02011113911124073,
      "difficulty_5_ratio": 0.0009911095206882054
    },
    {
      "timestep": 707,
      "pass_at_1": 0.11355735923230188,
      "avg_reward": 0.06912832360491564,
      "difficulty_1_ratio": 0.390107224895361,
      "difficulty_2_ratio": 0.4189913219593774,
      "difficulty_3_ratio": 0.1655509131479823,
      "difficulty_4_ratio": 0.024063769070528613,
      "difficulty_5_ratio": 0.0012867709267507749
    },
    {
      "timestep": 808,
      "pass_at_1": 0.17044435003181208,
      "avg_reward": 0.245694784474139,
      "difficulty_1_ratio": 0.3638473227132847,
      "difficulty_2_ratio": 0.42402633368046766,
      "difficulty_3_ratio": 0.18179083819928793,
      "difficulty_4_ratio": 0.028671913216506643,
      "difficulty_5_ratio": 0.0016635921904528722
    },
    {
      "timestep": 909,
      "pass_at_1": 0.15038144749347523,
      "avg_reward": 0.139614477953523,
      "difficulty_1_ratio": 0.337863746670805,
      "difficulty_2_ratio": 0.4272360092470168,
      "difficulty_3_ratio": 0.19874656153923254,
      "difficulty_4_ratio": 0.03401237165049899,
      "difficulty_5_ratio": 0.0021413108924466314
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.14910775806460144,
      "avg_reward": 0.19382280785922112,
      "difficulty_1_ratio": 0.31230127114431194,
      "difficulty_2_ratio": 0.4285017684753959,
      "difficulty_3_ratio": 0.21629028030484038,
      "difficulty_4_ratio": 0.04016307038955698,
      "difficulty_5_ratio": 0.0027436096858948753
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.11978848371057804,
      "avg_reward": 0.15462223920756762,
      "difficulty_1_ratio": 0.2873029447333821,
      "difficulty_2_ratio": 0.4277318152433385,
      "difficulty_3_ratio": 0.23426561605703436,
      "difficulty_4_ratio": 0.04720098526509968,
      "difficulty_5_ratio": 0.0034986387011453407
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.11765627333679067,
      "avg_reward": 0.06223744354676203,
      "difficulty_1_ratio": 0.2630070699260558,
      "difficulty_2_ratio": 0.4248655434002136,
      "difficulty_3_ratio": 0.2524882182255638,
      "difficulty_4_ratio": 0.05519963957750222,
      "difficulty_5_ratio": 0.004439528870664513
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.16518768811622583,
      "avg_reward": 0.06071611548168222,
      "difficulty_1_ratio": 0.23954417068994155,
      "difficulty_2_ratio": 0.41987721294759744,
      "difficulty_3_ratio": 0.2707475422306048,
      "difficulty_4_ratio": 0.06422620455155005,
      "difficulty_5_ratio": 0.005604869580306165
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.14863772318500362,
      "avg_reward": 0.07582243375501863,
      "difficulty_1_ratio": 0.21703407392185683,
      "difficulty_2_ratio": 0.412778655730858,
      "difficulty_3_ratio": 0.2888098894295048,
      "difficulty_4_ratio": 0.07433826251589389,
      "difficulty_5_ratio": 0.0070391184018864465
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.15080070312987126,
      "avg_reward": -0.0192888927691392,
      "difficulty_1_ratio": 0.1955832332539105,
      "difficulty_2_ratio": 0.4036208028084852,
      "difficulty_3_ratio": 0.3064227321494006,
      "difficulty_4_ratio": 0.08558032615731795,
      "difficulty_5_ratio": 0.008792905630886071
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.12503538154065233,
      "avg_reward": 0.06503444350262601,
      "difficulty_1_ratio": 0.17528241761460614,
      "difficulty_2_ratio": 0.39249387697759325,
      "difficulty_3_ratio": 0.3233202719632032,
      "difficulty_4_ratio": 0.09798024091278032,
      "difficulty_5_ratio": 0.010923192531817163
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.1836455008774001,
      "avg_reward": 0.1382346165624093,
      "difficulty_1_ratio": 0.15620487203762,
      "difficulty_2_ratio": 0.3795261610306469,
      "difficulty_3_ratio": 0.3392300979084394,
      "difficulty_4_ratio": 0.11154562879642933,
      "difficulty_5_ratio": 0.013493240226864338
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.16985874356663314,
      "avg_reward": 0.17029813040842076,
      "difficulty_1_ratio": 0.13840503524267814,
      "difficulty_2_ratio": 0.36488133073132456,
      "difficulty_3_ratio": 0.3538807296736819,
      "difficulty_4_ratio": 0.12626055765373156,
      "difficulty_5_ratio": 0.016572346698583963
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.15698995765778329,
      "avg_reward": 0.1397733323165912,
      "difficulty_1_ratio": 0.12191786908589192,
      "difficulty_2_ratio": 0.3487544252621549,
      "difficulty_3_ratio": 0.36700975575577915,
      "difficulty_4_ratio": 0.1420826368959247,
      "difficulty_5_ratio": 0.02023531300024945
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.1633232349109094,
      "avg_reward": 0.04427511322269714,
      "difficulty_1_ratio": 0.10675882140395278,
      "difficulty_2_ratio": 0.33136661015926444,
      "difficulty_3_ratio": 0.37837221513402225,
      "difficulty_4_ratio": 0.158940746377412,
      "difficulty_5_ratio": 0.02456160692534847
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.1765310214693564,
      "avg_reward": 0.16991511029573803,
      "difficulty_1_ratio": 0.09292440882580433,
      "difficulty_2_ratio": 0.3129589615253456,
      "difficulty_3_ratio": 0.38774882932075583,
      "difficulty_4_ratio": 0.1767335970180918,
      "difficulty_5_ratio": 0.02963420331000244
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.19610518838067056,
      "avg_reward": 0.15629262598059546,
      "difficulty_1_ratio": 0.08039337269830067,
      "difficulty_2_ratio": 0.29378555928253614,
      "difficulty_3_ratio": 0.3949536745312958,
      "difficulty_4_ratio": 0.19532929872471466,
      "difficulty_5_ratio": 0.03553809476315268
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.24222822719037382,
      "avg_reward": 0.214428189767738,
      "difficulty_1_ratio": 0.0691283320657602,
      "difficulty_2_ratio": 0.2741062164565189,
      "difficulty_3_ratio": 0.39984089400061734,
      "difficulty_4_ratio": 0.21456607296103805,
      "difficulty_5_ratio": 0.04235848451606555
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.2190632915690014,
      "avg_reward": 0.2871578001800988,
      "difficulty_1_ratio": 0.05907783484757915,
      "difficulty_2_ratio": 0.2541791879471294,
      "difficulty_3_ratio": 0.40231008867116286,
      "difficulty_4_ratio": 0.23425419509772658,
      "difficulty_5_ratio": 0.05017869343640206
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.17877148929992426,
      "avg_reward": 0.09107778092969174,
      "difficulty_1_ratio": 0.050178693436402015,
      "difficulty_2_ratio": 0.2342541950977265,
      "difficulty_3_ratio": 0.40231008867116286,
      "difficulty_4_ratio": 0.2541791879471295,
      "difficulty_5_ratio": 0.059077834847579204
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.24474571411799562,
      "avg_reward": 0.1558934345323434,
      "difficulty_1_ratio": 0.04235848451606552,
      "difficulty_2_ratio": 0.21456607296103797,
      "difficulty_3_ratio": 0.3998408940006174,
      "difficulty_4_ratio": 0.274106216456519,
      "difficulty_5_ratio": 0.06912833206576029
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.21573357456698505,
      "avg_reward": 0.2260526581248055,
      "difficulty_1_ratio": 0.03553809476315264,
      "difficulty_2_ratio": 0.1953292987247146,
      "difficulty_3_ratio": 0.3949536745312958,
      "difficulty_4_ratio": 0.2937855592825363,
      "difficulty_5_ratio": 0.08039337269830077
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.2382690116828348,
      "avg_reward": 0.27835951844532336,
      "difficulty_1_ratio": 0.029634203310002414,
      "difficulty_2_ratio": 0.17673359701809171,
      "difficulty_3_ratio": 0.38774882932075583,
      "difficulty_4_ratio": 0.31295896152534575,
      "difficulty_5_ratio": 0.09292440882580441
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.2557255000809335,
      "avg_reward": 0.25805003355003364,
      "difficulty_1_ratio": 0.02456160692534847,
      "difficulty_2_ratio": 0.158940746377412,
      "difficulty_3_ratio": 0.37837221513402225,
      "difficulty_4_ratio": 0.33136661015926444,
      "difficulty_5_ratio": 0.10675882140395278
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.21575503089804346,
      "avg_reward": 0.21234715810809568,
      "difficulty_1_ratio": 0.020235313000249448,
      "difficulty_2_ratio": 0.14208263689592468,
      "difficulty_3_ratio": 0.3670097557557791,
      "difficulty_4_ratio": 0.34875442526215483,
      "difficulty_5_ratio": 0.12191786908589189
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.24292606137589706,
      "avg_reward": 0.12802757610369486,
      "difficulty_1_ratio": 0.016572346698583963,
      "difficulty_2_ratio": 0.12626055765373156,
      "difficulty_3_ratio": 0.35388072967368184,
      "difficulty_4_ratio": 0.3648813307313245,
      "difficulty_5_ratio": 0.13840503524267814
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.2704487119811966,
      "avg_reward": 0.25672079631388556,
      "difficulty_1_ratio": 0.013493240226864338,
      "difficulty_2_ratio": 0.11154562879642933,
      "difficulty_3_ratio": 0.3392300979084394,
      "difficulty_4_ratio": 0.3795261610306469,
      "difficulty_5_ratio": 0.15620487203762
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.24850110309075915,
      "avg_reward": 0.18714627942338666,
      "difficulty_1_ratio": 0.010923192531817153,
      "difficulty_2_ratio": 0.09798024091278025,
      "difficulty_3_ratio": 0.32332027196320307,
      "difficulty_4_ratio": 0.39249387697759325,
      "difficulty_5_ratio": 0.17528241761460625
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.2291359930014873,
      "avg_reward": 0.19328499807912147,
      "difficulty_1_ratio": 0.00879290563088607,
      "difficulty_2_ratio": 0.08558032615731792,
      "difficulty_3_ratio": 0.3064227321494005,
      "difficulty_4_ratio": 0.40362080280848517,
      "difficulty_5_ratio": 0.19558323325391047
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.2679992686623077,
      "avg_reward": 0.17284166571768222,
      "difficulty_1_ratio": 0.007039118401886442,
      "difficulty_2_ratio": 0.07433826251589386,
      "difficulty_3_ratio": 0.2888098894295048,
      "difficulty_4_ratio": 0.41277865573085804,
      "difficulty_5_ratio": 0.21703407392185695
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.2874163481921268,
      "avg_reward": 0.17507292622954973,
      "difficulty_1_ratio": 0.00560486958030616,
      "difficulty_2_ratio": 0.06422620455155001,
      "difficulty_3_ratio": 0.2707475422306047,
      "difficulty_4_ratio": 0.41987721294759744,
      "difficulty_5_ratio": 0.2395441706899417
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.2272608631134631,
      "avg_reward": 0.23379504503540555,
      "difficulty_1_ratio": 0.004439528870664501,
      "difficulty_2_ratio": 0.05519963957750214,
      "difficulty_3_ratio": 0.2524882182255636,
      "difficulty_4_ratio": 0.42486554340021365,
      "difficulty_5_ratio": 0.2630070699260561
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.2672104569212631,
      "avg_reward": 0.20746688627135976,
      "difficulty_1_ratio": 0.0034986387011453407,
      "difficulty_2_ratio": 0.04720098526509968,
      "difficulty_3_ratio": 0.23426561605703436,
      "difficulty_4_ratio": 0.4277318152433385,
      "difficulty_5_ratio": 0.2873029447333821
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.26408212412354815,
      "avg_reward": 0.13096756126296838,
      "difficulty_1_ratio": 0.0027436096858948753,
      "difficulty_2_ratio": 0.04016307038955698,
      "difficulty_3_ratio": 0.21629028030484038,
      "difficulty_4_ratio": 0.4285017684753959,
      "difficulty_5_ratio": 0.31230127114431194
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.31148712970138487,
      "avg_reward": 0.21474625456876184,
      "difficulty_1_ratio": 0.0021413108924466314,
      "difficulty_2_ratio": 0.03401237165049899,
      "difficulty_3_ratio": 0.19874656153923254,
      "difficulty_4_ratio": 0.4272360092470168,
      "difficulty_5_ratio": 0.337863746670805
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.3251420832373518,
      "avg_reward": 0.3004790759004179,
      "difficulty_1_ratio": 0.0016635921904528726,
      "difficulty_2_ratio": 0.02867191321650665,
      "difficulty_3_ratio": 0.18179083819928796,
      "difficulty_4_ratio": 0.42402633368046766,
      "difficulty_5_ratio": 0.3638473227132848
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.29115476452833744,
      "avg_reward": 0.17862869156632663,
      "difficulty_1_ratio": 0.0012867709267507727,
      "difficulty_2_ratio": 0.02406376907052859,
      "difficulty_3_ratio": 0.16555091314798218,
      "difficulty_4_ratio": 0.41899132195937727,
      "difficulty_5_ratio": 0.3901072248953611
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.2883093841403951,
      "avg_reward": 0.17002135075755762,
      "difficulty_1_ratio": 0.0009911095206882065,
      "difficulty_2_ratio": 0.020111139111240753,
      "difficulty_3_ratio": 0.15012644832783265,
      "difficulty_4_ratio": 0.41227145735706805,
      "difficulty_5_ratio": 0.4164998456831704
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.35018700837496686,
      "avg_reward": 0.28837166821146476,
      "difficulty_1_ratio": 0.0007603048025599186,
      "difficulty_2_ratio": 0.01673999664411949,
      "difficulty_3_ratio": 0.1355902674936002,
      "difficulty_4_ratio": 0.40402402094501866,
      "difficulty_5_ratio": 0.44288541011470167
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.3369080812257743,
      "avg_reward": 0.20615886253010807,
      "difficulty_1_ratio": 0.0005810044175062084,
      "difficulty_2_ratio": 0.013880326375356472,
      "difficulty_3_ratio": 0.12199033943415054,
      "difficulty_4_ratio": 0.3944179935925989,
      "difficulty_5_ratio": 0.4691303361803878
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.32295279079651673,
      "avg_reward": 0.31725532957764235,
      "difficulty_1_ratio": 0.00044236066314863197,
      "difficulty_2_ratio": 0.011466987914927403,
      "difficulty_3_ratio": 0.10935225097641141,
      "difficulty_4_ratio": 0.3836291661319077,
      "difficulty_5_ratio": 0.49510923431360493
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.31802475463375507,
      "avg_reward": 0.3059755266530912,
      "difficulty_1_ratio": 0.0003356278889601711,
      "difficulty_2_ratio": 0.009440250235689705,
      "difficulty_3_ratio": 0.09768198799373934,
      "difficulty_4_ratio": 0.3718356202546845,
      "difficulty_5_ratio": 0.5207065136269263
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.30838724280660795,
      "avg_reward": 0.17853621701435718,
      "difficulty_1_ratio": 0.00025380613218624744,
      "difficulty_2_ratio": 0.007746048051242511,
      "difficulty_3_ratio": 0.08696886068067541,
      "difficulty_4_ratio": 0.3592137008263375,
      "difficulty_5_ratio": 0.5458175843095583
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.34297710140440973,
      "avg_reward": 0.25542285939490017,
      "difficulty_1_ratio": 0.00019133099735093795,
      "difficulty_2_ratio": 0.006336012450983673,
      "difficulty_3_ratio": 0.0771884334190506,
      "difficulty_4_ratio": 0.3459345584106765,
      "difficulty_5_ratio": 0.5703496647219383
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.3534937677200722,
      "avg_reward": 0.1839006176000353
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.3601110297342999,
      "avg_reward": 0.41800402015090565
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.3505322912010663,
      "avg_reward": 0.28213293940634515
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.359717576033566,
      "avg_reward": 0.19467527528726344
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.36969085285318903,
      "avg_reward": 0.215482195081753
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.3575922479816157,
      "avg_reward": 0.3482172758654794
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.3563532112628318,
      "avg_reward": 0.31014501848863546
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.39615521728232556,
      "avg_reward": 0.3308612166306605
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.3532530962864896,
      "avg_reward": 0.265978713261621
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.4245584195333936,
      "avg_reward": 0.23839444747684138
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.3844770374841988,
      "avg_reward": 0.27997622641295367
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.39695283573915163,
      "avg_reward": 0.3549730494506828
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.43117771816706985,
      "avg_reward": 0.331430554933198
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.4196361143417238,
      "avg_reward": 0.3606958987166377
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.4171796830922257,
      "avg_reward": 0.30554754989745697
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.39196667944343677,
      "avg_reward": 0.2585711879237146
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.40092069688873994,
      "avg_reward": 0.3368208863043033
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.4353199323588746,
      "avg_reward": 0.3644293882799445
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.4130878953590698,
      "avg_reward": 0.42076882178387964
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.45832445255312154,
      "avg_reward": 0.3489595564049886
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.4152724422417249,
      "avg_reward": 0.33872870150127843
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.4607946093458528,
      "avg_reward": 0.38527393633938817
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.45020080529550366,
      "avg_reward": 0.34955663812262167
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.45173020337908676,
      "avg_reward": 0.43861138527607635
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.4412603857282662,
      "avg_reward": 0.36017369520800663
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.4544934747598231,
      "avg_reward": 0.37778104759641035
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.42445766322638717,
      "avg_reward": 0.245722697787415
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.4354961603454899,
      "avg_reward": 0.35679404304647533
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.47007644853136704,
      "avg_reward": 0.34952743083641247
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.4895715936843908,
      "avg_reward": 0.3844984762312033
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.4653778400929494,
      "avg_reward": 0.36260407854672644
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.4705160733362397,
      "avg_reward": 0.41163656237117197
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.4839326240514834,
      "avg_reward": 0.34222495221070726
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.5037979768815343,
      "avg_reward": 0.34828705863388154
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.4775367058204775,
      "avg_reward": 0.3683095359802644
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.457523359986286,
      "avg_reward": 0.36226265859033724
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.4661628052601809,
      "avg_reward": 0.37657560637194737
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.49144288558687743,
      "avg_reward": 0.4667507769181655
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.49185851228462857,
      "avg_reward": 0.36292554281246164
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.4801370794765594,
      "avg_reward": 0.3911085688869757
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.49202776432221906,
      "avg_reward": 0.4666016748691963
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.5201865635129175,
      "avg_reward": 0.39820245449822095
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.48336098379404,
      "avg_reward": 0.2588360568318391
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.48534459677844477,
      "avg_reward": 0.33937279211854166
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.49115205459436506,
      "avg_reward": 0.41250085579299767
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.5036557978001631,
      "avg_reward": 0.4014262378877534
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.5059063807327144,
      "avg_reward": 0.398419215924622
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.5075987944023898,
      "avg_reward": 0.2445262851259462
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.4999586191833364,
      "avg_reward": 0.39442435929401876
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.5001492229773872,
      "avg_reward": 0.3892220652767627
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": 0.04986727232917929,
      "difficulty_1_ratio": 0.5703496647219384,
      "difficulty_2_ratio": 0.34593455841067655,
      "difficulty_3_ratio": 0.0771884334190506,
      "difficulty_4_ratio": 0.006336012450983674,
      "difficulty_5_ratio": 0.00019133099735093797
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.5001492229773872,
      "avg_reward": 0.3892220652767627
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 4.5,
      "update": 1,
      "cumulative_wall_time": 11.11111111111111
    },
    {
      "timestep": 101,
      "throughput": 4.95,
      "update": 2,
      "cumulative_wall_time": 22.22222222222222
    },
    {
      "timestep": 202,
      "throughput": 5.3999999999999995,
      "update": 3,
      "cumulative_wall_time": 33.33333333333333
    },
    {
      "timestep": 303,
      "throughput": 5.8500000000000005,
      "update": 4,
      "cumulative_wall_time": 44.44444444444444
    },
    {
      "timestep": 404,
      "throughput": 6.3,
      "update": 5,
      "cumulative_wall_time": 55.55555555555556
    },
    {
      "timestep": 505,
      "throughput": 6.75,
      "update": 6,
      "cumulative_wall_time": 66.66666666666667
    },
    {
      "timestep": 606,
      "throughput": 7.2,
      "update": 7,
      "cumulative_wall_time": 77.77777777777779
    },
    {
      "timestep": 707,
      "throughput": 7.6499999999999995,
      "update": 8,
      "cumulative_wall_time": 88.8888888888889
    },
    {
      "timestep": 808,
      "throughput": 8.1,
      "update": 9,
      "cumulative_wall_time": 100.00000000000001
    },
    {
      "timestep": 909,
      "throughput": 8.549999999999999,
      "update": 10,
      "cumulative_wall_time": 111.11111111111113
    },
    {
      "timestep": 1010,
      "throughput": 9.632979106026058,
      "update": 11,
      "cumulative_wall_time": 122.22222222222224
    },
    {
      "timestep": 1111,
      "throughput": 8.461705201793256,
      "update": 12,
      "cumulative_wall_time": 133.33333333333334
    },
    {
      "timestep": 1212,
      "throughput": 10.980631889295417,
      "update": 13,
      "cumulative_wall_time": 144.44444444444446
    },
    {
      "timestep": 1313,
      "throughput": 9.61946723719988,
      "update": 14,
      "cumulative_wall_time": 155.55555555555557
    },
    {
      "timestep": 1414,
      "throughput": 8.994323474177515,
      "update": 15,
      "cumulative_wall_time": 166.66666666666669
    },
    {
      "timestep": 1515,
      "throughput": 8.81400392712219,
      "update": 16,
      "cumulative_wall_time": 177.7777777777778
    },
    {
      "timestep": 1616,
      "throughput": 8.92212994225608,
      "update": 17,
      "cumulative_wall_time": 188.8888888888889
    },
    {
      "timestep": 1717,
      "throughput": 8.176223637050418,
      "update": 18,
      "cumulative_wall_time": 200.00000000000003
    },
    {
      "timestep": 1818,
      "throughput": 8.914317714667792,
      "update": 19,
      "cumulative_wall_time": 211.11111111111114
    },
    {
      "timestep": 1919,
      "throughput": 9.250815165054348,
      "update": 20,
      "cumulative_wall_time": 222.22222222222226
    },
    {
      "timestep": 2020,
      "throughput": 9.521587454015906,
      "update": 21,
      "cumulative_wall_time": 233.33333333333337
    },
    {
      "timestep": 2121,
      "throughput": 9.5217208012299,
      "update": 22,
      "cumulative_wall_time": 244.44444444444449
    },
    {
      "timestep": 2222,
      "throughput": 8.752610208090658,
      "update": 23,
      "cumulative_wall_time": 255.5555555555556
    },
    {
      "timestep": 2323,
      "throughput": 7.725525972730262,
      "update": 24,
      "cumulative_wall_time": 266.6666666666667
    },
    {
      "timestep": 2424,
      "throughput": 8.3978076363899,
      "update": 25,
      "cumulative_wall_time": 277.77777777777777
    },
    {
      "timestep": 2525,
      "throughput": 10.45097373853115,
      "update": 26,
      "cumulative_wall_time": 288.88888888888886
    },
    {
      "timestep": 2626,
      "throughput": 9.806452482068954,
      "update": 27,
      "cumulative_wall_time": 299.99999999999994
    },
    {
      "timestep": 2727,
      "throughput": 9.332657627673758,
      "update": 28,
      "cumulative_wall_time": 311.11111111111103
    },
    {
      "timestep": 2828,
      "throughput": 8.314835179715889,
      "update": 29,
      "cumulative_wall_time": 322.2222222222221
    },
    {
      "timestep": 2929,
      "throughput": 9.0032806394764,
      "update": 30,
      "cumulative_wall_time": 333.3333333333332
    },
    {
      "timestep": 3030,
      "throughput": 7.869898182903766,
      "update": 31,
      "cumulative_wall_time": 344.4444444444443
    },
    {
      "timestep": 3131,
      "throughput": 8.503256811873534,
      "update": 32,
      "cumulative_wall_time": 355.5555555555554
    },
    {
      "timestep": 3232,
      "throughput": 8.779316992483324,
      "update": 33,
      "cumulative_wall_time": 366.66666666666646
    },
    {
      "timestep": 3333,
      "throughput": 8.674524061321309,
      "update": 34,
      "cumulative_wall_time": 377.77777777777754
    },
    {
      "timestep": 3434,
      "throughput": 9.86094173795041,
      "update": 35,
      "cumulative_wall_time": 388.88888888888863
    },
    {
      "timestep": 3535,
      "throughput": 7.723146677368093,
      "update": 36,
      "cumulative_wall_time": 399.9999999999997
    },
    {
      "timestep": 3636,
      "throughput": 8.22111095563636,
      "update": 37,
      "cumulative_wall_time": 411.1111111111108
    },
    {
      "timestep": 3737,
      "throughput": 7.762780826080003,
      "update": 38,
      "cumulative_wall_time": 422.2222222222219
    },
    {
      "timestep": 3838,
      "throughput": 7.886382108580931,
      "update": 39,
      "cumulative_wall_time": 433.333333333333
    },
    {
      "timestep": 3939,
      "throughput": 9.111650306801984,
      "update": 40,
      "cumulative_wall_time": 444.44444444444406
    },
    {
      "timestep": 4040,
      "throughput": 7.559603520249355,
      "update": 41,
      "cumulative_wall_time": 455.55555555555515
    },
    {
      "timestep": 4141,
      "throughput": 9.678481900953873,
      "update": 42,
      "cumulative_wall_time": 466.66666666666623
    },
    {
      "timestep": 4242,
      "throughput": 8.777865800753032,
      "update": 43,
      "cumulative_wall_time": 477.7777777777773
    },
    {
      "timestep": 4343,
      "throughput": 9.06190949927338,
      "update": 44,
      "cumulative_wall_time": 488.8888888888884
    },
    {
      "timestep": 4444,
      "throughput": 9.290319064197483,
      "update": 45,
      "cumulative_wall_time": 499.9999999999995
    },
    {
      "timestep": 4545,
      "throughput": 8.609250131773567,
      "update": 46,
      "cumulative_wall_time": 511.1111111111106
    },
    {
      "timestep": 4646,
      "throughput": 9.92923174417804,
      "update": 47,
      "cumulative_wall_time": 522.2222222222217
    },
    {
      "timestep": 4747,
      "throughput": 8.825091545945128,
      "update": 48,
      "cumulative_wall_time": 533.3333333333328
    },
    {
      "timestep": 4848,
      "throughput": 9.534663229715163,
      "update": 49,
      "cumulative_wall_time": 544.4444444444439
    },
    {
      "timestep": 4949,
      "throughput": 8.820798855518472,
      "update": 50,
      "cumulative_wall_time": 555.555555555555
    },
    {
      "timestep": 5050,
      "throughput": 9.261786948682431,
      "update": 51,
      "cumulative_wall_time": 566.6666666666661
    },
    {
      "timestep": 5151,
      "throughput": 9.251696403142164,
      "update": 52,
      "cumulative_wall_time": 577.7777777777771
    },
    {
      "timestep": 5252,
      "throughput": 9.224972945509979,
      "update": 53,
      "cumulative_wall_time": 588.8888888888882
    },
    {
      "timestep": 5353,
      "throughput": 8.123122935341172,
      "update": 54,
      "cumulative_wall_time": 599.9999999999993
    },
    {
      "timestep": 5454,
      "throughput": 9.392288193492696,
      "update": 55,
      "cumulative_wall_time": 611.1111111111104
    },
    {
      "timestep": 5555,
      "throughput": 8.712938709810365,
      "update": 56,
      "cumulative_wall_time": 622.2222222222215
    },
    {
      "timestep": 5656,
      "throughput": 9.567439227440925,
      "update": 57,
      "cumulative_wall_time": 633.3333333333326
    },
    {
      "timestep": 5757,
      "throughput": 7.062755900028926,
      "update": 58,
      "cumulative_wall_time": 644.4444444444437
    },
    {
      "timestep": 5858,
      "throughput": 7.681395400150544,
      "update": 59,
      "cumulative_wall_time": 655.5555555555547
    },
    {
      "timestep": 5959,
      "throughput": 9.327101005921527,
      "update": 60,
      "cumulative_wall_time": 666.6666666666658
    },
    {
      "timestep": 6060,
      "throughput": 10.676634826594707,
      "update": 61,
      "cumulative_wall_time": 677.7777777777769
    },
    {
      "timestep": 6161,
      "throughput": 9.751552872130112,
      "update": 62,
      "cumulative_wall_time": 688.888888888888
    },
    {
      "timestep": 6262,
      "throughput": 8.385794159220017,
      "update": 63,
      "cumulative_wall_time": 699.9999999999991
    },
    {
      "timestep": 6363,
      "throughput": 7.4771528261598394,
      "update": 64,
      "cumulative_wall_time": 711.1111111111102
    },
    {
      "timestep": 6464,
      "throughput": 9.668417599045457,
      "update": 65,
      "cumulative_wall_time": 722.2222222222213
    },
    {
      "timestep": 6565,
      "throughput": 8.927475100161345,
      "update": 66,
      "cumulative_wall_time": 733.3333333333323
    },
    {
      "timestep": 6666,
      "throughput": 9.531633796104947,
      "update": 67,
      "cumulative_wall_time": 744.4444444444434
    },
    {
      "timestep": 6767,
      "throughput": 9.103768849989711,
      "update": 68,
      "cumulative_wall_time": 755.5555555555545
    },
    {
      "timestep": 6868,
      "throughput": 9.026678632608444,
      "update": 69,
      "cumulative_wall_time": 766.6666666666656
    },
    {
      "timestep": 6969,
      "throughput": 11.662762901303859,
      "update": 70,
      "cumulative_wall_time": 777.7777777777767
    },
    {
      "timestep": 7070,
      "throughput": 8.994483035058979,
      "update": 71,
      "cumulative_wall_time": 788.8888888888878
    },
    {
      "timestep": 7171,
      "throughput": 8.856679311672062,
      "update": 72,
      "cumulative_wall_time": 799.9999999999989
    },
    {
      "timestep": 7272,
      "throughput": 8.89069619213638,
      "update": 73,
      "cumulative_wall_time": 811.11111111111
    },
    {
      "timestep": 7373,
      "throughput": 8.474816954963108,
      "update": 74,
      "cumulative_wall_time": 822.222222222221
    },
    {
      "timestep": 7474,
      "throughput": 9.89111960524378,
      "update": 75,
      "cumulative_wall_time": 833.3333333333321
    },
    {
      "timestep": 7575,
      "throughput": 8.681621099596786,
      "update": 76,
      "cumulative_wall_time": 844.4444444444432
    },
    {
      "timestep": 7676,
      "throughput": 9.57234843508013,
      "update": 77,
      "cumulative_wall_time": 855.5555555555543
    },
    {
      "timestep": 7777,
      "throughput": 9.256142726832202,
      "update": 78,
      "cumulative_wall_time": 866.6666666666654
    },
    {
      "timestep": 7878,
      "throughput": 10.097087275919185,
      "update": 79,
      "cumulative_wall_time": 877.7777777777765
    },
    {
      "timestep": 7979,
      "throughput": 9.378161637289525,
      "update": 80,
      "cumulative_wall_time": 888.8888888888875
    },
    {
      "timestep": 8080,
      "throughput": 7.907953697147118,
      "update": 81,
      "cumulative_wall_time": 899.9999999999986
    },
    {
      "timestep": 8181,
      "throughput": 7.806160993451454,
      "update": 82,
      "cumulative_wall_time": 911.1111111111097
    },
    {
      "timestep": 8282,
      "throughput": 10.267532231469211,
      "update": 83,
      "cumulative_wall_time": 922.2222222222208
    },
    {
      "timestep": 8383,
      "throughput": 8.452160277062003,
      "update": 84,
      "cumulative_wall_time": 933.3333333333319
    },
    {
      "timestep": 8484,
      "throughput": 7.811457678189313,
      "update": 85,
      "cumulative_wall_time": 944.444444444443
    },
    {
      "timestep": 8585,
      "throughput": 8.397343260117218,
      "update": 86,
      "cumulative_wall_time": 955.5555555555541
    },
    {
      "timestep": 8686,
      "throughput": 10.138162758271205,
      "update": 87,
      "cumulative_wall_time": 966.6666666666652
    },
    {
      "timestep": 8787,
      "throughput": 7.721808300946339,
      "update": 88,
      "cumulative_wall_time": 977.7777777777762
    },
    {
      "timestep": 8888,
      "throughput": 8.220154316616352,
      "update": 89,
      "cumulative_wall_time": 988.8888888888873
    },
    {
      "timestep": 8989,
      "throughput": 8.399873242083132,
      "update": 90,
      "cumulative_wall_time": 999.9999999999984
    },
    {
      "timestep": 9090,
      "throughput": 7.873929113874125,
      "update": 91,
      "cumulative_wall_time": 1011.1111111111095
    },
    {
      "timestep": 9191,
      "throughput": 7.934105395339502,
      "update": 92,
      "cumulative_wall_time": 1022.2222222222206
    },
    {
      "timestep": 9292,
      "throughput": 7.633702822262707,
      "update": 93,
      "cumulative_wall_time": 1033.3333333333317
    },
    {
      "timestep": 9393,
      "throughput": 8.58493132817695,
      "update": 94,
      "cumulative_wall_time": 1044.4444444444428
    },
    {
      "timestep": 9494,
      "throughput": 8.680582051433923,
      "update": 95,
      "cumulative_wall_time": 1055.5555555555538
    },
    {
      "timestep": 9595,
      "throughput": 8.385715661217025,
      "update": 96,
      "cumulative_wall_time": 1066.666666666665
    },
    {
      "timestep": 9696,
      "throughput": 7.511671944929122,
      "update": 97,
      "cumulative_wall_time": 1077.777777777776
    },
    {
      "timestep": 9797,
      "throughput": 10.128002352170396,
      "update": 98,
      "cumulative_wall_time": 1088.888888888887
    },
    {
      "timestep": 9898,
      "throughput": 7.803829053745055,
      "update": 99,
      "cumulative_wall_time": 1099.9999999999982
    },
    {
      "timestep": 10000,
      "throughput": 9.250230340820584,
      "update": 100,
      "cumulative_wall_time": 1111.1111111111093
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 1500,
        "success_rate": 0.85,
        "mean_reward": 0.7435046681376225,
        "recent_gradient": 0.011336633733483056
      },
      "level_2": {
        "num_pulls": 2000,
        "success_rate": 0.65,
        "mean_reward": 0.6041166471033433,
        "recent_gradient": 0.01824477282674469
      },
      "level_3": {
        "num_pulls": 2500,
        "success_rate": 0.45,
        "mean_reward": 0.3665256854060575,
        "recent_gradient": 0.03139157463827921
      },
      "level_4": {
        "num_pulls": 2500,
        "success_rate": 0.28,
        "mean_reward": 0.28951601093427276,
        "recent_gradient": 0.02083138907978487
      },
      "level_5": {
        "num_pulls": 1500,
        "success_rate": 0.15,
        "mean_reward": 0.13821088842959436,
        "recent_gradient": 0.011639521219220378
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.15
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 5.382527422998509
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.585505583119495
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 4.670424344651676
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 5.305561775027956
      }
    }
  },
  "config": {
    "use_async": false,
    "curriculum_strategy": "fixed"
  }
}