{
  "experiment_name": "async_staleness_seed123",
  "total_timesteps": 10000,
  "total_time": 454.54545454545456,
  "avg_throughput": 22,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": 0.04986727232917929,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 101,
      "pass_at_1": 0.015356539658009538,
      "avg_reward": -0.06302950396949697,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 202,
      "pass_at_1": 0.007821934354568667,
      "avg_reward": 0.0888293743385125,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 303,
      "pass_at_1": 0.0,
      "avg_reward": -0.021445631442808866,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 404,
      "pass_at_1": 0.06410660396198947,
      "avg_reward": 0.007948263056336488,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 505,
      "pass_at_1": 0.1319618328851947,
      "avg_reward": 0.10083401786131121,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 606,
      "pass_at_1": 0.1779408818001168,
      "avg_reward": 0.11040760560586091,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 707,
      "pass_at_1": 0.1418319845009276,
      "avg_reward": 0.09174802381981623,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 808,
      "pass_at_1": 0.19745328643809756,
      "avg_reward": 0.26730193359916743,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 909,
      "pass_at_1": 0.1760628513411191,
      "avg_reward": 0.1601596010316381,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.1733997372039804,
      "avg_reward": 0.21325639117072426,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.14262923605588324,
      "avg_reward": 0.17289484108381176,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.13898423074953808,
      "avg_reward": 0.07929980947695996,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.18494166520972874,
      "avg_reward": 0.07651929715648455,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.16675707054660263,
      "avg_reward": 0.09031791164429784,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.16722546440065142,
      "avg_reward": -0.006149083752515078,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.13970645373673213,
      "avg_reward": 0.07677130125948985,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.19650479728337616,
      "avg_reward": 0.14852205368719015,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.18084935848116174,
      "avg_reward": 0.17909062234004364,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.1660563322243386,
      "avg_reward": 0.14702643196983545,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.17041132322424624,
      "avg_reward": 0.049945583873366645,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.18158845611087987,
      "avg_reward": 0.1739610580089568,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.1990814445045048,
      "avg_reward": 0.15867363087966285,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.2430747842571201,
      "avg_reward": 0.21510543542113503,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.21773379180661695,
      "avg_reward": 0.28609420037019123,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.17522189196140142,
      "avg_reward": 0.08823810305887347,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.23893444460406382,
      "avg_reward": 0.15124441892119794,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.20762166748927138,
      "avg_reward": 0.21956313246263456,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.22782024695908282,
      "avg_reward": 0.27000050666632175,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.24290653117914554,
      "avg_reward": 0.24779485842860327,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.20053550438080223,
      "avg_reward": 0.2001715368943027,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.2252787269395251,
      "avg_reward": 0.11390970855459728,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.2503495222365827,
      "avg_reward": 0.2406414445181945,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.22592930239321893,
      "avg_reward": 0.16908883886535447,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.20407419470541555,
      "avg_reward": 0.1732355594422641,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.2404335202519514,
      "avg_reward": 0.15078906698939717,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.2573361838217902,
      "avg_reward": 0.15100879473328044,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.19465934317794584,
      "avg_reward": 0.2077138290869917,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.23208419436934388,
      "avg_reward": 0.17936587622982436,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.22643129732278508,
      "avg_reward": 0.10084689982235794,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.27131548176027753,
      "avg_reward": 0.18260893621587596,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.28245690778981775,
      "avg_reward": 0.2663309355423906,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.24596687808430898,
      "avg_reward": 0.14247838241110386,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.24063308520393192,
      "avg_reward": 0.13188031160838706,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.3000400236264481,
      "avg_reward": 0.24825408041264974,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.28431149915633697,
      "avg_reward": 0.1640815968745582,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.26793098326989284,
      "avg_reward": 0.2732378835563432,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.2606052869320364,
      "avg_reward": 0.26003995249171624,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.2486007727913557,
      "avg_reward": 0.13070704100215536,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.2808572684921577,
      "avg_reward": 0.20572699306509856,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.2890770724309974,
      "avg_reward": 0.13236726136877547
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.29343670462414023,
      "avg_reward": 0.3646645600627779
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.281642164028878,
      "avg_reward": 0.22702083766859446
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.2886559260513927,
      "avg_reward": 0.13782595530152478
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.2965042611280694,
      "avg_reward": 0.15693292170165726
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.2823294426756101,
      "avg_reward": 0.2880070316206749
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.2790649088030897,
      "avg_reward": 0.24831437652084176
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.31689396035090006,
      "avg_reward": 0.2674522110855201
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.2720730895490583,
      "avg_reward": 0.20103470787167596
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.34151536400772864,
      "avg_reward": 0.17196000305630935
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.29962796442374057,
      "avg_reward": 0.21209696796458707
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.3103559408750053,
      "avg_reward": 0.2856955335593658
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.34289219711386654,
      "avg_reward": 0.26080213809063535
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.32972199992979956,
      "avg_reward": 0.2887646071870983
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.3256976853412282,
      "avg_reward": 0.23236195169665894
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.29897802884154495,
      "avg_reward": 0.18418026744220112
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.30648699158792997,
      "avg_reward": 0.2612739220636553
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.3395029898408498,
      "avg_reward": 0.2877758342655246
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.3159496090693001,
      "avg_reward": 0.34305819275206384
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.3599266539426116,
      "avg_reward": 0.2702413175165806
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.31567676859828164,
      "avg_reward": 0.2590521625865238
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.36006237773935645,
      "avg_reward": 0.30468815105419106
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.34839289290553566,
      "avg_reward": 0.2681103082106473
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.34890693441872034,
      "avg_reward": 0.3563527701077832
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.33748142512529833,
      "avg_reward": 0.2771505267256323
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.3498177287065867,
      "avg_reward": 0.29404045075382124
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.3189431866618278,
      "avg_reward": 0.16131111653576752
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.3292000713886666,
      "avg_reward": 0.2717571718810167
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.363054849844128,
      "avg_reward": 0.2639101518866212
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.3818795007028122,
      "avg_reward": 0.2983448018459404
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.35706911603229596,
      "avg_reward": 0.27595709929820367
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.36164337084274134,
      "avg_reward": 0.32453840037637327
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.3745473333461186,
      "avg_reward": 0.2547167196464154
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.39395018021623107,
      "avg_reward": 0.260408821301639
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.3672751380456015,
      "avg_reward": 0.28010028176036356
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.34689537500989004,
      "avg_reward": 0.2737602706092205
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.3552143481641079,
      "avg_reward": 0.28781684069508895
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.380218470152293,
      "avg_reward": 0.377771244570498
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.3804012036697566,
      "avg_reward": 0.27375969592056404
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.36848848178212007,
      "avg_reward": 0.30178969073142425
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.38022801277515184,
      "avg_reward": 0.3771618736315425
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.4082743209962248,
      "avg_reward": 0.3086726604848668
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.37137344144981804,
      "avg_reward": 0.16924602295646154
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.37331747841219465,
      "avg_reward": 0.24975109742554155
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.37911962461131726,
      "avg_reward": 0.3228749118065594
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.39165087240841234,
      "avg_reward": 0.31182229757435276
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.3939603421532881,
      "avg_reward": 0.30886238506108094
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.3957416078327876,
      "avg_reward": 0.1550405358702645
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.3882188522684267,
      "avg_reward": 0.305032545762091
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.3885540675496769,
      "avg_reward": 0.2999459409345945
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": 0.04986727232917929,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.3885540675496769,
      "avg_reward": 0.2999459409345945
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 11.0,
      "update": 1,
      "cumulative_wall_time": 4.545454545454546
    },
    {
      "timestep": 101,
      "throughput": 12.100000000000001,
      "update": 2,
      "cumulative_wall_time": 9.090909090909092
    },
    {
      "timestep": 202,
      "throughput": 13.2,
      "update": 3,
      "cumulative_wall_time": 13.636363636363637
    },
    {
      "timestep": 303,
      "throughput": 14.3,
      "update": 4,
      "cumulative_wall_time": 18.181818181818183
    },
    {
      "timestep": 404,
      "throughput": 15.399999999999999,
      "update": 5,
      "cumulative_wall_time": 22.72727272727273
    },
    {
      "timestep": 505,
      "throughput": 16.5,
      "update": 6,
      "cumulative_wall_time": 27.272727272727277
    },
    {
      "timestep": 606,
      "throughput": 17.6,
      "update": 7,
      "cumulative_wall_time": 31.818181818181824
    },
    {
      "timestep": 707,
      "throughput": 18.7,
      "update": 8,
      "cumulative_wall_time": 36.36363636363637
    },
    {
      "timestep": 808,
      "throughput": 19.8,
      "update": 9,
      "cumulative_wall_time": 40.909090909090914
    },
    {
      "timestep": 909,
      "throughput": 20.9,
      "update": 10,
      "cumulative_wall_time": 45.45454545454546
    },
    {
      "timestep": 1010,
      "throughput": 23.547282259174807,
      "update": 11,
      "cumulative_wall_time": 50.00000000000001
    },
    {
      "timestep": 1111,
      "throughput": 20.684168271050183,
      "update": 12,
      "cumulative_wall_time": 54.545454545454554
    },
    {
      "timestep": 1212,
      "throughput": 26.841544618277684,
      "update": 13,
      "cumulative_wall_time": 59.0909090909091
    },
    {
      "timestep": 1313,
      "throughput": 23.514253246488593,
      "update": 14,
      "cumulative_wall_time": 63.63636363636365
    },
    {
      "timestep": 1414,
      "throughput": 21.98612404798948,
      "update": 15,
      "cumulative_wall_time": 68.18181818181819
    },
    {
      "timestep": 1515,
      "throughput": 21.545342932965355,
      "update": 16,
      "cumulative_wall_time": 72.72727272727273
    },
    {
      "timestep": 1616,
      "throughput": 21.809650969959304,
      "update": 17,
      "cumulative_wall_time": 77.27272727272728
    },
    {
      "timestep": 1717,
      "throughput": 19.986324446123245,
      "update": 18,
      "cumulative_wall_time": 81.81818181818183
    },
    {
      "timestep": 1818,
      "throughput": 21.79055441363238,
      "update": 19,
      "cumulative_wall_time": 86.36363636363637
    },
    {
      "timestep": 1919,
      "throughput": 22.61310373679952,
      "update": 20,
      "cumulative_wall_time": 90.90909090909092
    },
    {
      "timestep": 2020,
      "throughput": 23.274991554261103,
      "update": 21,
      "cumulative_wall_time": 95.45454545454547
    },
    {
      "timestep": 2121,
      "throughput": 23.275317514117535,
      "update": 22,
      "cumulative_wall_time": 100.00000000000001
    },
    {
      "timestep": 2222,
      "throughput": 21.395269397554944,
      "update": 23,
      "cumulative_wall_time": 104.54545454545456
    },
    {
      "timestep": 2323,
      "throughput": 18.884619044451753,
      "update": 24,
      "cumulative_wall_time": 109.09090909090911
    },
    {
      "timestep": 2424,
      "throughput": 20.52797422228642,
      "update": 25,
      "cumulative_wall_time": 113.63636363636365
    },
    {
      "timestep": 2525,
      "throughput": 25.546824694187254,
      "update": 26,
      "cumulative_wall_time": 118.1818181818182
    },
    {
      "timestep": 2626,
      "throughput": 23.971328289501887,
      "update": 27,
      "cumulative_wall_time": 122.72727272727275
    },
    {
      "timestep": 2727,
      "throughput": 22.813163089869185,
      "update": 28,
      "cumulative_wall_time": 127.2727272727273
    },
    {
      "timestep": 2828,
      "throughput": 20.325152661527724,
      "update": 29,
      "cumulative_wall_time": 131.81818181818184
    },
    {
      "timestep": 2929,
      "throughput": 22.008019340942308,
      "update": 30,
      "cumulative_wall_time": 136.36363636363637
    },
    {
      "timestep": 3030,
      "throughput": 19.23752889154254,
      "update": 31,
      "cumulative_wall_time": 140.9090909090909
    },
    {
      "timestep": 3131,
      "throughput": 20.785738873468638,
      "update": 32,
      "cumulative_wall_time": 145.45454545454544
    },
    {
      "timestep": 3232,
      "throughput": 21.46055264829257,
      "update": 33,
      "cumulative_wall_time": 149.99999999999997
    },
    {
      "timestep": 3333,
      "throughput": 21.20439214989653,
      "update": 34,
      "cumulative_wall_time": 154.5454545454545
    },
    {
      "timestep": 3434,
      "throughput": 24.104524248323226,
      "update": 35,
      "cumulative_wall_time": 159.09090909090904
    },
    {
      "timestep": 3535,
      "throughput": 18.878802989122004,
      "update": 36,
      "cumulative_wall_time": 163.63636363636357
    },
    {
      "timestep": 3636,
      "throughput": 20.09604900266666,
      "update": 37,
      "cumulative_wall_time": 168.1818181818181
    },
    {
      "timestep": 3737,
      "throughput": 18.975686463751117,
      "update": 38,
      "cumulative_wall_time": 172.72727272727263
    },
    {
      "timestep": 3838,
      "throughput": 19.27782293208672,
      "update": 39,
      "cumulative_wall_time": 177.27272727272717
    },
    {
      "timestep": 3939,
      "throughput": 22.272922972182627,
      "update": 40,
      "cumulative_wall_time": 181.8181818181817
    },
    {
      "timestep": 4040,
      "throughput": 18.4790308272762,
      "update": 41,
      "cumulative_wall_time": 186.36363636363623
    },
    {
      "timestep": 4141,
      "throughput": 23.6585113134428,
      "update": 42,
      "cumulative_wall_time": 190.90909090909076
    },
    {
      "timestep": 4242,
      "throughput": 21.457005290729636,
      "update": 43,
      "cumulative_wall_time": 195.4545454545453
    },
    {
      "timestep": 4343,
      "throughput": 22.151334331557152,
      "update": 44,
      "cumulative_wall_time": 199.99999999999983
    },
    {
      "timestep": 4444,
      "throughput": 22.70966882359385,
      "update": 45,
      "cumulative_wall_time": 204.54545454545436
    },
    {
      "timestep": 4545,
      "throughput": 21.0448336554465,
      "update": 46,
      "cumulative_wall_time": 209.0909090909089
    },
    {
      "timestep": 4646,
      "throughput": 24.27145537465743,
      "update": 47,
      "cumulative_wall_time": 213.63636363636343
    },
    {
      "timestep": 4747,
      "throughput": 21.572446001199204,
      "update": 48,
      "cumulative_wall_time": 218.18181818181796
    },
    {
      "timestep": 4848,
      "throughput": 23.306954561525952,
      "update": 49,
      "cumulative_wall_time": 222.7272727272725
    },
    {
      "timestep": 4949,
      "throughput": 21.561952757934044,
      "update": 50,
      "cumulative_wall_time": 227.27272727272702
    },
    {
      "timestep": 5050,
      "throughput": 22.639923652334833,
      "update": 51,
      "cumulative_wall_time": 231.81818181818156
    },
    {
      "timestep": 5151,
      "throughput": 22.615257874347513,
      "update": 52,
      "cumulative_wall_time": 236.3636363636361
    },
    {
      "timestep": 5252,
      "throughput": 22.54993386680217,
      "update": 53,
      "cumulative_wall_time": 240.90909090909062
    },
    {
      "timestep": 5353,
      "throughput": 19.85652273083398,
      "update": 54,
      "cumulative_wall_time": 245.45454545454515
    },
    {
      "timestep": 5454,
      "throughput": 22.95892669520437,
      "update": 55,
      "cumulative_wall_time": 249.9999999999997
    },
    {
      "timestep": 5555,
      "throughput": 21.29829462398089,
      "update": 56,
      "cumulative_wall_time": 254.54545454545422
    },
    {
      "timestep": 5656,
      "throughput": 23.387073667077818,
      "update": 57,
      "cumulative_wall_time": 259.0909090909088
    },
    {
      "timestep": 5757,
      "throughput": 17.26451442229293,
      "update": 58,
      "cumulative_wall_time": 263.63636363636334
    },
    {
      "timestep": 5858,
      "throughput": 18.77674431147911,
      "update": 59,
      "cumulative_wall_time": 268.1818181818179
    },
    {
      "timestep": 5959,
      "throughput": 22.799580236697064,
      "update": 60,
      "cumulative_wall_time": 272.72727272727246
    },
    {
      "timestep": 6060,
      "throughput": 26.098440687231506,
      "update": 61,
      "cumulative_wall_time": 277.272727272727
    },
    {
      "timestep": 6161,
      "throughput": 23.837129242984723,
      "update": 62,
      "cumulative_wall_time": 281.8181818181816
    },
    {
      "timestep": 6262,
      "throughput": 20.498607944760042,
      "update": 63,
      "cumulative_wall_time": 286.36363636363615
    },
    {
      "timestep": 6363,
      "throughput": 18.277484686168496,
      "update": 64,
      "cumulative_wall_time": 290.9090909090907
    },
    {
      "timestep": 6464,
      "throughput": 23.633909686555562,
      "update": 65,
      "cumulative_wall_time": 295.45454545454527
    },
    {
      "timestep": 6565,
      "throughput": 21.82271691150551,
      "update": 66,
      "cumulative_wall_time": 299.99999999999983
    },
    {
      "timestep": 6666,
      "throughput": 23.299549279367646,
      "update": 67,
      "cumulative_wall_time": 304.5454545454544
    },
    {
      "timestep": 6767,
      "throughput": 22.253657188863738,
      "update": 68,
      "cumulative_wall_time": 309.09090909090895
    },
    {
      "timestep": 6868,
      "throughput": 22.065214435265087,
      "update": 69,
      "cumulative_wall_time": 313.6363636363635
    },
    {
      "timestep": 6969,
      "throughput": 28.50897598096499,
      "update": 70,
      "cumulative_wall_time": 318.1818181818181
    },
    {
      "timestep": 7070,
      "throughput": 21.986514085699728,
      "update": 71,
      "cumulative_wall_time": 322.72727272727263
    },
    {
      "timestep": 7171,
      "throughput": 21.649660539642817,
      "update": 72,
      "cumulative_wall_time": 327.2727272727272
    },
    {
      "timestep": 7272,
      "throughput": 21.73281291411115,
      "update": 73,
      "cumulative_wall_time": 331.81818181818176
    },
    {
      "timestep": 7373,
      "throughput": 20.716219223243154,
      "update": 74,
      "cumulative_wall_time": 336.3636363636363
    },
    {
      "timestep": 7474,
      "throughput": 24.178292368373686,
      "update": 75,
      "cumulative_wall_time": 340.9090909090909
    },
    {
      "timestep": 7575,
      "throughput": 21.221740465681034,
      "update": 76,
      "cumulative_wall_time": 345.45454545454544
    },
    {
      "timestep": 7676,
      "throughput": 23.3990739524181,
      "update": 77,
      "cumulative_wall_time": 350.0
    },
    {
      "timestep": 7777,
      "throughput": 22.626126665589826,
      "update": 78,
      "cumulative_wall_time": 354.54545454545456
    },
    {
      "timestep": 7878,
      "throughput": 24.681768896691338,
      "update": 79,
      "cumulative_wall_time": 359.0909090909091
    },
    {
      "timestep": 7979,
      "throughput": 22.924395113374395,
      "update": 80,
      "cumulative_wall_time": 363.6363636363637
    },
    {
      "timestep": 8080,
      "throughput": 19.330553481915175,
      "update": 81,
      "cumulative_wall_time": 368.18181818181824
    },
    {
      "timestep": 8181,
      "throughput": 19.081726872881333,
      "update": 82,
      "cumulative_wall_time": 372.7272727272728
    },
    {
      "timestep": 8282,
      "throughput": 25.098412121369186,
      "update": 83,
      "cumulative_wall_time": 377.27272727272737
    },
    {
      "timestep": 8383,
      "throughput": 20.660836232818227,
      "update": 84,
      "cumulative_wall_time": 381.8181818181819
    },
    {
      "timestep": 8484,
      "throughput": 19.094674324462765,
      "update": 85,
      "cumulative_wall_time": 386.3636363636365
    },
    {
      "timestep": 8585,
      "throughput": 20.526839080286532,
      "update": 86,
      "cumulative_wall_time": 390.90909090909105
    },
    {
      "timestep": 8686,
      "throughput": 24.782175631329615,
      "update": 87,
      "cumulative_wall_time": 395.4545454545456
    },
    {
      "timestep": 8787,
      "throughput": 18.87553140231327,
      "update": 88,
      "cumulative_wall_time": 400.00000000000017
    },
    {
      "timestep": 8888,
      "throughput": 20.093710551728858,
      "update": 89,
      "cumulative_wall_time": 404.54545454545473
    },
    {
      "timestep": 8989,
      "throughput": 20.533023480647657,
      "update": 90,
      "cumulative_wall_time": 409.0909090909093
    },
    {
      "timestep": 9090,
      "throughput": 19.24738227835897,
      "update": 91,
      "cumulative_wall_time": 413.63636363636385
    },
    {
      "timestep": 9191,
      "throughput": 19.39447985527434,
      "update": 92,
      "cumulative_wall_time": 418.1818181818184
    },
    {
      "timestep": 9292,
      "throughput": 18.66016245441995,
      "update": 93,
      "cumulative_wall_time": 422.727272727273
    },
    {
      "timestep": 9393,
      "throughput": 20.985387691099213,
      "update": 94,
      "cumulative_wall_time": 427.27272727272754
    },
    {
      "timestep": 9494,
      "throughput": 21.219200570171814,
      "update": 95,
      "cumulative_wall_time": 431.8181818181821
    },
    {
      "timestep": 9595,
      "throughput": 20.498416060752728,
      "update": 96,
      "cumulative_wall_time": 436.36363636363666
    },
    {
      "timestep": 9696,
      "throughput": 18.36186475427119,
      "update": 97,
      "cumulative_wall_time": 440.9090909090912
    },
    {
      "timestep": 9797,
      "throughput": 24.757339083083192,
      "update": 98,
      "cumulative_wall_time": 445.4545454545458
    },
    {
      "timestep": 9898,
      "throughput": 19.076026575821246,
      "update": 99,
      "cumulative_wall_time": 450.00000000000034
    },
    {
      "timestep": 10000,
      "throughput": 22.611674166450317,
      "update": 100,
      "cumulative_wall_time": 454.5454545454549
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 2000,
        "success_rate": 0.85,
        "mean_reward": 0.7435046681376225,
        "recent_gradient": 0.011336633733483056
      },
      "level_2": {
        "num_pulls": 2000,
        "success_rate": 0.65,
        "mean_reward": 0.6041166471033433,
        "recent_gradient": 0.01824477282674469
      },
      "level_3": {
        "num_pulls": 2000,
        "success_rate": 0.45,
        "mean_reward": 0.3665256854060575,
        "recent_gradient": 0.03139157463827921
      },
      "level_4": {
        "num_pulls": 2000,
        "success_rate": 0.28,
        "mean_reward": 0.28951601093427276,
        "recent_gradient": 0.02083138907978487
      },
      "level_5": {
        "num_pulls": 2000,
        "success_rate": 0.15,
        "mean_reward": 0.13821088842959436,
        "recent_gradient": 0.011639521219220378
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.15
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 5.382527422998509
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.585505583119495
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 4.670424344651676
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 5.305561775027956
      }
    }
  },
  "config": {
    "use_async": true,
    "curriculum_strategy": "uniform",
    "use_csc": true
  }
}