{
  "experiment_name": "sync_seed123",
  "total_timesteps": 10000,
  "total_time": 1000.0,
  "avg_throughput": 10,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": 0.04986727232917929,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 101,
      "pass_at_1": 0.014750479051948933,
      "avg_reward": -0.06351435245434546,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 202,
      "pass_at_1": 0.0066098131424474574,
      "avg_reward": 0.08785967736881553,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 303,
      "pass_at_1": 0.0,
      "avg_reward": -0.021445631442808866,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 404,
      "pass_at_1": 0.061682361537747046,
      "avg_reward": 0.006008869116942553,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 505,
      "pass_at_1": 0.10758001709633026,
      "avg_reward": 0.08132856523021967,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 606,
      "pass_at_1": 0.15368716624122186,
      "avg_reward": 0.09100463315874495,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 707,
      "pass_at_1": 0.11771841828426219,
      "avg_reward": 0.0724571708464839,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 808,
      "pass_at_1": 0.1734918773785151,
      "avg_reward": 0.24813280635150142,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 909,
      "pass_at_1": 0.15226554290289535,
      "avg_reward": 0.14112175428105908,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.14977838499609872,
      "avg_reward": 0.19435930940441892,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.1191955839428877,
      "avg_reward": 0.15414791939341535,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.11574988664922246,
      "avg_reward": 0.06071233419670746,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.1619180766528427,
      "avg_reward": 0.058100426310975714,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.14395550007738644,
      "avg_reward": 0.07207665526892489,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.14465696490032093,
      "avg_reward": -0.024203883352779468,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.1173818437549844,
      "avg_reward": 0.058911613274091654,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.174434636465544,
      "avg_reward": 0.1308659250329244,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.15904392318077126,
      "avg_reward": 0.16164627409973126,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.1445255913924914,
      "avg_reward": 0.12980183930435768,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.14916491466842577,
      "avg_reward": 0.03294845702871026,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.16063566321644288,
      "avg_reward": 0.1571988236934072,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.17843117351224733,
      "avg_reward": 0.14215341408585686,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.22273554218987685,
      "avg_reward": 0.19883404176734043,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.19771366513685784,
      "avg_reward": 0.27007809903438396,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.15552852611021567,
      "avg_reward": 0.07248341037792486,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.21957502435976844,
      "avg_reward": 0.13575688272576164,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.18860289843114927,
      "avg_reward": 0.20434811721613685,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.20914833796845023,
      "avg_reward": 0.2550629794738157,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.22458717811608572,
      "avg_reward": 0.23313937597815543,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.1825738750004939,
      "avg_reward": 0.18580223339005603,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.2076794471171704,
      "avg_reward": 0.09983028469671354,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.23311666356452024,
      "avg_reward": 0.22685515758054453,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.20906637120793464,
      "avg_reward": 0.15559849391712705,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.18758412259586799,
      "avg_reward": 0.160043501754626,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.2243186560939571,
      "avg_reward": 0.13789717566300172,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.24159828737621075,
      "avg_reward": 0.1384184775768169,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.17929958028313553,
      "avg_reward": 0.19542601877114346,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.21710313375080323,
      "avg_reward": 0.16738102773499183,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.2118289090352829,
      "avg_reward": 0.08916498919235617,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.2570911372699033,
      "avg_reward": 0.17122946062357658,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.26860938169557186,
      "avg_reward": 0.25525291466699396,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.23249435147098435,
      "avg_reward": 0.13170036112044417,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.2275331506102504,
      "avg_reward": 0.12140036393344186,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.28730969160474634,
      "avg_reward": 0.23806981479528833,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.2719472063926036,
      "avg_reward": 0.15419016266357152,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.25592860222570074,
      "avg_reward": 0.26363597872098954,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.2489601369629424,
      "avg_reward": 0.25072383251644104,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.23730763268970348,
      "avg_reward": 0.12167252892083356,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.2699103903959644,
      "avg_reward": 0.1969694905881439,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.2784701970347749,
      "avg_reward": 0.12388176105179746
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.2831630776221318,
      "avg_reward": 0.35644565846117116
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.2716945537163168,
      "avg_reward": 0.2190627494185455
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.2790266420050351,
      "avg_reward": 0.13012252806443872
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.2871851738834458,
      "avg_reward": 0.14947765190595838
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.27331200431519054,
      "avg_reward": 0.2807930809323393
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.27034017436688496,
      "avg_reward": 0.24133458897187798
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.30845260997892504,
      "avg_reward": 0.26069913078794005
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.26390545126356835,
      "avg_reward": 0.194500597243284
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.3336114370422007,
      "avg_reward": 0.16563686148388704
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.2919774430051999,
      "avg_reward": 0.20597655082975455
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.3029482383664768,
      "avg_reward": 0.27976937155254294
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.3357164704244478,
      "avg_reward": 0.25506155673910036
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.32276717410107875,
      "avg_reward": 0.28320074652412164
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.3189524782204846,
      "avg_reward": 0.2269657860000641
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.2924309757543417,
      "avg_reward": 0.17894262497243849
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.3001264699253054,
      "avg_reward": 0.25618550473355567
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.33331724347930225,
      "avg_reward": 0.28282723717628655
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.3099267725451034,
      "avg_reward": 0.3382399235327065
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.35405477630565857,
      "avg_reward": 0.2655438154070182
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.30994383687459426,
      "avg_reward": 0.2544658172075739
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.35445633993557757,
      "avg_reward": 0.30020332081116796
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.34290168049309905,
      "avg_reward": 0.263717338280698
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.34351848423993536,
      "avg_reward": 0.3520420099647552
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.3321837006682515,
      "avg_reward": 0.2729123471599948
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.3445987407005113,
      "avg_reward": 0.2898652603489609
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.31379101294939526,
      "avg_reward": 0.15718937756582152
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.32410287603646776,
      "avg_reward": 0.2676794155992576
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.35800090145741276,
      "avg_reward": 0.25986699317724904
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.37685718991530703,
      "avg_reward": 0.29432695321593627
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.3520669721465943,
      "avg_reward": 0.2719553841896423
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.3566500776013344,
      "avg_reward": 0.3205437657832477
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.3695517438175818,
      "avg_reward": 0.25072024802358595
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.38894133078538157,
      "avg_reward": 0.2564017417569594
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.36224226150057287,
      "avg_reward": 0.2760739805243407
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.34182791272302443,
      "avg_reward": 0.26970630077972796
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.35010196136731764,
      "avg_reward": 0.28372693125765674
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.3750510503110916,
      "avg_reward": 0.37363730869753686
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.37516888196348713,
      "avg_reward": 0.26957383855554845
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.3631816377010145,
      "avg_reward": 0.2975442154665398
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.37483728184773174,
      "avg_reward": 0.37284928888960644
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.4027906016631978,
      "avg_reward": 0.3042856850184452
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.3657879011030372,
      "avg_reward": 0.16477759067903688
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.3676215586194285,
      "avg_reward": 0.24519436159132865
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.3733050455495306,
      "avg_reward": 0.3182232485571301
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.38570963652998225,
      "avg_reward": 0.30706930887160866
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.38788473711109045,
      "avg_reward": 0.30400190102732283
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.38952420869137777,
      "avg_reward": 0.1500666165571366
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.38185252302962747,
      "avg_reward": 0.2999394823710516
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.38203196202177586,
      "avg_reward": 0.29472825651227363
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": 0.04986727232917929,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.38203196202177586,
      "avg_reward": 0.29472825651227363
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 5.0,
      "update": 1,
      "cumulative_wall_time": 10.0
    },
    {
      "timestep": 101,
      "throughput": 5.5,
      "update": 2,
      "cumulative_wall_time": 20.0
    },
    {
      "timestep": 202,
      "throughput": 6.0,
      "update": 3,
      "cumulative_wall_time": 30.0
    },
    {
      "timestep": 303,
      "throughput": 6.5,
      "update": 4,
      "cumulative_wall_time": 40.0
    },
    {
      "timestep": 404,
      "throughput": 7.0,
      "update": 5,
      "cumulative_wall_time": 50.0
    },
    {
      "timestep": 505,
      "throughput": 7.5,
      "update": 6,
      "cumulative_wall_time": 60.0
    },
    {
      "timestep": 606,
      "throughput": 8.0,
      "update": 7,
      "cumulative_wall_time": 70.0
    },
    {
      "timestep": 707,
      "throughput": 8.5,
      "update": 8,
      "cumulative_wall_time": 80.0
    },
    {
      "timestep": 808,
      "throughput": 9.0,
      "update": 9,
      "cumulative_wall_time": 90.0
    },
    {
      "timestep": 909,
      "throughput": 9.5,
      "update": 10,
      "cumulative_wall_time": 100.0
    },
    {
      "timestep": 1010,
      "throughput": 10.70331011780673,
      "update": 11,
      "cumulative_wall_time": 110.0
    },
    {
      "timestep": 1111,
      "throughput": 9.401894668659175,
      "update": 12,
      "cumulative_wall_time": 120.0
    },
    {
      "timestep": 1212,
      "throughput": 12.200702099217128,
      "update": 13,
      "cumulative_wall_time": 130.0
    },
    {
      "timestep": 1313,
      "throughput": 10.688296930222087,
      "update": 14,
      "cumulative_wall_time": 140.0
    },
    {
      "timestep": 1414,
      "throughput": 9.993692749086128,
      "update": 15,
      "cumulative_wall_time": 150.0
    },
    {
      "timestep": 1515,
      "throughput": 9.793337696802434,
      "update": 16,
      "cumulative_wall_time": 160.0
    },
    {
      "timestep": 1616,
      "throughput": 9.913477713617866,
      "update": 17,
      "cumulative_wall_time": 170.0
    },
    {
      "timestep": 1717,
      "throughput": 9.08469293005602,
      "update": 18,
      "cumulative_wall_time": 180.0
    },
    {
      "timestep": 1818,
      "throughput": 9.90479746074199,
      "update": 19,
      "cumulative_wall_time": 190.0
    },
    {
      "timestep": 1919,
      "throughput": 10.278683516727053,
      "update": 20,
      "cumulative_wall_time": 200.0
    },
    {
      "timestep": 2020,
      "throughput": 10.579541615573229,
      "update": 21,
      "cumulative_wall_time": 210.0
    },
    {
      "timestep": 2121,
      "throughput": 10.579689779144335,
      "update": 22,
      "cumulative_wall_time": 220.0
    },
    {
      "timestep": 2222,
      "throughput": 9.725122453434064,
      "update": 23,
      "cumulative_wall_time": 230.0
    },
    {
      "timestep": 2323,
      "throughput": 8.583917747478068,
      "update": 24,
      "cumulative_wall_time": 240.0
    },
    {
      "timestep": 2424,
      "throughput": 9.330897373766554,
      "update": 25,
      "cumulative_wall_time": 250.0
    },
    {
      "timestep": 2525,
      "throughput": 11.61219304281239,
      "update": 26,
      "cumulative_wall_time": 260.0
    },
    {
      "timestep": 2626,
      "throughput": 10.896058313409949,
      "update": 27,
      "cumulative_wall_time": 270.0
    },
    {
      "timestep": 2727,
      "throughput": 10.369619586304175,
      "update": 28,
      "cumulative_wall_time": 280.0
    },
    {
      "timestep": 2828,
      "throughput": 9.238705755239875,
      "update": 29,
      "cumulative_wall_time": 290.0
    },
    {
      "timestep": 2929,
      "throughput": 10.003645154973777,
      "update": 30,
      "cumulative_wall_time": 300.0
    },
    {
      "timestep": 3030,
      "throughput": 8.744331314337519,
      "update": 31,
      "cumulative_wall_time": 310.0
    },
    {
      "timestep": 3131,
      "throughput": 9.448063124303927,
      "update": 32,
      "cumulative_wall_time": 320.0
    },
    {
      "timestep": 3232,
      "throughput": 9.754796658314804,
      "update": 33,
      "cumulative_wall_time": 330.0
    },
    {
      "timestep": 3333,
      "throughput": 9.638360068134787,
      "update": 34,
      "cumulative_wall_time": 340.0
    },
    {
      "timestep": 3434,
      "throughput": 10.956601931056012,
      "update": 35,
      "cumulative_wall_time": 350.0
    },
    {
      "timestep": 3535,
      "throughput": 8.581274085964548,
      "update": 36,
      "cumulative_wall_time": 360.0
    },
    {
      "timestep": 3636,
      "throughput": 9.134567728484846,
      "update": 37,
      "cumulative_wall_time": 370.0
    },
    {
      "timestep": 3737,
      "throughput": 8.625312028977781,
      "update": 38,
      "cumulative_wall_time": 380.0
    },
    {
      "timestep": 3838,
      "throughput": 8.762646787312146,
      "update": 39,
      "cumulative_wall_time": 390.0
    },
    {
      "timestep": 3939,
      "throughput": 10.124055896446649,
      "update": 40,
      "cumulative_wall_time": 400.0
    },
    {
      "timestep": 4040,
      "throughput": 8.399559466943728,
      "update": 41,
      "cumulative_wall_time": 410.0
    },
    {
      "timestep": 4141,
      "throughput": 10.753868778837637,
      "update": 42,
      "cumulative_wall_time": 420.0
    },
    {
      "timestep": 4242,
      "throughput": 9.753184223058925,
      "update": 43,
      "cumulative_wall_time": 430.0
    },
    {
      "timestep": 4343,
      "throughput": 10.068788332525978,
      "update": 44,
      "cumulative_wall_time": 440.0
    },
    {
      "timestep": 4444,
      "throughput": 10.322576737997204,
      "update": 45,
      "cumulative_wall_time": 450.0
    },
    {
      "timestep": 4545,
      "throughput": 9.56583347974841,
      "update": 46,
      "cumulative_wall_time": 460.0
    },
    {
      "timestep": 4646,
      "throughput": 11.032479715753379,
      "update": 47,
      "cumulative_wall_time": 470.0
    },
    {
      "timestep": 4747,
      "throughput": 9.805657273272365,
      "update": 48,
      "cumulative_wall_time": 480.0
    },
    {
      "timestep": 4848,
      "throughput": 10.59407025523907,
      "update": 49,
      "cumulative_wall_time": 490.0
    },
    {
      "timestep": 4949,
      "throughput": 9.800887617242747,
      "update": 50,
      "cumulative_wall_time": 500.0
    },
    {
      "timestep": 5050,
      "throughput": 10.290874387424925,
      "update": 51,
      "cumulative_wall_time": 510.0
    },
    {
      "timestep": 5151,
      "throughput": 10.279662670157961,
      "update": 52,
      "cumulative_wall_time": 520.0
    },
    {
      "timestep": 5252,
      "throughput": 10.249969939455532,
      "update": 53,
      "cumulative_wall_time": 530.0
    },
    {
      "timestep": 5353,
      "throughput": 9.025692150379081,
      "update": 54,
      "cumulative_wall_time": 540.0
    },
    {
      "timestep": 5454,
      "throughput": 10.43587577054744,
      "update": 55,
      "cumulative_wall_time": 550.0
    },
    {
      "timestep": 5555,
      "throughput": 9.681043010900405,
      "update": 56,
      "cumulative_wall_time": 560.0
    },
    {
      "timestep": 5656,
      "throughput": 10.630488030489918,
      "update": 57,
      "cumulative_wall_time": 570.0
    },
    {
      "timestep": 5757,
      "throughput": 7.847506555587696,
      "update": 58,
      "cumulative_wall_time": 580.0
    },
    {
      "timestep": 5858,
      "throughput": 8.53488377794505,
      "update": 59,
      "cumulative_wall_time": 590.0
    },
    {
      "timestep": 5959,
      "throughput": 10.36344556213503,
      "update": 60,
      "cumulative_wall_time": 600.0
    },
    {
      "timestep": 6060,
      "throughput": 11.86292758510523,
      "update": 61,
      "cumulative_wall_time": 610.0
    },
    {
      "timestep": 6161,
      "throughput": 10.835058746811237,
      "update": 62,
      "cumulative_wall_time": 620.0
    },
    {
      "timestep": 6262,
      "throughput": 9.31754906580002,
      "update": 63,
      "cumulative_wall_time": 630.0
    },
    {
      "timestep": 6363,
      "throughput": 8.307947584622044,
      "update": 64,
      "cumulative_wall_time": 640.0
    },
    {
      "timestep": 6464,
      "throughput": 10.74268622116162,
      "update": 65,
      "cumulative_wall_time": 650.0
    },
    {
      "timestep": 6565,
      "throughput": 9.91941677795705,
      "update": 66,
      "cumulative_wall_time": 660.0
    },
    {
      "timestep": 6666,
      "throughput": 10.590704217894384,
      "update": 67,
      "cumulative_wall_time": 670.0
    },
    {
      "timestep": 6767,
      "throughput": 10.11529872221079,
      "update": 68,
      "cumulative_wall_time": 680.0
    },
    {
      "timestep": 6868,
      "throughput": 10.029642925120495,
      "update": 69,
      "cumulative_wall_time": 690.0
    },
    {
      "timestep": 6969,
      "throughput": 12.958625445893176,
      "update": 70,
      "cumulative_wall_time": 700.0
    },
    {
      "timestep": 7070,
      "throughput": 9.993870038954421,
      "update": 71,
      "cumulative_wall_time": 710.0
    },
    {
      "timestep": 7171,
      "throughput": 9.840754790746736,
      "update": 72,
      "cumulative_wall_time": 720.0
    },
    {
      "timestep": 7272,
      "throughput": 9.878551324595978,
      "update": 73,
      "cumulative_wall_time": 730.0
    },
    {
      "timestep": 7373,
      "throughput": 9.416463283292343,
      "update": 74,
      "cumulative_wall_time": 740.0
    },
    {
      "timestep": 7474,
      "throughput": 10.990132894715313,
      "update": 75,
      "cumulative_wall_time": 750.0
    },
    {
      "timestep": 7575,
      "throughput": 9.64624566621865,
      "update": 76,
      "cumulative_wall_time": 760.0
    },
    {
      "timestep": 7676,
      "throughput": 10.63594270564459,
      "update": 77,
      "cumulative_wall_time": 770.0
    },
    {
      "timestep": 7777,
      "throughput": 10.284603029813557,
      "update": 78,
      "cumulative_wall_time": 780.0
    },
    {
      "timestep": 7878,
      "throughput": 11.218985862132428,
      "update": 79,
      "cumulative_wall_time": 790.0
    },
    {
      "timestep": 7979,
      "throughput": 10.420179596988362,
      "update": 80,
      "cumulative_wall_time": 800.0
    },
    {
      "timestep": 8080,
      "throughput": 8.786615219052353,
      "update": 81,
      "cumulative_wall_time": 810.0
    },
    {
      "timestep": 8181,
      "throughput": 8.67351221494606,
      "update": 82,
      "cumulative_wall_time": 820.0
    },
    {
      "timestep": 8282,
      "throughput": 11.408369146076902,
      "update": 83,
      "cumulative_wall_time": 830.0
    },
    {
      "timestep": 8383,
      "throughput": 9.391289196735558,
      "update": 84,
      "cumulative_wall_time": 840.0
    },
    {
      "timestep": 8484,
      "throughput": 8.679397420210348,
      "update": 85,
      "cumulative_wall_time": 850.0
    },
    {
      "timestep": 8585,
      "throughput": 9.330381400130243,
      "update": 86,
      "cumulative_wall_time": 860.0
    },
    {
      "timestep": 8686,
      "throughput": 11.264625286968005,
      "update": 87,
      "cumulative_wall_time": 870.0
    },
    {
      "timestep": 8787,
      "throughput": 8.579787001051487,
      "update": 88,
      "cumulative_wall_time": 880.0
    },
    {
      "timestep": 8888,
      "throughput": 9.133504796240391,
      "update": 89,
      "cumulative_wall_time": 890.0
    },
    {
      "timestep": 8989,
      "throughput": 9.33319249120348,
      "update": 90,
      "cumulative_wall_time": 900.0
    },
    {
      "timestep": 9090,
      "throughput": 8.748810126526806,
      "update": 91,
      "cumulative_wall_time": 910.0
    },
    {
      "timestep": 9191,
      "throughput": 8.815672661488335,
      "update": 92,
      "cumulative_wall_time": 920.0
    },
    {
      "timestep": 9292,
      "throughput": 8.481892024736341,
      "update": 93,
      "cumulative_wall_time": 930.0
    },
    {
      "timestep": 9393,
      "throughput": 9.538812586863278,
      "update": 94,
      "cumulative_wall_time": 940.0
    },
    {
      "timestep": 9494,
      "throughput": 9.645091168259915,
      "update": 95,
      "cumulative_wall_time": 950.0
    },
    {
      "timestep": 9595,
      "throughput": 9.317461845796695,
      "update": 96,
      "cumulative_wall_time": 960.0
    },
    {
      "timestep": 9696,
      "throughput": 8.346302161032359,
      "update": 97,
      "cumulative_wall_time": 970.0
    },
    {
      "timestep": 9797,
      "throughput": 11.253335946855996,
      "update": 98,
      "cumulative_wall_time": 980.0
    },
    {
      "timestep": 9898,
      "throughput": 8.670921170827839,
      "update": 99,
      "cumulative_wall_time": 990.0
    },
    {
      "timestep": 10000,
      "throughput": 10.278033712022872,
      "update": 100,
      "cumulative_wall_time": 1000.0
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 2000,
        "success_rate": 0.85,
        "mean_reward": 0.7435046681376225,
        "recent_gradient": 0.011336633733483056
      },
      "level_2": {
        "num_pulls": 2000,
        "success_rate": 0.65,
        "mean_reward": 0.6041166471033433,
        "recent_gradient": 0.01824477282674469
      },
      "level_3": {
        "num_pulls": 2000,
        "success_rate": 0.45,
        "mean_reward": 0.3665256854060575,
        "recent_gradient": 0.03139157463827921
      },
      "level_4": {
        "num_pulls": 2000,
        "success_rate": 0.28,
        "mean_reward": 0.28951601093427276,
        "recent_gradient": 0.02083138907978487
      },
      "level_5": {
        "num_pulls": 2000,
        "success_rate": 0.15,
        "mean_reward": 0.13821088842959436,
        "recent_gradient": 0.011639521219220378
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.15
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 5.382527422998509
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.585505583119495
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 4.670424344651676
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 5.305561775027956
      }
    }
  },
  "config": {
    "use_async": false,
    "curriculum_strategy": "uniform"
  }
}