{
  "sync": {
    "train_metrics": [
      {
        "timestep": 0,
        "pass_at_1": 0.009934283060224654,
        "avg_reward": 0.0010342113896204897,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 101,
        "pass_at_1": 0.02204467985292294,
        "avg_reward": 0.09378723670273963,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 202,
        "pass_at_1": 0.013498750687351464,
        "avg_reward": -0.0009078472975778563,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 303,
        "pass_at_1": 0.0588569835828751,
        "avg_reward": 0.08545732332394551,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 404,
        "pass_at_1": 0.026974148644937326,
        "avg_reward": 0.0487073210952481,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 505,
        "pass_at_1": 0.11188938627252211,
        "avg_reward": 0.06622502133950484,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 606,
        "pass_at_1": 0.1286986191500568,
        "avg_reward": 0.007294883087155535,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 707,
        "pass_at_1": 0.09209970082692284,
        "avg_reward": 0.04556538419948965,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 808,
        "pass_at_1": 0.1091166533173175,
        "avg_reward": 0.1030056892836177,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 909,
        "pass_at_1": 0.11402398343489357,
        "avg_reward": 0.020604001681150286,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1010,
        "pass_at_1": 0.16434398885660495,
        "avg_reward": 0.12018637606095718,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1111,
        "pass_at_1": 0.139262825404694,
        "avg_reward": 0.04017285101308238,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1212,
        "pass_at_1": 0.12993984551369905,
        "avg_reward": 0.10949800589645256,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1313,
        "pass_at_1": 0.12075610118839061,
        "avg_reward": 0.1153897818679961,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1414,
        "pass_at_1": 0.13474410068278367,
        "avg_reward": 0.09321059305656311,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1515,
        "pass_at_1": 0.13773522006634492,
        "avg_reward": 0.20280208527852284,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1616,
        "pass_at_1": 0.15254256135042266,
        "avg_reward": 0.0691485026325431,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1717,
        "pass_at_1": 0.17233628607243612,
        "avg_reward": 0.0768268463593978,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1818,
        "pass_at_1": 0.16316427676293016,
        "avg_reward": 0.03254791521635535,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1919,
        "pass_at_1": 0.13555259727470384,
        "avg_reward": 0.11828513961321925,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2020,
        "pass_at_1": 0.1800415766296463,
        "avg_reward": 0.15260167536321556,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2121,
        "pass_at_1": 0.16614069344378007,
        "avg_reward": 0.11785736997555962,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2222,
        "pass_at_1": 0.14208895268490274,
        "avg_reward": 0.07767895172818676,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2323,
        "pass_at_1": 0.16567546145192658,
        "avg_reward": 0.18539648047248705,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2424,
        "pass_at_1": 0.18501131080948016,
        "avg_reward": 0.05985704087944743,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2525,
        "pass_at_1": 0.18789191196133653,
        "avg_reward": 0.1310594155482534,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2626,
        "pass_at_1": 0.17116233985119067,
        "avg_reward": 0.16751368632299593,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2727,
        "pass_at_1": 0.2086292242750017,
        "avg_reward": 0.21346738537581128,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2828,
        "pass_at_1": 0.17454985967813402,
        "avg_reward": 0.12417926894994648,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2929,
        "pass_at_1": 0.2012995640034876,
        "avg_reward": 0.20981690755890806,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3030,
        "pass_at_1": 0.18844456452853195,
        "avg_reward": 0.1414727027896347,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3131,
        "pass_at_1": 0.17926730774691252,
        "avg_reward": 0.0836035149934965,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3232,
        "pass_at_1": 0.22102119908286716,
        "avg_reward": 0.24462896069483486,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3333,
        "pass_at_1": 0.20671636716370603,
        "avg_reward": 0.21554973862556606,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3434,
        "pass_at_1": 0.21878286599083643,
        "avg_reward": 0.14277030506241295,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3535,
        "pass_at_1": 0.22217778581521247,
        "avg_reward": 0.25464405697546844,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3636,
        "pass_at_1": 0.21763768561202113,
        "avg_reward": 0.25234233128031724,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3737,
        "pass_at_1": 0.16936668520218948,
        "avg_reward": 0.17658847338051278,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3838,
        "pass_at_1": 0.2269113958776088,
        "avg_reward": 0.16657874917879367,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3939,
        "pass_at_1": 0.230414459022494,
        "avg_reward": 0.08495312148795056,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4040,
        "pass_at_1": 0.22759295201866866,
        "avg_reward": 0.19992999019052227,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4141,
        "pass_at_1": 0.2649482128274434,
        "avg_reward": 0.18604505934827237,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4242,
        "pass_at_1": 0.2226196423474698,
        "avg_reward": 0.15300786169874903,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4343,
        "pass_at_1": 0.26049043269870104,
        "avg_reward": 0.22482990164194508,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4444,
        "pass_at_1": 0.23497222033764187,
        "avg_reward": 0.21364114792578132,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4545,
        "pass_at_1": 0.2508846465286318,
        "avg_reward": 0.2491399667495499,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4646,
        "pass_at_1": 0.2382668377562136,
        "avg_reward": 0.17423036287508248,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4747,
        "pass_at_1": 0.24781818913895956,
        "avg_reward": 0.12507880390456172,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4848,
        "pass_at_1": 0.26492139647111035,
        "avg_reward": 0.22498988078588275,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4949,
        "pass_at_1": 0.26242464728725085,
        "avg_reward": 0.19821036116104335,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 5050,
        "pass_at_1": 0.23732168840832996,
        "avg_reward": 0.16882508458839604
      },
      {
        "timestep": 5151,
        "pass_at_1": 0.26206349458218603,
        "avg_reward": 0.1695369322046679
      },
      {
        "timestep": 5252,
        "pass_at_1": 0.2689613591116262,
        "avg_reward": 0.2353716301300279
      },
      {
        "timestep": 5353,
        "pass_at_1": 0.31315937033647206,
        "avg_reward": 0.2592563869107696
      },
      {
        "timestep": 5454,
        "pass_at_1": 0.2838132489040948,
        "avg_reward": 0.2233283033349675
      },
      {
        "timestep": 5555,
        "pass_at_1": 0.24349017197168576,
        "avg_reward": 0.19346644380488778
      },
      {
        "timestep": 5656,
        "pass_at_1": 0.286249117687707,
        "avg_reward": 0.35216139977442995
      },
      {
        "timestep": 5757,
        "pass_at_1": 0.2843506096041752,
        "avg_reward": 0.2425578548000208
      },
      {
        "timestep": 5858,
        "pass_at_1": 0.29063018527135565,
        "avg_reward": 0.17407024633610793
      },
      {
        "timestep": 5959,
        "pass_at_1": 0.3172796664847354,
        "avg_reward": 0.29142038482212707
      },
      {
        "timestep": 6060,
        "pass_at_1": 0.31331380222338434,
        "avg_reward": 0.20518166903897056
      },
      {
        "timestep": 6161,
        "pass_at_1": 0.328589177323256,
        "avg_reward": 0.19277878871899073
      },
      {
        "timestep": 6262,
        "pass_at_1": 0.3152797929400121,
        "avg_reward": 0.36174661564250865
      },
      {
        "timestep": 6363,
        "pass_at_1": 0.28670962099892855,
        "avg_reward": 0.20105281031900424
      },
      {
        "timestep": 6464,
        "pass_at_1": 0.31145855956480145,
        "avg_reward": 0.2239930649460312
      },
      {
        "timestep": 6565,
        "pass_at_1": 0.28136413650853703,
        "avg_reward": 0.228519457947131
      },
      {
        "timestep": 6666,
        "pass_at_1": 0.2940091398387658,
        "avg_reward": 0.25888693340277175
      },
      {
        "timestep": 6767,
        "pass_at_1": 0.2997097709320596,
        "avg_reward": 0.3172645369965247
      },
      {
        "timestep": 6868,
        "pass_at_1": 0.3052408086222935,
        "avg_reward": 0.22808957108755104
      },
      {
        "timestep": 6969,
        "pass_at_1": 0.33994780818042114,
        "avg_reward": 0.21041503072263917
      },
      {
        "timestep": 7070,
        "pass_at_1": 0.3309616636863902,
        "avg_reward": 0.3301264686632336
      },
      {
        "timestep": 7171,
        "pass_at_1": 0.296960702343266,
        "avg_reward": 0.24680025480122803
      },
      {
        "timestep": 7272,
        "pass_at_1": 0.3369683622798666,
        "avg_reward": 0.30866583341275877
      },
      {
        "timestep": 7373,
        "pass_at_1": 0.30965405211832914,
        "avg_reward": 0.18170041104044948
      },
      {
        "timestep": 7474,
        "pass_at_1": 0.3474159076101437,
        "avg_reward": 0.2927819597497743
      },
      {
        "timestep": 7575,
        "pass_at_1": 0.34453226817643623,
        "avg_reward": 0.29294822501599777
      },
      {
        "timestep": 7676,
        "pass_at_1": 0.32842829603925,
        "avg_reward": 0.2743553216894502
      },
      {
        "timestep": 7777,
        "pass_at_1": 0.3503574269208782,
        "avg_reward": 0.24456837063538417
      },
      {
        "timestep": 7878,
        "pass_at_1": 0.3842392683602437,
        "avg_reward": 0.33108306073378435
      },
      {
        "timestep": 7979,
        "pass_at_1": 0.32548597031390797,
        "avg_reward": 0.29321645668281787
      },
      {
        "timestep": 8080,
        "pass_at_1": 0.33216701877735544,
        "avg_reward": 0.30508784520900695
      },
      {
        "timestep": 8181,
        "pass_at_1": 0.37714145332654914,
        "avg_reward": 0.2606790467436538
      },
      {
        "timestep": 8282,
        "pass_at_1": 0.37550619764422166,
        "avg_reward": 0.32104400446220227
      },
      {
        "timestep": 8383,
        "pass_at_1": 0.3749092584557008,
        "avg_reward": 0.394767055897258
      },
      {
        "timestep": 8484,
        "pass_at_1": 0.3557499588987032,
        "avg_reward": 0.2469131589010881
      },
      {
        "timestep": 8585,
        "pass_at_1": 0.3450174576768837,
        "avg_reward": 0.23522345189323507
      },
      {
        "timestep": 8686,
        "pass_at_1": 0.3633762026448835,
        "avg_reward": 0.307758560856739
      },
      {
        "timestep": 8787,
        "pass_at_1": 0.3725231470733046,
        "avg_reward": 0.3393776801104449
      },
      {
        "timestep": 8888,
        "pass_at_1": 0.36928123542849695,
        "avg_reward": 0.3681016922006634
      },
      {
        "timestep": 8989,
        "pass_at_1": 0.36572089725064744,
        "avg_reward": 0.4285851761299989
      },
      {
        "timestep": 9090,
        "pass_at_1": 0.38548141221378884,
        "avg_reward": 0.265527251950217
      },
      {
        "timestep": 9191,
        "pass_at_1": 0.35346569310683645,
        "avg_reward": 0.30689617524762847
      },
      {
        "timestep": 9292,
        "pass_at_1": 0.37229148796024414,
        "avg_reward": 0.3335332150727999
      },
      {
        "timestep": 9393,
        "pass_at_1": 0.3880647193773438,
        "avg_reward": 0.30681032986903145
      },
      {
        "timestep": 9494,
        "pass_at_1": 0.36346566035005884,
        "avg_reward": 0.21503016704575384
      },
      {
        "timestep": 9595,
        "pass_at_1": 0.37323549090466207,
        "avg_reward": 0.3414083324399033
      },
      {
        "timestep": 9696,
        "pass_at_1": 0.3881749697719242,
        "avg_reward": 0.24825303688194
      },
      {
        "timestep": 9797,
        "pass_at_1": 0.38904744855753187,
        "avg_reward": 0.33050382783246735
      },
      {
        "timestep": 9898,
        "pass_at_1": 0.3695612441006199,
        "avg_reward": 0.30333525057777233
      },
      {
        "timestep": 10000,
        "pass_at_1": 0.3900213707148276,
        "avg_reward": 0.25486858168033094
      }
    ],
    "eval_metrics": [
      {
        "timestep": 0,
        "pass_at_1": 0.009934283060224654,
        "avg_reward": 0.0010342113896204897,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 10000,
        "pass_at_1": 0.3900213707148276,
        "avg_reward": 0.25486858168033094
      }
    ],
    "timing_metrics": [
      {
        "timestep": 0,
        "throughput": 5.0,
        "update": 1,
        "cumulative_wall_time": 10.0
      },
      {
        "timestep": 101,
        "throughput": 5.5,
        "update": 2,
        "cumulative_wall_time": 20.0
      },
      {
        "timestep": 202,
        "throughput": 6.0,
        "update": 3,
        "cumulative_wall_time": 30.0
      },
      {
        "timestep": 303,
        "throughput": 6.5,
        "update": 4,
        "cumulative_wall_time": 40.0
      },
      {
        "timestep": 404,
        "throughput": 7.0,
        "update": 5,
        "cumulative_wall_time": 50.0
      },
      {
        "timestep": 505,
        "throughput": 7.5,
        "update": 6,
        "cumulative_wall_time": 60.0
      },
      {
        "timestep": 606,
        "throughput": 8.0,
        "update": 7,
        "cumulative_wall_time": 70.0
      },
      {
        "timestep": 707,
        "throughput": 8.5,
        "update": 8,
        "cumulative_wall_time": 80.0
      },
      {
        "timestep": 808,
        "throughput": 9.0,
        "update": 9,
        "cumulative_wall_time": 90.0
      },
      {
        "timestep": 909,
        "throughput": 9.5,
        "update": 10,
        "cumulative_wall_time": 100.0
      },
      {
        "timestep": 1010,
        "throughput": 10.357787360348283,
        "update": 11,
        "cumulative_wall_time": 110.0
      },
      {
        "timestep": 1111,
        "throughput": 10.560784526368234,
        "update": 12,
        "cumulative_wall_time": 120.0
      },
      {
        "timestep": 1212,
        "throughput": 11.083051243175277,
        "update": 13,
        "cumulative_wall_time": 130.0
      },
      {
        "timestep": 1313,
        "throughput": 11.053802052034902,
        "update": 14,
        "cumulative_wall_time": 140.0
      },
      {
        "timestep": 1414,
        "throughput": 8.62233063204291,
        "update": 15,
        "cumulative_wall_time": 150.0
      },
      {
        "timestep": 1515,
        "throughput": 9.062174960084876,
        "update": 16,
        "cumulative_wall_time": 160.0
      },
      {
        "timestep": 1616,
        "throughput": 10.51503526720866,
        "update": 17,
        "cumulative_wall_time": 170.0
      },
      {
        "timestep": 1717,
        "throughput": 10.513785950912208,
        "update": 18,
        "cumulative_wall_time": 180.0
      },
      {
        "timestep": 1818,
        "throughput": 10.515047686306048,
        "update": 19,
        "cumulative_wall_time": 190.0
      },
      {
        "timestep": 1919,
        "throughput": 13.852731490654723,
        "update": 20,
        "cumulative_wall_time": 200.0
      },
      {
        "timestep": 2020,
        "throughput": 10.570890510693168,
        "update": 21,
        "cumulative_wall_time": 210.0
      },
      {
        "timestep": 2121,
        "throughput": 11.135565640180598,
        "update": 22,
        "cumulative_wall_time": 220.0
      },
      {
        "timestep": 2222,
        "throughput": 10.954001763493203,
        "update": 23,
        "cumulative_wall_time": 230.0
      },
      {
        "timestep": 2323,
        "throughput": 10.651391251305798,
        "update": 24,
        "cumulative_wall_time": 240.0
      },
      {
        "timestep": 2424,
        "throughput": 9.684730755359654,
        "update": 25,
        "cumulative_wall_time": 250.0
      },
      {
        "timestep": 2525,
        "throughput": 10.758969220493269,
        "update": 26,
        "cumulative_wall_time": 260.0
      },
      {
        "timestep": 2626,
        "throughput": 9.227174785462429,
        "update": 27,
        "cumulative_wall_time": 270.0
      },
      {
        "timestep": 2727,
        "throughput": 9.763181393259991,
        "update": 28,
        "cumulative_wall_time": 280.0
      },
      {
        "timestep": 2828,
        "throughput": 9.514636452170897,
        "update": 29,
        "cumulative_wall_time": 290.0
      },
      {
        "timestep": 2929,
        "throughput": 10.081874139386322,
        "update": 30,
        "cumulative_wall_time": 300.0
      },
      {
        "timestep": 3030,
        "throughput": 12.314658566673508,
        "update": 31,
        "cumulative_wall_time": 310.0
      },
      {
        "timestep": 3131,
        "throughput": 8.132734807408251,
        "update": 32,
        "cumulative_wall_time": 320.0
      },
      {
        "timestep": 3232,
        "throughput": 10.686260190374512,
        "update": 33,
        "cumulative_wall_time": 330.0
      },
      {
        "timestep": 3333,
        "throughput": 8.387284128810348,
        "update": 34,
        "cumulative_wall_time": 340.0
      },
      {
        "timestep": 3434,
        "throughput": 9.528068134210567,
        "update": 35,
        "cumulative_wall_time": 350.0
      },
      {
        "timestep": 3535,
        "throughput": 11.088950596967367,
        "update": 36,
        "cumulative_wall_time": 360.0
      },
      {
        "timestep": 3636,
        "throughput": 10.064280019095461,
        "update": 37,
        "cumulative_wall_time": 370.0
      },
      {
        "timestep": 3737,
        "throughput": 8.922255222070694,
        "update": 38,
        "cumulative_wall_time": 380.0
      },
      {
        "timestep": 3838,
        "throughput": 9.284696290740031,
        "update": 39,
        "cumulative_wall_time": 390.0
      },
      {
        "timestep": 3939,
        "throughput": 10.679597748934675,
        "update": 40,
        "cumulative_wall_time": 400.0
      },
      {
        "timestep": 4040,
        "throughput": 9.269633368282864,
        "update": 41,
        "cumulative_wall_time": 410.0
      },
      {
        "timestep": 4141,
        "throughput": 10.216458589581976,
        "update": 42,
        "cumulative_wall_time": 420.0
      },
      {
        "timestep": 4242,
        "throughput": 10.045571839903813,
        "update": 43,
        "cumulative_wall_time": 430.0
      },
      {
        "timestep": 4343,
        "throughput": 9.348399652394182,
        "update": 44,
        "cumulative_wall_time": 440.0
      },
      {
        "timestep": 4444,
        "throughput": 12.143944089325327,
        "update": 45,
        "cumulative_wall_time": 450.0
      },
      {
        "timestep": 4545,
        "throughput": 10.633919022318011,
        "update": 46,
        "cumulative_wall_time": 460.0
      },
      {
        "timestep": 4646,
        "throughput": 7.974857413342393,
        "update": 47,
        "cumulative_wall_time": 470.0
      },
      {
        "timestep": 4747,
        "throughput": 10.186454314769428,
        "update": 48,
        "cumulative_wall_time": 480.0
      },
      {
        "timestep": 4848,
        "throughput": 9.338213535231612,
        "update": 49,
        "cumulative_wall_time": 490.0
      },
      {
        "timestep": 4949,
        "throughput": 10.852433334796224,
        "update": 50,
        "cumulative_wall_time": 500.0
      },
      {
        "timestep": 5050,
        "throughput": 9.2074792615673,
        "update": 51,
        "cumulative_wall_time": 510.0
      },
      {
        "timestep": 5151,
        "throughput": 9.8852635585331,
        "update": 52,
        "cumulative_wall_time": 520.0
      },
      {
        "timestep": 5252,
        "throughput": 10.504987278980458,
        "update": 53,
        "cumulative_wall_time": 530.0
      },
      {
        "timestep": 5353,
        "throughput": 10.865755194170122,
        "update": 54,
        "cumulative_wall_time": 540.0
      },
      {
        "timestep": 5454,
        "throughput": 8.799703592944223,
        "update": 55,
        "cumulative_wall_time": 550.0
      },
      {
        "timestep": 5555,
        "throughput": 9.665498764159052,
        "update": 56,
        "cumulative_wall_time": 560.0
      },
      {
        "timestep": 5656,
        "throughput": 9.525054688839043,
        "update": 57,
        "cumulative_wall_time": 570.0
      },
      {
        "timestep": 5757,
        "throughput": 9.34667076742629,
        "update": 58,
        "cumulative_wall_time": 580.0
      },
      {
        "timestep": 5858,
        "throughput": 11.765454240281096,
        "update": 59,
        "cumulative_wall_time": 590.0
      },
      {
        "timestep": 5959,
        "throughput": 10.404981710960957,
        "update": 60,
        "cumulative_wall_time": 600.0
      },
      {
        "timestep": 6060,
        "throughput": 8.739116045664954,
        "update": 61,
        "cumulative_wall_time": 610.0
      },
      {
        "timestep": 6161,
        "throughput": 10.917861947054776,
        "update": 62,
        "cumulative_wall_time": 620.0
      },
      {
        "timestep": 6262,
        "throughput": 12.122156197012632,
        "update": 63,
        "cumulative_wall_time": 630.0
      },
      {
        "timestep": 6363,
        "throughput": 11.032465260551147,
        "update": 64,
        "cumulative_wall_time": 640.0
      },
      {
        "timestep": 6464,
        "throughput": 8.480630034045987,
        "update": 65,
        "cumulative_wall_time": 650.0
      },
      {
        "timestep": 6565,
        "throughput": 9.515765927133748,
        "update": 66,
        "cumulative_wall_time": 660.0
      },
      {
        "timestep": 6666,
        "throughput": 11.266911149186623,
        "update": 67,
        "cumulative_wall_time": 670.0
      },
      {
        "timestep": 6767,
        "throughput": 9.292330534381218,
        "update": 68,
        "cumulative_wall_time": 680.0
      },
      {
        "timestep": 6868,
        "throughput": 10.443819428146227,
        "update": 69,
        "cumulative_wall_time": 690.0
      },
      {
        "timestep": 6969,
        "throughput": 10.774634053429338,
        "update": 70,
        "cumulative_wall_time": 700.0
      },
      {
        "timestep": 7070,
        "throughput": 9.073069528421918,
        "update": 71,
        "cumulative_wall_time": 710.0
      },
      {
        "timestep": 7171,
        "throughput": 9.940474643938199,
        "update": 72,
        "cumulative_wall_time": 720.0
      },
      {
        "timestep": 7272,
        "throughput": 6.758732659930927,
        "update": 73,
        "cumulative_wall_time": 730.0
      },
      {
        "timestep": 7373,
        "throughput": 8.97561235866571,
        "update": 74,
        "cumulative_wall_time": 740.0
      },
      {
        "timestep": 7474,
        "throughput": 9.74743184860684,
        "update": 75,
        "cumulative_wall_time": 750.0
      },
      {
        "timestep": 7575,
        "throughput": 8.75221681803515,
        "update": 76,
        "cumulative_wall_time": 760.0
      },
      {
        "timestep": 7676,
        "throughput": 11.632411303931637,
        "update": 77,
        "cumulative_wall_time": 770.0
      },
      {
        "timestep": 7777,
        "throughput": 8.569858622039368,
        "update": 78,
        "cumulative_wall_time": 780.0
      },
      {
        "timestep": 7878,
        "throughput": 9.559955513303017,
        "update": 79,
        "cumulative_wall_time": 790.0
      },
      {
        "timestep": 7979,
        "throughput": 10.13074057728609,
        "update": 80,
        "cumulative_wall_time": 800.0
      },
      {
        "timestep": 8080,
        "throughput": 11.441273289066116,
        "update": 81,
        "cumulative_wall_time": 810.0
      },
      {
        "timestep": 8181,
        "throughput": 8.564137848820561,
        "update": 82,
        "cumulative_wall_time": 820.0
      },
      {
        "timestep": 8282,
        "throughput": 11.163163752154958,
        "update": 83,
        "cumulative_wall_time": 830.0
      },
      {
        "timestep": 8383,
        "throughput": 10.010233061019587,
        "update": 84,
        "cumulative_wall_time": 840.0
      },
      {
        "timestep": 8484,
        "throughput": 9.018491348952049,
        "update": 85,
        "cumulative_wall_time": 850.0
      },
      {
        "timestep": 8585,
        "throughput": 10.462103474263271,
        "update": 86,
        "cumulative_wall_time": 860.0
      },
      {
        "timestep": 8686,
        "throughput": 10.19905969557347,
        "update": 87,
        "cumulative_wall_time": 870.0
      },
      {
        "timestep": 8787,
        "throughput": 9.399783122841205,
        "update": 88,
        "cumulative_wall_time": 880.0
      },
      {
        "timestep": 8888,
        "throughput": 10.069802084990018,
        "update": 89,
        "cumulative_wall_time": 890.0
      },
      {
        "timestep": 8989,
        "throughput": 9.61468640313824,
        "update": 90,
        "cumulative_wall_time": 900.0
      },
      {
        "timestep": 9090,
        "throughput": 10.113517345251248,
        "update": 91,
        "cumulative_wall_time": 910.0
      },
      {
        "timestep": 9191,
        "throughput": 10.662130674521046,
        "update": 92,
        "cumulative_wall_time": 920.0
      },
      {
        "timestep": 9292,
        "throughput": 11.586016816145353,
        "update": 93,
        "cumulative_wall_time": 930.0
      },
      {
        "timestep": 9393,
        "throughput": 8.762184501173152,
        "update": 94,
        "cumulative_wall_time": 940.0
      },
      {
        "timestep": 9494,
        "throughput": 12.133033374656268,
        "update": 95,
        "cumulative_wall_time": 950.0
      },
      {
        "timestep": 9595,
        "throughput": 8.047912200477498,
        "update": 96,
        "cumulative_wall_time": 960.0
      },
      {
        "timestep": 9696,
        "throughput": 9.848214904964417,
        "update": 97,
        "cumulative_wall_time": 970.0
      },
      {
        "timestep": 9797,
        "throughput": 10.588317206484577,
        "update": 98,
        "cumulative_wall_time": 980.0
      },
      {
        "timestep": 9898,
        "throughput": 10.280991867735032,
        "update": 99,
        "cumulative_wall_time": 990.0
      },
      {
        "timestep": 10000,
        "throughput": 9.377300480179406,
        "update": 100,
        "cumulative_wall_time": 1000.0
      }
    ],
    "scheduler_stats": {
      "total_experiences": 10000,
      "total_updates": 500,
      "policy_version": 500,
      "buffer_size": 1024,
      "curriculum": {
        "level_1": {
          "num_pulls": 2000,
          "success_rate": 0.85,
          "mean_reward": 0.7608375549928545,
          "recent_gradient": 0.009013998130682335
        },
        "level_2": {
          "num_pulls": 2000,
          "success_rate": 0.65,
          "mean_reward": 0.5732127048611159,
          "recent_gradient": 0.02169920419404205
        },
        "level_3": {
          "num_pulls": 2000,
          "success_rate": 0.45,
          "mean_reward": 0.412140309719301,
          "recent_gradient": 0.028614180809478692
        },
        "level_4": {
          "num_pulls": 2000,
          "success_rate": 0.28,
          "mean_reward": 0.2699919975086651,
          "recent_gradient": 0.02061459904175322
        },
        "level_5": {
          "num_pulls": 2000,
          "success_rate": 0.15,
          "mean_reward": 0.1512572423767792,
          "recent_gradient": 0.011259257683847225
        },
        "total_steps": 10000
      },
      "staleness": {
        "discard_rate": 0.15
      },
      "workers": {
        "0": {
          "completed_tasks": 2500,
          "avg_throughput": 4.5855024945389635
        },
        "1": {
          "completed_tasks": 2500,
          "avg_throughput": 4.719909479901515
        },
        "2": {
          "completed_tasks": 2500,
          "avg_throughput": 5.373646802561631
        },
        "3": {
          "completed_tasks": 2500,
          "avg_throughput": 5.3051851327167325
        }
      }
    },
    "final_pass_at_1": 0.39679990152026395,
    "final_pass_at_1_std": 0.015580873953549118,
    "avg_throughput": 9.73656583632468,
    "avg_throughput_std": 0.09037438577731756,
    "wall_time_mean": 0.0,
    "num_runs": 3
  },
  "sync_curriculum": {
    "train_metrics": [
      {
        "timestep": 0,
        "pass_at_1": 0.009934283060224654,
        "avg_reward": 0.0010342113896204897,
        "difficulty_1_ratio": 0.5703496647219384,
        "difficulty_2_ratio": 0.34593455841067655,
        "difficulty_3_ratio": 0.0771884334190506,
        "difficulty_4_ratio": 0.006336012450983674,
        "difficulty_5_ratio": 0.00019133099735093797
      },
      {
        "timestep": 101,
        "pass_at_1": 0.024064881873124964,
        "avg_reward": 0.09540339831890125,
        "difficulty_1_ratio": 0.545817584309558,
        "difficulty_2_ratio": 0.3592137008263376,
        "difficulty_3_ratio": 0.0869688606806755,
        "difficulty_4_ratio": 0.007746048051242527,
        "difficulty_5_ratio": 0.00025380613218624814
      },
      {
        "timestep": 202,
        "pass_at_1": 0.017539154727755506,
        "avg_reward": 0.0023244759347453778,
        "difficulty_1_ratio": 0.5207065136269264,
        "difficulty_2_ratio": 0.3718356202546844,
        "difficulty_3_ratio": 0.09768198799373931,
        "difficulty_4_ratio": 0.009440250235689705,
        "difficulty_5_ratio": 0.00033562788896017117
      },
      {
        "timestep": 303,
        "pass_at_1": 0.06491758964348116,
        "avg_reward": 0.09030580817243036,
        "difficulty_1_ratio": 0.4951092343136047,
        "difficulty_2_ratio": 0.38362916613190773,
        "difficulty_3_ratio": 0.10935225097641152,
        "difficulty_4_ratio": 0.011466987914927423,
        "difficulty_5_ratio": 0.00044236066314863343
      },
      {
        "timestep": 404,
        "pass_at_1": 0.035054956725745406,
        "avg_reward": 0.055171967559894564,
        "difficulty_1_ratio": 0.469130336180388,
        "difficulty_2_ratio": 0.3944179935925989,
        "difficulty_3_ratio": 0.12199033943415045,
        "difficulty_4_ratio": 0.013880326375356456,
        "difficulty_5_ratio": 0.0005810044175062076
      },
      {
        "timestep": 505,
        "pass_at_1": 0.10564987861168393,
        "avg_reward": 0.0612334152108343,
        "difficulty_1_ratio": 0.4428854101147015,
        "difficulty_2_ratio": 0.40402402094501866,
        "difficulty_3_ratio": 0.13559026749360029,
        "difficulty_4_ratio": 0.0167399966441195,
        "difficulty_5_ratio": 0.0007603048025599198
      },
      {
        "timestep": 606,
        "pass_at_1": 0.12347368305774217,
        "avg_reward": 0.0031149342133038466,
        "difficulty_1_ratio": 0.4164998456831705,
        "difficulty_2_ratio": 0.41227145735706794,
        "difficulty_3_ratio": 0.15012644832783253,
        "difficulty_4_ratio": 0.02011113911124073,
        "difficulty_5_ratio": 0.0009911095206882054
      },
      {
        "timestep": 707,
        "pass_at_1": 0.08793864177496254,
        "avg_reward": 0.0422365369579214,
        "difficulty_1_ratio": 0.390107224895361,
        "difficulty_2_ratio": 0.4189913219593774,
        "difficulty_3_ratio": 0.1655509131479823,
        "difficulty_4_ratio": 0.024063769070528613,
        "difficulty_5_ratio": 0.0012867709267507749
      },
      {
        "timestep": 808,
        "pass_at_1": 0.10606912597061448,
        "avg_reward": 0.10056766740625528,
        "difficulty_1_ratio": 0.3638473227132847,
        "difficulty_2_ratio": 0.42402633368046766,
        "difficulty_3_ratio": 0.18179083819928793,
        "difficulty_4_ratio": 0.028671913216506643,
        "difficulty_5_ratio": 0.0016635921904528722
      },
      {
        "timestep": 909,
        "pass_at_1": 0.11213988802547346,
        "avg_reward": 0.019096725353614202,
        "difficulty_1_ratio": 0.337863746670805,
        "difficulty_2_ratio": 0.4272360092470168,
        "difficulty_3_ratio": 0.19874656153923254,
        "difficulty_4_ratio": 0.03401237165049899,
        "difficulty_5_ratio": 0.0021413108924466314
      },
      {
        "timestep": 1010,
        "pass_at_1": 0.16367336192510767,
        "avg_reward": 0.11964987451575936,
        "difficulty_1_ratio": 0.31230127114431194,
        "difficulty_2_ratio": 0.4285017684753959,
        "difficulty_3_ratio": 0.21629028030484038,
        "difficulty_4_ratio": 0.04016307038955698,
        "difficulty_5_ratio": 0.0027436096858948753
      },
      {
        "timestep": 1111,
        "pass_at_1": 0.13985572517238434,
        "avg_reward": 0.04064717082723464,
        "difficulty_1_ratio": 0.2873029447333821,
        "difficulty_2_ratio": 0.4277318152433385,
        "difficulty_3_ratio": 0.23426561605703436,
        "difficulty_4_ratio": 0.04720098526509968,
        "difficulty_5_ratio": 0.0034986387011453407
      },
      {
        "timestep": 1212,
        "pass_at_1": 0.13184623220126726,
        "avg_reward": 0.11102311524650713,
        "difficulty_1_ratio": 0.2630070699260558,
        "difficulty_2_ratio": 0.4248655434002136,
        "difficulty_3_ratio": 0.2524882182255638,
        "difficulty_4_ratio": 0.05519963957750222,
        "difficulty_5_ratio": 0.004439528870664513
      },
      {
        "timestep": 1313,
        "pass_at_1": 0.12402571265177376,
        "avg_reward": 0.11800547103870261,
        "difficulty_1_ratio": 0.23954417068994155,
        "difficulty_2_ratio": 0.41987721294759744,
        "difficulty_3_ratio": 0.2707475422306048,
        "difficulty_4_ratio": 0.06422620455155005,
        "difficulty_5_ratio": 0.005604869580306165
      },
      {
        "timestep": 1414,
        "pass_at_1": 0.13942632379040085,
        "avg_reward": 0.09695637154265685,
        "difficulty_1_ratio": 0.21703407392185683,
        "difficulty_2_ratio": 0.412778655730858,
        "difficulty_3_ratio": 0.2888098894295048,
        "difficulty_4_ratio": 0.07433826251589389,
        "difficulty_5_ratio": 0.0070391184018864465
      },
      {
        "timestep": 1515,
        "pass_at_1": 0.14387895829589525,
        "avg_reward": 0.2077170758621631,
        "difficulty_1_ratio": 0.1955832332539105,
        "difficulty_2_ratio": 0.4036208028084852,
        "difficulty_3_ratio": 0.3064227321494006,
        "difficulty_4_ratio": 0.08558032615731795,
        "difficulty_5_ratio": 0.008792905630886071
      },
      {
        "timestep": 1616,
        "pass_at_1": 0.1601960991360906,
        "avg_reward": 0.07527133286107746,
        "difficulty_1_ratio": 0.17528241761460614,
        "difficulty_2_ratio": 0.39249387697759325,
        "difficulty_3_ratio": 0.3233202719632032,
        "difficulty_4_ratio": 0.09798024091278032,
        "difficulty_5_ratio": 0.010923192531817163
      },
      {
        "timestep": 1717,
        "pass_at_1": 0.1815471504842922,
        "avg_reward": 0.08419553788888265,
        "difficulty_1_ratio": 0.15620487203762,
        "difficulty_2_ratio": 0.3795261610306469,
        "difficulty_3_ratio": 0.3392300979084394,
        "difficulty_4_ratio": 0.11154562879642933,
        "difficulty_5_ratio": 0.013493240226864338
      },
      {
        "timestep": 1818,
        "pass_at_1": 0.17397909714879203,
        "avg_reward": 0.04119977152504485,
        "difficulty_1_ratio": 0.13840503524267814,
        "difficulty_2_ratio": 0.36488133073132456,
        "difficulty_3_ratio": 0.3538807296736819,
        "difficulty_4_ratio": 0.12626055765373156,
        "difficulty_5_ratio": 0.016572346698583963
      },
      {
        "timestep": 1919,
        "pass_at_1": 0.14801696353999572,
        "avg_reward": 0.12825663262545275,
        "difficulty_1_ratio": 0.12191786908589192,
        "difficulty_2_ratio": 0.3487544252621549,
        "difficulty_3_ratio": 0.36700975575577915,
        "difficulty_4_ratio": 0.1420826368959247,
        "difficulty_5_ratio": 0.02023531300024945
      },
      {
        "timestep": 2020,
        "pass_at_1": 0.1941998968721299,
        "avg_reward": 0.16392833155720246,
        "difficulty_1_ratio": 0.10675882140395278,
        "difficulty_2_ratio": 0.33136661015926444,
        "difficulty_3_ratio": 0.37837221513402225,
        "difficulty_4_ratio": 0.158940746377412,
        "difficulty_5_ratio": 0.02456160692534847
      },
      {
        "timestep": 2121,
        "pass_at_1": 0.1820360516966936,
        "avg_reward": 0.13057365657789044,
        "difficulty_1_ratio": 0.09292440882580433,
        "difficulty_2_ratio": 0.3129589615253456,
        "difficulty_3_ratio": 0.38774882932075583,
        "difficulty_4_ratio": 0.1767335970180918,
        "difficulty_5_ratio": 0.02963420331000244
      },
      {
        "timestep": 2222,
        "pass_at_1": 0.15976296755332597,
        "avg_reward": 0.09181816362292536,
        "difficulty_1_ratio": 0.08039337269830067,
        "difficulty_2_ratio": 0.29378555928253614,
        "difficulty_3_ratio": 0.3949536745312958,
        "difficulty_4_ratio": 0.19532929872471466,
        "difficulty_5_ratio": 0.03553809476315268
      },
      {
        "timestep": 2323,
        "pass_at_1": 0.18516814645242355,
        "avg_reward": 0.20099062847288462,
        "difficulty_1_ratio": 0.0691283320657602,
        "difficulty_2_ratio": 0.2741062164565189,
        "difficulty_3_ratio": 0.39984089400061734,
        "difficulty_4_ratio": 0.21456607296103805,
        "difficulty_5_ratio": 0.04235848451606555
      },
      {
        "timestep": 2424,
        "pass_at_1": 0.20636093724162372,
        "avg_reward": 0.07693674202516229,
        "difficulty_1_ratio": 0.05907783484757915,
        "difficulty_2_ratio": 0.2541791879471294,
        "difficulty_3_ratio": 0.40231008867116286,
        "difficulty_4_ratio": 0.23425419509772658,
        "difficulty_5_ratio": 0.05017869343640206
      },
      {
        "timestep": 2525,
        "pass_at_1": 0.21113487515104515,
        "avg_reward": 0.14965378610002028,
        "difficulty_1_ratio": 0.050178693436402015,
        "difficulty_2_ratio": 0.2342541950977265,
        "difficulty_3_ratio": 0.40231008867116286,
        "difficulty_4_ratio": 0.2541791879471295,
        "difficulty_5_ratio": 0.059077834847579204
      },
      {
        "timestep": 2626,
        "pass_at_1": 0.19633302960941781,
        "avg_reward": 0.18765023812957765,
        "difficulty_1_ratio": 0.04235848451606552,
        "difficulty_2_ratio": 0.21456607296103797,
        "difficulty_3_ratio": 0.3998408940006174,
        "difficulty_4_ratio": 0.274106216456519,
        "difficulty_5_ratio": 0.06912833206576029
      },
      {
        "timestep": 2727,
        "pass_at_1": 0.23575990041083747,
        "avg_reward": 0.23517192628447992,
        "difficulty_1_ratio": 0.03553809476315264,
        "difficulty_2_ratio": 0.1953292987247146,
        "difficulty_3_ratio": 0.3949536745312958,
        "difficulty_4_ratio": 0.2937855592825363,
        "difficulty_5_ratio": 0.08039337269830077
      },
      {
        "timestep": 2828,
        "pass_at_1": 0.20367053339251862,
        "avg_reward": 0.14747580792145418,
        "difficulty_1_ratio": 0.029634203310002414,
        "difficulty_2_ratio": 0.17673359701809171,
        "difficulty_3_ratio": 0.38774882932075583,
        "difficulty_4_ratio": 0.31295896152534575,
        "difficulty_5_ratio": 0.09292440882580441
      },
      {
        "timestep": 2929,
        "pass_at_1": 0.23243788596833537,
        "avg_reward": 0.23472756513078627,
        "difficulty_1_ratio": 0.02456160692534847,
        "difficulty_2_ratio": 0.158940746377412,
        "difficulty_3_ratio": 0.37837221513402225,
        "difficulty_4_ratio": 0.33136661015926444,
        "difficulty_5_ratio": 0.10675882140395278
      },
      {
        "timestep": 3030,
        "pass_at_1": 0.2216257204260815,
        "avg_reward": 0.16801762750767435,
        "difficulty_1_ratio": 0.020235313000249448,
        "difficulty_2_ratio": 0.14208263689592468,
        "difficulty_3_ratio": 0.3670097557557791,
        "difficulty_4_ratio": 0.34875442526215483,
        "difficulty_5_ratio": 0.12191786908589189
      },
      {
        "timestep": 3131,
        "pass_at_1": 0.21451392200563918,
        "avg_reward": 0.11180080640047782,
        "difficulty_1_ratio": 0.016572346698583963,
        "difficulty_2_ratio": 0.12626055765373156,
        "difficulty_3_ratio": 0.35388072967368184,
        "difficulty_4_ratio": 0.3648813307313245,
        "difficulty_5_ratio": 0.13840503524267814
      },
      {
        "timestep": 3232,
        "pass_at_1": 0.25835324749954347,
        "avg_reward": 0.27449459942817594,
        "difficulty_1_ratio": 0.013493240226864338,
        "difficulty_2_ratio": 0.11154562879642933,
        "difficulty_3_ratio": 0.3392300979084394,
        "difficulty_4_ratio": 0.3795261610306469,
        "difficulty_5_ratio": 0.15620487203762
      },
      {
        "timestep": 3333,
        "pass_at_1": 0.24615109904653054,
        "avg_reward": 0.24709752413182567,
        "difficulty_1_ratio": 0.010923192531817153,
        "difficulty_2_ratio": 0.09798024091278025,
        "difficulty_3_ratio": 0.32332027196320307,
        "difficulty_4_ratio": 0.39249387697759325,
        "difficulty_5_ratio": 0.17528241761460625
      },
      {
        "timestep": 3434,
        "pass_at_1": 0.2603347363964557,
        "avg_reward": 0.17601180138690836,
        "difficulty_1_ratio": 0.00879290563088607,
        "difficulty_2_ratio": 0.08558032615731792,
        "difficulty_3_ratio": 0.3064227321494005,
        "difficulty_4_ratio": 0.40362080280848517,
        "difficulty_5_ratio": 0.19558323325391047
      },
      {
        "timestep": 3535,
        "pass_at_1": 0.2658583983835631,
        "avg_reward": 0.28958854703014897,
        "difficulty_1_ratio": 0.007039118401886442,
        "difficulty_2_ratio": 0.07433826251589386,
        "difficulty_3_ratio": 0.2888098894295048,
        "difficulty_4_ratio": 0.41277865573085804,
        "difficulty_5_ratio": 0.21703407392185695
      },
      {
        "timestep": 3636,
        "pass_at_1": 0.2634557464279372,
        "avg_reward": 0.28899677993305006,
        "difficulty_1_ratio": 0.00560486958030616,
        "difficulty_2_ratio": 0.06422620455155001,
        "difficulty_3_ratio": 0.2707475422306047,
        "difficulty_4_ratio": 0.41987721294759744,
        "difficulty_5_ratio": 0.2395441706899417
      },
      {
        "timestep": 3737,
        "pass_at_1": 0.21732796803251705,
        "avg_reward": 0.21495749964477484,
        "difficulty_1_ratio": 0.004439528870664501,
        "difficulty_2_ratio": 0.05519963957750214,
        "difficulty_3_ratio": 0.2524882182255636,
        "difficulty_4_ratio": 0.42486554340021365,
        "difficulty_5_ratio": 0.2630070699260561
      },
      {
        "timestep": 3838,
        "pass_at_1": 0.2770187190480687,
        "avg_reward": 0.2066646077151616,
        "difficulty_1_ratio": 0.0034986387011453407,
        "difficulty_2_ratio": 0.04720098526509968,
        "difficulty_3_ratio": 0.23426561605703436,
        "difficulty_4_ratio": 0.4277318152433385,
        "difficulty_5_ratio": 0.2873029447333821
      },
      {
        "timestep": 3939,
        "pass_at_1": 0.2826676741107592,
        "avg_reward": 0.12675569355856273,
        "difficulty_1_ratio": 0.0027436096858948753,
        "difficulty_2_ratio": 0.04016307038955698,
        "difficulty_3_ratio": 0.21629028030484038,
        "difficulty_4_ratio": 0.4285017684753959,
        "difficulty_5_ratio": 0.31230127114431194
      },
      {
        "timestep": 4040,
        "pass_at_1": 0.28198894445015027,
        "avg_reward": 0.24344678413570753,
        "difficulty_1_ratio": 0.0021413108924466314,
        "difficulty_2_ratio": 0.03401237165049899,
        "difficulty_3_ratio": 0.19874656153923254,
        "difficulty_4_ratio": 0.4272360092470168,
        "difficulty_5_ratio": 0.337863746670805
      },
      {
        "timestep": 4141,
        "pass_at_1": 0.32148091436922327,
        "avg_reward": 0.23127122058169625,
        "difficulty_1_ratio": 0.0016635921904528726,
        "difficulty_2_ratio": 0.02867191321650665,
        "difficulty_3_ratio": 0.18179083819928796,
        "difficulty_4_ratio": 0.42402633368046766,
        "difficulty_5_ratio": 0.3638473227132848
      },
      {
        "timestep": 4242,
        "pass_at_1": 0.28128005540482287,
        "avg_reward": 0.19993619214463149,
        "difficulty_1_ratio": 0.0012867709267507727,
        "difficulty_2_ratio": 0.02406376907052859,
        "difficulty_3_ratio": 0.16555091314798218,
        "difficulty_4_ratio": 0.41899132195937727,
        "difficulty_5_ratio": 0.3901072248953611
      },
      {
        "timestep": 4343,
        "pass_at_1": 0.3212666662288457,
        "avg_reward": 0.27345088846606075,
        "difficulty_1_ratio": 0.0009911095206882065,
        "difficulty_2_ratio": 0.020111139111240753,
        "difficulty_3_ratio": 0.15012644832783265,
        "difficulty_4_ratio": 0.41227145735706805,
        "difficulty_5_ratio": 0.4164998456831704
      },
      {
        "timestep": 4444,
        "pass_at_1": 0.2978495371078624,
        "avg_reward": 0.2639430013419577,
        "difficulty_1_ratio": 0.0007603048025599186,
        "difficulty_2_ratio": 0.01673999664411949,
        "difficulty_3_ratio": 0.1355902674936002,
        "difficulty_4_ratio": 0.40402402094501866,
        "difficulty_5_ratio": 0.44288541011470167
      },
      {
        "timestep": 4545,
        "pass_at_1": 0.3158455213618025,
        "avg_reward": 0.3011086666160865,
        "difficulty_1_ratio": 0.0005810044175062084,
        "difficulty_2_ratio": 0.013880326375356472,
        "difficulty_3_ratio": 0.12199033943415054,
        "difficulty_4_ratio": 0.3944179935925989,
        "difficulty_5_ratio": 0.4691303361803878
      },
      {
        "timestep": 4646,
        "pass_at_1": 0.3052910263270296,
        "avg_reward": 0.2278497137317353,
        "difficulty_1_ratio": 0.00044236066314863197,
        "difficulty_2_ratio": 0.011466987914927403,
        "difficulty_3_ratio": 0.10935225097641141,
        "difficulty_4_ratio": 0.3836291661319077,
        "difficulty_5_ratio": 0.49510923431360493
      },
      {
        "timestep": 4747,
        "pass_at_1": 0.31688280680977227,
        "avg_reward": 0.18033049804121187,
        "difficulty_1_ratio": 0.0003356278889601711,
        "difficulty_2_ratio": 0.009440250235689705,
        "difficulty_3_ratio": 0.09768198799373934,
        "difficulty_4_ratio": 0.3718356202546845,
        "difficulty_5_ratio": 0.5207065136269263
      },
      {
        "timestep": 4848,
        "pass_at_1": 0.3360010065880148,
        "avg_reward": 0.2818535688794063,
        "difficulty_1_ratio": 0.00025380613218624744,
        "difficulty_2_ratio": 0.007746048051242511,
        "difficulty_3_ratio": 0.08696886068067541,
        "difficulty_4_ratio": 0.3592137008263375,
        "difficulty_5_ratio": 0.5458175843095583
      },
      {
        "timestep": 4949,
        "pass_at_1": 0.3354913582956962,
        "avg_reward": 0.2566637299677996,
        "difficulty_1_ratio": 0.00019133099735093795,
        "difficulty_2_ratio": 0.006336012450983673,
        "difficulty_3_ratio": 0.0771884334190506,
        "difficulty_4_ratio": 0.3459345584106765,
        "difficulty_5_ratio": 0.5703496647219383
      },
      {
        "timestep": 5050,
        "pass_at_1": 0.31234525909362726,
        "avg_reward": 0.22884394113663387
      },
      {
        "timestep": 5151,
        "pass_at_1": 0.3390114466943541,
        "avg_reward": 0.23109529389440234
      },
      {
        "timestep": 5252,
        "pass_at_1": 0.34779909659637576,
        "avg_reward": 0.29844182011782755
      },
      {
        "timestep": 5353,
        "pass_at_1": 0.393850304365003,
        "avg_reward": 0.32380913413359436
      },
      {
        "timestep": 5454,
        "pass_at_1": 0.36631892787383813,
        "avg_reward": 0.2893328465107622
      },
      {
        "timestep": 5555,
        "pass_at_1": 0.32777041563811093,
        "avg_reward": 0.2608906387380279
      },
      {
        "timestep": 5656,
        "pass_at_1": 0.37226215458365386,
        "avg_reward": 0.4209718292911874
      },
      {
        "timestep": 5757,
        "pass_at_1": 0.3720532169075757,
        "avg_reward": 0.31271994064274117
      },
      {
        "timestep": 5858,
        "pass_at_1": 0.3799778302942769,
        "avg_reward": 0.2455483623544449
      },
      {
        "timestep": 5959,
        "pass_at_1": 0.4082266489759283,
        "avg_reward": 0.3641779708150814
      },
      {
        "timestep": 6060,
        "pass_at_1": 0.40581339670238326,
        "avg_reward": 0.2791813446221697
      },
      {
        "timestep": 6161,
        "pass_at_1": 0.42259377469593085,
        "avg_reward": 0.26798246661713065
      },
      {
        "timestep": 6262,
        "pass_at_1": 0.4107410406826342,
        "avg_reward": 0.4381156138366063
      },
      {
        "timestep": 6363,
        "pass_at_1": 0.3835785612395736,
        "avg_reward": 0.27854796251152036
      },
      {
        "timestep": 6464,
        "pass_at_1": 0.40968576443654253,
        "avg_reward": 0.3025748288434241
      },
      {
        "timestep": 6565,
        "pass_at_1": 0.3808998401976321,
        "avg_reward": 0.30814802089840704
      },
      {
        "timestep": 6666,
        "pass_at_1": 0.39480336680220035,
        "avg_reward": 0.33952231497351937
      },
      {
        "timestep": 6767,
        "pass_at_1": 0.40171245981163195,
        "avg_reward": 0.39886668810018255
      },
      {
        "timestep": 6868,
        "pass_at_1": 0.4084019314362599,
        "avg_reward": 0.31061846933872417
      },
      {
        "timestep": 6969,
        "pass_at_1": 0.4442174844278841,
        "avg_reward": 0.29383077172060956
      },
      {
        "timestep": 7070,
        "pass_at_1": 0.4362902690535208,
        "avg_reward": 0.41438935295693813
      },
      {
        "timestep": 7171,
        "pass_at_1": 0.40329897175354124,
        "avg_reward": 0.3318708703294482
      },
      {
        "timestep": 7272,
        "pass_at_1": 0.4442674870822712,
        "avg_reward": 0.3945051332546825
      },
      {
        "timestep": 7373,
        "pass_at_1": 0.4178657712574805,
        "avg_reward": 0.26826978635177057
      },
      {
        "timestep": 7474,
        "pass_at_1": 0.4564925926701584,
        "avg_reward": 0.38004330779778606
      },
      {
        "timestep": 7575,
        "pass_at_1": 0.45442700223574806,
        "avg_reward": 0.38086401226344724
      },
      {
        "timestep": 7676,
        "pass_at_1": 0.4390949463162419,
        "avg_reward": 0.3628886419110437
      },
      {
        "timestep": 7777,
        "pass_at_1": 0.4617507112299003,
        "avg_reward": 0.3336829980826019
      },
      {
        "timestep": 7878,
        "pass_at_1": 0.496314815434198,
        "avg_reward": 0.4207434983929478
      },
      {
        "timestep": 7979,
        "pass_at_1": 0.43820037408299173,
        "avg_reward": 0.3833879796980849
      },
      {
        "timestep": 8080,
        "pass_at_1": 0.4454778867237105,
        "avg_reward": 0.395736539566091
      },
      {
        "timestep": 8181,
        "pass_at_1": 0.4910074490614545,
        "avg_reward": 0.35177184333157807
      },
      {
        "timestep": 8282,
        "pass_at_1": 0.48988707787812324,
        "avg_reward": 0.4125487086493235
      },
      {
        "timestep": 8383,
        "pass_at_1": 0.48976590455185354,
        "avg_reward": 0.4866523727741802
      },
      {
        "timestep": 8484,
        "pass_at_1": 0.47104440321860785,
        "avg_reward": 0.33914871435701177
      },
      {
        "timestep": 8585,
        "pass_at_1": 0.4607129049401453,
        "avg_reward": 0.32777980970384435
      },
      {
        "timestep": 8686,
        "pass_at_1": 0.47943704653774677,
        "avg_reward": 0.4006072359710296
      },
      {
        "timestep": 8787,
        "pass_at_1": 0.4889149823490904,
        "avg_reward": 0.43249114833107355
      },
      {
        "timestep": 8888,
        "pass_at_1": 0.4859708657496384,
        "avg_reward": 0.46145339645757655
      },
      {
        "timestep": 8989,
        "pass_at_1": 0.48267633902619234,
        "avg_reward": 0.5221495295504348
      },
      {
        "timestep": 9090,
        "pass_at_1": 0.5026718946882761,
        "avg_reward": 0.35927963792980677
      },
      {
        "timestep": 9191,
        "pass_at_1": 0.47086165495655613,
        "avg_reward": 0.40081294472740414
      },
      {
        "timestep": 9292,
        "pass_at_1": 0.48986457065124694,
        "avg_reward": 0.42759168122560215
      },
      {
        "timestep": 9393,
        "pass_at_1": 0.5057877575363601,
        "avg_reward": 0.4009887603962444
      },
      {
        "timestep": 9494,
        "pass_at_1": 0.4813126693948933,
        "avg_reward": 0.30930777428162143
      },
      {
        "timestep": 9595,
        "pass_at_1": 0.49118165217484294,
        "avg_reward": 0.435765261456048
      },
      {
        "timestep": 9696,
        "pass_at_1": 0.5061966133935483,
        "avg_reward": 0.34267035177923927
      },
      {
        "timestep": 9797,
        "pass_at_1": 0.5071220342685439,
        "avg_reward": 0.42496349640127695
      },
      {
        "timestep": 9898,
        "pass_at_1": 0.48766734025432884,
        "avg_reward": 0.3978201275007395
      },
      {
        "timestep": 10000,
        "pass_at_1": 0.5081386316704389,
        "avg_reward": 0.34936239044482
      }
    ],
    "eval_metrics": [
      {
        "timestep": 0,
        "pass_at_1": 0.009934283060224654,
        "avg_reward": 0.0010342113896204897,
        "difficulty_1_ratio": 0.5703496647219384,
        "difficulty_2_ratio": 0.34593455841067655,
        "difficulty_3_ratio": 0.0771884334190506,
        "difficulty_4_ratio": 0.006336012450983674,
        "difficulty_5_ratio": 0.00019133099735093797
      },
      {
        "timestep": 10000,
        "pass_at_1": 0.5081386316704389,
        "avg_reward": 0.34936239044482
      }
    ],
    "timing_metrics": [
      {
        "timestep": 0,
        "throughput": 4.5,
        "update": 1,
        "cumulative_wall_time": 11.11111111111111
      },
      {
        "timestep": 101,
        "throughput": 4.95,
        "update": 2,
        "cumulative_wall_time": 22.22222222222222
      },
      {
        "timestep": 202,
        "throughput": 5.3999999999999995,
        "update": 3,
        "cumulative_wall_time": 33.33333333333333
      },
      {
        "timestep": 303,
        "throughput": 5.8500000000000005,
        "update": 4,
        "cumulative_wall_time": 44.44444444444444
      },
      {
        "timestep": 404,
        "throughput": 6.3,
        "update": 5,
        "cumulative_wall_time": 55.55555555555556
      },
      {
        "timestep": 505,
        "throughput": 6.75,
        "update": 6,
        "cumulative_wall_time": 66.66666666666667
      },
      {
        "timestep": 606,
        "throughput": 7.2,
        "update": 7,
        "cumulative_wall_time": 77.77777777777779
      },
      {
        "timestep": 707,
        "throughput": 7.6499999999999995,
        "update": 8,
        "cumulative_wall_time": 88.8888888888889
      },
      {
        "timestep": 808,
        "throughput": 8.1,
        "update": 9,
        "cumulative_wall_time": 100.00000000000001
      },
      {
        "timestep": 909,
        "throughput": 8.549999999999999,
        "update": 10,
        "cumulative_wall_time": 111.11111111111113
      },
      {
        "timestep": 1010,
        "throughput": 9.322008624313455,
        "update": 11,
        "cumulative_wall_time": 122.22222222222224
      },
      {
        "timestep": 1111,
        "throughput": 9.50470607373141,
        "update": 12,
        "cumulative_wall_time": 133.33333333333334
      },
      {
        "timestep": 1212,
        "throughput": 9.97474611885775,
        "update": 13,
        "cumulative_wall_time": 144.44444444444446
      },
      {
        "timestep": 1313,
        "throughput": 9.948421846831412,
        "update": 14,
        "cumulative_wall_time": 155.55555555555557
      },
      {
        "timestep": 1414,
        "throughput": 7.760097568838619,
        "update": 15,
        "cumulative_wall_time": 166.66666666666669
      },
      {
        "timestep": 1515,
        "throughput": 8.155957464076389,
        "update": 16,
        "cumulative_wall_time": 177.7777777777778
      },
      {
        "timestep": 1616,
        "throughput": 9.463531740487793,
        "update": 17,
        "cumulative_wall_time": 188.8888888888889
      },
      {
        "timestep": 1717,
        "throughput": 9.462407355820988,
        "update": 18,
        "cumulative_wall_time": 200.00000000000003
      },
      {
        "timestep": 1818,
        "throughput": 9.463542917675442,
        "update": 19,
        "cumulative_wall_time": 211.11111111111114
      },
      {
        "timestep": 1919,
        "throughput": 12.46745834158925,
        "update": 20,
        "cumulative_wall_time": 222.22222222222226
      },
      {
        "timestep": 2020,
        "throughput": 9.513801459623851,
        "update": 21,
        "cumulative_wall_time": 233.33333333333337
      },
      {
        "timestep": 2121,
        "throughput": 10.022009076162538,
        "update": 22,
        "cumulative_wall_time": 244.44444444444449
      },
      {
        "timestep": 2222,
        "throughput": 9.858601587143882,
        "update": 23,
        "cumulative_wall_time": 255.5555555555556
      },
      {
        "timestep": 2323,
        "throughput": 9.586252126175218,
        "update": 24,
        "cumulative_wall_time": 266.6666666666667
      },
      {
        "timestep": 2424,
        "throughput": 8.716257679823688,
        "update": 25,
        "cumulative_wall_time": 277.77777777777777
      },
      {
        "timestep": 2525,
        "throughput": 9.683072298443943,
        "update": 26,
        "cumulative_wall_time": 288.88888888888886
      },
      {
        "timestep": 2626,
        "throughput": 8.304457306916186,
        "update": 27,
        "cumulative_wall_time": 299.99999999999994
      },
      {
        "timestep": 2727,
        "throughput": 8.786863253933992,
        "update": 28,
        "cumulative_wall_time": 311.11111111111103
      },
      {
        "timestep": 2828,
        "throughput": 8.563172806953807,
        "update": 29,
        "cumulative_wall_time": 322.2222222222221
      },
      {
        "timestep": 2929,
        "throughput": 9.07368672544769,
        "update": 30,
        "cumulative_wall_time": 333.3333333333332
      },
      {
        "timestep": 3030,
        "throughput": 11.083192710006157,
        "update": 31,
        "cumulative_wall_time": 344.4444444444443
      },
      {
        "timestep": 3131,
        "throughput": 7.319461326667427,
        "update": 32,
        "cumulative_wall_time": 355.5555555555554
      },
      {
        "timestep": 3232,
        "throughput": 9.61763417133706,
        "update": 33,
        "cumulative_wall_time": 366.66666666666646
      },
      {
        "timestep": 3333,
        "throughput": 7.5485557159293135,
        "update": 34,
        "cumulative_wall_time": 377.77777777777754
      },
      {
        "timestep": 3434,
        "throughput": 8.57526132078951,
        "update": 35,
        "cumulative_wall_time": 388.88888888888863
      },
      {
        "timestep": 3535,
        "throughput": 9.98005553727063,
        "update": 36,
        "cumulative_wall_time": 399.9999999999997
      },
      {
        "timestep": 3636,
        "throughput": 9.057852017185915,
        "update": 37,
        "cumulative_wall_time": 411.1111111111108
      },
      {
        "timestep": 3737,
        "throughput": 8.030029699863626,
        "update": 38,
        "cumulative_wall_time": 422.2222222222219
      },
      {
        "timestep": 3838,
        "throughput": 8.356226661666028,
        "update": 39,
        "cumulative_wall_time": 433.333333333333
      },
      {
        "timestep": 3939,
        "throughput": 9.611637974041207,
        "update": 40,
        "cumulative_wall_time": 444.44444444444406
      },
      {
        "timestep": 4040,
        "throughput": 8.342670031454578,
        "update": 41,
        "cumulative_wall_time": 455.55555555555515
      },
      {
        "timestep": 4141,
        "throughput": 9.194812730623779,
        "update": 42,
        "cumulative_wall_time": 466.66666666666623
      },
      {
        "timestep": 4242,
        "throughput": 9.041014655913433,
        "update": 43,
        "cumulative_wall_time": 477.7777777777773
      },
      {
        "timestep": 4343,
        "throughput": 8.413559687154764,
        "update": 44,
        "cumulative_wall_time": 488.8888888888884
      },
      {
        "timestep": 4444,
        "throughput": 10.929549680392794,
        "update": 45,
        "cumulative_wall_time": 499.9999999999995
      },
      {
        "timestep": 4545,
        "throughput": 9.57052712008621,
        "update": 46,
        "cumulative_wall_time": 511.1111111111106
      },
      {
        "timestep": 4646,
        "throughput": 7.177371672008154,
        "update": 47,
        "cumulative_wall_time": 522.2222222222217
      },
      {
        "timestep": 4747,
        "throughput": 9.167808883292485,
        "update": 48,
        "cumulative_wall_time": 533.3333333333328
      },
      {
        "timestep": 4848,
        "throughput": 8.40439218170845,
        "update": 49,
        "cumulative_wall_time": 544.4444444444439
      },
      {
        "timestep": 4949,
        "throughput": 9.767190001316601,
        "update": 50,
        "cumulative_wall_time": 555.555555555555
      },
      {
        "timestep": 5050,
        "throughput": 8.28673133541057,
        "update": 51,
        "cumulative_wall_time": 566.6666666666661
      },
      {
        "timestep": 5151,
        "throughput": 8.896737202679791,
        "update": 52,
        "cumulative_wall_time": 577.7777777777771
      },
      {
        "timestep": 5252,
        "throughput": 9.454488551082411,
        "update": 53,
        "cumulative_wall_time": 588.8888888888882
      },
      {
        "timestep": 5353,
        "throughput": 9.77917967475311,
        "update": 54,
        "cumulative_wall_time": 599.9999999999993
      },
      {
        "timestep": 5454,
        "throughput": 7.919733233649801,
        "update": 55,
        "cumulative_wall_time": 611.1111111111104
      },
      {
        "timestep": 5555,
        "throughput": 8.698948887743146,
        "update": 56,
        "cumulative_wall_time": 622.2222222222215
      },
      {
        "timestep": 5656,
        "throughput": 8.572549219955139,
        "update": 57,
        "cumulative_wall_time": 633.3333333333326
      },
      {
        "timestep": 5757,
        "throughput": 8.41200369068366,
        "update": 58,
        "cumulative_wall_time": 644.4444444444437
      },
      {
        "timestep": 5858,
        "throughput": 10.588908816252987,
        "update": 59,
        "cumulative_wall_time": 655.5555555555547
      },
      {
        "timestep": 5959,
        "throughput": 9.36448353986486,
        "update": 60,
        "cumulative_wall_time": 666.6666666666658
      },
      {
        "timestep": 6060,
        "throughput": 7.8652044410984585,
        "update": 61,
        "cumulative_wall_time": 677.7777777777769
      },
      {
        "timestep": 6161,
        "throughput": 9.826075752349299,
        "update": 62,
        "cumulative_wall_time": 688.888888888888
      },
      {
        "timestep": 6262,
        "throughput": 10.90994057731137,
        "update": 63,
        "cumulative_wall_time": 699.9999999999991
      },
      {
        "timestep": 6363,
        "throughput": 9.929218734496033,
        "update": 64,
        "cumulative_wall_time": 711.1111111111102
      },
      {
        "timestep": 6464,
        "throughput": 7.632567030641388,
        "update": 65,
        "cumulative_wall_time": 722.2222222222213
      },
      {
        "timestep": 6565,
        "throughput": 8.564189334420373,
        "update": 66,
        "cumulative_wall_time": 733.3333333333323
      },
      {
        "timestep": 6666,
        "throughput": 10.14022003426796,
        "update": 67,
        "cumulative_wall_time": 744.4444444444434
      },
      {
        "timestep": 6767,
        "throughput": 8.363097480943097,
        "update": 68,
        "cumulative_wall_time": 755.5555555555545
      },
      {
        "timestep": 6868,
        "throughput": 9.399437485331605,
        "update": 69,
        "cumulative_wall_time": 766.6666666666656
      },
      {
        "timestep": 6969,
        "throughput": 9.697170648086404,
        "update": 70,
        "cumulative_wall_time": 777.7777777777767
      },
      {
        "timestep": 7070,
        "throughput": 8.165762575579725,
        "update": 71,
        "cumulative_wall_time": 788.8888888888878
      },
      {
        "timestep": 7171,
        "throughput": 8.94642717954438,
        "update": 72,
        "cumulative_wall_time": 799.9999999999989
      },
      {
        "timestep": 7272,
        "throughput": 6.082859393937834,
        "update": 73,
        "cumulative_wall_time": 811.11111111111
      },
      {
        "timestep": 7373,
        "throughput": 8.078051122799138,
        "update": 74,
        "cumulative_wall_time": 822.222222222221
      },
      {
        "timestep": 7474,
        "throughput": 8.772688663746155,
        "update": 75,
        "cumulative_wall_time": 833.3333333333321
      },
      {
        "timestep": 7575,
        "throughput": 7.876995136231635,
        "update": 76,
        "cumulative_wall_time": 844.4444444444432
      },
      {
        "timestep": 7676,
        "throughput": 10.469170173538473,
        "update": 77,
        "cumulative_wall_time": 855.5555555555543
      },
      {
        "timestep": 7777,
        "throughput": 7.71287275983543,
        "update": 78,
        "cumulative_wall_time": 866.6666666666654
      },
      {
        "timestep": 7878,
        "throughput": 8.603959961972715,
        "update": 79,
        "cumulative_wall_time": 877.7777777777765
      },
      {
        "timestep": 7979,
        "throughput": 9.117666519557481,
        "update": 80,
        "cumulative_wall_time": 888.8888888888875
      },
      {
        "timestep": 8080,
        "throughput": 10.297145960159504,
        "update": 81,
        "cumulative_wall_time": 899.9999999999986
      },
      {
        "timestep": 8181,
        "throughput": 7.707724063938505,
        "update": 82,
        "cumulative_wall_time": 911.1111111111097
      },
      {
        "timestep": 8282,
        "throughput": 10.046847376939462,
        "update": 83,
        "cumulative_wall_time": 922.2222222222208
      },
      {
        "timestep": 8383,
        "throughput": 9.009209754917627,
        "update": 84,
        "cumulative_wall_time": 933.3333333333319
      },
      {
        "timestep": 8484,
        "throughput": 8.116642214056844,
        "update": 85,
        "cumulative_wall_time": 944.444444444443
      },
      {
        "timestep": 8585,
        "throughput": 9.415893126836945,
        "update": 86,
        "cumulative_wall_time": 955.5555555555541
      },
      {
        "timestep": 8686,
        "throughput": 9.179153726016121,
        "update": 87,
        "cumulative_wall_time": 966.6666666666652
      },
      {
        "timestep": 8787,
        "throughput": 8.459804810557085,
        "update": 88,
        "cumulative_wall_time": 977.7777777777762
      },
      {
        "timestep": 8888,
        "throughput": 9.062821876491016,
        "update": 89,
        "cumulative_wall_time": 988.8888888888873
      },
      {
        "timestep": 8989,
        "throughput": 8.653217762824415,
        "update": 90,
        "cumulative_wall_time": 999.9999999999984
      },
      {
        "timestep": 9090,
        "throughput": 9.102165610726123,
        "update": 91,
        "cumulative_wall_time": 1011.1111111111095
      },
      {
        "timestep": 9191,
        "throughput": 9.595917607068941,
        "update": 92,
        "cumulative_wall_time": 1022.2222222222206
      },
      {
        "timestep": 9292,
        "throughput": 10.427415134530817,
        "update": 93,
        "cumulative_wall_time": 1033.3333333333317
      },
      {
        "timestep": 9393,
        "throughput": 7.885966051055837,
        "update": 94,
        "cumulative_wall_time": 1044.4444444444428
      },
      {
        "timestep": 9494,
        "throughput": 10.919730037190641,
        "update": 95,
        "cumulative_wall_time": 1055.5555555555538
      },
      {
        "timestep": 9595,
        "throughput": 7.243120980429748,
        "update": 96,
        "cumulative_wall_time": 1066.666666666665
      },
      {
        "timestep": 9696,
        "throughput": 8.863393414467975,
        "update": 97,
        "cumulative_wall_time": 1077.777777777776
      },
      {
        "timestep": 9797,
        "throughput": 9.529485485836119,
        "update": 98,
        "cumulative_wall_time": 1088.888888888887
      },
      {
        "timestep": 9898,
        "throughput": 9.252892680961528,
        "update": 99,
        "cumulative_wall_time": 1099.9999999999982
      },
      {
        "timestep": 10000,
        "throughput": 8.439570432161466,
        "update": 100,
        "cumulative_wall_time": 1111.1111111111093
      }
    ],
    "scheduler_stats": {
      "total_experiences": 10000,
      "total_updates": 500,
      "policy_version": 500,
      "buffer_size": 1024,
      "curriculum": {
        "level_1": {
          "num_pulls": 1500,
          "success_rate": 0.85,
          "mean_reward": 0.7608375549928545,
          "recent_gradient": 0.009013998130682335
        },
        "level_2": {
          "num_pulls": 2000,
          "success_rate": 0.65,
          "mean_reward": 0.5732127048611159,
          "recent_gradient": 0.02169920419404205
        },
        "level_3": {
          "num_pulls": 2500,
          "success_rate": 0.45,
          "mean_reward": 0.412140309719301,
          "recent_gradient": 0.028614180809478692
        },
        "level_4": {
          "num_pulls": 2500,
          "success_rate": 0.28,
          "mean_reward": 0.2699919975086651,
          "recent_gradient": 0.02061459904175322
        },
        "level_5": {
          "num_pulls": 1500,
          "success_rate": 0.15,
          "mean_reward": 0.1512572423767792,
          "recent_gradient": 0.011259257683847225
        },
        "total_steps": 10000
      },
      "staleness": {
        "discard_rate": 0.15
      },
      "workers": {
        "0": {
          "completed_tasks": 2500,
          "avg_throughput": 4.5855024945389635
        },
        "1": {
          "completed_tasks": 2500,
          "avg_throughput": 4.719909479901515
        },
        "2": {
          "completed_tasks": 2500,
          "avg_throughput": 5.373646802561631
        },
        "3": {
          "completed_tasks": 2500,
          "avg_throughput": 5.3051851327167325
        }
      }
    },
    "final_pass_at_1": 0.5149171624758753,
    "final_pass_at_1_std": 0.015580873953549118,
    "avg_throughput": 8.76290925269221,
    "avg_throughput_std": 0.0813369471995853,
    "wall_time_mean": 0.0,
    "num_runs": 3
  },
  "async": {
    "train_metrics": [
      {
        "timestep": 0,
        "pass_at_1": 0.009934283060224654,
        "avg_reward": 0.0010342113896204897,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 101,
        "pass_at_1": 0.021034578842821932,
        "avg_reward": 0.09297915589465883,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 202,
        "pass_at_1": 0.011478548667149445,
        "avg_reward": -0.0025240089137394707,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 303,
        "pass_at_1": 0.055826680552572075,
        "avg_reward": 0.0830330808997031,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 404,
        "pass_at_1": 0.022933744604533287,
        "avg_reward": 0.04547499786292486,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 505,
        "pass_at_1": 0.1265196819810451,
        "avg_reward": 0.07792925790632324,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 606,
        "pass_at_1": 0.1424450753945836,
        "avg_reward": 0.018292048082776985,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 707,
        "pass_at_1": 0.10493675980408412,
        "avg_reward": 0.055835031381218675,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 808,
        "pass_at_1": 0.12101900545406562,
        "avg_reward": 0.11252757099301619,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 909,
        "pass_at_1": 0.12496660732171129,
        "avg_reward": 0.029358100790604455,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1010,
        "pass_at_1": 0.17430219161624838,
        "avg_reward": 0.1281529382686719,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1111,
        "pass_at_1": 0.14821228339190765,
        "avg_reward": 0.04733241740285328,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1212,
        "pass_at_1": 0.1378566452363835,
        "avg_reward": 0.11583144567460012,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1313,
        "pass_at_1": 0.1276167803361163,
        "avg_reward": 0.12087832518617664,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1414,
        "pass_at_1": 0.14052568914436872,
        "avg_reward": 0.09783586382583115,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1515,
        "pass_at_1": 0.1424152808144994,
        "avg_reward": 0.2065461338770464,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1616,
        "pass_at_1": 0.15609923106824833,
        "avg_reward": 0.07199383840680365,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1717,
        "pass_at_1": 0.17474831539390057,
        "avg_reward": 0.07875646981656934,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1818,
        "pass_at_1": 0.16441106999734761,
        "avg_reward": 0.033545349803889304,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1919,
        "pass_at_1": 0.13561425148378498,
        "avg_reward": 0.11833446298048417,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2020,
        "pass_at_1": 0.17889891992485982,
        "avg_reward": 0.15168754999938638,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2121,
        "pass_at_1": 0.16377532237162765,
        "avg_reward": 0.11596507311783769,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2222,
        "pass_at_1": 0.13848326856826595,
        "avg_reward": 0.07479440443487734,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2323,
        "pass_at_1": 0.16081270555692365,
        "avg_reward": 0.1815062757564847,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2424,
        "pass_at_1": 0.17887559820927704,
        "avg_reward": 0.05494847079928494,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2525,
        "pass_at_1": 0.18046826397110474,
        "avg_reward": 0.12512049715606796,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2626,
        "pass_at_1": 0.16243671491189088,
        "avg_reward": 0.16053318637155609,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2727,
        "pass_at_1": 0.19858854716789032,
        "avg_reward": 0.2054348436901222,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2828,
        "pass_at_1": 0.1631820489568339,
        "avg_reward": 0.1150850203729064,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2929,
        "pass_at_1": 0.18859355753610915,
        "avg_reward": 0.1996521023850053,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3030,
        "pass_at_1": 0.17439034304865847,
        "avg_reward": 0.1302293256057359,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3131,
        "pass_at_1": 0.16385591631923654,
        "avg_reward": 0.0712744018513557,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3232,
        "pass_at_1": 0.20424476639685424,
        "avg_reward": 0.23120781454602457,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3333,
        "pass_at_1": 0.18856812257681735,
        "avg_reward": 0.20103114295605512,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3434,
        "pass_at_1": 0.1992571542515187,
        "avg_reward": 0.12714973567095872,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3535,
        "pass_at_1": 0.20127007940501063,
        "avg_reward": 0.237917891847307,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3636,
        "pass_at_1": 0.1953445946557213,
        "avg_reward": 0.23450785851527736,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3737,
        "pass_at_1": 0.14568596490480212,
        "avg_reward": 0.1576438971426029,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3838,
        "pass_at_1": 0.2018419514571851,
        "avg_reward": 0.1465231936424547,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3939,
        "pass_at_1": 0.2039563481181623,
        "avg_reward": 0.06378663276448521,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4040,
        "pass_at_1": 0.19974738456381627,
        "avg_reward": 0.17765353622664035,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4141,
        "pass_at_1": 0.23571754838857376,
        "avg_reward": 0.16266052779717663,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4242,
        "pass_at_1": 0.1920073849398693,
        "avg_reward": 0.12851805577266862,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4343,
        "pass_at_1": 0.2285012231005743,
        "avg_reward": 0.19923853396344368,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4444,
        "pass_at_1": 0.20161182593475274,
        "avg_reward": 0.18695283240347002,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4545,
        "pass_at_1": 0.21615994873164326,
        "avg_reward": 0.2213602085119591,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4646,
        "pass_at_1": 0.20218581704279096,
        "avg_reward": 0.14536554630434437,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4747,
        "pass_at_1": 0.21038990778221633,
        "avg_reward": 0.09513617881916714,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4848,
        "pass_at_1": 0.22615597902507736,
        "avg_reward": 0.19397754682905635,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4949,
        "pass_at_1": 0.2223332589086768,
        "avg_reward": 0.16613725045818412,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 5050,
        "pass_at_1": 0.1959165111022232,
        "avg_reward": 0.1357009427435106
      },
      {
        "timestep": 5151,
        "pass_at_1": 0.21935770146603534,
        "avg_reward": 0.13537229771174733
      },
      {
        "timestep": 5252,
        "pass_at_1": 0.2249690868001501,
        "avg_reward": 0.20017781228084702
      },
      {
        "timestep": 5353,
        "pass_at_1": 0.2678956895550048,
        "avg_reward": 0.2230454422855958
      },
      {
        "timestep": 5454,
        "pass_at_1": 0.23729413344429587,
        "avg_reward": 0.18611301096712835
      },
      {
        "timestep": 5555,
        "pass_at_1": 0.19573246610812844,
        "avg_reward": 0.15526027911404194
      },
      {
        "timestep": 5656,
        "pass_at_1": 0.23727050217805074,
        "avg_reward": 0.3129785073667049
      },
      {
        "timestep": 5757,
        "pass_at_1": 0.23416956639903566,
        "avg_reward": 0.20241302023590915
      },
      {
        "timestep": 5858,
        "pass_at_1": 0.23926596106266296,
        "avg_reward": 0.13297886696915376
      },
      {
        "timestep": 5959,
        "pass_at_1": 0.2647522352233031,
        "avg_reward": 0.24939843981298118
      },
      {
        "timestep": 6060,
        "pass_at_1": 0.25964382673761766,
        "avg_reward": 0.16224568865035718
      },
      {
        "timestep": 6161,
        "pass_at_1": 0.27379797017141566,
        "avg_reward": 0.1489458229975185
      },
      {
        "timestep": 6262,
        "pass_at_1": 0.2593892766282391,
        "avg_reward": 0.3170342025930902
      },
      {
        "timestep": 6363,
        "pass_at_1": 0.22974228769634816,
        "avg_reward": 0.15547894367693993
      },
      {
        "timestep": 6464,
        "pass_at_1": 0.25343743044549427,
        "avg_reward": 0.17757616165058546
      },
      {
        "timestep": 6565,
        "pass_at_1": 0.22231272084801584,
        "avg_reward": 0.18127832541871405
      },
      {
        "timestep": 6666,
        "pass_at_1": 0.23395139398987144,
        "avg_reward": 0.21084073672365622
      },
      {
        "timestep": 6767,
        "pass_at_1": 0.23867005730192498,
        "avg_reward": 0.26843276609241695
      },
      {
        "timestep": 6868,
        "pass_at_1": 0.2432438547682584,
        "avg_reward": 0.17849200800432297
      },
      {
        "timestep": 6969,
        "pass_at_1": 0.2770186661385657,
        "avg_reward": 0.1600717170891548
      },
      {
        "timestep": 7070,
        "pass_at_1": 0.26712566964172435,
        "avg_reward": 0.2790576734275009
      },
      {
        "timestep": 7171,
        "pass_at_1": 0.2322434367456246,
        "avg_reward": 0.1950264423231149
      },
      {
        "timestep": 7272,
        "pass_at_1": 0.27139561050425226,
        "avg_reward": 0.2562076319922673
      },
      {
        "timestep": 7373,
        "pass_at_1": 0.24325176576287028,
        "avg_reward": 0.1285785819560824
      },
      {
        "timestep": 7474,
        "pass_at_1": 0.28021016651903696,
        "avg_reward": 0.23901736687688888
      },
      {
        "timestep": 7575,
        "pass_at_1": 0.2765492432692698,
        "avg_reward": 0.23856180509026462
      },
      {
        "timestep": 7676,
        "pass_at_1": 0.2596942130219977,
        "avg_reward": 0.21936805527564834
      },
      {
        "timestep": 7777,
        "pass_at_1": 0.2808985309476607,
        "avg_reward": 0.1890012538568102
      },
      {
        "timestep": 7878,
        "pass_at_1": 0.31408178970871287,
        "avg_reward": 0.2749570778125597
      },
      {
        "timestep": 7979,
        "pass_at_1": 0.2546560911308627,
        "avg_reward": 0.23655255333638164
      },
      {
        "timestep": 8080,
        "pass_at_1": 0.2606908409449796,
        "avg_reward": 0.24790690294310627
      },
      {
        "timestep": 8181,
        "pass_at_1": 0.3050449674935109,
        "avg_reward": 0.2030018580772232
      },
      {
        "timestep": 8282,
        "pass_at_1": 0.3028152534598183,
        "avg_reward": 0.26289124911467954
      },
      {
        "timestep": 8383,
        "pass_at_1": 0.3016495360393043,
        "avg_reward": 0.3361592779641408
      },
      {
        "timestep": 8484,
        "pass_at_1": 0.2819469415709908,
        "avg_reward": 0.18787074503891818
      },
      {
        "timestep": 8585,
        "pass_at_1": 0.2706964059737401,
        "avg_reward": 0.17576661053072018
      },
      {
        "timestep": 8686,
        "pass_at_1": 0.28856212962946537,
        "avg_reward": 0.2479073024444045
      },
      {
        "timestep": 8787,
        "pass_at_1": 0.29724079495657996,
        "avg_reward": 0.27915179841706517
      },
      {
        "timestep": 8888,
        "pass_at_1": 0.2935550535036287,
        "avg_reward": 0.3075207466607688
      },
      {
        "timestep": 8989,
        "pass_at_1": 0.2895750211418895,
        "avg_reward": 0.3676684752429925
      },
      {
        "timestep": 9090,
        "pass_at_1": 0.308939644436126,
        "avg_reward": 0.20429383772808668
      },
      {
        "timestep": 9191,
        "pass_at_1": 0.2765514849284203,
        "avg_reward": 0.24536480870489552
      },
      {
        "timestep": 9292,
        "pass_at_1": 0.29502792255577653,
        "avg_reward": 0.27172236274922584
      },
      {
        "timestep": 9393,
        "pass_at_1": 0.310474496256928,
        "avg_reward": 0.2447381513726988
      },
      {
        "timestep": 9494,
        "pass_at_1": 0.28557108104468437,
        "avg_reward": 0.15271450360145428
      },
      {
        "timestep": 9595,
        "pass_at_1": 0.2950584458864134,
        "avg_reward": 0.2788666964253044
      },
      {
        "timestep": 9696,
        "pass_at_1": 0.3097369265841966,
        "avg_reward": 0.18550260233175792
      },
      {
        "timestep": 9797,
        "pass_at_1": 0.31036944112800485,
        "avg_reward": 0.26756142188884574
      },
      {
        "timestep": 9898,
        "pass_at_1": 0.29066386320746745,
        "avg_reward": 0.2402173458632504
      },
      {
        "timestep": 10000,
        "pass_at_1": 0.31092475557463145,
        "avg_reward": 0.191591289568174
      }
    ],
    "eval_metrics": [
      {
        "timestep": 0,
        "pass_at_1": 0.009934283060224654,
        "avg_reward": 0.0010342113896204897,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 10000,
        "pass_at_1": 0.31092475557463145,
        "avg_reward": 0.191591289568174
      }
    ],
    "timing_metrics": [
      {
        "timestep": 0,
        "throughput": 12.5,
        "update": 1,
        "cumulative_wall_time": 4.0
      },
      {
        "timestep": 101,
        "throughput": 13.750000000000002,
        "update": 2,
        "cumulative_wall_time": 8.0
      },
      {
        "timestep": 202,
        "throughput": 15.0,
        "update": 3,
        "cumulative_wall_time": 12.0
      },
      {
        "timestep": 303,
        "throughput": 16.25,
        "update": 4,
        "cumulative_wall_time": 16.0
      },
      {
        "timestep": 404,
        "throughput": 17.5,
        "update": 5,
        "cumulative_wall_time": 20.0
      },
      {
        "timestep": 505,
        "throughput": 18.75,
        "update": 6,
        "cumulative_wall_time": 24.0
      },
      {
        "timestep": 606,
        "throughput": 20.0,
        "update": 7,
        "cumulative_wall_time": 28.0
      },
      {
        "timestep": 707,
        "throughput": 21.25,
        "update": 8,
        "cumulative_wall_time": 32.0
      },
      {
        "timestep": 808,
        "throughput": 22.5,
        "update": 9,
        "cumulative_wall_time": 36.0
      },
      {
        "timestep": 909,
        "throughput": 23.75,
        "update": 10,
        "cumulative_wall_time": 40.0
      },
      {
        "timestep": 1010,
        "throughput": 25.894468400870707,
        "update": 11,
        "cumulative_wall_time": 44.0
      },
      {
        "timestep": 1111,
        "throughput": 26.401961315920587,
        "update": 12,
        "cumulative_wall_time": 48.0
      },
      {
        "timestep": 1212,
        "throughput": 27.70762810793819,
        "update": 13,
        "cumulative_wall_time": 52.0
      },
      {
        "timestep": 1313,
        "throughput": 27.634505130087256,
        "update": 14,
        "cumulative_wall_time": 56.0
      },
      {
        "timestep": 1414,
        "throughput": 21.555826580107272,
        "update": 15,
        "cumulative_wall_time": 60.0
      },
      {
        "timestep": 1515,
        "throughput": 22.655437400212193,
        "update": 16,
        "cumulative_wall_time": 64.0
      },
      {
        "timestep": 1616,
        "throughput": 26.287588168021646,
        "update": 17,
        "cumulative_wall_time": 68.0
      },
      {
        "timestep": 1717,
        "throughput": 26.284464877280524,
        "update": 18,
        "cumulative_wall_time": 72.0
      },
      {
        "timestep": 1818,
        "throughput": 26.28761921576512,
        "update": 19,
        "cumulative_wall_time": 76.0
      },
      {
        "timestep": 1919,
        "throughput": 34.631828726636805,
        "update": 20,
        "cumulative_wall_time": 80.0
      },
      {
        "timestep": 2020,
        "throughput": 26.427226276732917,
        "update": 21,
        "cumulative_wall_time": 84.0
      },
      {
        "timestep": 2121,
        "throughput": 27.838914100451497,
        "update": 22,
        "cumulative_wall_time": 88.0
      },
      {
        "timestep": 2222,
        "throughput": 27.385004408733003,
        "update": 23,
        "cumulative_wall_time": 92.0
      },
      {
        "timestep": 2323,
        "throughput": 26.628478128264494,
        "update": 24,
        "cumulative_wall_time": 96.0
      },
      {
        "timestep": 2424,
        "throughput": 24.211826888399134,
        "update": 25,
        "cumulative_wall_time": 100.0
      },
      {
        "timestep": 2525,
        "throughput": 26.897423051233172,
        "update": 26,
        "cumulative_wall_time": 104.0
      },
      {
        "timestep": 2626,
        "throughput": 23.06793696365607,
        "update": 27,
        "cumulative_wall_time": 108.0
      },
      {
        "timestep": 2727,
        "throughput": 24.407953483149978,
        "update": 28,
        "cumulative_wall_time": 112.0
      },
      {
        "timestep": 2828,
        "throughput": 23.786591130427244,
        "update": 29,
        "cumulative_wall_time": 116.0
      },
      {
        "timestep": 2929,
        "throughput": 25.204685348465805,
        "update": 30,
        "cumulative_wall_time": 120.0
      },
      {
        "timestep": 3030,
        "throughput": 30.786646416683773,
        "update": 31,
        "cumulative_wall_time": 124.0
      },
      {
        "timestep": 3131,
        "throughput": 20.33183701852063,
        "update": 32,
        "cumulative_wall_time": 128.0
      },
      {
        "timestep": 3232,
        "throughput": 26.715650475936283,
        "update": 33,
        "cumulative_wall_time": 132.0
      },
      {
        "timestep": 3333,
        "throughput": 20.96821032202587,
        "update": 34,
        "cumulative_wall_time": 136.0
      },
      {
        "timestep": 3434,
        "throughput": 23.820170335526416,
        "update": 35,
        "cumulative_wall_time": 140.0
      },
      {
        "timestep": 3535,
        "throughput": 27.722376492418416,
        "update": 36,
        "cumulative_wall_time": 144.0
      },
      {
        "timestep": 3636,
        "throughput": 25.160700047738654,
        "update": 37,
        "cumulative_wall_time": 148.0
      },
      {
        "timestep": 3737,
        "throughput": 22.305638055176736,
        "update": 38,
        "cumulative_wall_time": 152.0
      },
      {
        "timestep": 3838,
        "throughput": 23.21174072685008,
        "update": 39,
        "cumulative_wall_time": 156.0
      },
      {
        "timestep": 3939,
        "throughput": 26.69899437233669,
        "update": 40,
        "cumulative_wall_time": 160.0
      },
      {
        "timestep": 4040,
        "throughput": 23.17408342070716,
        "update": 41,
        "cumulative_wall_time": 164.0
      },
      {
        "timestep": 4141,
        "throughput": 25.54114647395494,
        "update": 42,
        "cumulative_wall_time": 168.0
      },
      {
        "timestep": 4242,
        "throughput": 25.113929599759533,
        "update": 43,
        "cumulative_wall_time": 172.0
      },
      {
        "timestep": 4343,
        "throughput": 23.370999130985457,
        "update": 44,
        "cumulative_wall_time": 176.0
      },
      {
        "timestep": 4444,
        "throughput": 30.35986022331332,
        "update": 45,
        "cumulative_wall_time": 180.0
      },
      {
        "timestep": 4545,
        "throughput": 26.584797555795024,
        "update": 46,
        "cumulative_wall_time": 184.0
      },
      {
        "timestep": 4646,
        "throughput": 19.937143533355982,
        "update": 47,
        "cumulative_wall_time": 188.0
      },
      {
        "timestep": 4747,
        "throughput": 25.466135786923573,
        "update": 48,
        "cumulative_wall_time": 192.0
      },
      {
        "timestep": 4848,
        "throughput": 23.34553383807903,
        "update": 49,
        "cumulative_wall_time": 196.0
      },
      {
        "timestep": 4949,
        "throughput": 27.131083336990557,
        "update": 50,
        "cumulative_wall_time": 200.0
      },
      {
        "timestep": 5050,
        "throughput": 23.018698153918248,
        "update": 51,
        "cumulative_wall_time": 204.0
      },
      {
        "timestep": 5151,
        "throughput": 24.71315889633275,
        "update": 52,
        "cumulative_wall_time": 208.0
      },
      {
        "timestep": 5252,
        "throughput": 26.262468197451145,
        "update": 53,
        "cumulative_wall_time": 212.0
      },
      {
        "timestep": 5353,
        "throughput": 27.164387985425304,
        "update": 54,
        "cumulative_wall_time": 216.0
      },
      {
        "timestep": 5454,
        "throughput": 21.99925898236056,
        "update": 55,
        "cumulative_wall_time": 220.0
      },
      {
        "timestep": 5555,
        "throughput": 24.16374691039763,
        "update": 56,
        "cumulative_wall_time": 224.0
      },
      {
        "timestep": 5656,
        "throughput": 23.81263672209761,
        "update": 57,
        "cumulative_wall_time": 228.0
      },
      {
        "timestep": 5757,
        "throughput": 23.36667691856572,
        "update": 58,
        "cumulative_wall_time": 232.0
      },
      {
        "timestep": 5858,
        "throughput": 29.413635600702744,
        "update": 59,
        "cumulative_wall_time": 236.0
      },
      {
        "timestep": 5959,
        "throughput": 26.01245427740239,
        "update": 60,
        "cumulative_wall_time": 240.0
      },
      {
        "timestep": 6060,
        "throughput": 21.847790114162386,
        "update": 61,
        "cumulative_wall_time": 244.0
      },
      {
        "timestep": 6161,
        "throughput": 27.294654867636943,
        "update": 62,
        "cumulative_wall_time": 248.0
      },
      {
        "timestep": 6262,
        "throughput": 30.30539049253158,
        "update": 63,
        "cumulative_wall_time": 252.0
      },
      {
        "timestep": 6363,
        "throughput": 27.58116315137787,
        "update": 64,
        "cumulative_wall_time": 256.0
      },
      {
        "timestep": 6464,
        "throughput": 21.201575085114964,
        "update": 65,
        "cumulative_wall_time": 260.0
      },
      {
        "timestep": 6565,
        "throughput": 23.78941481783437,
        "update": 66,
        "cumulative_wall_time": 264.0
      },
      {
        "timestep": 6666,
        "throughput": 28.167277872966558,
        "update": 67,
        "cumulative_wall_time": 268.0
      },
      {
        "timestep": 6767,
        "throughput": 23.230826335953047,
        "update": 68,
        "cumulative_wall_time": 272.0
      },
      {
        "timestep": 6868,
        "throughput": 26.109548570365572,
        "update": 69,
        "cumulative_wall_time": 276.0
      },
      {
        "timestep": 6969,
        "throughput": 26.93658513357334,
        "update": 70,
        "cumulative_wall_time": 280.0
      },
      {
        "timestep": 7070,
        "throughput": 22.682673821054795,
        "update": 71,
        "cumulative_wall_time": 284.0
      },
      {
        "timestep": 7171,
        "throughput": 24.8511866098455,
        "update": 72,
        "cumulative_wall_time": 288.0
      },
      {
        "timestep": 7272,
        "throughput": 16.89683164982732,
        "update": 73,
        "cumulative_wall_time": 292.0
      },
      {
        "timestep": 7373,
        "throughput": 22.439030896664274,
        "update": 74,
        "cumulative_wall_time": 296.0
      },
      {
        "timestep": 7474,
        "throughput": 24.3685796215171,
        "update": 75,
        "cumulative_wall_time": 300.0
      },
      {
        "timestep": 7575,
        "throughput": 21.880542045087875,
        "update": 76,
        "cumulative_wall_time": 304.0
      },
      {
        "timestep": 7676,
        "throughput": 29.08102825982909,
        "update": 77,
        "cumulative_wall_time": 308.0
      },
      {
        "timestep": 7777,
        "throughput": 21.424646555098416,
        "update": 78,
        "cumulative_wall_time": 312.0
      },
      {
        "timestep": 7878,
        "throughput": 23.899888783257538,
        "update": 79,
        "cumulative_wall_time": 316.0
      },
      {
        "timestep": 7979,
        "throughput": 25.326851443215226,
        "update": 80,
        "cumulative_wall_time": 320.0
      },
      {
        "timestep": 8080,
        "throughput": 28.60318322266529,
        "update": 81,
        "cumulative_wall_time": 324.0
      },
      {
        "timestep": 8181,
        "throughput": 21.410344622051404,
        "update": 82,
        "cumulative_wall_time": 328.0
      },
      {
        "timestep": 8282,
        "throughput": 27.907909380387398,
        "update": 83,
        "cumulative_wall_time": 332.0
      },
      {
        "timestep": 8383,
        "throughput": 25.025582652548966,
        "update": 84,
        "cumulative_wall_time": 336.0
      },
      {
        "timestep": 8484,
        "throughput": 22.546228372380124,
        "update": 85,
        "cumulative_wall_time": 340.0
      },
      {
        "timestep": 8585,
        "throughput": 26.15525868565818,
        "update": 86,
        "cumulative_wall_time": 344.0
      },
      {
        "timestep": 8686,
        "throughput": 25.497649238933672,
        "update": 87,
        "cumulative_wall_time": 348.0
      },
      {
        "timestep": 8787,
        "throughput": 23.499457807103013,
        "update": 88,
        "cumulative_wall_time": 352.0
      },
      {
        "timestep": 8888,
        "throughput": 25.174505212475047,
        "update": 89,
        "cumulative_wall_time": 356.0
      },
      {
        "timestep": 8989,
        "throughput": 24.036716007845598,
        "update": 90,
        "cumulative_wall_time": 360.0
      },
      {
        "timestep": 9090,
        "throughput": 25.283793363128122,
        "update": 91,
        "cumulative_wall_time": 364.0
      },
      {
        "timestep": 9191,
        "throughput": 26.655326686302615,
        "update": 92,
        "cumulative_wall_time": 368.0
      },
      {
        "timestep": 9292,
        "throughput": 28.965042040363382,
        "update": 93,
        "cumulative_wall_time": 372.0
      },
      {
        "timestep": 9393,
        "throughput": 21.905461252932877,
        "update": 94,
        "cumulative_wall_time": 376.0
      },
      {
        "timestep": 9494,
        "throughput": 30.332583436640668,
        "update": 95,
        "cumulative_wall_time": 380.0
      },
      {
        "timestep": 9595,
        "throughput": 20.119780501193745,
        "update": 96,
        "cumulative_wall_time": 384.0
      },
      {
        "timestep": 9696,
        "throughput": 24.62053726241104,
        "update": 97,
        "cumulative_wall_time": 388.0
      },
      {
        "timestep": 9797,
        "throughput": 26.47079301621144,
        "update": 98,
        "cumulative_wall_time": 392.0
      },
      {
        "timestep": 9898,
        "throughput": 25.70247966933758,
        "update": 99,
        "cumulative_wall_time": 396.0
      },
      {
        "timestep": 10000,
        "throughput": 23.443251200448515,
        "update": 100,
        "cumulative_wall_time": 400.0
      }
    ],
    "scheduler_stats": {
      "total_experiences": 10000,
      "total_updates": 500,
      "policy_version": 500,
      "buffer_size": 1024,
      "curriculum": {
        "level_1": {
          "num_pulls": 2000,
          "success_rate": 0.85,
          "mean_reward": 0.7608375549928545,
          "recent_gradient": 0.009013998130682335
        },
        "level_2": {
          "num_pulls": 2000,
          "success_rate": 0.65,
          "mean_reward": 0.5732127048611159,
          "recent_gradient": 0.02169920419404205
        },
        "level_3": {
          "num_pulls": 2000,
          "success_rate": 0.45,
          "mean_reward": 0.412140309719301,
          "recent_gradient": 0.028614180809478692
        },
        "level_4": {
          "num_pulls": 2000,
          "success_rate": 0.28,
          "mean_reward": 0.2699919975086651,
          "recent_gradient": 0.02061459904175322
        },
        "level_5": {
          "num_pulls": 2000,
          "success_rate": 0.15,
          "mean_reward": 0.1512572423767792,
          "recent_gradient": 0.011259257683847225
        },
        "total_steps": 10000
      },
      "staleness": {
        "discard_rate": 0.15
      },
      "workers": {
        "0": {
          "completed_tasks": 2500,
          "avg_throughput": 4.5855024945389635
        },
        "1": {
          "completed_tasks": 2500,
          "avg_throughput": 4.719909479901515
        },
        "2": {
          "completed_tasks": 2500,
          "avg_throughput": 5.373646802561631
        },
        "3": {
          "completed_tasks": 2500,
          "avg_throughput": 5.3051851327167325
        }
      }
    },
    "final_pass_at_1": 0.3177032863800678,
    "final_pass_at_1_std": 0.015580873953549118,
    "avg_throughput": 24.341414590811695,
    "avg_throughput_std": 0.22593596444329203,
    "wall_time_mean": 0.0,
    "num_runs": 3
  },
  "async_staleness": {
    "train_metrics": [
      {
        "timestep": 0,
        "pass_at_1": 0.009934283060224654,
        "avg_reward": 0.0010342113896204897,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 101,
        "pass_at_1": 0.022650740458983548,
        "avg_reward": 0.09427208518758812,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 202,
        "pass_at_1": 0.014710871899472674,
        "avg_reward": 6.184967211911134e-05,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 303,
        "pass_at_1": 0.06067516540105691,
        "avg_reward": 0.08691186877849097,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 404,
        "pass_at_1": 0.029398391069179745,
        "avg_reward": 0.050646715034642034,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 505,
        "pass_at_1": 0.13627120206138654,
        "avg_reward": 0.08573047397059638,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 606,
        "pass_at_1": 0.15295233470895173,
        "avg_reward": 0.026697855534271495,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 707,
        "pass_at_1": 0.11621326704358825,
        "avg_reward": 0.06485623717282198,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 808,
        "pass_at_1": 0.13307806237689995,
        "avg_reward": 0.12217481653128366,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 909,
        "pass_at_1": 0.13782129187311734,
        "avg_reward": 0.0396418484317293,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1010,
        "pass_at_1": 0.18796534106448662,
        "avg_reward": 0.1390834578272625,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1111,
        "pass_at_1": 0.16269647751768954,
        "avg_reward": 0.0589197727034788,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1212,
        "pass_at_1": 0.15317418961401466,
        "avg_reward": 0.12808548117670504,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1313,
        "pass_at_1": 0.14377968974527666,
        "avg_reward": 0.13380865271350492,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1414,
        "pass_at_1": 0.15754567115199986,
        "avg_reward": 0.11145184943193605,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1515,
        "pass_at_1": 0.1603037195666754,
        "avg_reward": 0.22085688487878724,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1616,
        "pass_at_1": 0.1748671713321704,
        "avg_reward": 0.0870081906179413,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1717,
        "pass_at_1": 0.1944064468902683,
        "avg_reward": 0.09448297501366351,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1818,
        "pass_at_1": 0.18496971206332063,
        "avg_reward": 0.049992263456667727,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 1919,
        "pass_at_1": 0.15708333810655103,
        "avg_reward": 0.135509732278697,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2020,
        "pass_at_1": 0.20128798518546676,
        "avg_reward": 0.16959880220787193,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2121,
        "pass_at_1": 0.18709348633821707,
        "avg_reward": 0.13461960429110922,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2222,
        "pass_at_1": 0.1627392236771602,
        "avg_reward": 0.09419916852199273,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2323,
        "pass_at_1": 0.18601470351916982,
        "avg_reward": 0.20166787412628165,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2424,
        "pass_at_1": 0.20503143747923927,
        "avg_reward": 0.07587314221525474,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2525,
        "pass_at_1": 0.20758527781252228,
        "avg_reward": 0.146814108229202,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2626,
        "pass_at_1": 0.19052176009548602,
        "avg_reward": 0.1830012225184322,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2727,
        "pass_at_1": 0.2276479933331238,
        "avg_reward": 0.22868240062230896,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2828,
        "pass_at_1": 0.1932217686687666,
        "avg_reward": 0.1391167961424526,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 2929,
        "pass_at_1": 0.21961891706654743,
        "avg_reward": 0.22447239000935593,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3030,
        "pass_at_1": 0.20640619390884027,
        "avg_reward": 0.15584200629388137,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3131,
        "pass_at_1": 0.19686658756926723,
        "avg_reward": 0.09768293885138027,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3232,
        "pass_at_1": 0.23825405775492958,
        "avg_reward": 0.2584152476324848,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3333,
        "pass_at_1": 0.22357929834899032,
        "avg_reward": 0.2290400835737935,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3434,
        "pass_at_1": 0.23527293810038397,
        "avg_reward": 0.155962362750051,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3535,
        "pass_at_1": 0.23829264997320676,
        "avg_reward": 0.2675359483018639,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3636,
        "pass_at_1": 0.23337558205760056,
        "avg_reward": 0.26493264843678077,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3737,
        "pass_at_1": 0.18472644809699978,
        "avg_reward": 0.18887628369636103,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3838,
        "pass_at_1": 0.24189245649614946,
        "avg_reward": 0.1785635976736262,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 3939,
        "pass_at_1": 0.24501684730999618,
        "avg_reward": 0.0966350321179523,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4040,
        "pass_at_1": 0.2418172965090429,
        "avg_reward": 0.21130946578282164,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4141,
        "pass_at_1": 0.27879573892168924,
        "avg_reward": 0.19712308022366903,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4242,
        "pass_at_1": 0.23609216896079444,
        "avg_reward": 0.16378588298940874,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4343,
        "pass_at_1": 0.27359036729238256,
        "avg_reward": 0.23530984931689028,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4444,
        "pass_at_1": 0.2477025523593436,
        "avg_reward": 0.2238254135431427,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4545,
        "pass_at_1": 0.26324893929236515,
        "avg_reward": 0.25903140096053656,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4646,
        "pass_at_1": 0.2502692188004057,
        "avg_reward": 0.18383226771043618,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4747,
        "pass_at_1": 0.2594633391080536,
        "avg_reward": 0.13439492387983695,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4848,
        "pass_at_1": 0.27621453657276257,
        "avg_reward": 0.23402439286720453,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 4949,
        "pass_at_1": 0.27337152538344417,
        "avg_reward": 0.206967863637998,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 5050,
        "pass_at_1": 0.24792856380455247,
        "avg_reward": 0.17731058490537405
      },
      {
        "timestep": 5151,
        "pass_at_1": 0.27233712158419443,
        "avg_reward": 0.1777558338062746
      },
      {
        "timestep": 5252,
        "pass_at_1": 0.2789089694241874,
        "avg_reward": 0.24332971838007686
      },
      {
        "timestep": 5353,
        "pass_at_1": 0.32278865438282967,
        "avg_reward": 0.2669598141478557
      },
      {
        "timestep": 5454,
        "pass_at_1": 0.2931323361487184,
        "avg_reward": 0.2307835731306664
      },
      {
        "timestep": 5555,
        "pass_at_1": 0.25250761033210534,
        "avg_reward": 0.20068039449322345
      },
      {
        "timestep": 5656,
        "pass_at_1": 0.29497385212391175,
        "avg_reward": 0.35914118732339373
      },
      {
        "timestep": 5757,
        "pass_at_1": 0.2927919599761502,
        "avg_reward": 0.2493109350976008
      },
      {
        "timestep": 5858,
        "pass_at_1": 0.2987978235568456,
        "avg_reward": 0.18060435696449986
      },
      {
        "timestep": 5959,
        "pass_at_1": 0.3251835934502633,
        "avg_reward": 0.2977435263945494
      },
      {
        "timestep": 6060,
        "pass_at_1": 0.320964323641925,
        "avg_reward": 0.21130208617380308
      },
      {
        "timestep": 6161,
        "pass_at_1": 0.33599687983178445,
        "avg_reward": 0.1987049507258135
      },
      {
        "timestep": 6262,
        "pass_at_1": 0.32245551962943086,
        "avg_reward": 0.36748719699404364
      },
      {
        "timestep": 6363,
        "pass_at_1": 0.29366444682764936,
        "avg_reward": 0.2066166709819809
      },
      {
        "timestep": 6464,
        "pass_at_1": 0.31820376668554506,
        "avg_reward": 0.2293892306426261
      },
      {
        "timestep": 6565,
        "pass_at_1": 0.2879111895957403,
        "avg_reward": 0.23375710041689363
      },
      {
        "timestep": 6666,
        "pass_at_1": 0.3003696615013904,
        "avg_reward": 0.26397535073287137
      },
      {
        "timestep": 6767,
        "pass_at_1": 0.30589551729360714,
        "avg_reward": 0.3222131340857627
      },
      {
        "timestep": 6868,
        "pass_at_1": 0.3112636451464902,
        "avg_reward": 0.2329078403069084
      },
      {
        "timestep": 6969,
        "pass_at_1": 0.34581968581737416,
        "avg_reward": 0.2151125328322016
      },
      {
        "timestep": 7070,
        "pass_at_1": 0.33669459541007757,
        "avg_reward": 0.33471281404218345
      },
      {
        "timestep": 7171,
        "pass_at_1": 0.3025667401470449,
        "avg_reward": 0.2512850850442511
      },
      {
        "timestep": 7272,
        "pass_at_1": 0.3424595746923032,
        "avg_reward": 0.3130588033427081
      },
      {
        "timestep": 7373,
        "pass_at_1": 0.31504250229711406,
        "avg_reward": 0.18601117118347743
      },
      {
        "timestep": 7474,
        "pass_at_1": 0.35271363206719053,
        "avg_reward": 0.2970201393154117
      },
      {
        "timestep": 7575,
        "pass_at_1": 0.3497512561825116,
        "avg_reward": 0.2971234154208581
      },
      {
        "timestep": 7676,
        "pass_at_1": 0.33358046975168254,
        "avg_reward": 0.2784770606593962
      },
      {
        "timestep": 7777,
        "pass_at_1": 0.355454622273077,
        "avg_reward": 0.24864612691714322
      },
      {
        "timestep": 7878,
        "pass_at_1": 0.38929321674695894,
        "avg_reward": 0.33512621944315657
      },
      {
        "timestep": 7979,
        "pass_at_1": 0.3305082811014131,
        "avg_reward": 0.29723430531282197
      },
      {
        "timestep": 8080,
        "pass_at_1": 0.3371691626630571,
        "avg_reward": 0.30908956031756823
      },
      {
        "timestep": 8181,
        "pass_at_1": 0.3821347465679561,
        "avg_reward": 0.2646736813367794
      },
      {
        "timestep": 8282,
        "pass_at_1": 0.38050178717275845,
        "avg_reward": 0.32504047608503167
      },
      {
        "timestep": 8383,
        "pass_at_1": 0.3799181078865503,
        "avg_reward": 0.3987741354419376
      },
      {
        "timestep": 8484,
        "pass_at_1": 0.36078283544373185,
        "avg_reward": 0.250939460137111
      },
      {
        "timestep": 8585,
        "pass_at_1": 0.3500849199637493,
        "avg_reward": 0.23927742172272753
      },
      {
        "timestep": 8686,
        "pass_at_1": 0.3684885894416738,
        "avg_reward": 0.31184847029417123
      },
      {
        "timestep": 8787,
        "pass_at_1": 0.377690566914506,
        "avg_reward": 0.343511615983406
      },
      {
        "timestep": 8888,
        "pass_at_1": 0.3745135571347664,
        "avg_reward": 0.372287549565679
      },
      {
        "timestep": 8989,
        "pass_at_1": 0.371027741331753,
        "avg_reward": 0.43283065139488336
      },
      {
        "timestep": 9090,
        "pass_at_1": 0.3908721431412089,
        "avg_reward": 0.269839836692153
      },
      {
        "timestep": 9191,
        "pass_at_1": 0.35894941243986345,
        "avg_reward": 0.31128315071405
      },
      {
        "timestep": 9292,
        "pass_at_1": 0.37787702830702496,
        "avg_reward": 0.3380016473502246
      },
      {
        "timestep": 9393,
        "pass_at_1": 0.39376063917010995,
        "avg_reward": 0.31136706570324435
      },
      {
        "timestep": 9494,
        "pass_at_1": 0.3692802394118455,
        "avg_reward": 0.21968183029518318
      },
      {
        "timestep": 9595,
        "pass_at_1": 0.37917672678309217,
        "avg_reward": 0.3461613211426474
      },
      {
        "timestep": 9696,
        "pass_at_1": 0.3942505748141219,
        "avg_reward": 0.25311352091569816
      },
      {
        "timestep": 9797,
        "pass_at_1": 0.3952648476989417,
        "avg_reward": 0.33547774714559525
      },
      {
        "timestep": 9898,
        "pass_at_1": 0.3759275733394191,
        "avg_reward": 0.3084283139688117
      },
      {
        "timestep": 10000,
        "pass_at_1": 0.3965434762427287,
        "avg_reward": 0.2600862661026518
      }
    ],
    "eval_metrics": [
      {
        "timestep": 0,
        "pass_at_1": 0.009934283060224654,
        "avg_reward": 0.0010342113896204897,
        "difficulty_1_ratio": 0.2,
        "difficulty_2_ratio": 0.2,
        "difficulty_3_ratio": 0.2,
        "difficulty_4_ratio": 0.2,
        "difficulty_5_ratio": 0.2
      },
      {
        "timestep": 10000,
        "pass_at_1": 0.3965434762427287,
        "avg_reward": 0.2600862661026518
      }
    ],
    "timing_metrics": [
      {
        "timestep": 0,
        "throughput": 11.0,
        "update": 1,
        "cumulative_wall_time": 4.545454545454546
      },
      {
        "timestep": 101,
        "throughput": 12.100000000000001,
        "update": 2,
        "cumulative_wall_time": 9.090909090909092
      },
      {
        "timestep": 202,
        "throughput": 13.2,
        "update": 3,
        "cumulative_wall_time": 13.636363636363637
      },
      {
        "timestep": 303,
        "throughput": 14.3,
        "update": 4,
        "cumulative_wall_time": 18.181818181818183
      },
      {
        "timestep": 404,
        "throughput": 15.399999999999999,
        "update": 5,
        "cumulative_wall_time": 22.72727272727273
      },
      {
        "timestep": 505,
        "throughput": 16.5,
        "update": 6,
        "cumulative_wall_time": 27.272727272727277
      },
      {
        "timestep": 606,
        "throughput": 17.6,
        "update": 7,
        "cumulative_wall_time": 31.818181818181824
      },
      {
        "timestep": 707,
        "throughput": 18.7,
        "update": 8,
        "cumulative_wall_time": 36.36363636363637
      },
      {
        "timestep": 808,
        "throughput": 19.8,
        "update": 9,
        "cumulative_wall_time": 40.909090909090914
      },
      {
        "timestep": 909,
        "throughput": 20.9,
        "update": 10,
        "cumulative_wall_time": 45.45454545454546
      },
      {
        "timestep": 1010,
        "throughput": 22.787132192766222,
        "update": 11,
        "cumulative_wall_time": 50.00000000000001
      },
      {
        "timestep": 1111,
        "throughput": 23.233725958010115,
        "update": 12,
        "cumulative_wall_time": 54.545454545454554
      },
      {
        "timestep": 1212,
        "throughput": 24.38271273498561,
        "update": 13,
        "cumulative_wall_time": 59.0909090909091
      },
      {
        "timestep": 1313,
        "throughput": 24.318364514476784,
        "update": 14,
        "cumulative_wall_time": 63.63636363636365
      },
      {
        "timestep": 1414,
        "throughput": 18.9691273904944,
        "update": 15,
        "cumulative_wall_time": 68.18181818181819
      },
      {
        "timestep": 1515,
        "throughput": 19.936784912186727,
        "update": 16,
        "cumulative_wall_time": 72.72727272727273
      },
      {
        "timestep": 1616,
        "throughput": 23.13307758785905,
        "update": 17,
        "cumulative_wall_time": 77.27272727272728
      },
      {
        "timestep": 1717,
        "throughput": 23.13032909200686,
        "update": 18,
        "cumulative_wall_time": 81.81818181818183
      },
      {
        "timestep": 1818,
        "throughput": 23.133104909873303,
        "update": 19,
        "cumulative_wall_time": 86.36363636363637
      },
      {
        "timestep": 1919,
        "throughput": 30.476009279440387,
        "update": 20,
        "cumulative_wall_time": 90.90909090909092
      },
      {
        "timestep": 2020,
        "throughput": 23.255959123524967,
        "update": 21,
        "cumulative_wall_time": 95.45454545454547
      },
      {
        "timestep": 2121,
        "throughput": 24.498244408397316,
        "update": 22,
        "cumulative_wall_time": 100.00000000000001
      },
      {
        "timestep": 2222,
        "throughput": 24.098803879685043,
        "update": 23,
        "cumulative_wall_time": 104.54545454545456
      },
      {
        "timestep": 2323,
        "throughput": 23.433060752872755,
        "update": 24,
        "cumulative_wall_time": 109.09090909090911
      },
      {
        "timestep": 2424,
        "throughput": 21.30640766179124,
        "update": 25,
        "cumulative_wall_time": 113.63636363636365
      },
      {
        "timestep": 2525,
        "throughput": 23.66973228508519,
        "update": 26,
        "cumulative_wall_time": 118.1818181818182
      },
      {
        "timestep": 2626,
        "throughput": 20.299784528017344,
        "update": 27,
        "cumulative_wall_time": 122.72727272727275
      },
      {
        "timestep": 2727,
        "throughput": 21.47899906517198,
        "update": 28,
        "cumulative_wall_time": 127.2727272727273
      },
      {
        "timestep": 2828,
        "throughput": 20.932200194775973,
        "update": 29,
        "cumulative_wall_time": 131.81818181818184
      },
      {
        "timestep": 2929,
        "throughput": 22.18012310664991,
        "update": 30,
        "cumulative_wall_time": 136.36363636363637
      },
      {
        "timestep": 3030,
        "throughput": 27.09224884668172,
        "update": 31,
        "cumulative_wall_time": 140.9090909090909
      },
      {
        "timestep": 3131,
        "throughput": 17.892016576298154,
        "update": 32,
        "cumulative_wall_time": 145.45454545454544
      },
      {
        "timestep": 3232,
        "throughput": 23.50977241882393,
        "update": 33,
        "cumulative_wall_time": 149.99999999999997
      },
      {
        "timestep": 3333,
        "throughput": 18.452025083382765,
        "update": 34,
        "cumulative_wall_time": 154.5454545454545
      },
      {
        "timestep": 3434,
        "throughput": 20.961749895263246,
        "update": 35,
        "cumulative_wall_time": 159.09090909090904
      },
      {
        "timestep": 3535,
        "throughput": 24.395691313328207,
        "update": 36,
        "cumulative_wall_time": 163.63636363636357
      },
      {
        "timestep": 3636,
        "throughput": 22.141416042010015,
        "update": 37,
        "cumulative_wall_time": 168.1818181818181
      },
      {
        "timestep": 3737,
        "throughput": 19.628961488555525,
        "update": 38,
        "cumulative_wall_time": 172.72727272727263
      },
      {
        "timestep": 3838,
        "throughput": 20.42633183962807,
        "update": 39,
        "cumulative_wall_time": 177.27272727272717
      },
      {
        "timestep": 3939,
        "throughput": 23.495115047656284,
        "update": 40,
        "cumulative_wall_time": 181.8181818181817
      },
      {
        "timestep": 4040,
        "throughput": 20.3931934102223,
        "update": 41,
        "cumulative_wall_time": 186.36363636363623
      },
      {
        "timestep": 4141,
        "throughput": 22.476208897080348,
        "update": 42,
        "cumulative_wall_time": 190.90909090909076
      },
      {
        "timestep": 4242,
        "throughput": 22.100258047788387,
        "update": 43,
        "cumulative_wall_time": 195.4545454545453
      },
      {
        "timestep": 4343,
        "throughput": 20.566479235267202,
        "update": 44,
        "cumulative_wall_time": 199.99999999999983
      },
      {
        "timestep": 4444,
        "throughput": 26.71667699651572,
        "update": 45,
        "cumulative_wall_time": 204.54545454545436
      },
      {
        "timestep": 4545,
        "throughput": 23.39462184909962,
        "update": 46,
        "cumulative_wall_time": 209.0909090909089
      },
      {
        "timestep": 4646,
        "throughput": 17.544686309353267,
        "update": 47,
        "cumulative_wall_time": 213.63636363636343
      },
      {
        "timestep": 4747,
        "throughput": 22.410199492492744,
        "update": 48,
        "cumulative_wall_time": 218.18181818181796
      },
      {
        "timestep": 4848,
        "throughput": 20.544069777509545,
        "update": 49,
        "cumulative_wall_time": 222.7272727272725
      },
      {
        "timestep": 4949,
        "throughput": 23.87535333655169,
        "update": 50,
        "cumulative_wall_time": 227.27272727272702
      },
      {
        "timestep": 5050,
        "throughput": 20.256454375448058,
        "update": 51,
        "cumulative_wall_time": 231.81818181818156
      },
      {
        "timestep": 5151,
        "throughput": 21.74757982877282,
        "update": 52,
        "cumulative_wall_time": 236.3636363636361
      },
      {
        "timestep": 5252,
        "throughput": 23.110972013757006,
        "update": 53,
        "cumulative_wall_time": 240.90909090909062
      },
      {
        "timestep": 5353,
        "throughput": 23.90466142717427,
        "update": 54,
        "cumulative_wall_time": 245.45454545454515
      },
      {
        "timestep": 5454,
        "throughput": 19.359347904477293,
        "update": 55,
        "cumulative_wall_time": 249.9999999999997
      },
      {
        "timestep": 5555,
        "throughput": 21.264097281149915,
        "update": 56,
        "cumulative_wall_time": 254.54545454545422
      },
      {
        "timestep": 5656,
        "throughput": 20.955120315445896,
        "update": 57,
        "cumulative_wall_time": 259.0909090909088
      },
      {
        "timestep": 5757,
        "throughput": 20.562675688337833,
        "update": 58,
        "cumulative_wall_time": 263.63636363636334
      },
      {
        "timestep": 5858,
        "throughput": 25.883999328618412,
        "update": 59,
        "cumulative_wall_time": 268.1818181818179
      },
      {
        "timestep": 5959,
        "throughput": 22.890959764114104,
        "update": 60,
        "cumulative_wall_time": 272.72727272727246
      },
      {
        "timestep": 6060,
        "throughput": 19.2260553004629,
        "update": 61,
        "cumulative_wall_time": 277.272727272727
      },
      {
        "timestep": 6161,
        "throughput": 24.019296283520507,
        "update": 62,
        "cumulative_wall_time": 281.8181818181816
      },
      {
        "timestep": 6262,
        "throughput": 26.66874363342779,
        "update": 63,
        "cumulative_wall_time": 286.36363636363615
      },
      {
        "timestep": 6363,
        "throughput": 24.271423573212523,
        "update": 64,
        "cumulative_wall_time": 290.9090909090907
      },
      {
        "timestep": 6464,
        "throughput": 18.65738607490117,
        "update": 65,
        "cumulative_wall_time": 295.45454545454527
      },
      {
        "timestep": 6565,
        "throughput": 20.934685039694244,
        "update": 66,
        "cumulative_wall_time": 299.99999999999983
      },
      {
        "timestep": 6666,
        "throughput": 24.78720452821057,
        "update": 67,
        "cumulative_wall_time": 304.5454545454544
      },
      {
        "timestep": 6767,
        "throughput": 20.443127175638683,
        "update": 68,
        "cumulative_wall_time": 309.09090909090895
      },
      {
        "timestep": 6868,
        "throughput": 22.976402741921703,
        "update": 69,
        "cumulative_wall_time": 313.6363636363635
      },
      {
        "timestep": 6969,
        "throughput": 23.70419491754454,
        "update": 70,
        "cumulative_wall_time": 318.1818181818181
      },
      {
        "timestep": 7070,
        "throughput": 19.96075296252822,
        "update": 71,
        "cumulative_wall_time": 322.72727272727263
      },
      {
        "timestep": 7171,
        "throughput": 21.86904421666404,
        "update": 72,
        "cumulative_wall_time": 327.2727272727272
      },
      {
        "timestep": 7272,
        "throughput": 14.86921185184804,
        "update": 73,
        "cumulative_wall_time": 331.81818181818176
      },
      {
        "timestep": 7373,
        "throughput": 19.74634718906456,
        "update": 74,
        "cumulative_wall_time": 336.3636363636363
      },
      {
        "timestep": 7474,
        "throughput": 21.444350066935048,
        "update": 75,
        "cumulative_wall_time": 340.9090909090909
      },
      {
        "timestep": 7575,
        "throughput": 19.25487699967733,
        "update": 76,
        "cumulative_wall_time": 345.45454545454544
      },
      {
        "timestep": 7676,
        "throughput": 25.591304868649598,
        "update": 77,
        "cumulative_wall_time": 350.0
      },
      {
        "timestep": 7777,
        "throughput": 18.85368896848661,
        "update": 78,
        "cumulative_wall_time": 354.54545454545456
      },
      {
        "timestep": 7878,
        "throughput": 21.031902129266633,
        "update": 79,
        "cumulative_wall_time": 359.0909090909091
      },
      {
        "timestep": 7979,
        "throughput": 22.2876292700294,
        "update": 80,
        "cumulative_wall_time": 363.6363636363637
      },
      {
        "timestep": 8080,
        "throughput": 25.170801235945454,
        "update": 81,
        "cumulative_wall_time": 368.18181818181824
      },
      {
        "timestep": 8181,
        "throughput": 18.841103267405234,
        "update": 82,
        "cumulative_wall_time": 372.7272727272728
      },
      {
        "timestep": 8282,
        "throughput": 24.55896025474091,
        "update": 83,
        "cumulative_wall_time": 377.27272727272737
      },
      {
        "timestep": 8383,
        "throughput": 22.02251273424309,
        "update": 84,
        "cumulative_wall_time": 381.8181818181819
      },
      {
        "timestep": 8484,
        "throughput": 19.840680967694507,
        "update": 85,
        "cumulative_wall_time": 386.3636363636365
      },
      {
        "timestep": 8585,
        "throughput": 23.016627643379195,
        "update": 86,
        "cumulative_wall_time": 390.90909090909105
      },
      {
        "timestep": 8686,
        "throughput": 22.437931330261634,
        "update": 87,
        "cumulative_wall_time": 395.4545454545456
      },
      {
        "timestep": 8787,
        "throughput": 20.67952287025065,
        "update": 88,
        "cumulative_wall_time": 400.00000000000017
      },
      {
        "timestep": 8888,
        "throughput": 22.15356458697804,
        "update": 89,
        "cumulative_wall_time": 404.54545454545473
      },
      {
        "timestep": 8989,
        "throughput": 21.152310086904127,
        "update": 90,
        "cumulative_wall_time": 409.0909090909093
      },
      {
        "timestep": 9090,
        "throughput": 22.249738159552745,
        "update": 91,
        "cumulative_wall_time": 413.63636363636385
      },
      {
        "timestep": 9191,
        "throughput": 23.456687483946304,
        "update": 92,
        "cumulative_wall_time": 418.1818181818184
      },
      {
        "timestep": 9292,
        "throughput": 25.489236995519775,
        "update": 93,
        "cumulative_wall_time": 422.727272727273
      },
      {
        "timestep": 9393,
        "throughput": 19.276805902580932,
        "update": 94,
        "cumulative_wall_time": 427.27272727272754
      },
      {
        "timestep": 9494,
        "throughput": 26.69267342424379,
        "update": 95,
        "cumulative_wall_time": 431.8181818181821
      },
      {
        "timestep": 9595,
        "throughput": 17.705406841050497,
        "update": 96,
        "cumulative_wall_time": 436.36363636363666
      },
      {
        "timestep": 9696,
        "throughput": 21.666072790921717,
        "update": 97,
        "cumulative_wall_time": 440.9090909090912
      },
      {
        "timestep": 9797,
        "throughput": 23.29429785426607,
        "update": 98,
        "cumulative_wall_time": 445.4545454545458
      },
      {
        "timestep": 9898,
        "throughput": 22.61818210901707,
        "update": 99,
        "cumulative_wall_time": 450.00000000000034
      },
      {
        "timestep": 10000,
        "throughput": 20.63006105639469,
        "update": 100,
        "cumulative_wall_time": 454.5454545454549
      }
    ],
    "scheduler_stats": {
      "total_experiences": 10000,
      "total_updates": 500,
      "policy_version": 500,
      "buffer_size": 1024,
      "curriculum": {
        "level_1": {
          "num_pulls": 2000,
          "success_rate": 0.85,
          "mean_reward": 0.7608375549928545,
          "recent_gradient": 0.009013998130682335
        },
        "level_2": {
          "num_pulls": 2000,
          "success_rate": 0.65,
          "mean_reward": 0.5732127048611159,
          "recent_gradient": 0.02169920419404205
        },
        "level_3": {
          "num_pulls": 2000,
          "success_rate": 0.45,
          "mean_reward": 0.412140309719301,
          "recent_gradient": 0.028614180809478692
        },
        "level_4": {
          "num_pulls": 2000,
          "success_rate": 0.28,
          "mean_reward": 0.2699919975086651,
          "recent_gradient": 0.02061459904175322
        },
        "level_5": {
          "num_pulls": 2000,
          "success_rate": 0.15,
          "mean_reward": 0.1512572423767792,
          "recent_gradient": 0.011259257683847225
        },
        "total_steps": 10000
      },
      "staleness": {
        "discard_rate": 0.15
      },
      "workers": {
        "0": {
          "completed_tasks": 2500,
          "avg_throughput": 4.5855024945389635
        },
        "1": {
          "completed_tasks": 2500,
          "avg_throughput": 4.719909479901515
        },
        "2": {
          "completed_tasks": 2500,
          "avg_throughput": 5.373646802561631
        },
        "3": {
          "completed_tasks": 2500,
          "avg_throughput": 5.3051851327167325
        }
      }
    },
    "final_pass_at_1": 0.40332200704816507,
    "final_pass_at_1_std": 0.015580873953549118,
    "avg_throughput": 21.420444839914293,
    "avg_throughput_std": 0.19882364871009708,
    "wall_time_mean": 0.0,
    "num_runs": 3
  },
  "aceas": {
    "train_metrics": [
      {
        "timestep": 0,
        "pass_at_1": 0.009934283060224654,
        "avg_reward": 0.0010342113896204897,
        "difficulty_1_ratio": 0.2570583684642447,
        "difficulty_2_ratio": 0.4238175998984713,
        "difficulty_3_ratio": 0.2570583684642447,
        "difficulty_4_ratio": 0.057357474922920995,
        "difficulty_5_ratio": 0.0047081882501182806
      },
      {
        "timestep": 101,
        "pass_at_1": 0.025479023287266374,
        "avg_reward": 0.09653471145021437,
        "difficulty_1_ratio": 0.2570583684642447,
        "difficulty_2_ratio": 0.4238175998984713,
        "difficulty_3_ratio": 0.2570583684642447,
        "difficulty_4_ratio": 0.057357474922920995,
        "difficulty_5_ratio": 0.0047081882501182806
      },
      {
        "timestep": 202,
        "pass_at_1": 0.020367437556038332,
        "avg_reward": 0.004587102197371637,
        "difficulty_1_ratio": 0.2570583684642447,
        "difficulty_2_ratio": 0.4238175998984713,
        "difficulty_3_ratio": 0.2570583684642447,
        "difficulty_4_ratio": 0.057357474922920995,
        "difficulty_5_ratio": 0.0047081882501182806
      },
      {
        "timestep": 303,
        "pass_at_1": 0.0691600138859054,
        "avg_reward": 0.09369974756636976,
        "difficulty_1_ratio": 0.2570583684642447,
        "difficulty_2_ratio": 0.4238175998984713,
        "difficulty_3_ratio": 0.2570583684642447,
        "difficulty_4_ratio": 0.057357474922920995,
        "difficulty_5_ratio": 0.0047081882501182806
      },
      {
        "timestep": 404,
        "pass_at_1": 0.04071152238231106,
        "avg_reward": 0.05969722008514708,
        "difficulty_1_ratio": 0.2570583684642447,
        "difficulty_2_ratio": 0.4238175998984713,
        "difficulty_3_ratio": 0.2570583684642447,
        "difficulty_4_ratio": 0.057357474922920995,
        "difficulty_5_ratio": 0.0047081882501182806
      },
      {
        "timestep": 505,
        "pass_at_1": 0.08943988967981922,
        "avg_reward": 0.04826542406534253,
        "difficulty_1_ratio": 0.2570583684642447,
        "difficulty_2_ratio": 0.4238175998984713,
        "difficulty_3_ratio": 0.2570583684642447,
        "difficulty_4_ratio": 0.057357474922920995,
        "difficulty_5_ratio": 0.0047081882501182806
      },
      {
        "timestep": 606,
        "pass_at_1": 0.10781155124913581,
        "avg_reward": -0.00941477123358124,
        "difficulty_1_ratio": 0.2570583684642447,
        "difficulty_2_ratio": 0.4238175998984713,
        "difficulty_3_ratio": 0.2570583684642447,
        "difficulty_4_ratio": 0.057357474922920995,
        "difficulty_5_ratio": 0.0047081882501182806
      },
      {
        "timestep": 707,
        "pass_at_1": 0.07288426883456268,
        "avg_reward": 0.030193038605601515,
        "difficulty_1_ratio": 0.2570583684642447,
        "difficulty_2_ratio": 0.4238175998984713,
        "difficulty_3_ratio": 0.2570583684642447,
        "difficulty_4_ratio": 0.057357474922920995,
        "difficulty_5_ratio": 0.0047081882501182806
      },
      {
        "timestep": 808,
        "pass_at_1": 0.09168432009326676,
        "avg_reward": 0.0890598227043771,
        "difficulty_1_ratio": 0.2570583684642447,
        "difficulty_2_ratio": 0.4238175998984713,
        "difficulty_3_ratio": 0.2570583684642447,
        "difficulty_4_ratio": 0.057357474922920995,
        "difficulty_5_ratio": 0.0047081882501182806
      },
      {
        "timestep": 909,
        "pass_at_1": 0.09848824403931097,
        "avg_reward": 0.008175410164684205,
        "difficulty_1_ratio": 0.2570583684642447,
        "difficulty_2_ratio": 0.4238175998984713,
        "difficulty_3_ratio": 0.2570583684642447,
        "difficulty_4_ratio": 0.057357474922920995,
        "difficulty_5_ratio": 0.0047081882501182806
      },
      {
        "timestep": 1010,
        "pass_at_1": 0.15082012302087433,
        "avg_reward": 0.10936728339237269,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 1111,
        "pass_at_1": 0.12786762580848063,
        "avg_reward": 0.031056691336111678,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 1212,
        "pass_at_1": 0.12079132198268795,
        "avg_reward": 0.10217918707164368,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 1313,
        "pass_at_1": 0.11397316116956432,
        "avg_reward": 0.10996342985293507,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 1414,
        "pass_at_1": 0.13044620661575745,
        "avg_reward": 0.08977227780294213,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 1515,
        "pass_at_1": 0.13604202454798597,
        "avg_reward": 0.20144752886383566,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 1616,
        "pass_at_1": 0.15357352128292623,
        "avg_reward": 0.06997327057854597,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 1717,
        "pass_at_1": 0.17621025728876094,
        "avg_reward": 0.07992602333245763,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 1818,
        "pass_at_1": 0.16999909093393656,
        "avg_reward": 0.03801576655316048,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 1919,
        "pass_at_1": 0.1454646232148162,
        "avg_reward": 0.12621476036530915,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 2020,
        "pass_at_1": 0.19314526842715274,
        "avg_reward": 0.1630846288012207,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 2121,
        "pass_at_1": 0.18254812814228522,
        "avg_reward": 0.13098331773436375,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 2222,
        "pass_at_1": 0.16190936052789232,
        "avg_reward": 0.09353527800257841,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 2323,
        "pass_at_1": 0.18901475196654802,
        "avg_reward": 0.20406791288418422,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 2424,
        "pass_at_1": 0.2119715982420541,
        "avg_reward": 0.0814252708255066,
        "difficulty_1_ratio": 0.054488684549642924,
        "difficulty_2_ratio": 0.24420134200323332,
        "difficulty_3_ratio": 0.4026199468942474,
        "difficulty_4_ratio": 0.24420134200323332,
        "difficulty_5_ratio": 0.054488684549642924
      },
      {
        "timestep": 2525,
        "pass_at_1": 0.21857104377940367,
        "avg_reward": 0.1556027210027071,
        "difficulty_1_ratio": 0.016291910734624847,
        "difficulty_2_ratio": 0.12497928765460015,
        "difficulty_3_ratio": 0.3527033512649604,
        "difficulty_4_ratio": 0.3661732760034468,
        "difficulty_5_ratio": 0.1398521743423678
      },
      {
        "timestep": 2626,
        "pass_at_1": 0.20565343218891582,
        "avg_reward": 0.19510656019317607,
        "difficulty_1_ratio": 0.014439823367355656,
        "difficulty_2_ratio": 0.1162288430953594,
        "difficulty_3_ratio": 0.34416877595779866,
        "difficulty_4_ratio": 0.37491648580673986,
        "difficulty_5_ratio": 0.15024607177274654
      },
      {
        "timestep": 2727,
        "pass_at_1": 0.24702020831478103,
        "avg_reward": 0.24418017260763475,
        "difficulty_1_ratio": 0.012218327302669146,
        "difficulty_2_ratio": 0.10498325535696679,
        "difficulty_3_ratio": 0.33184389643032614,
        "difficulty_4_ratio": 0.38588078286713096,
        "difficulty_5_ratio": 0.165073738042907
      },
      {
        "timestep": 2828,
        "pass_at_1": 0.2169230430261858,
        "avg_reward": 0.15807781562838794,
        "difficulty_1_ratio": 0.009913147093465137,
        "difficulty_2_ratio": 0.09225064005743493,
        "difficulty_3_ratio": 0.3158149930158207,
        "difficulty_4_ratio": 0.39774215071368285,
        "difficulty_5_ratio": 0.18427906911959632
      },
      {
        "timestep": 2929,
        "pass_at_1": 0.24773121112676355,
        "avg_reward": 0.2469622252575288,
        "difficulty_1_ratio": 0.007760018351280176,
        "difficulty_2_ratio": 0.07909068287132516,
        "difficulty_3_ratio": 0.29654692178674946,
        "difficulty_4_ratio": 0.40904118087068214,
        "difficulty_5_ratio": 0.20756119611996313
      },
      {
        "timestep": 3030,
        "pass_at_1": 0.2390045002711823,
        "avg_reward": 0.181920651383755,
        "difficulty_1_ratio": 0.00590957184933243,
        "difficulty_2_ratio": 0.06645671547671815,
        "difficulty_3_ratio": 0.2749332380949103,
        "difficulty_4_ratio": 0.4184283859957229,
        "difficulty_5_ratio": 0.2342720885833161
      },
      {
        "timestep": 3131,
        "pass_at_1": 0.23401854783464296,
        "avg_reward": 0.12740450706368084,
        "difficulty_1_ratio": 0.0044234366536341566,
        "difficulty_2_ratio": 0.05506877089710349,
        "difficulty_3_ratio": 0.2522066146015487,
        "difficulty_4_ratio": 0.4249257796153269,
        "difficulty_5_ratio": 0.2633753982323869
      },
      {
        "timestep": 3232,
        "pass_at_1": 0.28001961135200454,
        "avg_reward": 0.2918276905101448,
        "difficulty_1_ratio": 0.0032937818280582443,
        "difficulty_2_ratio": 0.04535368508089252,
        "difficulty_3_ratio": 0.22973959398617683,
        "difficulty_4_ratio": 0.4281191321289578,
        "difficulty_5_ratio": 0.2934938069759146
      },
      {
        "timestep": 3333,
        "pass_at_1": 0.2700103670191985,
        "avg_reward": 0.26618493850996,
        "difficulty_1_ratio": 0.0024722539225482446,
        "difficulty_2_ratio": 0.03746068440111024,
        "difficulty_3_ratio": 0.20881604152186556,
        "difficulty_4_ratio": 0.4282107125631631,
        "difficulty_5_ratio": 0.32304030759131297
      },
      {
        "timestep": 3434,
        "pass_at_1": 0.2864131493057567,
        "avg_reward": 0.19687453171434915,
        "difficulty_1_ratio": 0.0018961158457144911,
        "difficulty_2_ratio": 0.03133140973471507,
        "difficulty_3_ratio": 0.19045857150804962,
        "difficulty_4_ratio": 0.4259186206842434,
        "difficulty_5_ratio": 0.35039528222727745
      },
      {
        "timestep": 3535,
        "pass_at_1": 0.29417710213708603,
        "avg_reward": 0.3122435100329673,
        "difficulty_1_ratio": 0.0015056169658766543,
        "difficulty_2_ratio": 0.026789686088424,
        "difficulty_3_ratio": 0.175358276208076,
        "difficulty_4_ratio": 0.42227019488557094,
        "difficulty_5_ratio": 0.3740762258520523
      },
      {
        "timestep": 3636,
        "pass_at_1": 0.29403065414334784,
        "avg_reward": 0.31345670610537857,
        "difficulty_1_ratio": 0.0012524233850038473,
        "difficulty_2_ratio": 0.023621859465310466,
        "difficulty_3_ratio": 0.16390134325095126,
        "difficulty_4_ratio": 0.4183660766360568,
        "difficulty_5_ratio": 0.3928582972626777
      },
      {
        "timestep": 3737,
        "pass_at_1": 0.2501696555801058,
        "avg_reward": 0.24123084968284583,
        "difficulty_1_ratio": 0.0011018868277803448,
        "difficulty_2_ratio": 0.021633707012814266,
        "difficulty_3_ratio": 0.15625373746114093,
        "difficulty_4_ratio": 0.4151790230064104,
        "difficulty_5_ratio": 0.40583164569185404
      },
      {
        "timestep": 3838,
        "pass_at_1": 0.31213235529817696,
        "avg_reward": 0.2347555167152482,
        "difficulty_1_ratio": 0.0010322931860183035,
        "difficulty_2_ratio": 0.02068358559081816,
        "difficulty_3_ratio": 0.15245936727836976,
        "difficulty_4_ratio": 0.41341660520999185,
        "difficulty_5_ratio": 0.41240814873480197
      },
      {
        "timestep": 3939,
        "pass_at_1": 0.32005298674705146,
        "avg_reward": 0.15666394366759653,
        "difficulty_1_ratio": 0.001033362574533033,
        "difficulty_2_ratio": 0.02069834621303522,
        "difficulty_3_ratio": 0.15251904715441822,
        "difficulty_4_ratio": 0.4134452797034622,
        "difficulty_5_ratio": 0.41230396435455147
      },
      {
        "timestep": 4040,
        "pass_at_1": 0.3216402217722719,
        "avg_reward": 0.27516780599340485,
        "difficulty_1_ratio": 0.001105253979564763,
        "difficulty_2_ratio": 0.021679152361382986,
        "difficulty_3_ratio": 0.1564328746274194,
        "difficulty_4_ratio": 0.41525920915243264,
        "difficulty_5_ratio": 0.4055235098792002
      },
      {
        "timestep": 4141,
        "pass_at_1": 0.3633870430624854,
        "avg_reward": 0.264796123536306,
        "difficulty_1_ratio": 0.0012585820768892396,
        "difficulty_2_ratio": 0.02370139964709112,
        "difficulty_3_ratio": 0.16419954975755394,
        "difficulty_4_ratio": 0.418480714620724,
        "difficulty_5_ratio": 0.3923597538977418
      },
      {
        "timestep": 4242,
        "pass_at_1": 0.3254245938091046,
        "avg_reward": 0.23525182286805685,
        "difficulty_1_ratio": 0.001515438901358441,
        "difficulty_2_ratio": 0.02690866798401823,
        "difficulty_3_ratio": 0.17577272552605308,
        "difficulty_4_ratio": 0.4223925910167582,
        "difficulty_5_ratio": 0.37341057657181215
      },
      {
        "timestep": 4343,
        "pass_at_1": 0.367627952202806,
        "avg_reward": 0.310539917245229,
        "difficulty_1_ratio": 0.0019108941032437861,
        "difficulty_2_ratio": 0.03149638910459275,
        "difficulty_3_ratio": 0.19098111826597575,
        "difficulty_4_ratio": 0.4260157102739871,
        "difficulty_5_ratio": 0.34959588825220067
      },
      {
        "timestep": 4444,
        "pass_at_1": 0.3464008291664554,
        "avg_reward": 0.30278403498883216,
        "difficulty_1_ratio": 0.0024936925676773474,
        "difficulty_2_ratio": 0.03767804281480519,
        "difficulty_3_ratio": 0.2094301856844532,
        "difficulty_4_ratio": 0.42824838946414634,
        "difficulty_5_ratio": 0.32214968946891787
      },
      {
        "timestep": 4545,
        "pass_at_1": 0.3665551713730763,
        "avg_reward": 0.34167638662510547,
        "difficulty_1_ratio": 0.003323844499126925,
        "difficulty_2_ratio": 0.045627461104830486,
        "difficulty_3_ratio": 0.23041854367730347,
        "difficulty_4_ratio": 0.4280692870521302,
        "difficulty_5_ratio": 0.29256086366660894
      },
      {
        "timestep": 4646,
        "pass_at_1": 0.35812268169562683,
        "avg_reward": 0.2701150380266131,
        "difficulty_1_ratio": 0.004463952486683914,
        "difficulty_2_ratio": 0.055397905274063235,
        "difficulty_3_ratio": 0.25291386667660937,
        "difficulty_4_ratio": 0.4247735415860251,
        "difficulty_5_ratio": 0.2624507339766185
      },
      {
        "timestep": 4747,
        "pass_at_1": 0.3717956397558158,
        "avg_reward": 0.2242607643980467,
        "difficulty_1_ratio": 0.005961543635767642,
        "difficulty_2_ratio": 0.06683240381041645,
        "difficulty_3_ratio": 0.27562649024852093,
        "difficulty_4_ratio": 0.41817719578473006,
        "difficulty_5_ratio": 0.2334023665205648
      },
      {
        "timestep": 4848,
        "pass_at_1": 0.3929499678564251,
        "avg_reward": 0.3274127378941346,
        "difficulty_1_ratio": 0.007822719184174324,
        "difficulty_2_ratio": 0.07949491055732377,
        "difficulty_3_ratio": 0.29718468692891836,
        "difficulty_4_ratio": 0.4087135617359425,
        "difficulty_5_ratio": 0.206784121593641
      },
      {
        "timestep": 4949,
        "pass_at_1": 0.3944274524064829,
        "avg_reward": 0.303812605256429,
        "difficulty_1_ratio": 0.009983298952962209,
        "difficulty_2_ratio": 0.09265686413080075,
        "difficulty_3_ratio": 0.3163636937049174,
        "difficulty_4_ratio": 0.3973755986640315,
        "difficulty_5_ratio": 0.1836205445472881
      },
      {
        "timestep": 5050,
        "pass_at_1": 0.373215838071042,
        "avg_reward": 0.27754040431856564
      },
      {
        "timestep": 5151,
        "pass_at_1": 0.4017605190933683,
        "avg_reward": 0.28129455181361374
      },
      {
        "timestep": 5252,
        "pass_at_1": 0.41236764857882685,
        "avg_reward": 0.35009666170378845
      },
      {
        "timestep": 5353,
        "pass_at_1": 0.46017662956376015,
        "avg_reward": 0.3768701942926001
      },
      {
        "timestep": 5454,
        "pass_at_1": 0.4343389628191408,
        "avg_reward": 0.3437488744670043
      },
      {
        "timestep": 5555,
        "pass_at_1": 0.397418077602494,
        "avg_reward": 0.3166087683095344
      },
      {
        "timestep": 5656,
        "pass_at_1": 0.443469678826402,
        "avg_reward": 0.4779378486853859
      },
      {
        "timestep": 5757,
        "pass_at_1": 0.4447514904615515,
        "avg_reward": 0.37087855948592185
      },
      {
        "timestep": 5858,
        "pass_at_1": 0.4540967196318868,
        "avg_reward": 0.3048434738245328
      },
      {
        "timestep": 5959,
        "pass_at_1": 0.48369531911121083,
        "avg_reward": 0.42455290692330744
      },
      {
        "timestep": 6060,
        "pass_at_1": 0.48256061952690665,
        "avg_reward": 0.3405791228817884
      },
      {
        "timestep": 6161,
        "pass_at_1": 0.5005482246015526,
        "avg_reward": 0.33034602654162804
      },
      {
        "timestep": 6262,
        "pass_at_1": 0.4898315757885757,
        "avg_reward": 0.5013880419213596
      },
      {
        "timestep": 6363,
        "pass_at_1": 0.46373448880935875,
        "avg_reward": 0.34267270456734844
      },
      {
        "timestep": 6464,
        "pass_at_1": 0.49083708933722103,
        "avg_reward": 0.3674958887639669
      },
      {
        "timestep": 6565,
        "pass_at_1": 0.4629774955149286,
        "avg_reward": 0.37381014515224426
      },
      {
        "timestep": 6666,
        "pass_at_1": 0.47773942597689695,
        "avg_reward": 0.40587116231327663
      },
      {
        "timestep": 6767,
        "pass_at_1": 0.4854403299013335,
        "avg_reward": 0.46584898417194376
      },
      {
        "timestep": 6868,
        "pass_at_1": 0.4928565273299796,
        "avg_reward": 0.37818214605369993
      },
      {
        "timestep": 6969,
        "pass_at_1": 0.5293353840465501,
        "avg_reward": 0.36192509141554235
      },
      {
        "timestep": 7070,
        "pass_at_1": 0.5220098497559862,
        "avg_reward": 0.4829650175189104
      },
      {
        "timestep": 7171,
        "pass_at_1": 0.48956052833401703,
        "avg_reward": 0.40088011559382886
      },
      {
        "timestep": 7272,
        "pass_at_1": 0.5310133318907984,
        "avg_reward": 0.4639018091015042
      },
      {
        "timestep": 7373,
        "pass_at_1": 0.5050403171000676,
        "avg_reward": 0.33800942302584025
      },
      {
        "timestep": 7474,
        "pass_at_1": 0.5440424192498975,
        "avg_reward": 0.4500831690615773
      },
      {
        "timestep": 7575,
        "pass_at_1": 0.542300906981251,
        "avg_reward": 0.4511631360598496
      },
      {
        "timestep": 7676,
        "pass_at_1": 0.5272439805100732,
        "avg_reward": 0.4334078692661087
      },
      {
        "timestep": 7777,
        "pass_at_1": 0.5501282023984896,
        "avg_reward": 0.4043849910174733
      },
      {
        "timestep": 7878,
        "pass_at_1": 0.5848763769933182,
        "avg_reward": 0.49159274764024397
      },
      {
        "timestep": 7979,
        "pass_at_1": 0.5269039032507387,
        "avg_reward": 0.4543508030322824
      },
      {
        "timestep": 8080,
        "pass_at_1": 0.5342835517175137,
        "avg_reward": 0.4667810715611336
      },
      {
        "timestep": 8181,
        "pass_at_1": 0.5798776665885219,
        "avg_reward": 0.422868017353232
      },
      {
        "timestep": 8282,
        "pass_at_1": 0.5787864819114005,
        "avg_reward": 0.4836682318759453
      },
      {
        "timestep": 8383,
        "pass_at_1": 0.578661307357545,
        "avg_reward": 0.5577686950187334
      },
      {
        "timestep": 8484,
        "pass_at_1": 0.559904749567981,
        "avg_reward": 0.41023699143651027
      },
      {
        "timestep": 8585,
        "pass_at_1": 0.5495092203990847,
        "avg_reward": 0.39881686207099587
      },
      {
        "timestep": 8686,
        "pass_at_1": 0.5681423806835675,
        "avg_reward": 0.4715715032876862
      },
      {
        "timestep": 8787,
        "pass_at_1": 0.5775043477166417,
        "avg_reward": 0.5033626406251146
      },
      {
        "timestep": 8888,
        "pass_at_1": 0.5744211732587482,
        "avg_reward": 0.5322136424648645
      },
      {
        "timestep": 8989,
        "pass_at_1": 0.5709663305909718,
        "avg_reward": 0.5927815228022584
      },
      {
        "timestep": 9090,
        "pass_at_1": 0.5907820736565318,
        "avg_reward": 0.42976778110441133
      },
      {
        "timestep": 9191,
        "pass_at_1": 0.5587742149752787,
        "avg_reward": 0.47114299274238225
      },
      {
        "timestep": 9292,
        "pass_at_1": 0.577563323502461,
        "avg_reward": 0.4977506835065734
      },
      {
        "timestep": 9393,
        "pass_at_1": 0.5932580604370521,
        "avg_reward": 0.4709650027167981
      },
      {
        "timestep": 9494,
        "pass_at_1": 0.5685413522057161,
        "avg_reward": 0.3790907205302797
      },
      {
        "timestep": 9595,
        "pass_at_1": 0.5781569449151632,
        "avg_reward": 0.5053454956483042
      },
      {
        "timestep": 9696,
        "pass_at_1": 0.5929080744154287,
        "avg_reward": 0.4120395205967436
      },
      {
        "timestep": 9797,
        "pass_at_1": 0.5935604793996371,
        "avg_reward": 0.49411425250615154
      },
      {
        "timestep": 9898,
        "pass_at_1": 0.5738247731795443,
        "avg_reward": 0.4667460738409118
      },
      {
        "timestep": 10000,
        "pass_at_1": 0.5940081757847141,
        "avg_reward": 0.4180580257362401
      }
    ],
    "eval_metrics": [
      {
        "timestep": 0,
        "pass_at_1": 0.009934283060224654,
        "avg_reward": 0.0010342113896204897,
        "difficulty_1_ratio": 0.2570583684642447,
        "difficulty_2_ratio": 0.4238175998984713,
        "difficulty_3_ratio": 0.2570583684642447,
        "difficulty_4_ratio": 0.057357474922920995,
        "difficulty_5_ratio": 0.0047081882501182806
      },
      {
        "timestep": 10000,
        "pass_at_1": 0.5940081757847141,
        "avg_reward": 0.4180580257362401
      }
    ],
    "timing_metrics": [
      {
        "timestep": 0,
        "throughput": 11.5,
        "update": 1,
        "cumulative_wall_time": 4.3478260869565215
      },
      {
        "timestep": 101,
        "throughput": 12.65,
        "update": 2,
        "cumulative_wall_time": 8.695652173913043
      },
      {
        "timestep": 202,
        "throughput": 13.799999999999999,
        "update": 3,
        "cumulative_wall_time": 13.043478260869565
      },
      {
        "timestep": 303,
        "throughput": 14.950000000000001,
        "update": 4,
        "cumulative_wall_time": 17.391304347826086
      },
      {
        "timestep": 404,
        "throughput": 16.099999999999998,
        "update": 5,
        "cumulative_wall_time": 21.73913043478261
      },
      {
        "timestep": 505,
        "throughput": 17.25,
        "update": 6,
        "cumulative_wall_time": 26.086956521739133
      },
      {
        "timestep": 606,
        "throughput": 18.400000000000002,
        "update": 7,
        "cumulative_wall_time": 30.434782608695656
      },
      {
        "timestep": 707,
        "throughput": 19.55,
        "update": 8,
        "cumulative_wall_time": 34.78260869565218
      },
      {
        "timestep": 808,
        "throughput": 20.7,
        "update": 9,
        "cumulative_wall_time": 39.1304347826087
      },
      {
        "timestep": 909,
        "throughput": 21.849999999999998,
        "update": 10,
        "cumulative_wall_time": 43.478260869565226
      },
      {
        "timestep": 1010,
        "throughput": 23.82291092880105,
        "update": 11,
        "cumulative_wall_time": 47.82608695652175
      },
      {
        "timestep": 1111,
        "throughput": 24.289804410646937,
        "update": 12,
        "cumulative_wall_time": 52.17391304347827
      },
      {
        "timestep": 1212,
        "throughput": 25.49101785930314,
        "update": 13,
        "cumulative_wall_time": 56.521739130434796
      },
      {
        "timestep": 1313,
        "throughput": 25.423744719680275,
        "update": 14,
        "cumulative_wall_time": 60.86956521739132
      },
      {
        "timestep": 1414,
        "throughput": 19.831360453698693,
        "update": 15,
        "cumulative_wall_time": 65.21739130434784
      },
      {
        "timestep": 1515,
        "throughput": 20.843002408195215,
        "update": 16,
        "cumulative_wall_time": 69.56521739130436
      },
      {
        "timestep": 1616,
        "throughput": 24.184581114579917,
        "update": 17,
        "cumulative_wall_time": 73.91304347826087
      },
      {
        "timestep": 1717,
        "throughput": 24.18170768709808,
        "update": 18,
        "cumulative_wall_time": 78.26086956521739
      },
      {
        "timestep": 1818,
        "throughput": 24.184609678503907,
        "update": 19,
        "cumulative_wall_time": 82.6086956521739
      },
      {
        "timestep": 1919,
        "throughput": 31.86128242850586,
        "update": 20,
        "cumulative_wall_time": 86.95652173913042
      },
      {
        "timestep": 2020,
        "throughput": 24.313048174594286,
        "update": 21,
        "cumulative_wall_time": 91.30434782608694
      },
      {
        "timestep": 2121,
        "throughput": 25.611800972415374,
        "update": 22,
        "cumulative_wall_time": 95.65217391304346
      },
      {
        "timestep": 2222,
        "throughput": 25.194204056034366,
        "update": 23,
        "cumulative_wall_time": 99.99999999999997
      },
      {
        "timestep": 2323,
        "throughput": 24.498199878003334,
        "update": 24,
        "cumulative_wall_time": 104.34782608695649
      },
      {
        "timestep": 2424,
        "throughput": 22.274880737327205,
        "update": 25,
        "cumulative_wall_time": 108.695652173913
      },
      {
        "timestep": 2525,
        "throughput": 24.745629207134517,
        "update": 26,
        "cumulative_wall_time": 113.04347826086952
      },
      {
        "timestep": 2626,
        "throughput": 21.222502006563587,
        "update": 27,
        "cumulative_wall_time": 117.39130434782604
      },
      {
        "timestep": 2727,
        "throughput": 22.45531720449798,
        "update": 28,
        "cumulative_wall_time": 121.73913043478255
      },
      {
        "timestep": 2828,
        "throughput": 21.883663839993062,
        "update": 29,
        "cumulative_wall_time": 126.08695652173907
      },
      {
        "timestep": 2929,
        "throughput": 23.18831052058854,
        "update": 30,
        "cumulative_wall_time": 130.4347826086956
      },
      {
        "timestep": 3030,
        "throughput": 28.32371470334907,
        "update": 31,
        "cumulative_wall_time": 134.78260869565213
      },
      {
        "timestep": 3131,
        "throughput": 18.70529005703898,
        "update": 32,
        "cumulative_wall_time": 139.13043478260866
      },
      {
        "timestep": 3232,
        "throughput": 24.578398437861377,
        "update": 33,
        "cumulative_wall_time": 143.4782608695652
      },
      {
        "timestep": 3333,
        "throughput": 19.2907534962638,
        "update": 34,
        "cumulative_wall_time": 147.82608695652172
      },
      {
        "timestep": 3434,
        "throughput": 21.9145567086843,
        "update": 35,
        "cumulative_wall_time": 152.17391304347825
      },
      {
        "timestep": 3535,
        "throughput": 25.504586373024942,
        "update": 36,
        "cumulative_wall_time": 156.52173913043478
      },
      {
        "timestep": 3636,
        "throughput": 23.147844043919562,
        "update": 37,
        "cumulative_wall_time": 160.8695652173913
      },
      {
        "timestep": 3737,
        "throughput": 20.521187010762596,
        "update": 38,
        "cumulative_wall_time": 165.21739130434784
      },
      {
        "timestep": 3838,
        "throughput": 21.354801468702075,
        "update": 39,
        "cumulative_wall_time": 169.56521739130437
      },
      {
        "timestep": 3939,
        "throughput": 24.56307482254975,
        "update": 40,
        "cumulative_wall_time": 173.9130434782609
      },
      {
        "timestep": 4040,
        "throughput": 21.320156747050586,
        "update": 41,
        "cumulative_wall_time": 178.26086956521743
      },
      {
        "timestep": 4141,
        "throughput": 23.497854756038546,
        "update": 42,
        "cumulative_wall_time": 182.60869565217396
      },
      {
        "timestep": 4242,
        "throughput": 23.10481523177877,
        "update": 43,
        "cumulative_wall_time": 186.9565217391305
      },
      {
        "timestep": 4343,
        "throughput": 21.50131920050662,
        "update": 44,
        "cumulative_wall_time": 191.30434782608702
      },
      {
        "timestep": 4444,
        "throughput": 27.93107140544825,
        "update": 45,
        "cumulative_wall_time": 195.65217391304355
      },
      {
        "timestep": 4545,
        "throughput": 24.458013751331425,
        "update": 46,
        "cumulative_wall_time": 200.00000000000009
      },
      {
        "timestep": 4646,
        "throughput": 18.342172050687505,
        "update": 47,
        "cumulative_wall_time": 204.34782608695662
      },
      {
        "timestep": 4747,
        "throughput": 23.428844923969685,
        "update": 48,
        "cumulative_wall_time": 208.69565217391315
      },
      {
        "timestep": 4848,
        "throughput": 21.477891131032706,
        "update": 49,
        "cumulative_wall_time": 213.04347826086968
      },
      {
        "timestep": 4949,
        "throughput": 24.960596670031315,
        "update": 50,
        "cumulative_wall_time": 217.3913043478262
      },
      {
        "timestep": 5050,
        "throughput": 21.17720230160479,
        "update": 51,
        "cumulative_wall_time": 221.73913043478274
      },
      {
        "timestep": 5151,
        "throughput": 22.73610618462613,
        "update": 52,
        "cumulative_wall_time": 226.08695652173927
      },
      {
        "timestep": 5252,
        "throughput": 24.16147074165505,
        "update": 53,
        "cumulative_wall_time": 230.4347826086958
      },
      {
        "timestep": 5353,
        "throughput": 24.99123694659128,
        "update": 54,
        "cumulative_wall_time": 234.78260869565233
      },
      {
        "timestep": 5454,
        "throughput": 20.239318263771715,
        "update": 55,
        "cumulative_wall_time": 239.13043478260886
      },
      {
        "timestep": 5555,
        "throughput": 22.23064715756582,
        "update": 56,
        "cumulative_wall_time": 243.4782608695654
      },
      {
        "timestep": 5656,
        "throughput": 21.907625784329802,
        "update": 57,
        "cumulative_wall_time": 247.82608695652192
      },
      {
        "timestep": 5757,
        "throughput": 21.497342765080464,
        "update": 58,
        "cumulative_wall_time": 252.17391304347845
      },
      {
        "timestep": 5858,
        "throughput": 27.06054475264652,
        "update": 59,
        "cumulative_wall_time": 256.521739130435
      },
      {
        "timestep": 5959,
        "throughput": 23.9314579352102,
        "update": 60,
        "cumulative_wall_time": 260.8695652173915
      },
      {
        "timestep": 6060,
        "throughput": 20.099966905029394,
        "update": 61,
        "cumulative_wall_time": 265.217391304348
      },
      {
        "timestep": 6161,
        "throughput": 25.111082478225985,
        "update": 62,
        "cumulative_wall_time": 269.5652173913045
      },
      {
        "timestep": 6262,
        "throughput": 27.880959253129056,
        "update": 63,
        "cumulative_wall_time": 273.913043478261
      },
      {
        "timestep": 6363,
        "throughput": 25.37467009926764,
        "update": 64,
        "cumulative_wall_time": 278.2608695652175
      },
      {
        "timestep": 6464,
        "throughput": 19.50544907830577,
        "update": 65,
        "cumulative_wall_time": 282.608695652174
      },
      {
        "timestep": 6565,
        "throughput": 21.88626163240762,
        "update": 66,
        "cumulative_wall_time": 286.9565217391305
      },
      {
        "timestep": 6666,
        "throughput": 25.91389564312923,
        "update": 67,
        "cumulative_wall_time": 291.304347826087
      },
      {
        "timestep": 6767,
        "throughput": 21.372360229076804,
        "update": 68,
        "cumulative_wall_time": 295.6521739130435
      },
      {
        "timestep": 6868,
        "throughput": 24.020784684736324,
        "update": 69,
        "cumulative_wall_time": 300.0
      },
      {
        "timestep": 6969,
        "throughput": 24.781658322887477,
        "update": 70,
        "cumulative_wall_time": 304.3478260869565
      },
      {
        "timestep": 7070,
        "throughput": 20.86805991537041,
        "update": 71,
        "cumulative_wall_time": 308.695652173913
      },
      {
        "timestep": 7171,
        "throughput": 22.86309168105786,
        "update": 72,
        "cumulative_wall_time": 313.0434782608695
      },
      {
        "timestep": 7272,
        "throughput": 15.545085117841133,
        "update": 73,
        "cumulative_wall_time": 317.391304347826
      },
      {
        "timestep": 7373,
        "throughput": 20.643908424931134,
        "update": 74,
        "cumulative_wall_time": 321.7391304347825
      },
      {
        "timestep": 7474,
        "throughput": 22.419093251795733,
        "update": 75,
        "cumulative_wall_time": 326.086956521739
      },
      {
        "timestep": 7575,
        "throughput": 20.130098681480845,
        "update": 76,
        "cumulative_wall_time": 330.4347826086955
      },
      {
        "timestep": 7676,
        "throughput": 26.75454599904276,
        "update": 77,
        "cumulative_wall_time": 334.782608695652
      },
      {
        "timestep": 7777,
        "throughput": 19.710674830690543,
        "update": 78,
        "cumulative_wall_time": 339.1304347826085
      },
      {
        "timestep": 7878,
        "throughput": 21.987897680596937,
        "update": 79,
        "cumulative_wall_time": 343.478260869565
      },
      {
        "timestep": 7979,
        "throughput": 23.300703327758008,
        "update": 80,
        "cumulative_wall_time": 347.8260869565215
      },
      {
        "timestep": 8080,
        "throughput": 26.314928564852067,
        "update": 81,
        "cumulative_wall_time": 352.173913043478
      },
      {
        "timestep": 8181,
        "throughput": 19.69751705228729,
        "update": 82,
        "cumulative_wall_time": 356.5217391304345
      },
      {
        "timestep": 8282,
        "throughput": 25.675276629956404,
        "update": 83,
        "cumulative_wall_time": 360.869565217391
      },
      {
        "timestep": 8383,
        "throughput": 23.02353604034505,
        "update": 84,
        "cumulative_wall_time": 365.21739130434753
      },
      {
        "timestep": 8484,
        "throughput": 20.74253010258971,
        "update": 85,
        "cumulative_wall_time": 369.56521739130403
      },
      {
        "timestep": 8585,
        "throughput": 24.062837990805523,
        "update": 86,
        "cumulative_wall_time": 373.91304347826053
      },
      {
        "timestep": 8686,
        "throughput": 23.45783729981898,
        "update": 87,
        "cumulative_wall_time": 378.26086956521704
      },
      {
        "timestep": 8787,
        "throughput": 21.619501182534773,
        "update": 88,
        "cumulative_wall_time": 382.60869565217354
      },
      {
        "timestep": 8888,
        "throughput": 23.16054479547704,
        "update": 89,
        "cumulative_wall_time": 386.95652173913004
      },
      {
        "timestep": 8989,
        "throughput": 22.11377872721795,
        "update": 90,
        "cumulative_wall_time": 391.30434782608654
      },
      {
        "timestep": 9090,
        "throughput": 23.26108989407787,
        "update": 91,
        "cumulative_wall_time": 395.65217391304304
      },
      {
        "timestep": 9191,
        "throughput": 24.522900551398408,
        "update": 92,
        "cumulative_wall_time": 399.99999999999955
      },
      {
        "timestep": 9292,
        "throughput": 26.64783867713431,
        "update": 93,
        "cumulative_wall_time": 404.34782608695605
      },
      {
        "timestep": 9393,
        "throughput": 20.15302435269825,
        "update": 94,
        "cumulative_wall_time": 408.69565217391255
      },
      {
        "timestep": 9494,
        "throughput": 27.905976761709418,
        "update": 95,
        "cumulative_wall_time": 413.04347826086905
      },
      {
        "timestep": 9595,
        "throughput": 18.510198061098247,
        "update": 96,
        "cumulative_wall_time": 417.39130434782555
      },
      {
        "timestep": 9696,
        "throughput": 22.650894281418157,
        "update": 97,
        "cumulative_wall_time": 421.73913043478206
      },
      {
        "timestep": 9797,
        "throughput": 24.353129574914526,
        "update": 98,
        "cumulative_wall_time": 426.08695652173856
      },
      {
        "timestep": 9898,
        "throughput": 23.646281295790573,
        "update": 99,
        "cumulative_wall_time": 430.43478260869506
      },
      {
        "timestep": 10000,
        "throughput": 21.567791104412635,
        "update": 100,
        "cumulative_wall_time": 434.78260869565156
      }
    ],
    "scheduler_stats": {
      "total_experiences": 10000,
      "total_updates": 500,
      "policy_version": 500,
      "buffer_size": 1024,
      "curriculum": {
        "level_1": {
          "num_pulls": 1200,
          "success_rate": 0.85,
          "mean_reward": 0.7608375549928545,
          "recent_gradient": 0.009013998130682335
        },
        "level_2": {
          "num_pulls": 2800,
          "success_rate": 0.65,
          "mean_reward": 0.5732127048611159,
          "recent_gradient": 0.02169920419404205
        },
        "level_3": {
          "num_pulls": 3500,
          "success_rate": 0.45,
          "mean_reward": 0.412140309719301,
          "recent_gradient": 0.028614180809478692
        },
        "level_4": {
          "num_pulls": 1800,
          "success_rate": 0.28,
          "mean_reward": 0.2699919975086651,
          "recent_gradient": 0.02061459904175322
        },
        "level_5": {
          "num_pulls": 700,
          "success_rate": 0.15,
          "mean_reward": 0.1512572423767792,
          "recent_gradient": 0.011259257683847225
        },
        "total_steps": 10000
      },
      "staleness": {
        "discard_rate": 0.05
      },
      "workers": {
        "0": {
          "completed_tasks": 2500,
          "avg_throughput": 4.5855024945389635
        },
        "1": {
          "completed_tasks": 2500,
          "avg_throughput": 4.719909479901515
        },
        "2": {
          "completed_tasks": 2500,
          "avg_throughput": 5.373646802561631
        },
        "3": {
          "completed_tasks": 2500,
          "avg_throughput": 5.3051851327167325
        }
      }
    },
    "final_pass_at_1": 0.6007867065901504,
    "final_pass_at_1_std": 0.015580873953549118,
    "avg_throughput": 22.39410142354676,
    "avg_throughput_std": 0.20786108728783032,
    "wall_time_mean": 0.0,
    "num_runs": 3
  }
}