{
  "experiment_name": "sync_seed42",
  "total_timesteps": 10000,
  "total_time": 1000.0,
  "avg_throughput": 10,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.009934283060224654,
      "avg_reward": 0.0010342113896204897,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 101,
      "pass_at_1": 0.02204467985292294,
      "avg_reward": 0.09378723670273963,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 202,
      "pass_at_1": 0.013498750687351464,
      "avg_reward": -0.0009078472975778563,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 303,
      "pass_at_1": 0.0588569835828751,
      "avg_reward": 0.08545732332394551,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 404,
      "pass_at_1": 0.026974148644937326,
      "avg_reward": 0.0487073210952481,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 505,
      "pass_at_1": 0.11188938627252211,
      "avg_reward": 0.06622502133950484,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 606,
      "pass_at_1": 0.1286986191500568,
      "avg_reward": 0.007294883087155535,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 707,
      "pass_at_1": 0.09209970082692284,
      "avg_reward": 0.04556538419948965,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 808,
      "pass_at_1": 0.1091166533173175,
      "avg_reward": 0.1030056892836177,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 909,
      "pass_at_1": 0.11402398343489357,
      "avg_reward": 0.020604001681150286,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.16434398885660495,
      "avg_reward": 0.12018637606095718,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.139262825404694,
      "avg_reward": 0.04017285101308238,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.12993984551369905,
      "avg_reward": 0.10949800589645256,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.12075610118839061,
      "avg_reward": 0.1153897818679961,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.13474410068278367,
      "avg_reward": 0.09321059305656311,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.13773522006634492,
      "avg_reward": 0.20280208527852284,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.15254256135042266,
      "avg_reward": 0.0691485026325431,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.17233628607243612,
      "avg_reward": 0.0768268463593978,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.16316427676293016,
      "avg_reward": 0.03254791521635535,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.13555259727470384,
      "avg_reward": 0.11828513961321925,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.1800415766296463,
      "avg_reward": 0.15260167536321556,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.16614069344378007,
      "avg_reward": 0.11785736997555962,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.14208895268490274,
      "avg_reward": 0.07767895172818676,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.16567546145192658,
      "avg_reward": 0.18539648047248705,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.18501131080948016,
      "avg_reward": 0.05985704087944743,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.18789191196133653,
      "avg_reward": 0.1310594155482534,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.17116233985119067,
      "avg_reward": 0.16751368632299593,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.2086292242750017,
      "avg_reward": 0.21346738537581128,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.17454985967813402,
      "avg_reward": 0.12417926894994648,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.2012995640034876,
      "avg_reward": 0.20981690755890806,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.18844456452853195,
      "avg_reward": 0.1414727027896347,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.17926730774691252,
      "avg_reward": 0.0836035149934965,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.22102119908286716,
      "avg_reward": 0.24462896069483486,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.20671636716370603,
      "avg_reward": 0.21554973862556606,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.21878286599083643,
      "avg_reward": 0.14277030506241295,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.22217778581521247,
      "avg_reward": 0.25464405697546844,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.21763768561202113,
      "avg_reward": 0.25234233128031724,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.16936668520218948,
      "avg_reward": 0.17658847338051278,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.2269113958776088,
      "avg_reward": 0.16657874917879367,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.230414459022494,
      "avg_reward": 0.08495312148795056,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.22759295201866866,
      "avg_reward": 0.19992999019052227,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.2649482128274434,
      "avg_reward": 0.18604505934827237,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.2226196423474698,
      "avg_reward": 0.15300786169874903,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.26049043269870104,
      "avg_reward": 0.22482990164194508,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.23497222033764187,
      "avg_reward": 0.21364114792578132,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.2508846465286318,
      "avg_reward": 0.2491399667495499,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.2382668377562136,
      "avg_reward": 0.17423036287508248,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.24781818913895956,
      "avg_reward": 0.12507880390456172,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.26492139647111035,
      "avg_reward": 0.22498988078588275,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.26242464728725085,
      "avg_reward": 0.19821036116104335,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.23732168840832996,
      "avg_reward": 0.16882508458839604
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.26206349458218603,
      "avg_reward": 0.1695369322046679
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.2689613591116262,
      "avg_reward": 0.2353716301300279
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.31315937033647206,
      "avg_reward": 0.2592563869107696
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.2838132489040948,
      "avg_reward": 0.2233283033349675
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.24349017197168576,
      "avg_reward": 0.19346644380488778
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.286249117687707,
      "avg_reward": 0.35216139977442995
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.2843506096041752,
      "avg_reward": 0.2425578548000208
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.29063018527135565,
      "avg_reward": 0.17407024633610793
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.3172796664847354,
      "avg_reward": 0.29142038482212707
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.31331380222338434,
      "avg_reward": 0.20518166903897056
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.328589177323256,
      "avg_reward": 0.19277878871899073
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.3152797929400121,
      "avg_reward": 0.36174661564250865
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.28670962099892855,
      "avg_reward": 0.20105281031900424
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.31145855956480145,
      "avg_reward": 0.2239930649460312
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.28136413650853703,
      "avg_reward": 0.228519457947131
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.2940091398387658,
      "avg_reward": 0.25888693340277175
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.2997097709320596,
      "avg_reward": 0.3172645369965247
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.3052408086222935,
      "avg_reward": 0.22808957108755104
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.33994780818042114,
      "avg_reward": 0.21041503072263917
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.3309616636863902,
      "avg_reward": 0.3301264686632336
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.296960702343266,
      "avg_reward": 0.24680025480122803
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.3369683622798666,
      "avg_reward": 0.30866583341275877
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.30965405211832914,
      "avg_reward": 0.18170041104044948
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.3474159076101437,
      "avg_reward": 0.2927819597497743
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.34453226817643623,
      "avg_reward": 0.29294822501599777
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.32842829603925,
      "avg_reward": 0.2743553216894502
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.3503574269208782,
      "avg_reward": 0.24456837063538417
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.3842392683602437,
      "avg_reward": 0.33108306073378435
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.32548597031390797,
      "avg_reward": 0.29321645668281787
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.33216701877735544,
      "avg_reward": 0.30508784520900695
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.37714145332654914,
      "avg_reward": 0.2606790467436538
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.37550619764422166,
      "avg_reward": 0.32104400446220227
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.3749092584557008,
      "avg_reward": 0.394767055897258
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.3557499588987032,
      "avg_reward": 0.2469131589010881
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.3450174576768837,
      "avg_reward": 0.23522345189323507
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.3633762026448835,
      "avg_reward": 0.307758560856739
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.3725231470733046,
      "avg_reward": 0.3393776801104449
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.36928123542849695,
      "avg_reward": 0.3681016922006634
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.36572089725064744,
      "avg_reward": 0.4285851761299989
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.38548141221378884,
      "avg_reward": 0.265527251950217
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.35346569310683645,
      "avg_reward": 0.30689617524762847
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.37229148796024414,
      "avg_reward": 0.3335332150727999
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.3880647193773438,
      "avg_reward": 0.30681032986903145
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.36346566035005884,
      "avg_reward": 0.21503016704575384
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.37323549090466207,
      "avg_reward": 0.3414083324399033
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.3881749697719242,
      "avg_reward": 0.24825303688194
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.38904744855753187,
      "avg_reward": 0.33050382783246735
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.3695612441006199,
      "avg_reward": 0.30333525057777233
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.3900213707148276,
      "avg_reward": 0.25486858168033094
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.009934283060224654,
      "avg_reward": 0.0010342113896204897,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.3900213707148276,
      "avg_reward": 0.25486858168033094
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 5.0,
      "update": 1,
      "cumulative_wall_time": 10.0
    },
    {
      "timestep": 101,
      "throughput": 5.5,
      "update": 2,
      "cumulative_wall_time": 20.0
    },
    {
      "timestep": 202,
      "throughput": 6.0,
      "update": 3,
      "cumulative_wall_time": 30.0
    },
    {
      "timestep": 303,
      "throughput": 6.5,
      "update": 4,
      "cumulative_wall_time": 40.0
    },
    {
      "timestep": 404,
      "throughput": 7.0,
      "update": 5,
      "cumulative_wall_time": 50.0
    },
    {
      "timestep": 505,
      "throughput": 7.5,
      "update": 6,
      "cumulative_wall_time": 60.0
    },
    {
      "timestep": 606,
      "throughput": 8.0,
      "update": 7,
      "cumulative_wall_time": 70.0
    },
    {
      "timestep": 707,
      "throughput": 8.5,
      "update": 8,
      "cumulative_wall_time": 80.0
    },
    {
      "timestep": 808,
      "throughput": 9.0,
      "update": 9,
      "cumulative_wall_time": 90.0
    },
    {
      "timestep": 909,
      "throughput": 9.5,
      "update": 10,
      "cumulative_wall_time": 100.0
    },
    {
      "timestep": 1010,
      "throughput": 10.357787360348283,
      "update": 11,
      "cumulative_wall_time": 110.0
    },
    {
      "timestep": 1111,
      "throughput": 10.560784526368234,
      "update": 12,
      "cumulative_wall_time": 120.0
    },
    {
      "timestep": 1212,
      "throughput": 11.083051243175277,
      "update": 13,
      "cumulative_wall_time": 130.0
    },
    {
      "timestep": 1313,
      "throughput": 11.053802052034902,
      "update": 14,
      "cumulative_wall_time": 140.0
    },
    {
      "timestep": 1414,
      "throughput": 8.62233063204291,
      "update": 15,
      "cumulative_wall_time": 150.0
    },
    {
      "timestep": 1515,
      "throughput": 9.062174960084876,
      "update": 16,
      "cumulative_wall_time": 160.0
    },
    {
      "timestep": 1616,
      "throughput": 10.51503526720866,
      "update": 17,
      "cumulative_wall_time": 170.0
    },
    {
      "timestep": 1717,
      "throughput": 10.513785950912208,
      "update": 18,
      "cumulative_wall_time": 180.0
    },
    {
      "timestep": 1818,
      "throughput": 10.515047686306048,
      "update": 19,
      "cumulative_wall_time": 190.0
    },
    {
      "timestep": 1919,
      "throughput": 13.852731490654723,
      "update": 20,
      "cumulative_wall_time": 200.0
    },
    {
      "timestep": 2020,
      "throughput": 10.570890510693168,
      "update": 21,
      "cumulative_wall_time": 210.0
    },
    {
      "timestep": 2121,
      "throughput": 11.135565640180598,
      "update": 22,
      "cumulative_wall_time": 220.0
    },
    {
      "timestep": 2222,
      "throughput": 10.954001763493203,
      "update": 23,
      "cumulative_wall_time": 230.0
    },
    {
      "timestep": 2323,
      "throughput": 10.651391251305798,
      "update": 24,
      "cumulative_wall_time": 240.0
    },
    {
      "timestep": 2424,
      "throughput": 9.684730755359654,
      "update": 25,
      "cumulative_wall_time": 250.0
    },
    {
      "timestep": 2525,
      "throughput": 10.758969220493269,
      "update": 26,
      "cumulative_wall_time": 260.0
    },
    {
      "timestep": 2626,
      "throughput": 9.227174785462429,
      "update": 27,
      "cumulative_wall_time": 270.0
    },
    {
      "timestep": 2727,
      "throughput": 9.763181393259991,
      "update": 28,
      "cumulative_wall_time": 280.0
    },
    {
      "timestep": 2828,
      "throughput": 9.514636452170897,
      "update": 29,
      "cumulative_wall_time": 290.0
    },
    {
      "timestep": 2929,
      "throughput": 10.081874139386322,
      "update": 30,
      "cumulative_wall_time": 300.0
    },
    {
      "timestep": 3030,
      "throughput": 12.314658566673508,
      "update": 31,
      "cumulative_wall_time": 310.0
    },
    {
      "timestep": 3131,
      "throughput": 8.132734807408251,
      "update": 32,
      "cumulative_wall_time": 320.0
    },
    {
      "timestep": 3232,
      "throughput": 10.686260190374512,
      "update": 33,
      "cumulative_wall_time": 330.0
    },
    {
      "timestep": 3333,
      "throughput": 8.387284128810348,
      "update": 34,
      "cumulative_wall_time": 340.0
    },
    {
      "timestep": 3434,
      "throughput": 9.528068134210567,
      "update": 35,
      "cumulative_wall_time": 350.0
    },
    {
      "timestep": 3535,
      "throughput": 11.088950596967367,
      "update": 36,
      "cumulative_wall_time": 360.0
    },
    {
      "timestep": 3636,
      "throughput": 10.064280019095461,
      "update": 37,
      "cumulative_wall_time": 370.0
    },
    {
      "timestep": 3737,
      "throughput": 8.922255222070694,
      "update": 38,
      "cumulative_wall_time": 380.0
    },
    {
      "timestep": 3838,
      "throughput": 9.284696290740031,
      "update": 39,
      "cumulative_wall_time": 390.0
    },
    {
      "timestep": 3939,
      "throughput": 10.679597748934675,
      "update": 40,
      "cumulative_wall_time": 400.0
    },
    {
      "timestep": 4040,
      "throughput": 9.269633368282864,
      "update": 41,
      "cumulative_wall_time": 410.0
    },
    {
      "timestep": 4141,
      "throughput": 10.216458589581976,
      "update": 42,
      "cumulative_wall_time": 420.0
    },
    {
      "timestep": 4242,
      "throughput": 10.045571839903813,
      "update": 43,
      "cumulative_wall_time": 430.0
    },
    {
      "timestep": 4343,
      "throughput": 9.348399652394182,
      "update": 44,
      "cumulative_wall_time": 440.0
    },
    {
      "timestep": 4444,
      "throughput": 12.143944089325327,
      "update": 45,
      "cumulative_wall_time": 450.0
    },
    {
      "timestep": 4545,
      "throughput": 10.633919022318011,
      "update": 46,
      "cumulative_wall_time": 460.0
    },
    {
      "timestep": 4646,
      "throughput": 7.974857413342393,
      "update": 47,
      "cumulative_wall_time": 470.0
    },
    {
      "timestep": 4747,
      "throughput": 10.186454314769428,
      "update": 48,
      "cumulative_wall_time": 480.0
    },
    {
      "timestep": 4848,
      "throughput": 9.338213535231612,
      "update": 49,
      "cumulative_wall_time": 490.0
    },
    {
      "timestep": 4949,
      "throughput": 10.852433334796224,
      "update": 50,
      "cumulative_wall_time": 500.0
    },
    {
      "timestep": 5050,
      "throughput": 9.2074792615673,
      "update": 51,
      "cumulative_wall_time": 510.0
    },
    {
      "timestep": 5151,
      "throughput": 9.8852635585331,
      "update": 52,
      "cumulative_wall_time": 520.0
    },
    {
      "timestep": 5252,
      "throughput": 10.504987278980458,
      "update": 53,
      "cumulative_wall_time": 530.0
    },
    {
      "timestep": 5353,
      "throughput": 10.865755194170122,
      "update": 54,
      "cumulative_wall_time": 540.0
    },
    {
      "timestep": 5454,
      "throughput": 8.799703592944223,
      "update": 55,
      "cumulative_wall_time": 550.0
    },
    {
      "timestep": 5555,
      "throughput": 9.665498764159052,
      "update": 56,
      "cumulative_wall_time": 560.0
    },
    {
      "timestep": 5656,
      "throughput": 9.525054688839043,
      "update": 57,
      "cumulative_wall_time": 570.0
    },
    {
      "timestep": 5757,
      "throughput": 9.34667076742629,
      "update": 58,
      "cumulative_wall_time": 580.0
    },
    {
      "timestep": 5858,
      "throughput": 11.765454240281096,
      "update": 59,
      "cumulative_wall_time": 590.0
    },
    {
      "timestep": 5959,
      "throughput": 10.404981710960957,
      "update": 60,
      "cumulative_wall_time": 600.0
    },
    {
      "timestep": 6060,
      "throughput": 8.739116045664954,
      "update": 61,
      "cumulative_wall_time": 610.0
    },
    {
      "timestep": 6161,
      "throughput": 10.917861947054776,
      "update": 62,
      "cumulative_wall_time": 620.0
    },
    {
      "timestep": 6262,
      "throughput": 12.122156197012632,
      "update": 63,
      "cumulative_wall_time": 630.0
    },
    {
      "timestep": 6363,
      "throughput": 11.032465260551147,
      "update": 64,
      "cumulative_wall_time": 640.0
    },
    {
      "timestep": 6464,
      "throughput": 8.480630034045987,
      "update": 65,
      "cumulative_wall_time": 650.0
    },
    {
      "timestep": 6565,
      "throughput": 9.515765927133748,
      "update": 66,
      "cumulative_wall_time": 660.0
    },
    {
      "timestep": 6666,
      "throughput": 11.266911149186623,
      "update": 67,
      "cumulative_wall_time": 670.0
    },
    {
      "timestep": 6767,
      "throughput": 9.292330534381218,
      "update": 68,
      "cumulative_wall_time": 680.0
    },
    {
      "timestep": 6868,
      "throughput": 10.443819428146227,
      "update": 69,
      "cumulative_wall_time": 690.0
    },
    {
      "timestep": 6969,
      "throughput": 10.774634053429338,
      "update": 70,
      "cumulative_wall_time": 700.0
    },
    {
      "timestep": 7070,
      "throughput": 9.073069528421918,
      "update": 71,
      "cumulative_wall_time": 710.0
    },
    {
      "timestep": 7171,
      "throughput": 9.940474643938199,
      "update": 72,
      "cumulative_wall_time": 720.0
    },
    {
      "timestep": 7272,
      "throughput": 6.758732659930927,
      "update": 73,
      "cumulative_wall_time": 730.0
    },
    {
      "timestep": 7373,
      "throughput": 8.97561235866571,
      "update": 74,
      "cumulative_wall_time": 740.0
    },
    {
      "timestep": 7474,
      "throughput": 9.74743184860684,
      "update": 75,
      "cumulative_wall_time": 750.0
    },
    {
      "timestep": 7575,
      "throughput": 8.75221681803515,
      "update": 76,
      "cumulative_wall_time": 760.0
    },
    {
      "timestep": 7676,
      "throughput": 11.632411303931637,
      "update": 77,
      "cumulative_wall_time": 770.0
    },
    {
      "timestep": 7777,
      "throughput": 8.569858622039368,
      "update": 78,
      "cumulative_wall_time": 780.0
    },
    {
      "timestep": 7878,
      "throughput": 9.559955513303017,
      "update": 79,
      "cumulative_wall_time": 790.0
    },
    {
      "timestep": 7979,
      "throughput": 10.13074057728609,
      "update": 80,
      "cumulative_wall_time": 800.0
    },
    {
      "timestep": 8080,
      "throughput": 11.441273289066116,
      "update": 81,
      "cumulative_wall_time": 810.0
    },
    {
      "timestep": 8181,
      "throughput": 8.564137848820561,
      "update": 82,
      "cumulative_wall_time": 820.0
    },
    {
      "timestep": 8282,
      "throughput": 11.163163752154958,
      "update": 83,
      "cumulative_wall_time": 830.0
    },
    {
      "timestep": 8383,
      "throughput": 10.010233061019587,
      "update": 84,
      "cumulative_wall_time": 840.0
    },
    {
      "timestep": 8484,
      "throughput": 9.018491348952049,
      "update": 85,
      "cumulative_wall_time": 850.0
    },
    {
      "timestep": 8585,
      "throughput": 10.462103474263271,
      "update": 86,
      "cumulative_wall_time": 860.0
    },
    {
      "timestep": 8686,
      "throughput": 10.19905969557347,
      "update": 87,
      "cumulative_wall_time": 870.0
    },
    {
      "timestep": 8787,
      "throughput": 9.399783122841205,
      "update": 88,
      "cumulative_wall_time": 880.0
    },
    {
      "timestep": 8888,
      "throughput": 10.069802084990018,
      "update": 89,
      "cumulative_wall_time": 890.0
    },
    {
      "timestep": 8989,
      "throughput": 9.61468640313824,
      "update": 90,
      "cumulative_wall_time": 900.0
    },
    {
      "timestep": 9090,
      "throughput": 10.113517345251248,
      "update": 91,
      "cumulative_wall_time": 910.0
    },
    {
      "timestep": 9191,
      "throughput": 10.662130674521046,
      "update": 92,
      "cumulative_wall_time": 920.0
    },
    {
      "timestep": 9292,
      "throughput": 11.586016816145353,
      "update": 93,
      "cumulative_wall_time": 930.0
    },
    {
      "timestep": 9393,
      "throughput": 8.762184501173152,
      "update": 94,
      "cumulative_wall_time": 940.0
    },
    {
      "timestep": 9494,
      "throughput": 12.133033374656268,
      "update": 95,
      "cumulative_wall_time": 950.0
    },
    {
      "timestep": 9595,
      "throughput": 8.047912200477498,
      "update": 96,
      "cumulative_wall_time": 960.0
    },
    {
      "timestep": 9696,
      "throughput": 9.848214904964417,
      "update": 97,
      "cumulative_wall_time": 970.0
    },
    {
      "timestep": 9797,
      "throughput": 10.588317206484577,
      "update": 98,
      "cumulative_wall_time": 980.0
    },
    {
      "timestep": 9898,
      "throughput": 10.280991867735032,
      "update": 99,
      "cumulative_wall_time": 990.0
    },
    {
      "timestep": 10000,
      "throughput": 9.377300480179406,
      "update": 100,
      "cumulative_wall_time": 1000.0
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 2000,
        "success_rate": 0.85,
        "mean_reward": 0.7608375549928545,
        "recent_gradient": 0.009013998130682335
      },
      "level_2": {
        "num_pulls": 2000,
        "success_rate": 0.65,
        "mean_reward": 0.5732127048611159,
        "recent_gradient": 0.02169920419404205
      },
      "level_3": {
        "num_pulls": 2000,
        "success_rate": 0.45,
        "mean_reward": 0.412140309719301,
        "recent_gradient": 0.028614180809478692
      },
      "level_4": {
        "num_pulls": 2000,
        "success_rate": 0.28,
        "mean_reward": 0.2699919975086651,
        "recent_gradient": 0.02061459904175322
      },
      "level_5": {
        "num_pulls": 2000,
        "success_rate": 0.15,
        "mean_reward": 0.1512572423767792,
        "recent_gradient": 0.011259257683847225
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.15
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 4.5855024945389635
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.719909479901515
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 5.373646802561631
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 5.3051851327167325
      }
    }
  },
  "config": {
    "use_async": false,
    "curriculum_strategy": "uniform"
  }
}