{
  "experiment_name": "async_seed456",
  "total_timesteps": 10000,
  "total_time": 400.0,
  "avg_throughput": 25,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": -0.02491047619505481,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 101,
      "pass_at_1": 0.02045232448631682,
      "avg_reward": 0.044796471983061886,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 202,
      "pass_at_1": 0.043171805787134955,
      "avg_reward": 0.11601687126940823,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 303,
      "pass_at_1": 0.03028174847853335,
      "avg_reward": 0.0466995576158461,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 404,
      "pass_at_1": 0.025407009983880367,
      "avg_reward": 0.004564066501489057,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 505,
      "pass_at_1": 0.09546860892751832,
      "avg_reward": 0.019863325308811547,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 606,
      "pass_at_1": 0.11536890864942419,
      "avg_reward": 0.10418768237955393,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 707,
      "pass_at_1": 0.13293252311648934,
      "avg_reward": 0.20358113815389706,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 808,
      "pass_at_1": 0.1795891484937894,
      "avg_reward": 0.18968873658698837,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 909,
      "pass_at_1": 0.16185505545650833,
      "avg_reward": 0.18736164626365837,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.14286506211069888,
      "avg_reward": 0.10985446795678121,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.1274320155753669,
      "avg_reward": 0.08274258784582085,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.17154175343335853,
      "avg_reward": 0.1440519937480303,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.14329769078926965,
      "avg_reward": 0.09958387827768851,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.15469125637321715,
      "avg_reward": 0.18083474708200456,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.12825883055520806,
      "avg_reward": 0.08888801962371162,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.1736659113913142,
      "avg_reward": 0.06693832591543789,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.1847933614772599,
      "avg_reward": 0.1061794377109391,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.17363966844327378,
      "avg_reward": 0.1432290619285764,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.16927771483082646,
      "avg_reward": 0.07479704377972415,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.16653677720022692,
      "avg_reward": 0.11528540743456886,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.1900870103177367,
      "avg_reward": 0.12501541668382976,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.16781880078491404,
      "avg_reward": 0.11969185626570163,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.17780882249229235,
      "avg_reward": 0.20232860228968255,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.17232732075215323,
      "avg_reward": 0.16013345774897278,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.15336441131787273,
      "avg_reward": 0.12604815708450914,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.15170613693528454,
      "avg_reward": 0.07652407165191573,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.20290353129471148,
      "avg_reward": 0.1583590854739881,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.16722847110777944,
      "avg_reward": 0.13447290025651362,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.15402304117084406,
      "avg_reward": 0.20952520276116637,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.17413628821029495,
      "avg_reward": 0.152019306351696,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.18061925670859838,
      "avg_reward": 0.14116782005800085,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.16764114270211627,
      "avg_reward": 0.11780624081486038,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.20342972374066218,
      "avg_reward": 0.13106150581331547,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.18931370350153198,
      "avg_reward": 0.242134523512177,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.1956508321419147,
      "avg_reward": 0.11239853047417875,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.21911453614896673,
      "avg_reward": 0.21798854348079297,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.21560992821298006,
      "avg_reward": 0.18707209129618813,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.20508550926780425,
      "avg_reward": 0.23333875517952452,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.19716934302432335,
      "avg_reward": 0.20825418654148076,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.2102862927480242,
      "avg_reward": 0.20853653841299113,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.20759403836759016,
      "avg_reward": 0.15372639718082254,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.19271005459443244,
      "avg_reward": 0.111085707867164,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.23287023891922654,
      "avg_reward": 0.14680009894925414,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.2232319333947028,
      "avg_reward": 0.16428064893086572,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.198874272748488,
      "avg_reward": 0.21382164747070243,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.24830502511214736,
      "avg_reward": 0.10309799724163314,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.22081339902200822,
      "avg_reward": 0.20796070298306576,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.22189655703898198,
      "avg_reward": 0.29364924406009213,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.2679244243240488,
      "avg_reward": 0.2341817938606753,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.20942356248261074,
      "avg_reward": 0.12487000772139542
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.1854215484589973,
      "avg_reward": 0.20705199581452344
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.2091759583865066,
      "avg_reward": 0.20186653931011755
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.24547121806781483,
      "avg_reward": 0.1727745601370587
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.21635661689048585,
      "avg_reward": 0.16952251963263099
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.22933658545086816,
      "avg_reward": 0.23734791676862052
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.2789309382234802,
      "avg_reward": 0.2407491564852791
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.2568267881995058,
      "avg_reward": 0.14772926169598016
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.2708180361324302,
      "avg_reward": 0.34528241388567793
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.25484153854173097,
      "avg_reward": 0.163697433869946
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.24103276791344086,
      "avg_reward": 0.14322085206352628
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.2278896984570842,
      "avg_reward": 0.14816589279071715
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.2715312876896269,
      "avg_reward": 0.1900001561089083
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.25474526289332766,
      "avg_reward": 0.17070819594864353
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.24717823110126594,
      "avg_reward": 0.12229377242059952
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.23178596853257546,
      "avg_reward": 0.20452688625174908
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.25930522029972675,
      "avg_reward": 0.23673323837715263
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.2847764973765642,
      "avg_reward": 0.3482658729256687
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.2584291915887847,
      "avg_reward": 0.1420893365318267
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.2636852761390694,
      "avg_reward": 0.3032683392145897
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.24828063733708183,
      "avg_reward": 0.16219969041703142
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.26185152408093515,
      "avg_reward": 0.22707417951465894
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.28918103639240333,
      "avg_reward": 0.27556790215901655
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.28011207361415136,
      "avg_reward": 0.10806465592532631
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.2673748407330344,
      "avg_reward": 0.164259948155805
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.26899712228863787,
      "avg_reward": 0.18703206697890254
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.2712669710875287,
      "avg_reward": 0.25969225085776615
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.27181490857881013,
      "avg_reward": 0.13052768721294497
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.28971279654660786,
      "avg_reward": 0.19096907214883233
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.2718029514570013,
      "avg_reward": 0.20194545317998291
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.25715839903915805,
      "avg_reward": 0.12204077577453457
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.28337164963494316,
      "avg_reward": 0.26416442602848256
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.3013513437403633,
      "avg_reward": 0.09457220199894212
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.27736518929670323,
      "avg_reward": 0.2587278345121522
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.3273349018087379,
      "avg_reward": 0.31901706491815096
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.2635387787165346,
      "avg_reward": 0.18725481847896253
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.31357842133204206,
      "avg_reward": 0.21091370699379713
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.24748290459946637,
      "avg_reward": 0.17466771242704254
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.293187190651017,
      "avg_reward": 0.2558564650704721
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.28401455235236717,
      "avg_reward": 0.26630321879478525
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.28992407459981306,
      "avg_reward": 0.26090165611573357
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.29877659432337256,
      "avg_reward": 0.14806068350195745
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.2623468439484892,
      "avg_reward": 0.11509054697588222
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.3082482612517228,
      "avg_reward": 0.2484421655549243
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.28169627419225307,
      "avg_reward": 0.25442271226341895
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.282838719725036,
      "avg_reward": 0.13554599770158465
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.30764760367555766,
      "avg_reward": 0.30073389723587773
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.3205817347679984,
      "avg_reward": 0.21429416982708321
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.2735678586835455,
      "avg_reward": 0.21576012047344006
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.3392497566839923,
      "avg_reward": 0.3208726165093934
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": -0.02491047619505481,
      "difficulty_1_ratio": 0.2,
      "difficulty_2_ratio": 0.2,
      "difficulty_3_ratio": 0.2,
      "difficulty_4_ratio": 0.2,
      "difficulty_5_ratio": 0.2
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.3392497566839923,
      "avg_reward": 0.3208726165093934
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 12.5,
      "update": 1,
      "cumulative_wall_time": 4.0
    },
    {
      "timestep": 101,
      "throughput": 13.750000000000002,
      "update": 2,
      "cumulative_wall_time": 8.0
    },
    {
      "timestep": 202,
      "throughput": 15.0,
      "update": 3,
      "cumulative_wall_time": 12.0
    },
    {
      "timestep": 303,
      "throughput": 16.25,
      "update": 4,
      "cumulative_wall_time": 16.0
    },
    {
      "timestep": 404,
      "throughput": 17.5,
      "update": 5,
      "cumulative_wall_time": 20.0
    },
    {
      "timestep": 505,
      "throughput": 18.75,
      "update": 6,
      "cumulative_wall_time": 24.0
    },
    {
      "timestep": 606,
      "throughput": 20.0,
      "update": 7,
      "cumulative_wall_time": 28.0
    },
    {
      "timestep": 707,
      "throughput": 21.25,
      "update": 8,
      "cumulative_wall_time": 32.0
    },
    {
      "timestep": 808,
      "throughput": 22.5,
      "update": 9,
      "cumulative_wall_time": 36.0
    },
    {
      "timestep": 909,
      "throughput": 23.75,
      "update": 10,
      "cumulative_wall_time": 40.0
    },
    {
      "timestep": 1010,
      "throughput": 26.272683539356628,
      "update": 11,
      "cumulative_wall_time": 44.0
    },
    {
      "timestep": 1111,
      "throughput": 22.75971165322572,
      "update": 12,
      "cumulative_wall_time": 48.0
    },
    {
      "timestep": 1212,
      "throughput": 22.082302341533406,
      "update": 13,
      "cumulative_wall_time": 52.0
    },
    {
      "timestep": 1313,
      "throughput": 26.721852872532097,
      "update": 14,
      "cumulative_wall_time": 56.0
    },
    {
      "timestep": 1414,
      "throughput": 21.403244512186152,
      "update": 15,
      "cumulative_wall_time": 60.0
    },
    {
      "timestep": 1515,
      "throughput": 29.914895677729014,
      "update": 16,
      "cumulative_wall_time": 64.0
    },
    {
      "timestep": 1616,
      "throughput": 27.29014573683862,
      "update": 17,
      "cumulative_wall_time": 68.0
    },
    {
      "timestep": 1717,
      "throughput": 22.72413553754003,
      "update": 18,
      "cumulative_wall_time": 72.0
    },
    {
      "timestep": 1818,
      "throughput": 24.727760995015792,
      "update": 19,
      "cumulative_wall_time": 76.0
    },
    {
      "timestep": 1919,
      "throughput": 21.017215337668148,
      "update": 20,
      "cumulative_wall_time": 80.0
    },
    {
      "timestep": 2020,
      "throughput": 24.180541226578868,
      "update": 21,
      "cumulative_wall_time": 84.0
    },
    {
      "timestep": 2121,
      "throughput": 28.134739968845285,
      "update": 22,
      "cumulative_wall_time": 88.0
    },
    {
      "timestep": 2222,
      "throughput": 29.616569816306328,
      "update": 23,
      "cumulative_wall_time": 92.0
    },
    {
      "timestep": 2323,
      "throughput": 26.717212425741053,
      "update": 24,
      "cumulative_wall_time": 96.0
    },
    {
      "timestep": 2424,
      "throughput": 19.088214694389414,
      "update": 25,
      "cumulative_wall_time": 100.0
    },
    {
      "timestep": 2525,
      "throughput": 26.214432408245326,
      "update": 26,
      "cumulative_wall_time": 104.0
    },
    {
      "timestep": 2626,
      "throughput": 26.230216559971844,
      "update": 27,
      "cumulative_wall_time": 108.0
    },
    {
      "timestep": 2727,
      "throughput": 23.946772553126294,
      "update": 28,
      "cumulative_wall_time": 112.0
    },
    {
      "timestep": 2828,
      "throughput": 27.272080453404797,
      "update": 29,
      "cumulative_wall_time": 116.0
    },
    {
      "timestep": 2929,
      "throughput": 22.050267182762305,
      "update": 30,
      "cumulative_wall_time": 120.0
    },
    {
      "timestep": 3030,
      "throughput": 26.668312826815814,
      "update": 31,
      "cumulative_wall_time": 124.0
    },
    {
      "timestep": 3131,
      "throughput": 24.707867697618486,
      "update": 32,
      "cumulative_wall_time": 128.0
    },
    {
      "timestep": 3232,
      "throughput": 26.281058235885247,
      "update": 33,
      "cumulative_wall_time": 132.0
    },
    {
      "timestep": 3333,
      "throughput": 30.852385197479627,
      "update": 34,
      "cumulative_wall_time": 136.0
    },
    {
      "timestep": 3434,
      "throughput": 25.864246356636738,
      "update": 35,
      "cumulative_wall_time": 140.0
    },
    {
      "timestep": 3535,
      "throughput": 23.81171730967867,
      "update": 36,
      "cumulative_wall_time": 144.0
    },
    {
      "timestep": 3636,
      "throughput": 22.70355174737906,
      "update": 37,
      "cumulative_wall_time": 148.0
    },
    {
      "timestep": 3737,
      "throughput": 24.314453525058227,
      "update": 38,
      "cumulative_wall_time": 152.0
    },
    {
      "timestep": 3838,
      "throughput": 25.047906627438348,
      "update": 39,
      "cumulative_wall_time": 156.0
    },
    {
      "timestep": 3939,
      "throughput": 23.60822304547832,
      "update": 40,
      "cumulative_wall_time": 160.0
    },
    {
      "timestep": 4040,
      "throughput": 29.8460455892269,
      "update": 41,
      "cumulative_wall_time": 164.0
    },
    {
      "timestep": 4141,
      "throughput": 26.437929778107573,
      "update": 42,
      "cumulative_wall_time": 168.0
    },
    {
      "timestep": 4242,
      "throughput": 24.009436769687593,
      "update": 43,
      "cumulative_wall_time": 172.0
    },
    {
      "timestep": 4343,
      "throughput": 28.528552215105147,
      "update": 44,
      "cumulative_wall_time": 176.0
    },
    {
      "timestep": 4444,
      "throughput": 20.83927978768693,
      "update": 45,
      "cumulative_wall_time": 180.0
    },
    {
      "timestep": 4545,
      "throughput": 28.302681298781984,
      "update": 46,
      "cumulative_wall_time": 184.0
    },
    {
      "timestep": 4646,
      "throughput": 28.15391756480683,
      "update": 47,
      "cumulative_wall_time": 188.0
    },
    {
      "timestep": 4747,
      "throughput": 30.134948781690586,
      "update": 48,
      "cumulative_wall_time": 192.0
    },
    {
      "timestep": 4848,
      "throughput": 25.48482354217078,
      "update": 49,
      "cumulative_wall_time": 196.0
    },
    {
      "timestep": 4949,
      "throughput": 27.818363786388172,
      "update": 50,
      "cumulative_wall_time": 200.0
    },
    {
      "timestep": 5050,
      "throughput": 26.179049063047067,
      "update": 51,
      "cumulative_wall_time": 204.0
    },
    {
      "timestep": 5151,
      "throughput": 26.54962637235629,
      "update": 52,
      "cumulative_wall_time": 208.0
    },
    {
      "timestep": 5252,
      "throughput": 22.506196835094848,
      "update": 53,
      "cumulative_wall_time": 212.0
    },
    {
      "timestep": 5353,
      "throughput": 28.762806933271563,
      "update": 54,
      "cumulative_wall_time": 216.0
    },
    {
      "timestep": 5454,
      "throughput": 25.852761886642874,
      "update": 55,
      "cumulative_wall_time": 220.0
    },
    {
      "timestep": 5555,
      "throughput": 21.85344095453039,
      "update": 56,
      "cumulative_wall_time": 224.0
    },
    {
      "timestep": 5656,
      "throughput": 24.739390073653773,
      "update": 57,
      "cumulative_wall_time": 228.0
    },
    {
      "timestep": 5757,
      "throughput": 20.284302756185312,
      "update": 58,
      "cumulative_wall_time": 232.0
    },
    {
      "timestep": 5858,
      "throughput": 20.60987350086348,
      "update": 59,
      "cumulative_wall_time": 236.0
    },
    {
      "timestep": 5959,
      "throughput": 22.62932044662696,
      "update": 60,
      "cumulative_wall_time": 240.0
    },
    {
      "timestep": 6060,
      "throughput": 26.81197451761882,
      "update": 61,
      "cumulative_wall_time": 244.0
    },
    {
      "timestep": 6161,
      "throughput": 28.24447882061878,
      "update": 62,
      "cumulative_wall_time": 248.0
    },
    {
      "timestep": 6262,
      "throughput": 22.82451970473374,
      "update": 63,
      "cumulative_wall_time": 252.0
    },
    {
      "timestep": 6363,
      "throughput": 24.095204695212303,
      "update": 64,
      "cumulative_wall_time": 256.0
    },
    {
      "timestep": 6464,
      "throughput": 25.479080649390962,
      "update": 65,
      "cumulative_wall_time": 260.0
    },
    {
      "timestep": 6565,
      "throughput": 24.833992785194596,
      "update": 66,
      "cumulative_wall_time": 264.0
    },
    {
      "timestep": 6666,
      "throughput": 25.49041446098253,
      "update": 67,
      "cumulative_wall_time": 268.0
    },
    {
      "timestep": 6767,
      "throughput": 21.962361013021052,
      "update": 68,
      "cumulative_wall_time": 272.0
    },
    {
      "timestep": 6868,
      "throughput": 26.36929404456768,
      "update": 69,
      "cumulative_wall_time": 276.0
    },
    {
      "timestep": 6969,
      "throughput": 24.478338750156002,
      "update": 70,
      "cumulative_wall_time": 280.0
    },
    {
      "timestep": 7070,
      "throughput": 23.859260396685475,
      "update": 71,
      "cumulative_wall_time": 284.0
    },
    {
      "timestep": 7171,
      "throughput": 26.580296605537214,
      "update": 72,
      "cumulative_wall_time": 288.0
    },
    {
      "timestep": 7272,
      "throughput": 25.646942941553707,
      "update": 73,
      "cumulative_wall_time": 292.0
    },
    {
      "timestep": 7373,
      "throughput": 26.149780917152015,
      "update": 74,
      "cumulative_wall_time": 296.0
    },
    {
      "timestep": 7474,
      "throughput": 24.54608895170723,
      "update": 75,
      "cumulative_wall_time": 300.0
    },
    {
      "timestep": 7575,
      "throughput": 28.693617416991245,
      "update": 76,
      "cumulative_wall_time": 304.0
    },
    {
      "timestep": 7676,
      "throughput": 24.178724331503844,
      "update": 77,
      "cumulative_wall_time": 308.0
    },
    {
      "timestep": 7777,
      "throughput": 28.448598250077765,
      "update": 78,
      "cumulative_wall_time": 312.0
    },
    {
      "timestep": 7878,
      "throughput": 24.2363131859427,
      "update": 79,
      "cumulative_wall_time": 316.0
    },
    {
      "timestep": 7979,
      "throughput": 26.69678689478901,
      "update": 80,
      "cumulative_wall_time": 320.0
    },
    {
      "timestep": 8080,
      "throughput": 22.44457973107839,
      "update": 81,
      "cumulative_wall_time": 324.0
    },
    {
      "timestep": 8181,
      "throughput": 20.322959087520385,
      "update": 82,
      "cumulative_wall_time": 328.0
    },
    {
      "timestep": 8282,
      "throughput": 27.406043513846427,
      "update": 83,
      "cumulative_wall_time": 332.0
    },
    {
      "timestep": 8383,
      "throughput": 23.946854132539517,
      "update": 84,
      "cumulative_wall_time": 336.0
    },
    {
      "timestep": 8484,
      "throughput": 27.016617819418553,
      "update": 85,
      "cumulative_wall_time": 340.0
    },
    {
      "timestep": 8585,
      "throughput": 28.451339009494337,
      "update": 86,
      "cumulative_wall_time": 344.0
    },
    {
      "timestep": 8686,
      "throughput": 23.12962123397283,
      "update": 87,
      "cumulative_wall_time": 348.0
    },
    {
      "timestep": 8787,
      "throughput": 23.478185451690926,
      "update": 88,
      "cumulative_wall_time": 352.0
    },
    {
      "timestep": 8888,
      "throughput": 25.345305670774138,
      "update": 89,
      "cumulative_wall_time": 356.0
    },
    {
      "timestep": 8989,
      "throughput": 24.390490377805392,
      "update": 90,
      "cumulative_wall_time": 360.0
    },
    {
      "timestep": 9090,
      "throughput": 25.269472458600113,
      "update": 91,
      "cumulative_wall_time": 364.0
    },
    {
      "timestep": 9191,
      "throughput": 27.308544331723034,
      "update": 92,
      "cumulative_wall_time": 368.0
    },
    {
      "timestep": 9292,
      "throughput": 22.598987922117608,
      "update": 93,
      "cumulative_wall_time": 372.0
    },
    {
      "timestep": 9393,
      "throughput": 24.747781827882616,
      "update": 94,
      "cumulative_wall_time": 376.0
    },
    {
      "timestep": 9494,
      "throughput": 28.112546768448354,
      "update": 95,
      "cumulative_wall_time": 380.0
    },
    {
      "timestep": 9595,
      "throughput": 27.307196090007977,
      "update": 96,
      "cumulative_wall_time": 384.0
    },
    {
      "timestep": 9696,
      "throughput": 27.38990558574687,
      "update": 97,
      "cumulative_wall_time": 388.0
    },
    {
      "timestep": 9797,
      "throughput": 23.392483708106436,
      "update": 98,
      "cumulative_wall_time": 392.0
    },
    {
      "timestep": 9898,
      "throughput": 25.383817619768003,
      "update": 99,
      "cumulative_wall_time": 396.0
    },
    {
      "timestep": 10000,
      "throughput": 26.387501986240576,
      "update": 100,
      "cumulative_wall_time": 400.0
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 2000,
        "success_rate": 0.85,
        "mean_reward": 0.774535753066723,
        "recent_gradient": 0.00880228815501225
      },
      "level_2": {
        "num_pulls": 2000,
        "success_rate": 0.65,
        "mean_reward": 0.6076855357527491,
        "recent_gradient": 0.021498278466352168
      },
      "level_3": {
        "num_pulls": 2000,
        "success_rate": 0.45,
        "mean_reward": 0.3831754599108145,
        "recent_gradient": 0.03149706388174175
      },
      "level_4": {
        "num_pulls": 2000,
        "success_rate": 0.28,
        "mean_reward": 0.28015326432172166,
        "recent_gradient": 0.019275276932362185
      },
      "level_5": {
        "num_pulls": 2000,
        "success_rate": 0.15,
        "mean_reward": 0.13334041455555007,
        "recent_gradient": 0.012821048819579189
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.15
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 4.269411344381984
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.280264511263108
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 5.37398672115195
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 4.826192872277722
      }
    }
  },
  "config": {
    "use_async": true,
    "curriculum_strategy": "uniform"
  }
}