{
  "experiment_name": "aceas_seed42",
  "total_timesteps": 10000,
  "total_time": 434.7826086956522,
  "avg_throughput": 23,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.009934283060224654,
      "avg_reward": 0.0010342113896204897,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 101,
      "pass_at_1": 0.025479023287266374,
      "avg_reward": 0.09653471145021437,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 202,
      "pass_at_1": 0.020367437556038332,
      "avg_reward": 0.004587102197371637,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 303,
      "pass_at_1": 0.0691600138859054,
      "avg_reward": 0.09369974756636976,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 404,
      "pass_at_1": 0.04071152238231106,
      "avg_reward": 0.05969722008514708,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 505,
      "pass_at_1": 0.08943988967981922,
      "avg_reward": 0.04826542406534253,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 606,
      "pass_at_1": 0.10781155124913581,
      "avg_reward": -0.00941477123358124,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 707,
      "pass_at_1": 0.07288426883456268,
      "avg_reward": 0.030193038605601515,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 808,
      "pass_at_1": 0.09168432009326676,
      "avg_reward": 0.0890598227043771,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 909,
      "pass_at_1": 0.09848824403931097,
      "avg_reward": 0.008175410164684205,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.15082012302087433,
      "avg_reward": 0.10936728339237269,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.12786762580848063,
      "avg_reward": 0.031056691336111678,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.12079132198268795,
      "avg_reward": 0.10217918707164368,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.11397316116956432,
      "avg_reward": 0.10996342985293507,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.13044620661575745,
      "avg_reward": 0.08977227780294213,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.13604202454798597,
      "avg_reward": 0.20144752886383566,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.15357352128292623,
      "avg_reward": 0.06997327057854597,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.17621025728876094,
      "avg_reward": 0.07992602333245763,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.16999909093393656,
      "avg_reward": 0.03801576655316048,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.1454646232148162,
      "avg_reward": 0.12621476036530915,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.19314526842715274,
      "avg_reward": 0.1630846288012207,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.18254812814228522,
      "avg_reward": 0.13098331773436375,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.16190936052789232,
      "avg_reward": 0.09353527800257841,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.18901475196654802,
      "avg_reward": 0.20406791288418422,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.2119715982420541,
      "avg_reward": 0.0814252708255066,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.21857104377940367,
      "avg_reward": 0.1556027210027071,
      "difficulty_1_ratio": 0.016291910734624847,
      "difficulty_2_ratio": 0.12497928765460015,
      "difficulty_3_ratio": 0.3527033512649604,
      "difficulty_4_ratio": 0.3661732760034468,
      "difficulty_5_ratio": 0.1398521743423678
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.20565343218891582,
      "avg_reward": 0.19510656019317607,
      "difficulty_1_ratio": 0.014439823367355656,
      "difficulty_2_ratio": 0.1162288430953594,
      "difficulty_3_ratio": 0.34416877595779866,
      "difficulty_4_ratio": 0.37491648580673986,
      "difficulty_5_ratio": 0.15024607177274654
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.24702020831478103,
      "avg_reward": 0.24418017260763475,
      "difficulty_1_ratio": 0.012218327302669146,
      "difficulty_2_ratio": 0.10498325535696679,
      "difficulty_3_ratio": 0.33184389643032614,
      "difficulty_4_ratio": 0.38588078286713096,
      "difficulty_5_ratio": 0.165073738042907
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.2169230430261858,
      "avg_reward": 0.15807781562838794,
      "difficulty_1_ratio": 0.009913147093465137,
      "difficulty_2_ratio": 0.09225064005743493,
      "difficulty_3_ratio": 0.3158149930158207,
      "difficulty_4_ratio": 0.39774215071368285,
      "difficulty_5_ratio": 0.18427906911959632
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.24773121112676355,
      "avg_reward": 0.2469622252575288,
      "difficulty_1_ratio": 0.007760018351280176,
      "difficulty_2_ratio": 0.07909068287132516,
      "difficulty_3_ratio": 0.29654692178674946,
      "difficulty_4_ratio": 0.40904118087068214,
      "difficulty_5_ratio": 0.20756119611996313
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.2390045002711823,
      "avg_reward": 0.181920651383755,
      "difficulty_1_ratio": 0.00590957184933243,
      "difficulty_2_ratio": 0.06645671547671815,
      "difficulty_3_ratio": 0.2749332380949103,
      "difficulty_4_ratio": 0.4184283859957229,
      "difficulty_5_ratio": 0.2342720885833161
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.23401854783464296,
      "avg_reward": 0.12740450706368084,
      "difficulty_1_ratio": 0.0044234366536341566,
      "difficulty_2_ratio": 0.05506877089710349,
      "difficulty_3_ratio": 0.2522066146015487,
      "difficulty_4_ratio": 0.4249257796153269,
      "difficulty_5_ratio": 0.2633753982323869
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.28001961135200454,
      "avg_reward": 0.2918276905101448,
      "difficulty_1_ratio": 0.0032937818280582443,
      "difficulty_2_ratio": 0.04535368508089252,
      "difficulty_3_ratio": 0.22973959398617683,
      "difficulty_4_ratio": 0.4281191321289578,
      "difficulty_5_ratio": 0.2934938069759146
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.2700103670191985,
      "avg_reward": 0.26618493850996,
      "difficulty_1_ratio": 0.0024722539225482446,
      "difficulty_2_ratio": 0.03746068440111024,
      "difficulty_3_ratio": 0.20881604152186556,
      "difficulty_4_ratio": 0.4282107125631631,
      "difficulty_5_ratio": 0.32304030759131297
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.2864131493057567,
      "avg_reward": 0.19687453171434915,
      "difficulty_1_ratio": 0.0018961158457144911,
      "difficulty_2_ratio": 0.03133140973471507,
      "difficulty_3_ratio": 0.19045857150804962,
      "difficulty_4_ratio": 0.4259186206842434,
      "difficulty_5_ratio": 0.35039528222727745
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.29417710213708603,
      "avg_reward": 0.3122435100329673,
      "difficulty_1_ratio": 0.0015056169658766543,
      "difficulty_2_ratio": 0.026789686088424,
      "difficulty_3_ratio": 0.175358276208076,
      "difficulty_4_ratio": 0.42227019488557094,
      "difficulty_5_ratio": 0.3740762258520523
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.29403065414334784,
      "avg_reward": 0.31345670610537857,
      "difficulty_1_ratio": 0.0012524233850038473,
      "difficulty_2_ratio": 0.023621859465310466,
      "difficulty_3_ratio": 0.16390134325095126,
      "difficulty_4_ratio": 0.4183660766360568,
      "difficulty_5_ratio": 0.3928582972626777
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.2501696555801058,
      "avg_reward": 0.24123084968284583,
      "difficulty_1_ratio": 0.0011018868277803448,
      "difficulty_2_ratio": 0.021633707012814266,
      "difficulty_3_ratio": 0.15625373746114093,
      "difficulty_4_ratio": 0.4151790230064104,
      "difficulty_5_ratio": 0.40583164569185404
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.31213235529817696,
      "avg_reward": 0.2347555167152482,
      "difficulty_1_ratio": 0.0010322931860183035,
      "difficulty_2_ratio": 0.02068358559081816,
      "difficulty_3_ratio": 0.15245936727836976,
      "difficulty_4_ratio": 0.41341660520999185,
      "difficulty_5_ratio": 0.41240814873480197
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.32005298674705146,
      "avg_reward": 0.15666394366759653,
      "difficulty_1_ratio": 0.001033362574533033,
      "difficulty_2_ratio": 0.02069834621303522,
      "difficulty_3_ratio": 0.15251904715441822,
      "difficulty_4_ratio": 0.4134452797034622,
      "difficulty_5_ratio": 0.41230396435455147
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.3216402217722719,
      "avg_reward": 0.27516780599340485,
      "difficulty_1_ratio": 0.001105253979564763,
      "difficulty_2_ratio": 0.021679152361382986,
      "difficulty_3_ratio": 0.1564328746274194,
      "difficulty_4_ratio": 0.41525920915243264,
      "difficulty_5_ratio": 0.4055235098792002
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.3633870430624854,
      "avg_reward": 0.264796123536306,
      "difficulty_1_ratio": 0.0012585820768892396,
      "difficulty_2_ratio": 0.02370139964709112,
      "difficulty_3_ratio": 0.16419954975755394,
      "difficulty_4_ratio": 0.418480714620724,
      "difficulty_5_ratio": 0.3923597538977418
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.3254245938091046,
      "avg_reward": 0.23525182286805685,
      "difficulty_1_ratio": 0.001515438901358441,
      "difficulty_2_ratio": 0.02690866798401823,
      "difficulty_3_ratio": 0.17577272552605308,
      "difficulty_4_ratio": 0.4223925910167582,
      "difficulty_5_ratio": 0.37341057657181215
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.367627952202806,
      "avg_reward": 0.310539917245229,
      "difficulty_1_ratio": 0.0019108941032437861,
      "difficulty_2_ratio": 0.03149638910459275,
      "difficulty_3_ratio": 0.19098111826597575,
      "difficulty_4_ratio": 0.4260157102739871,
      "difficulty_5_ratio": 0.34959588825220067
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.3464008291664554,
      "avg_reward": 0.30278403498883216,
      "difficulty_1_ratio": 0.0024936925676773474,
      "difficulty_2_ratio": 0.03767804281480519,
      "difficulty_3_ratio": 0.2094301856844532,
      "difficulty_4_ratio": 0.42824838946414634,
      "difficulty_5_ratio": 0.32214968946891787
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.3665551713730763,
      "avg_reward": 0.34167638662510547,
      "difficulty_1_ratio": 0.003323844499126925,
      "difficulty_2_ratio": 0.045627461104830486,
      "difficulty_3_ratio": 0.23041854367730347,
      "difficulty_4_ratio": 0.4280692870521302,
      "difficulty_5_ratio": 0.29256086366660894
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.35812268169562683,
      "avg_reward": 0.2701150380266131,
      "difficulty_1_ratio": 0.004463952486683914,
      "difficulty_2_ratio": 0.055397905274063235,
      "difficulty_3_ratio": 0.25291386667660937,
      "difficulty_4_ratio": 0.4247735415860251,
      "difficulty_5_ratio": 0.2624507339766185
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.3717956397558158,
      "avg_reward": 0.2242607643980467,
      "difficulty_1_ratio": 0.005961543635767642,
      "difficulty_2_ratio": 0.06683240381041645,
      "difficulty_3_ratio": 0.27562649024852093,
      "difficulty_4_ratio": 0.41817719578473006,
      "difficulty_5_ratio": 0.2334023665205648
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.3929499678564251,
      "avg_reward": 0.3274127378941346,
      "difficulty_1_ratio": 0.007822719184174324,
      "difficulty_2_ratio": 0.07949491055732377,
      "difficulty_3_ratio": 0.29718468692891836,
      "difficulty_4_ratio": 0.4087135617359425,
      "difficulty_5_ratio": 0.206784121593641
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.3944274524064829,
      "avg_reward": 0.303812605256429,
      "difficulty_1_ratio": 0.009983298952962209,
      "difficulty_2_ratio": 0.09265686413080075,
      "difficulty_3_ratio": 0.3163636937049174,
      "difficulty_4_ratio": 0.3973755986640315,
      "difficulty_5_ratio": 0.1836205445472881
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.373215838071042,
      "avg_reward": 0.27754040431856564
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.4017605190933683,
      "avg_reward": 0.28129455181361374
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.41236764857882685,
      "avg_reward": 0.35009666170378845
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.46017662956376015,
      "avg_reward": 0.3768701942926001
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.4343389628191408,
      "avg_reward": 0.3437488744670043
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.397418077602494,
      "avg_reward": 0.3166087683095344
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.443469678826402,
      "avg_reward": 0.4779378486853859
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.4447514904615515,
      "avg_reward": 0.37087855948592185
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.4540967196318868,
      "avg_reward": 0.3048434738245328
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.48369531911121083,
      "avg_reward": 0.42455290692330744
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.48256061952690665,
      "avg_reward": 0.3405791228817884
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.5005482246015526,
      "avg_reward": 0.33034602654162804
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.4898315757885757,
      "avg_reward": 0.5013880419213596
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.46373448880935875,
      "avg_reward": 0.34267270456734844
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.49083708933722103,
      "avg_reward": 0.3674958887639669
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.4629774955149286,
      "avg_reward": 0.37381014515224426
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.47773942597689695,
      "avg_reward": 0.40587116231327663
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.4854403299013335,
      "avg_reward": 0.46584898417194376
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.4928565273299796,
      "avg_reward": 0.37818214605369993
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.5293353840465501,
      "avg_reward": 0.36192509141554235
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.5220098497559862,
      "avg_reward": 0.4829650175189104
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.48956052833401703,
      "avg_reward": 0.40088011559382886
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.5310133318907984,
      "avg_reward": 0.4639018091015042
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.5050403171000676,
      "avg_reward": 0.33800942302584025
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.5440424192498975,
      "avg_reward": 0.4500831690615773
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.542300906981251,
      "avg_reward": 0.4511631360598496
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.5272439805100732,
      "avg_reward": 0.4334078692661087
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.5501282023984896,
      "avg_reward": 0.4043849910174733
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.5848763769933182,
      "avg_reward": 0.49159274764024397
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.5269039032507387,
      "avg_reward": 0.4543508030322824
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.5342835517175137,
      "avg_reward": 0.4667810715611336
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.5798776665885219,
      "avg_reward": 0.422868017353232
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.5787864819114005,
      "avg_reward": 0.4836682318759453
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.578661307357545,
      "avg_reward": 0.5577686950187334
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.559904749567981,
      "avg_reward": 0.41023699143651027
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.5495092203990847,
      "avg_reward": 0.39881686207099587
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.5681423806835675,
      "avg_reward": 0.4715715032876862
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.5775043477166417,
      "avg_reward": 0.5033626406251146
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.5744211732587482,
      "avg_reward": 0.5322136424648645
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.5709663305909718,
      "avg_reward": 0.5927815228022584
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.5907820736565318,
      "avg_reward": 0.42976778110441133
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.5587742149752787,
      "avg_reward": 0.47114299274238225
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.577563323502461,
      "avg_reward": 0.4977506835065734
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.5932580604370521,
      "avg_reward": 0.4709650027167981
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.5685413522057161,
      "avg_reward": 0.3790907205302797
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.5781569449151632,
      "avg_reward": 0.5053454956483042
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.5929080744154287,
      "avg_reward": 0.4120395205967436
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.5935604793996371,
      "avg_reward": 0.49411425250615154
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.5738247731795443,
      "avg_reward": 0.4667460738409118
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.5940081757847141,
      "avg_reward": 0.4180580257362401
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.009934283060224654,
      "avg_reward": 0.0010342113896204897,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.5940081757847141,
      "avg_reward": 0.4180580257362401
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 11.5,
      "update": 1,
      "cumulative_wall_time": 4.3478260869565215
    },
    {
      "timestep": 101,
      "throughput": 12.65,
      "update": 2,
      "cumulative_wall_time": 8.695652173913043
    },
    {
      "timestep": 202,
      "throughput": 13.799999999999999,
      "update": 3,
      "cumulative_wall_time": 13.043478260869565
    },
    {
      "timestep": 303,
      "throughput": 14.950000000000001,
      "update": 4,
      "cumulative_wall_time": 17.391304347826086
    },
    {
      "timestep": 404,
      "throughput": 16.099999999999998,
      "update": 5,
      "cumulative_wall_time": 21.73913043478261
    },
    {
      "timestep": 505,
      "throughput": 17.25,
      "update": 6,
      "cumulative_wall_time": 26.086956521739133
    },
    {
      "timestep": 606,
      "throughput": 18.400000000000002,
      "update": 7,
      "cumulative_wall_time": 30.434782608695656
    },
    {
      "timestep": 707,
      "throughput": 19.55,
      "update": 8,
      "cumulative_wall_time": 34.78260869565218
    },
    {
      "timestep": 808,
      "throughput": 20.7,
      "update": 9,
      "cumulative_wall_time": 39.1304347826087
    },
    {
      "timestep": 909,
      "throughput": 21.849999999999998,
      "update": 10,
      "cumulative_wall_time": 43.478260869565226
    },
    {
      "timestep": 1010,
      "throughput": 23.82291092880105,
      "update": 11,
      "cumulative_wall_time": 47.82608695652175
    },
    {
      "timestep": 1111,
      "throughput": 24.289804410646937,
      "update": 12,
      "cumulative_wall_time": 52.17391304347827
    },
    {
      "timestep": 1212,
      "throughput": 25.49101785930314,
      "update": 13,
      "cumulative_wall_time": 56.521739130434796
    },
    {
      "timestep": 1313,
      "throughput": 25.423744719680275,
      "update": 14,
      "cumulative_wall_time": 60.86956521739132
    },
    {
      "timestep": 1414,
      "throughput": 19.831360453698693,
      "update": 15,
      "cumulative_wall_time": 65.21739130434784
    },
    {
      "timestep": 1515,
      "throughput": 20.843002408195215,
      "update": 16,
      "cumulative_wall_time": 69.56521739130436
    },
    {
      "timestep": 1616,
      "throughput": 24.184581114579917,
      "update": 17,
      "cumulative_wall_time": 73.91304347826087
    },
    {
      "timestep": 1717,
      "throughput": 24.18170768709808,
      "update": 18,
      "cumulative_wall_time": 78.26086956521739
    },
    {
      "timestep": 1818,
      "throughput": 24.184609678503907,
      "update": 19,
      "cumulative_wall_time": 82.6086956521739
    },
    {
      "timestep": 1919,
      "throughput": 31.86128242850586,
      "update": 20,
      "cumulative_wall_time": 86.95652173913042
    },
    {
      "timestep": 2020,
      "throughput": 24.313048174594286,
      "update": 21,
      "cumulative_wall_time": 91.30434782608694
    },
    {
      "timestep": 2121,
      "throughput": 25.611800972415374,
      "update": 22,
      "cumulative_wall_time": 95.65217391304346
    },
    {
      "timestep": 2222,
      "throughput": 25.194204056034366,
      "update": 23,
      "cumulative_wall_time": 99.99999999999997
    },
    {
      "timestep": 2323,
      "throughput": 24.498199878003334,
      "update": 24,
      "cumulative_wall_time": 104.34782608695649
    },
    {
      "timestep": 2424,
      "throughput": 22.274880737327205,
      "update": 25,
      "cumulative_wall_time": 108.695652173913
    },
    {
      "timestep": 2525,
      "throughput": 24.745629207134517,
      "update": 26,
      "cumulative_wall_time": 113.04347826086952
    },
    {
      "timestep": 2626,
      "throughput": 21.222502006563587,
      "update": 27,
      "cumulative_wall_time": 117.39130434782604
    },
    {
      "timestep": 2727,
      "throughput": 22.45531720449798,
      "update": 28,
      "cumulative_wall_time": 121.73913043478255
    },
    {
      "timestep": 2828,
      "throughput": 21.883663839993062,
      "update": 29,
      "cumulative_wall_time": 126.08695652173907
    },
    {
      "timestep": 2929,
      "throughput": 23.18831052058854,
      "update": 30,
      "cumulative_wall_time": 130.4347826086956
    },
    {
      "timestep": 3030,
      "throughput": 28.32371470334907,
      "update": 31,
      "cumulative_wall_time": 134.78260869565213
    },
    {
      "timestep": 3131,
      "throughput": 18.70529005703898,
      "update": 32,
      "cumulative_wall_time": 139.13043478260866
    },
    {
      "timestep": 3232,
      "throughput": 24.578398437861377,
      "update": 33,
      "cumulative_wall_time": 143.4782608695652
    },
    {
      "timestep": 3333,
      "throughput": 19.2907534962638,
      "update": 34,
      "cumulative_wall_time": 147.82608695652172
    },
    {
      "timestep": 3434,
      "throughput": 21.9145567086843,
      "update": 35,
      "cumulative_wall_time": 152.17391304347825
    },
    {
      "timestep": 3535,
      "throughput": 25.504586373024942,
      "update": 36,
      "cumulative_wall_time": 156.52173913043478
    },
    {
      "timestep": 3636,
      "throughput": 23.147844043919562,
      "update": 37,
      "cumulative_wall_time": 160.8695652173913
    },
    {
      "timestep": 3737,
      "throughput": 20.521187010762596,
      "update": 38,
      "cumulative_wall_time": 165.21739130434784
    },
    {
      "timestep": 3838,
      "throughput": 21.354801468702075,
      "update": 39,
      "cumulative_wall_time": 169.56521739130437
    },
    {
      "timestep": 3939,
      "throughput": 24.56307482254975,
      "update": 40,
      "cumulative_wall_time": 173.9130434782609
    },
    {
      "timestep": 4040,
      "throughput": 21.320156747050586,
      "update": 41,
      "cumulative_wall_time": 178.26086956521743
    },
    {
      "timestep": 4141,
      "throughput": 23.497854756038546,
      "update": 42,
      "cumulative_wall_time": 182.60869565217396
    },
    {
      "timestep": 4242,
      "throughput": 23.10481523177877,
      "update": 43,
      "cumulative_wall_time": 186.9565217391305
    },
    {
      "timestep": 4343,
      "throughput": 21.50131920050662,
      "update": 44,
      "cumulative_wall_time": 191.30434782608702
    },
    {
      "timestep": 4444,
      "throughput": 27.93107140544825,
      "update": 45,
      "cumulative_wall_time": 195.65217391304355
    },
    {
      "timestep": 4545,
      "throughput": 24.458013751331425,
      "update": 46,
      "cumulative_wall_time": 200.00000000000009
    },
    {
      "timestep": 4646,
      "throughput": 18.342172050687505,
      "update": 47,
      "cumulative_wall_time": 204.34782608695662
    },
    {
      "timestep": 4747,
      "throughput": 23.428844923969685,
      "update": 48,
      "cumulative_wall_time": 208.69565217391315
    },
    {
      "timestep": 4848,
      "throughput": 21.477891131032706,
      "update": 49,
      "cumulative_wall_time": 213.04347826086968
    },
    {
      "timestep": 4949,
      "throughput": 24.960596670031315,
      "update": 50,
      "cumulative_wall_time": 217.3913043478262
    },
    {
      "timestep": 5050,
      "throughput": 21.17720230160479,
      "update": 51,
      "cumulative_wall_time": 221.73913043478274
    },
    {
      "timestep": 5151,
      "throughput": 22.73610618462613,
      "update": 52,
      "cumulative_wall_time": 226.08695652173927
    },
    {
      "timestep": 5252,
      "throughput": 24.16147074165505,
      "update": 53,
      "cumulative_wall_time": 230.4347826086958
    },
    {
      "timestep": 5353,
      "throughput": 24.99123694659128,
      "update": 54,
      "cumulative_wall_time": 234.78260869565233
    },
    {
      "timestep": 5454,
      "throughput": 20.239318263771715,
      "update": 55,
      "cumulative_wall_time": 239.13043478260886
    },
    {
      "timestep": 5555,
      "throughput": 22.23064715756582,
      "update": 56,
      "cumulative_wall_time": 243.4782608695654
    },
    {
      "timestep": 5656,
      "throughput": 21.907625784329802,
      "update": 57,
      "cumulative_wall_time": 247.82608695652192
    },
    {
      "timestep": 5757,
      "throughput": 21.497342765080464,
      "update": 58,
      "cumulative_wall_time": 252.17391304347845
    },
    {
      "timestep": 5858,
      "throughput": 27.06054475264652,
      "update": 59,
      "cumulative_wall_time": 256.521739130435
    },
    {
      "timestep": 5959,
      "throughput": 23.9314579352102,
      "update": 60,
      "cumulative_wall_time": 260.8695652173915
    },
    {
      "timestep": 6060,
      "throughput": 20.099966905029394,
      "update": 61,
      "cumulative_wall_time": 265.217391304348
    },
    {
      "timestep": 6161,
      "throughput": 25.111082478225985,
      "update": 62,
      "cumulative_wall_time": 269.5652173913045
    },
    {
      "timestep": 6262,
      "throughput": 27.880959253129056,
      "update": 63,
      "cumulative_wall_time": 273.913043478261
    },
    {
      "timestep": 6363,
      "throughput": 25.37467009926764,
      "update": 64,
      "cumulative_wall_time": 278.2608695652175
    },
    {
      "timestep": 6464,
      "throughput": 19.50544907830577,
      "update": 65,
      "cumulative_wall_time": 282.608695652174
    },
    {
      "timestep": 6565,
      "throughput": 21.88626163240762,
      "update": 66,
      "cumulative_wall_time": 286.9565217391305
    },
    {
      "timestep": 6666,
      "throughput": 25.91389564312923,
      "update": 67,
      "cumulative_wall_time": 291.304347826087
    },
    {
      "timestep": 6767,
      "throughput": 21.372360229076804,
      "update": 68,
      "cumulative_wall_time": 295.6521739130435
    },
    {
      "timestep": 6868,
      "throughput": 24.020784684736324,
      "update": 69,
      "cumulative_wall_time": 300.0
    },
    {
      "timestep": 6969,
      "throughput": 24.781658322887477,
      "update": 70,
      "cumulative_wall_time": 304.3478260869565
    },
    {
      "timestep": 7070,
      "throughput": 20.86805991537041,
      "update": 71,
      "cumulative_wall_time": 308.695652173913
    },
    {
      "timestep": 7171,
      "throughput": 22.86309168105786,
      "update": 72,
      "cumulative_wall_time": 313.0434782608695
    },
    {
      "timestep": 7272,
      "throughput": 15.545085117841133,
      "update": 73,
      "cumulative_wall_time": 317.391304347826
    },
    {
      "timestep": 7373,
      "throughput": 20.643908424931134,
      "update": 74,
      "cumulative_wall_time": 321.7391304347825
    },
    {
      "timestep": 7474,
      "throughput": 22.419093251795733,
      "update": 75,
      "cumulative_wall_time": 326.086956521739
    },
    {
      "timestep": 7575,
      "throughput": 20.130098681480845,
      "update": 76,
      "cumulative_wall_time": 330.4347826086955
    },
    {
      "timestep": 7676,
      "throughput": 26.75454599904276,
      "update": 77,
      "cumulative_wall_time": 334.782608695652
    },
    {
      "timestep": 7777,
      "throughput": 19.710674830690543,
      "update": 78,
      "cumulative_wall_time": 339.1304347826085
    },
    {
      "timestep": 7878,
      "throughput": 21.987897680596937,
      "update": 79,
      "cumulative_wall_time": 343.478260869565
    },
    {
      "timestep": 7979,
      "throughput": 23.300703327758008,
      "update": 80,
      "cumulative_wall_time": 347.8260869565215
    },
    {
      "timestep": 8080,
      "throughput": 26.314928564852067,
      "update": 81,
      "cumulative_wall_time": 352.173913043478
    },
    {
      "timestep": 8181,
      "throughput": 19.69751705228729,
      "update": 82,
      "cumulative_wall_time": 356.5217391304345
    },
    {
      "timestep": 8282,
      "throughput": 25.675276629956404,
      "update": 83,
      "cumulative_wall_time": 360.869565217391
    },
    {
      "timestep": 8383,
      "throughput": 23.02353604034505,
      "update": 84,
      "cumulative_wall_time": 365.21739130434753
    },
    {
      "timestep": 8484,
      "throughput": 20.74253010258971,
      "update": 85,
      "cumulative_wall_time": 369.56521739130403
    },
    {
      "timestep": 8585,
      "throughput": 24.062837990805523,
      "update": 86,
      "cumulative_wall_time": 373.91304347826053
    },
    {
      "timestep": 8686,
      "throughput": 23.45783729981898,
      "update": 87,
      "cumulative_wall_time": 378.26086956521704
    },
    {
      "timestep": 8787,
      "throughput": 21.619501182534773,
      "update": 88,
      "cumulative_wall_time": 382.60869565217354
    },
    {
      "timestep": 8888,
      "throughput": 23.16054479547704,
      "update": 89,
      "cumulative_wall_time": 386.95652173913004
    },
    {
      "timestep": 8989,
      "throughput": 22.11377872721795,
      "update": 90,
      "cumulative_wall_time": 391.30434782608654
    },
    {
      "timestep": 9090,
      "throughput": 23.26108989407787,
      "update": 91,
      "cumulative_wall_time": 395.65217391304304
    },
    {
      "timestep": 9191,
      "throughput": 24.522900551398408,
      "update": 92,
      "cumulative_wall_time": 399.99999999999955
    },
    {
      "timestep": 9292,
      "throughput": 26.64783867713431,
      "update": 93,
      "cumulative_wall_time": 404.34782608695605
    },
    {
      "timestep": 9393,
      "throughput": 20.15302435269825,
      "update": 94,
      "cumulative_wall_time": 408.69565217391255
    },
    {
      "timestep": 9494,
      "throughput": 27.905976761709418,
      "update": 95,
      "cumulative_wall_time": 413.04347826086905
    },
    {
      "timestep": 9595,
      "throughput": 18.510198061098247,
      "update": 96,
      "cumulative_wall_time": 417.39130434782555
    },
    {
      "timestep": 9696,
      "throughput": 22.650894281418157,
      "update": 97,
      "cumulative_wall_time": 421.73913043478206
    },
    {
      "timestep": 9797,
      "throughput": 24.353129574914526,
      "update": 98,
      "cumulative_wall_time": 426.08695652173856
    },
    {
      "timestep": 9898,
      "throughput": 23.646281295790573,
      "update": 99,
      "cumulative_wall_time": 430.43478260869506
    },
    {
      "timestep": 10000,
      "throughput": 21.567791104412635,
      "update": 100,
      "cumulative_wall_time": 434.78260869565156
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 1200,
        "success_rate": 0.85,
        "mean_reward": 0.7608375549928545,
        "recent_gradient": 0.009013998130682335
      },
      "level_2": {
        "num_pulls": 2800,
        "success_rate": 0.65,
        "mean_reward": 0.5732127048611159,
        "recent_gradient": 0.02169920419404205
      },
      "level_3": {
        "num_pulls": 3500,
        "success_rate": 0.45,
        "mean_reward": 0.412140309719301,
        "recent_gradient": 0.028614180809478692
      },
      "level_4": {
        "num_pulls": 1800,
        "success_rate": 0.28,
        "mean_reward": 0.2699919975086651,
        "recent_gradient": 0.02061459904175322
      },
      "level_5": {
        "num_pulls": 700,
        "success_rate": 0.15,
        "mean_reward": 0.1512572423767792,
        "recent_gradient": 0.011259257683847225
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.05
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 4.5855024945389635
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.719909479901515
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 5.373646802561631
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 5.3051851327167325
      }
    }
  },
  "config": {
    "use_async": true,
    "curriculum_strategy": "adaptive",
    "use_csc": true,
    "use_eaas": true
  }
}