{
  "experiment_name": "aceas_seed123",
  "total_timesteps": 10000,
  "total_time": 434.7826086956522,
  "avg_throughput": 23,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": 0.04986727232917929,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 101,
      "pass_at_1": 0.018184822486292367,
      "avg_reward": -0.06076687770687071,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 202,
      "pass_at_1": 0.013478500011134325,
      "avg_reward": 0.09335462686376503,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 303,
      "pass_at_1": 0.0,
      "avg_reward": -0.021445631442808866,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 404,
      "pass_at_1": 0.07541973527512079,
      "avg_reward": 0.016998768106841547,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 505,
      "pass_at_1": 0.08513052050362738,
      "avg_reward": 0.06336896795605736,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 606,
      "pass_at_1": 0.1328000983403009,
      "avg_reward": 0.07429497883800817,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 707,
      "pass_at_1": 0.09850298629190203,
      "avg_reward": 0.05708482525259576,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 808,
      "pass_at_1": 0.15605954415446435,
      "avg_reward": 0.23418693977226082,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 909,
      "pass_at_1": 0.13672980350731273,
      "avg_reward": 0.12869316276459297,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.1362545191603681,
      "avg_reward": 0.18354021673583443,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.10780038434667433,
      "avg_reward": 0.14503175971644464,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.10660136311821135,
      "avg_reward": 0.05339351537189857,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.1551351366340164,
      "avg_reward": 0.05267407429591467,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.13965760601036023,
      "avg_reward": 0.06863834001530392,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.14296376938196198,
      "avg_reward": -0.02555843976746662,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.11841280368748797,
      "avg_reward": 0.05973638122009452,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.17830860768186882,
      "avg_reward": 0.13396510200598427,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.16587873735177766,
      "avg_reward": 0.16711412543653636,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.15443761733260378,
      "avg_reward": 0.13773146005644757,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.16226860646593222,
      "avg_reward": 0.04343141046671542,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.17704309791494802,
      "avg_reward": 0.1703247714522113,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.1982515813552369,
      "avg_reward": 0.15800974036024854,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.2460748327044983,
      "avg_reward": 0.21750547417903757,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.2246739525694318,
      "avg_reward": 0.29164632898044307,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.1862076579282828,
      "avg_reward": 0.0970267158323786,
      "difficulty_1_ratio": 0.016291910734624847,
      "difficulty_2_ratio": 0.12497928765460015,
      "difficulty_3_ratio": 0.3527033512649604,
      "difficulty_4_ratio": 0.3661732760034468,
      "difficulty_5_ratio": 0.1398521743423678
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.2540661166974936,
      "avg_reward": 0.16334975659594178,
      "difficulty_1_ratio": 0.014439823367355656,
      "difficulty_2_ratio": 0.1162288430953594,
      "difficulty_3_ratio": 0.34416877595779866,
      "difficulty_4_ratio": 0.37491648580673986,
      "difficulty_5_ratio": 0.15024607177274654
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.2269938824709286,
      "avg_reward": 0.23506090444796032,
      "difficulty_1_ratio": 0.012218327302669146,
      "difficulty_2_ratio": 0.10498325535696679,
      "difficulty_3_ratio": 0.33184389643032614,
      "difficulty_4_ratio": 0.38588078286713096,
      "difficulty_5_ratio": 0.165073738042907
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.251521521316502,
      "avg_reward": 0.2889615261522571,
      "difficulty_1_ratio": 0.009913147093465137,
      "difficulty_2_ratio": 0.09225064005743493,
      "difficulty_3_ratio": 0.3158149930158207,
      "difficulty_4_ratio": 0.39774215071368285,
      "difficulty_5_ratio": 0.18427906911959632
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.27101882523936166,
      "avg_reward": 0.27028469367677616,
      "difficulty_1_ratio": 0.007760018351280176,
      "difficulty_2_ratio": 0.07909068287132516,
      "difficulty_3_ratio": 0.29654692178674946,
      "difficulty_4_ratio": 0.40904118087068214,
      "difficulty_5_ratio": 0.20756119611996313
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.23313381074314427,
      "avg_reward": 0.22625018198417632,
      "difficulty_1_ratio": 0.00590957184933243,
      "difficulty_2_ratio": 0.06645671547671815,
      "difficulty_3_ratio": 0.2749332380949103,
      "difficulty_4_ratio": 0.4184283859957229,
      "difficulty_5_ratio": 0.2342720885833161
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.26243068720490087,
      "avg_reward": 0.1436312767668979,
      "difficulty_1_ratio": 0.0044234366536341566,
      "difficulty_2_ratio": 0.05506877089710349,
      "difficulty_3_ratio": 0.2522066146015487,
      "difficulty_4_ratio": 0.4249257796153269,
      "difficulty_5_ratio": 0.2633753982323869
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.29211507583365764,
      "avg_reward": 0.27405388739585446,
      "difficulty_1_ratio": 0.0032937818280582443,
      "difficulty_2_ratio": 0.04535368508089252,
      "difficulty_3_ratio": 0.22973959398617683,
      "difficulty_4_ratio": 0.4281191321289578,
      "difficulty_5_ratio": 0.2934938069759146
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.27236037106342714,
      "avg_reward": 0.20623369380152107,
      "difficulty_1_ratio": 0.0024722539225482446,
      "difficulty_2_ratio": 0.03746068440111024,
      "difficulty_3_ratio": 0.20881604152186556,
      "difficulty_4_ratio": 0.4282107125631631,
      "difficulty_5_ratio": 0.32304030759131297
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.25521440591078826,
      "avg_reward": 0.21414772840656227,
      "difficulty_1_ratio": 0.0018961158457144911,
      "difficulty_2_ratio": 0.03133140973471507,
      "difficulty_3_ratio": 0.19045857150804962,
      "difficulty_4_ratio": 0.4259186206842434,
      "difficulty_5_ratio": 0.35039528222727745
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.29631797241583063,
      "avg_reward": 0.19549662872050055,
      "difficulty_1_ratio": 0.0015056169658766543,
      "difficulty_2_ratio": 0.026789686088424,
      "difficulty_3_ratio": 0.175358276208076,
      "difficulty_4_ratio": 0.42227019488557094,
      "difficulty_5_ratio": 0.3740762258520523
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.31799125590753746,
      "avg_reward": 0.1995328524018783,
      "difficulty_1_ratio": 0.0012524233850038473,
      "difficulty_2_ratio": 0.023621859465310466,
      "difficulty_3_ratio": 0.16390134325095126,
      "difficulty_4_ratio": 0.4183660766360568,
      "difficulty_5_ratio": 0.3928582972626777
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.2601025506610518,
      "avg_reward": 0.2600683950734765,
      "difficulty_1_ratio": 0.0011018868277803448,
      "difficulty_2_ratio": 0.021633707012814266,
      "difficulty_3_ratio": 0.15625373746114093,
      "difficulty_4_ratio": 0.4151790230064104,
      "difficulty_5_ratio": 0.40583164569185404
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.3023240931713714,
      "avg_reward": 0.23555779527144635,
      "difficulty_1_ratio": 0.0010322931860183035,
      "difficulty_2_ratio": 0.02068358559081816,
      "difficulty_3_ratio": 0.15245936727836976,
      "difficulty_4_ratio": 0.41341660520999185,
      "difficulty_5_ratio": 0.41240814873480197
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.30146743675984033,
      "avg_reward": 0.16087581137200213,
      "difficulty_1_ratio": 0.001033362574533033,
      "difficulty_2_ratio": 0.02069834621303522,
      "difficulty_3_ratio": 0.15251904715441822,
      "difficulty_4_ratio": 0.4134452797034622,
      "difficulty_5_ratio": 0.41230396435455147
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.3511384070235065,
      "avg_reward": 0.24646727642645913,
      "difficulty_1_ratio": 0.001105253979564763,
      "difficulty_2_ratio": 0.021679152361382986,
      "difficulty_3_ratio": 0.1564328746274194,
      "difficulty_4_ratio": 0.41525920915243264,
      "difficulty_5_ratio": 0.4055235098792002
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.36704821193061393,
      "avg_reward": 0.3340039788550276,
      "difficulty_1_ratio": 0.0012585820768892396,
      "difficulty_2_ratio": 0.02370139964709112,
      "difficulty_3_ratio": 0.16419954975755394,
      "difficulty_4_ratio": 0.418480714620724,
      "difficulty_5_ratio": 0.3923597538977418
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.33529930293261917,
      "avg_reward": 0.21394432228975205,
      "difficulty_1_ratio": 0.001515438901358441,
      "difficulty_2_ratio": 0.02690866798401823,
      "difficulty_3_ratio": 0.17577272552605308,
      "difficulty_4_ratio": 0.4223925910167582,
      "difficulty_5_ratio": 0.37341057657181215
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.33467067011435536,
      "avg_reward": 0.2071103795367258,
      "difficulty_1_ratio": 0.0019108941032437861,
      "difficulty_2_ratio": 0.03149638910459275,
      "difficulty_3_ratio": 0.19098111826597575,
      "difficulty_4_ratio": 0.4260157102739871,
      "difficulty_5_ratio": 0.34959588825220067
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.3987383004335599,
      "avg_reward": 0.32721270185833917,
      "difficulty_1_ratio": 0.0024936925676773474,
      "difficulty_2_ratio": 0.03767804281480519,
      "difficulty_3_ratio": 0.2094301856844532,
      "difficulty_4_ratio": 0.42824838946414634,
      "difficulty_5_ratio": 0.32214968946891787
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.3876177312370481,
      "avg_reward": 0.24672658253912716,
      "difficulty_1_ratio": 0.003323844499126925,
      "difficulty_2_ratio": 0.045627461104830486,
      "difficulty_3_ratio": 0.23041854367730347,
      "difficulty_4_ratio": 0.4280692870521302,
      "difficulty_5_ratio": 0.29256086366660894
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.375784446165114,
      "avg_reward": 0.35952065387252014,
      "difficulty_1_ratio": 0.004463952486683914,
      "difficulty_2_ratio": 0.055397905274063235,
      "difficulty_3_ratio": 0.25291386667660937,
      "difficulty_4_ratio": 0.4247735415860251,
      "difficulty_5_ratio": 0.2624507339766185
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.3729375875797986,
      "avg_reward": 0.349905793009926,
      "difficulty_1_ratio": 0.005961543635767642,
      "difficulty_2_ratio": 0.06683240381041645,
      "difficulty_3_ratio": 0.27562649024852093,
      "difficulty_4_ratio": 0.41817719578473006,
      "difficulty_5_ratio": 0.2334023665205648
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.36533620407501827,
      "avg_reward": 0.2240953860290854,
      "difficulty_1_ratio": 0.007822719184174324,
      "difficulty_2_ratio": 0.07949491055732377,
      "difficulty_3_ratio": 0.29718468692891836,
      "difficulty_4_ratio": 0.4087135617359425,
      "difficulty_5_ratio": 0.206784121593641
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.40191319551519644,
      "avg_reward": 0.30257173468352955,
      "difficulty_1_ratio": 0.009983298952962209,
      "difficulty_2_ratio": 0.09265686413080075,
      "difficulty_3_ratio": 0.3163636937049174,
      "difficulty_4_ratio": 0.3973755986640315,
      "difficulty_5_ratio": 0.1836205445472881
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.41436434669748695,
      "avg_reward": 0.2325970807819671
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.42286010213331404,
      "avg_reward": 0.46820327807011697
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.4151008431835174,
      "avg_reward": 0.33378778099230605
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.42604390123232316,
      "avg_reward": 0.2477363354462692
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.43771088779849177,
      "avg_reward": 0.26989822303799516
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.42723990994599875,
      "avg_reward": 0.40393540543698586
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.42756073550557994,
      "avg_reward": 0.36711103788283395
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.46885349083630135,
      "avg_reward": 0.3890198354738411
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.4273719856240995,
      "avg_reward": 0.32527382473170896
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.5000270896686762,
      "avg_reward": 0.29876938358506744
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.4612242603087222,
      "avg_reward": 0.3413740046725724
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.47490728564477336,
      "avg_reward": 0.4173366093751802
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.5102682532730114,
      "avg_reward": 0.39470298301795126
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.49979204191150894,
      "avg_reward": 0.42482064077246584
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.4983310079929042,
      "avg_reward": 0.3704686098179998
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.47404433476073327,
      "avg_reward": 0.3242333121775518
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.48385675606343653,
      "avg_reward": 0.4031697336440606
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.5190478024485762,
      "avg_reward": 0.4314116843517057
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.4975424912527895,
      "avg_reward": 0.4883324984988554
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.5434423521717875,
      "avg_reward": 0.41705387609992134
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.5009920229441903,
      "avg_reward": 0.40730436606325077
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.5470561659263287,
      "avg_reward": 0.45428318160376885
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.5369466501040308,
      "avg_reward": 0.41895331396944335
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.5389047492216739,
      "avg_reward": 0.508351021950146
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.5288102123080054,
      "avg_reward": 0.430213556471798
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.542367379505326,
      "avg_reward": 0.4480801713928127
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.5126066974202185,
      "avg_reward": 0.31624192514248006
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.5238736515140792,
      "avg_reward": 0.4274960359813468
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.5586380100904873,
      "avg_reward": 0.42037668008370865
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.5782751228521378,
      "avg_reward": 0.4554612995654009
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.5541835050867527,
      "avg_reward": 0.43364861054176906
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.5593862908633072,
      "avg_reward": 0.48273273639282593
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.5728320280847607,
      "avg_reward": 0.4133444754373291
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.5926933796872257,
      "avg_reward": 0.4194033808784347
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.5663970521698506,
      "avg_reward": 0.43939781305976283
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.5463196754452253,
      "avg_reward": 0.4332997109574887
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.5548681394060017,
      "avg_reward": 0.447539873688604
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.5800322509544287,
      "avg_reward": 0.5376222692122066
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.5803088197937384,
      "avg_reward": 0.43368578881974945
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.5684270710413389,
      "avg_reward": 0.4617405621387993
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.5801379432904746,
      "avg_reward": 0.5370898180438007
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.60809912353164,
      "avg_reward": 0.46853250251319895
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.571059736645254,
      "avg_reward": 0.32899505911281035
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.5728148996791368,
      "avg_reward": 0.4093490344390953
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.5783807374051878,
      "avg_reward": 0.48228380204165583
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.5906310905404835,
      "avg_reward": 0.4710064720800097
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.5926178417545949,
      "avg_reward": 0.46778838474212636
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.594037239533483,
      "avg_reward": 0.3136770412308208
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.5861160521085519,
      "avg_reward": 0.46335030563419116
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.5860187670916623,
      "avg_reward": 0.4579177005681828
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": 0.04986727232917929,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.5860187670916623,
      "avg_reward": 0.4579177005681828
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 11.5,
      "update": 1,
      "cumulative_wall_time": 4.3478260869565215
    },
    {
      "timestep": 101,
      "throughput": 12.65,
      "update": 2,
      "cumulative_wall_time": 8.695652173913043
    },
    {
      "timestep": 202,
      "throughput": 13.799999999999999,
      "update": 3,
      "cumulative_wall_time": 13.043478260869565
    },
    {
      "timestep": 303,
      "throughput": 14.950000000000001,
      "update": 4,
      "cumulative_wall_time": 17.391304347826086
    },
    {
      "timestep": 404,
      "throughput": 16.099999999999998,
      "update": 5,
      "cumulative_wall_time": 21.73913043478261
    },
    {
      "timestep": 505,
      "throughput": 17.25,
      "update": 6,
      "cumulative_wall_time": 26.086956521739133
    },
    {
      "timestep": 606,
      "throughput": 18.400000000000002,
      "update": 7,
      "cumulative_wall_time": 30.434782608695656
    },
    {
      "timestep": 707,
      "throughput": 19.55,
      "update": 8,
      "cumulative_wall_time": 34.78260869565218
    },
    {
      "timestep": 808,
      "throughput": 20.7,
      "update": 9,
      "cumulative_wall_time": 39.1304347826087
    },
    {
      "timestep": 909,
      "throughput": 21.849999999999998,
      "update": 10,
      "cumulative_wall_time": 43.478260869565226
    },
    {
      "timestep": 1010,
      "throughput": 24.61761327095548,
      "update": 11,
      "cumulative_wall_time": 47.82608695652175
    },
    {
      "timestep": 1111,
      "throughput": 21.6243577379161,
      "update": 12,
      "cumulative_wall_time": 52.17391304347827
    },
    {
      "timestep": 1212,
      "throughput": 28.061614828199396,
      "update": 13,
      "cumulative_wall_time": 56.521739130434796
    },
    {
      "timestep": 1313,
      "throughput": 24.583082939510803,
      "update": 14,
      "cumulative_wall_time": 60.86956521739132
    },
    {
      "timestep": 1414,
      "throughput": 22.985493322898094,
      "update": 15,
      "cumulative_wall_time": 65.21739130434784
    },
    {
      "timestep": 1515,
      "throughput": 22.524676702645596,
      "update": 16,
      "cumulative_wall_time": 69.56521739130436
    },
    {
      "timestep": 1616,
      "throughput": 22.80099874132109,
      "update": 17,
      "cumulative_wall_time": 73.91304347826087
    },
    {
      "timestep": 1717,
      "throughput": 20.894793739128847,
      "update": 18,
      "cumulative_wall_time": 78.26086956521739
    },
    {
      "timestep": 1818,
      "throughput": 22.78103415970658,
      "update": 19,
      "cumulative_wall_time": 82.6086956521739
    },
    {
      "timestep": 1919,
      "throughput": 23.640972088472225,
      "update": 20,
      "cumulative_wall_time": 86.95652173913042
    },
    {
      "timestep": 2020,
      "throughput": 24.332945715818425,
      "update": 21,
      "cumulative_wall_time": 91.30434782608694
    },
    {
      "timestep": 2121,
      "throughput": 24.33328649203197,
      "update": 22,
      "cumulative_wall_time": 95.65217391304346
    },
    {
      "timestep": 2222,
      "throughput": 22.36778164289835,
      "update": 23,
      "cumulative_wall_time": 99.99999999999997
    },
    {
      "timestep": 2323,
      "throughput": 19.743010819199558,
      "update": 24,
      "cumulative_wall_time": 104.34782608695649
    },
    {
      "timestep": 2424,
      "throughput": 21.461063959663075,
      "update": 25,
      "cumulative_wall_time": 108.695652173913
    },
    {
      "timestep": 2525,
      "throughput": 26.708043998468494,
      "update": 26,
      "cumulative_wall_time": 113.04347826086952
    },
    {
      "timestep": 2626,
      "throughput": 25.06093412084288,
      "update": 27,
      "cumulative_wall_time": 117.39130434782604
    },
    {
      "timestep": 2727,
      "throughput": 23.850125048499603,
      "update": 28,
      "cumulative_wall_time": 121.73913043478255
    },
    {
      "timestep": 2828,
      "throughput": 21.249023237051713,
      "update": 29,
      "cumulative_wall_time": 126.08695652173907
    },
    {
      "timestep": 2929,
      "throughput": 23.008383856439686,
      "update": 30,
      "cumulative_wall_time": 130.4347826086956
    },
    {
      "timestep": 3030,
      "throughput": 20.11196202297629,
      "update": 31,
      "cumulative_wall_time": 134.78260869565213
    },
    {
      "timestep": 3131,
      "throughput": 21.73054518589903,
      "update": 32,
      "cumulative_wall_time": 139.13043478260866
    },
    {
      "timestep": 3232,
      "throughput": 22.436032314124052,
      "update": 33,
      "cumulative_wall_time": 143.4782608695652
    },
    {
      "timestep": 3333,
      "throughput": 22.16822815671001,
      "update": 34,
      "cumulative_wall_time": 147.82608695652172
    },
    {
      "timestep": 3434,
      "throughput": 25.200184441428828,
      "update": 35,
      "cumulative_wall_time": 152.17391304347825
    },
    {
      "timestep": 3535,
      "throughput": 19.73693039771846,
      "update": 36,
      "cumulative_wall_time": 156.52173913043478
    },
    {
      "timestep": 3636,
      "throughput": 21.009505775515144,
      "update": 37,
      "cumulative_wall_time": 160.8695652173913
    },
    {
      "timestep": 3737,
      "throughput": 19.838217666648895,
      "update": 38,
      "cumulative_wall_time": 165.21739130434784
    },
    {
      "timestep": 3838,
      "throughput": 20.154087610817935,
      "update": 39,
      "cumulative_wall_time": 169.56521739130437
    },
    {
      "timestep": 3939,
      "throughput": 23.285328561827292,
      "update": 40,
      "cumulative_wall_time": 173.9130434782609
    },
    {
      "timestep": 4040,
      "throughput": 19.318986773970575,
      "update": 41,
      "cumulative_wall_time": 178.26086956521743
    },
    {
      "timestep": 4141,
      "throughput": 24.733898191326563,
      "update": 42,
      "cumulative_wall_time": 182.60869565217396
    },
    {
      "timestep": 4242,
      "throughput": 22.432323713035526,
      "update": 43,
      "cumulative_wall_time": 186.9565217391305
    },
    {
      "timestep": 4343,
      "throughput": 23.158213164809748,
      "update": 44,
      "cumulative_wall_time": 191.30434782608702
    },
    {
      "timestep": 4444,
      "throughput": 23.74192649739357,
      "update": 45,
      "cumulative_wall_time": 195.65217391304355
    },
    {
      "timestep": 4545,
      "throughput": 22.00141700342134,
      "update": 46,
      "cumulative_wall_time": 200.00000000000009
    },
    {
      "timestep": 4646,
      "throughput": 25.37470334623277,
      "update": 47,
      "cumulative_wall_time": 204.34782608695662
    },
    {
      "timestep": 4747,
      "throughput": 22.55301172852644,
      "update": 48,
      "cumulative_wall_time": 208.69565217391315
    },
    {
      "timestep": 4848,
      "throughput": 24.36636158704986,
      "update": 49,
      "cumulative_wall_time": 213.04347826086968
    },
    {
      "timestep": 4949,
      "throughput": 22.54204151965832,
      "update": 50,
      "cumulative_wall_time": 217.3913043478262
    },
    {
      "timestep": 5050,
      "throughput": 23.669011091077326,
      "update": 51,
      "cumulative_wall_time": 221.73913043478274
    },
    {
      "timestep": 5151,
      "throughput": 23.64322414136331,
      "update": 52,
      "cumulative_wall_time": 226.08695652173927
    },
    {
      "timestep": 5252,
      "throughput": 23.574930860747724,
      "update": 53,
      "cumulative_wall_time": 230.4347826086958
    },
    {
      "timestep": 5353,
      "throughput": 20.759091945871887,
      "update": 54,
      "cumulative_wall_time": 234.78260869565233
    },
    {
      "timestep": 5454,
      "throughput": 24.002514272259113,
      "update": 55,
      "cumulative_wall_time": 239.13043478260886
    },
    {
      "timestep": 5555,
      "throughput": 22.26639892507093,
      "update": 56,
      "cumulative_wall_time": 243.4782608695654
    },
    {
      "timestep": 5656,
      "throughput": 24.45012247012681,
      "update": 57,
      "cumulative_wall_time": 247.82608695652192
    },
    {
      "timestep": 5757,
      "throughput": 18.0492650778517,
      "update": 58,
      "cumulative_wall_time": 252.17391304347845
    },
    {
      "timestep": 5858,
      "throughput": 19.630232689273612,
      "update": 59,
      "cumulative_wall_time": 256.521739130435
    },
    {
      "timestep": 5959,
      "throughput": 23.835924792910568,
      "update": 60,
      "cumulative_wall_time": 260.8695652173915
    },
    {
      "timestep": 6060,
      "throughput": 27.284733445742027,
      "update": 61,
      "cumulative_wall_time": 265.217391304348
    },
    {
      "timestep": 6161,
      "throughput": 24.920635117665846,
      "update": 62,
      "cumulative_wall_time": 269.5652173913045
    },
    {
      "timestep": 6262,
      "throughput": 21.430362851340043,
      "update": 63,
      "cumulative_wall_time": 273.913043478261
    },
    {
      "timestep": 6363,
      "throughput": 19.1082794446307,
      "update": 64,
      "cumulative_wall_time": 278.2608695652175
    },
    {
      "timestep": 6464,
      "throughput": 24.708178308671723,
      "update": 65,
      "cumulative_wall_time": 282.608695652174
    },
    {
      "timestep": 6565,
      "throughput": 22.814658589301214,
      "update": 66,
      "cumulative_wall_time": 286.9565217391305
    },
    {
      "timestep": 6666,
      "throughput": 24.358619701157085,
      "update": 67,
      "cumulative_wall_time": 291.304347826087
    },
    {
      "timestep": 6767,
      "throughput": 23.265187061084816,
      "update": 68,
      "cumulative_wall_time": 295.6521739130435
    },
    {
      "timestep": 6868,
      "throughput": 23.068178727777138,
      "update": 69,
      "cumulative_wall_time": 300.0
    },
    {
      "timestep": 6969,
      "throughput": 29.804838525554306,
      "update": 70,
      "cumulative_wall_time": 304.3478260869565
    },
    {
      "timestep": 7070,
      "throughput": 22.985901089595167,
      "update": 71,
      "cumulative_wall_time": 308.695652173913
    },
    {
      "timestep": 7171,
      "throughput": 22.633736018717492,
      "update": 72,
      "cumulative_wall_time": 313.0434782608695
    },
    {
      "timestep": 7272,
      "throughput": 22.720668046570747,
      "update": 73,
      "cumulative_wall_time": 317.391304347826
    },
    {
      "timestep": 7373,
      "throughput": 21.65786555157239,
      "update": 74,
      "cumulative_wall_time": 321.7391304347825
    },
    {
      "timestep": 7474,
      "throughput": 25.27730565784522,
      "update": 75,
      "cumulative_wall_time": 326.086956521739
    },
    {
      "timestep": 7575,
      "throughput": 22.1863650323029,
      "update": 76,
      "cumulative_wall_time": 330.4347826086955
    },
    {
      "timestep": 7676,
      "throughput": 24.462668222982558,
      "update": 77,
      "cumulative_wall_time": 334.782608695652
    },
    {
      "timestep": 7777,
      "throughput": 23.65458696857118,
      "update": 78,
      "cumulative_wall_time": 339.1304347826085
    },
    {
      "timestep": 7878,
      "throughput": 25.803667482904583,
      "update": 79,
      "cumulative_wall_time": 343.478260869565
    },
    {
      "timestep": 7979,
      "throughput": 23.96641307307323,
      "update": 80,
      "cumulative_wall_time": 347.8260869565215
    },
    {
      "timestep": 8080,
      "throughput": 20.20921500382041,
      "update": 81,
      "cumulative_wall_time": 352.173913043478
    },
    {
      "timestep": 8181,
      "throughput": 19.94907809437594,
      "update": 82,
      "cumulative_wall_time": 356.5217391304345
    },
    {
      "timestep": 8282,
      "throughput": 26.239249035976876,
      "update": 83,
      "cumulative_wall_time": 360.869565217391
    },
    {
      "timestep": 8383,
      "throughput": 21.599965152491784,
      "update": 84,
      "cumulative_wall_time": 365.21739130434753
    },
    {
      "timestep": 8484,
      "throughput": 19.9626140664838,
      "update": 85,
      "cumulative_wall_time": 369.56521739130403
    },
    {
      "timestep": 8585,
      "throughput": 21.459877220299557,
      "update": 86,
      "cumulative_wall_time": 373.91304347826053
    },
    {
      "timestep": 8686,
      "throughput": 25.908638160026413,
      "update": 87,
      "cumulative_wall_time": 378.26086956521704
    },
    {
      "timestep": 8787,
      "throughput": 19.73351010241842,
      "update": 88,
      "cumulative_wall_time": 382.60869565217354
    },
    {
      "timestep": 8888,
      "throughput": 21.007061031352897,
      "update": 89,
      "cumulative_wall_time": 386.95652173913004
    },
    {
      "timestep": 8989,
      "throughput": 21.466342729768005,
      "update": 90,
      "cumulative_wall_time": 391.30434782608654
    },
    {
      "timestep": 9090,
      "throughput": 20.122263291011652,
      "update": 91,
      "cumulative_wall_time": 395.65217391304304
    },
    {
      "timestep": 9191,
      "throughput": 20.276047121423172,
      "update": 92,
      "cumulative_wall_time": 399.99999999999955
    },
    {
      "timestep": 9292,
      "throughput": 19.508351656893584,
      "update": 93,
      "cumulative_wall_time": 404.34782608695605
    },
    {
      "timestep": 9393,
      "throughput": 21.93926894978554,
      "update": 94,
      "cumulative_wall_time": 408.69565217391255
    },
    {
      "timestep": 9494,
      "throughput": 22.183709686997805,
      "update": 95,
      "cumulative_wall_time": 413.04347826086905
    },
    {
      "timestep": 9595,
      "throughput": 21.430162245332397,
      "update": 96,
      "cumulative_wall_time": 417.39130434782555
    },
    {
      "timestep": 9696,
      "throughput": 19.196494970374424,
      "update": 97,
      "cumulative_wall_time": 421.73913043478206
    },
    {
      "timestep": 9797,
      "throughput": 25.88267267776879,
      "update": 98,
      "cumulative_wall_time": 426.08695652173856
    },
    {
      "timestep": 9898,
      "throughput": 19.94311869290403,
      "update": 99,
      "cumulative_wall_time": 430.43478260869506
    },
    {
      "timestep": 10000,
      "throughput": 23.639477537652603,
      "update": 100,
      "cumulative_wall_time": 434.78260869565156
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 1200,
        "success_rate": 0.85,
        "mean_reward": 0.7435046681376225,
        "recent_gradient": 0.011336633733483056
      },
      "level_2": {
        "num_pulls": 2800,
        "success_rate": 0.65,
        "mean_reward": 0.6041166471033433,
        "recent_gradient": 0.01824477282674469
      },
      "level_3": {
        "num_pulls": 3500,
        "success_rate": 0.45,
        "mean_reward": 0.3665256854060575,
        "recent_gradient": 0.03139157463827921
      },
      "level_4": {
        "num_pulls": 1800,
        "success_rate": 0.28,
        "mean_reward": 0.28951601093427276,
        "recent_gradient": 0.02083138907978487
      },
      "level_5": {
        "num_pulls": 700,
        "success_rate": 0.15,
        "mean_reward": 0.13821088842959436,
        "recent_gradient": 0.011639521219220378
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.05
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 5.382527422998509
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.585505583119495
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 4.670424344651676
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 5.305561775027956
      }
    }
  },
  "config": {
    "use_async": true,
    "curriculum_strategy": "adaptive",
    "use_csc": true,
    "use_eaas": true
  }
}