{
  "experiment_name": "aceas_seed456",
  "total_timesteps": 10000,
  "total_time": 434.7826086956522,
  "avg_throughput": 23,
  "train_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": -0.02491047619505481,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 101,
      "pass_at_1": 0.024896768930761266,
      "avg_reward": 0.04835202753861745,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 202,
      "pass_at_1": 0.05206069467602384,
      "avg_reward": 0.12312798238051934,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 303,
      "pass_at_1": 0.043615081811866685,
      "avg_reward": 0.05736622428251277,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 404,
      "pass_at_1": 0.04318478776165814,
      "avg_reward": 0.018786288723711277,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 505,
      "pass_at_1": 0.05838881662629244,
      "avg_reward": -0.00980050853216917,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 606,
      "pass_at_1": 0.08073538450397642,
      "avg_reward": 0.07648086306319572,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 707,
      "pass_at_1": 0.10088003214696792,
      "avg_reward": 0.17793914537827993,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 808,
      "pass_at_1": 0.15025446313299054,
      "avg_reward": 0.16622098829834928,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 909,
      "pass_at_1": 0.13537669217410803,
      "avg_reward": 0.16617895563773816,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 1010,
      "pass_at_1": 0.11938299351532485,
      "avg_reward": 0.09106881308048198,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1111,
      "pass_at_1": 0.10708735799193989,
      "avg_reward": 0.06646686177907923,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1212,
      "pass_at_1": 0.15447643017966295,
      "avg_reward": 0.13039973514507383,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1313,
      "pass_at_1": 0.1296540716227177,
      "avg_reward": 0.08866898294444694,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1414,
      "pass_at_1": 0.14461177384460588,
      "avg_reward": 0.17277116105911555,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1515,
      "pass_at_1": 0.12188557428869466,
      "avg_reward": 0.0837894146105009,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1616,
      "pass_at_1": 0.1711402016059921,
      "avg_reward": 0.0649177580871802,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1717,
      "pass_at_1": 0.18625530337212026,
      "avg_reward": 0.1073489912268274,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1818,
      "pass_at_1": 0.17922768937986272,
      "avg_reward": 0.14769947867784758,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 1919,
      "pass_at_1": 0.1791280865618577,
      "avg_reward": 0.08267734116454914,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2020,
      "pass_at_1": 0.18078312570251984,
      "avg_reward": 0.12668248623640319,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2121,
      "pass_at_1": 0.20885981608839427,
      "avg_reward": 0.14003366130035583,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2222,
      "pass_at_1": 0.1912448927445404,
      "avg_reward": 0.13843272983340274,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2323,
      "pass_at_1": 0.20601086890191672,
      "avg_reward": 0.22489023941738207,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2424,
      "pass_at_1": 0.2054233207849303,
      "avg_reward": 0.18661025777519444,
      "difficulty_1_ratio": 0.054488684549642924,
      "difficulty_2_ratio": 0.24420134200323332,
      "difficulty_3_ratio": 0.4026199468942474,
      "difficulty_4_ratio": 0.24420134200323332,
      "difficulty_5_ratio": 0.054488684549642924
    },
    {
      "timestep": 2525,
      "pass_at_1": 0.19146719112617167,
      "avg_reward": 0.1565303809311483,
      "difficulty_1_ratio": 0.016291910734624847,
      "difficulty_2_ratio": 0.12497928765460015,
      "difficulty_3_ratio": 0.3527033512649604,
      "difficulty_4_ratio": 0.3661732760034468,
      "difficulty_5_ratio": 0.1398521743423678
    },
    {
      "timestep": 2626,
      "pass_at_1": 0.19492285421230948,
      "avg_reward": 0.1110974454735357,
      "difficulty_1_ratio": 0.014439823367355656,
      "difficulty_2_ratio": 0.1162288430953594,
      "difficulty_3_ratio": 0.34416877595779866,
      "difficulty_4_ratio": 0.37491648580673986,
      "difficulty_5_ratio": 0.15024607177274654
    },
    {
      "timestep": 2727,
      "pass_at_1": 0.2513351924416022,
      "avg_reward": 0.19710441439150067,
      "difficulty_1_ratio": 0.012218327302669146,
      "difficulty_2_ratio": 0.10498325535696679,
      "difficulty_3_ratio": 0.33184389643032614,
      "difficulty_4_ratio": 0.38588078286713096,
      "difficulty_5_ratio": 0.165073738042907
    },
    {
      "timestep": 2828,
      "pass_at_1": 0.22096946517713137,
      "avg_reward": 0.17746569551199518,
      "difficulty_1_ratio": 0.009913147093465137,
      "difficulty_2_ratio": 0.09225064005743493,
      "difficulty_3_ratio": 0.3158149930158207,
      "difficulty_4_ratio": 0.39774215071368285,
      "difficulty_5_ratio": 0.18427906911959632
    },
    {
      "timestep": 2929,
      "pass_at_1": 0.21316069476149846,
      "avg_reward": 0.25683532563368994,
      "difficulty_1_ratio": 0.007760018351280176,
      "difficulty_2_ratio": 0.07909068287132516,
      "difficulty_3_ratio": 0.29654692178674946,
      "difficulty_4_ratio": 0.40904118087068214,
      "difficulty_5_ratio": 0.20756119611996313
    },
    {
      "timestep": 3030,
      "pass_at_1": 0.2387504454328188,
      "avg_reward": 0.20371063212971507,
      "difficulty_1_ratio": 0.00590957184933243,
      "difficulty_2_ratio": 0.06645671547671815,
      "difficulty_3_ratio": 0.2749332380949103,
      "difficulty_4_ratio": 0.4184283859957229,
      "difficulty_5_ratio": 0.2342720885833161
    },
    {
      "timestep": 3131,
      "pass_at_1": 0.2507818882240048,
      "avg_reward": 0.197297925270326,
      "difficulty_1_ratio": 0.0044234366536341566,
      "difficulty_2_ratio": 0.05506877089710349,
      "difficulty_3_ratio": 0.2522066146015487,
      "difficulty_4_ratio": 0.4249257796153269,
      "difficulty_5_ratio": 0.2633753982323869
    },
    {
      "timestep": 3232,
      "pass_at_1": 0.24341598765726657,
      "avg_reward": 0.17842611677898063,
      "difficulty_1_ratio": 0.0032937818280582443,
      "difficulty_2_ratio": 0.04535368508089252,
      "difficulty_3_ratio": 0.22973959398617683,
      "difficulty_4_ratio": 0.4281191321289578,
      "difficulty_5_ratio": 0.2934938069759146
    },
    {
      "timestep": 3333,
      "pass_at_1": 0.2848719681830434,
      "avg_reward": 0.19621530136722043,
      "difficulty_1_ratio": 0.0024722539225482446,
      "difficulty_2_ratio": 0.03746068440111024,
      "difficulty_3_ratio": 0.20881604152186556,
      "difficulty_4_ratio": 0.4282107125631631,
      "difficulty_5_ratio": 0.32304030759131297
    },
    {
      "timestep": 3434,
      "pass_at_1": 0.27646969855576997,
      "avg_reward": 0.3118593195555674,
      "difficulty_1_ratio": 0.0018961158457144911,
      "difficulty_2_ratio": 0.03133140973471507,
      "difficulty_3_ratio": 0.19045857150804962,
      "difficulty_4_ratio": 0.4259186206842434,
      "difficulty_5_ratio": 0.35039528222727745
    },
    {
      "timestep": 3535,
      "pass_at_1": 0.2885578548739901,
      "avg_reward": 0.18672414865983908,
      "difficulty_1_ratio": 0.0015056169658766543,
      "difficulty_2_ratio": 0.026789686088424,
      "difficulty_3_ratio": 0.175358276208076,
      "difficulty_4_ratio": 0.42227019488557094,
      "difficulty_5_ratio": 0.3740762258520523
    },
    {
      "timestep": 3636,
      "pass_at_1": 0.31780059563659324,
      "avg_reward": 0.29693739107089423,
      "difficulty_1_ratio": 0.0012524233850038473,
      "difficulty_2_ratio": 0.023621859465310466,
      "difficulty_3_ratio": 0.16390134325095126,
      "difficulty_4_ratio": 0.4183660766360568,
      "difficulty_5_ratio": 0.3928582972626777
    },
    {
      "timestep": 3737,
      "pass_at_1": 0.3200936188882837,
      "avg_reward": 0.270659043836431,
      "difficulty_1_ratio": 0.0011018868277803448,
      "difficulty_2_ratio": 0.021633707012814266,
      "difficulty_3_ratio": 0.15625373746114093,
      "difficulty_4_ratio": 0.4151790230064104,
      "difficulty_5_ratio": 0.40583164569185404
    },
    {
      "timestep": 3838,
      "pass_at_1": 0.31537591310879615,
      "avg_reward": 0.321571078252318,
      "difficulty_1_ratio": 0.0010322931860183035,
      "difficulty_2_ratio": 0.02068358559081816,
      "difficulty_3_ratio": 0.15245936727836976,
      "difficulty_4_ratio": 0.41341660520999185,
      "difficulty_5_ratio": 0.41240814873480197
    },
    {
      "timestep": 3939,
      "pass_at_1": 0.3132659816532125,
      "avg_reward": 0.3011314974445921,
      "difficulty_1_ratio": 0.001033362574533033,
      "difficulty_2_ratio": 0.02069834621303522,
      "difficulty_3_ratio": 0.15251904715441822,
      "difficulty_4_ratio": 0.4134452797034622,
      "difficulty_5_ratio": 0.41230396435455147
    },
    {
      "timestep": 4040,
      "pass_at_1": 0.3321791299564798,
      "avg_reward": 0.3060508081797556,
      "difficulty_1_ratio": 0.001105253979564763,
      "difficulty_2_ratio": 0.021679152361382986,
      "difficulty_3_ratio": 0.1564328746274194,
      "difficulty_4_ratio": 0.41525920915243264,
      "difficulty_5_ratio": 0.4055235098792002
    },
    {
      "timestep": 4141,
      "pass_at_1": 0.33526353304150186,
      "avg_reward": 0.2558619929199519,
      "difficulty_1_ratio": 0.0012585820768892396,
      "difficulty_2_ratio": 0.02370139964709112,
      "difficulty_3_ratio": 0.16419954975755394,
      "difficulty_4_ratio": 0.418480714620724,
      "difficulty_5_ratio": 0.3923597538977418
    },
    {
      "timestep": 4242,
      "pass_at_1": 0.3261272634636677,
      "avg_reward": 0.21781947496255222,
      "difficulty_1_ratio": 0.001515438901358441,
      "difficulty_2_ratio": 0.02690866798401823,
      "difficulty_3_ratio": 0.17577272552605308,
      "difficulty_4_ratio": 0.4223925910167582,
      "difficulty_5_ratio": 0.37341057657181215
    },
    {
      "timestep": 4343,
      "pass_at_1": 0.3719969680214582,
      "avg_reward": 0.25810148223103946,
      "difficulty_1_ratio": 0.0019108941032437861,
      "difficulty_2_ratio": 0.03149638910459275,
      "difficulty_3_ratio": 0.19098111826597575,
      "difficulty_4_ratio": 0.4260157102739871,
      "difficulty_5_ratio": 0.34959588825220067
    },
    {
      "timestep": 4444,
      "pass_at_1": 0.36802093662640545,
      "avg_reward": 0.28011185151622786,
      "difficulty_1_ratio": 0.0024936925676773474,
      "difficulty_2_ratio": 0.03767804281480519,
      "difficulty_3_ratio": 0.2094301856844532,
      "difficulty_4_ratio": 0.42824838946414634,
      "difficulty_5_ratio": 0.32214968946891787
    },
    {
      "timestep": 4545,
      "pass_at_1": 0.349269495389921,
      "avg_reward": 0.33413782558384886,
      "difficulty_1_ratio": 0.003323844499126925,
      "difficulty_2_ratio": 0.045627461104830486,
      "difficulty_3_ratio": 0.23041854367730347,
      "difficulty_4_ratio": 0.4280692870521302,
      "difficulty_5_ratio": 0.29256086366660894
    },
    {
      "timestep": 4646,
      "pass_at_1": 0.40424188976498326,
      "avg_reward": 0.22784748896390183,
      "difficulty_1_ratio": 0.004463952486683914,
      "difficulty_2_ratio": 0.055397905274063235,
      "difficulty_3_ratio": 0.25291386667660937,
      "difficulty_4_ratio": 0.4247735415860251,
      "difficulty_5_ratio": 0.2624507339766185
    },
    {
      "timestep": 4747,
      "pass_at_1": 0.38221913099560767,
      "avg_reward": 0.33708528856194536,
      "difficulty_1_ratio": 0.005961543635767642,
      "difficulty_2_ratio": 0.06683240381041645,
      "difficulty_3_ratio": 0.27562649024852093,
      "difficulty_4_ratio": 0.41817719578473006,
      "difficulty_5_ratio": 0.2334023665205648
    },
    {
      "timestep": 4848,
      "pass_at_1": 0.3886905458703297,
      "avg_reward": 0.4270844351251703,
      "difficulty_1_ratio": 0.007822719184174324,
      "difficulty_2_ratio": 0.07949491055732377,
      "difficulty_3_ratio": 0.29718468692891836,
      "difficulty_4_ratio": 0.4087135617359425,
      "difficulty_5_ratio": 0.206784121593641
    },
    {
      "timestep": 4949,
      "pass_at_1": 0.44001861782185486,
      "avg_reward": 0.37185714865892017,
      "difficulty_1_ratio": 0.009983298952962209,
      "difficulty_2_ratio": 0.09265686413080075,
      "difficulty_3_ratio": 0.3163636937049174,
      "difficulty_4_ratio": 0.3973755986640315,
      "difficulty_5_ratio": 0.1836205445472881
    },
    {
      "timestep": 5050,
      "pass_at_1": 0.3867228894514296,
      "avg_reward": 0.26670946929645056
    },
    {
      "timestep": 5151,
      "pass_at_1": 0.36782436608633023,
      "avg_reward": 0.3529742499163898
    },
    {
      "timestep": 5252,
      "pass_at_1": 0.39657452016518335,
      "avg_reward": 0.351785388733059
    },
    {
      "timestep": 5353,
      "pass_at_1": 0.4377521580765702,
      "avg_reward": 0.326599312144063
    },
    {
      "timestep": 5454,
      "pass_at_1": 0.4134014462653308,
      "avg_reward": 0.32715838313250695
    },
    {
      "timestep": 5555,
      "pass_at_1": 0.4310221969452337,
      "avg_reward": 0.398696405964113
    },
    {
      "timestep": 5656,
      "pass_at_1": 0.4851301148718315,
      "avg_reward": 0.4057084978039601
    },
    {
      "timestep": 5757,
      "pass_at_1": 0.4674087122620216,
      "avg_reward": 0.3161948009459928
    },
    {
      "timestep": 5858,
      "pass_at_1": 0.485648794701654,
      "avg_reward": 0.517147020741057
    },
    {
      "timestep": 5959,
      "pass_at_1": 0.47378462242963865,
      "avg_reward": 0.3388519009802722
    },
    {
      "timestep": 6060,
      "pass_at_1": 0.46394956070272986,
      "avg_reward": 0.3215542862949575
    },
    {
      "timestep": 6161,
      "pass_at_1": 0.45463995288722114,
      "avg_reward": 0.3295660963348267
    },
    {
      "timestep": 6262,
      "pass_at_1": 0.5019735868499636,
      "avg_reward": 0.3743539954371776
    },
    {
      "timestep": 6363,
      "pass_at_1": 0.4887374640063383,
      "avg_reward": 0.357901956839052
    },
    {
      "timestep": 6464,
      "pass_at_1": 0.48457788999299267,
      "avg_reward": 0.3122134995339809
    },
    {
      "timestep": 6565,
      "pass_at_1": 0.47245074319948827,
      "avg_reward": 0.3970587059852793
    },
    {
      "timestep": 6666,
      "pass_at_1": 0.5030932522867522,
      "avg_reward": 0.43176366396677296
    },
    {
      "timestep": 6767,
      "pass_at_1": 0.5315467699759727,
      "avg_reward": 0.5456820910051956
    },
    {
      "timestep": 6868,
      "pass_at_1": 0.5080418641505059,
      "avg_reward": 0.34177947458120367
    },
    {
      "timestep": 6969,
      "pass_at_1": 0.5160019940470538,
      "avg_reward": 0.5051217135409772
    },
    {
      "timestep": 7070,
      "pass_at_1": 0.5031648174513437,
      "avg_reward": 0.3661070345084409
    },
    {
      "timestep": 7171,
      "pass_at_1": 0.5191686156693276,
      "avg_reward": 0.4329278527853729
    },
    {
      "timestep": 7272,
      "pass_at_1": 0.5487987577789494,
      "avg_reward": 0.4832620792682534
    },
    {
      "timestep": 7373,
      "pass_at_1": 0.5419006249513487,
      "avg_reward": 0.3174954969950842
    },
    {
      "timestep": 7474,
      "pass_at_1": 0.5312070934638949,
      "avg_reward": 0.3753257503404934
    },
    {
      "timestep": 7575,
      "pass_at_1": 0.534748786000619,
      "avg_reward": 0.3996333979484875
    },
    {
      "timestep": 7676,
      "pass_at_1": 0.5388167385756042,
      "avg_reward": 0.47373206484822655
    },
    {
      "timestep": 7777,
      "pass_at_1": 0.541044580029639,
      "avg_reward": 0.34591142437360806
    },
    {
      "timestep": 7878,
      "pass_at_1": 0.5605073838312131,
      "avg_reward": 0.4076047419765165
    },
    {
      "timestep": 7979,
      "pass_at_1": 0.5440507635768773,
      "avg_reward": 0.4197437028758838
    },
    {
      "timestep": 8080,
      "pass_at_1": 0.5307511098116923,
      "avg_reward": 0.340914944392562
    },
    {
      "timestep": 8181,
      "pass_at_1": 0.5582043487299542,
      "avg_reward": 0.4840305853044914
    },
    {
      "timestep": 8282,
      "pass_at_1": 0.5773225721919456,
      "avg_reward": 0.3153491847602079
    },
    {
      "timestep": 8383,
      "pass_at_1": 0.5543769606149438,
      "avg_reward": 0.4803372515667446
    },
    {
      "timestep": 8484,
      "pass_at_1": 0.605292709805728,
      "avg_reward": 0.5413833113157431
    },
    {
      "timestep": 8585,
      "pass_at_1": 0.5423515931418791,
      "avg_reward": 0.41030507001923816
    },
    {
      "timestep": 8686,
      "pass_at_1": 0.5931586723861442,
      "avg_reward": 0.43457790783707884
    },
    {
      "timestep": 8787,
      "pass_at_1": 0.5277464573595281,
      "avg_reward": 0.3988785546350919
    },
    {
      "timestep": 8888,
      "pass_at_1": 0.5740533104061365,
      "avg_reward": 0.48054936087456773
    },
    {
      "timestep": 8989,
      "pass_at_1": 0.5654058618014495,
      "avg_reward": 0.4914162663540511
    },
    {
      "timestep": 9090,
      "pass_at_1": 0.5717665038202189,
      "avg_reward": 0.4863755994920582
    },
    {
      "timestep": 9191,
      "pass_at_1": 0.5809993243702308,
      "avg_reward": 0.37383886753944406
    },
    {
      "timestep": 9292,
      "pass_at_1": 0.5448822448951737,
      "avg_reward": 0.34111886773322986
    },
    {
      "timestep": 9393,
      "pass_at_1": 0.5910318254318468,
      "avg_reward": 0.4746690168990236
    },
    {
      "timestep": 9494,
      "pass_at_1": 0.5646665453532848,
      "avg_reward": 0.4807989291922443
    },
    {
      "timestep": 9595,
      "pass_at_1": 0.5659372187537859,
      "avg_reward": 0.36202479692458456
    },
    {
      "timestep": 9696,
      "pass_at_1": 0.5908187515067898,
      "avg_reward": 0.5272708155008634
    },
    {
      "timestep": 9797,
      "pass_at_1": 0.6037727730396306,
      "avg_reward": 0.440847000444389
    },
    {
      "timestep": 9898,
      "pass_at_1": 0.5567287686556224,
      "avg_reward": 0.4422888484511016
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.622333176894075,
      "avg_reward": 0.5473393526774596
    }
  ],
  "eval_metrics": [
    {
      "timestep": 0,
      "pass_at_1": 0.0,
      "avg_reward": -0.02491047619505481,
      "difficulty_1_ratio": 0.2570583684642447,
      "difficulty_2_ratio": 0.4238175998984713,
      "difficulty_3_ratio": 0.2570583684642447,
      "difficulty_4_ratio": 0.057357474922920995,
      "difficulty_5_ratio": 0.0047081882501182806
    },
    {
      "timestep": 10000,
      "pass_at_1": 0.622333176894075,
      "avg_reward": 0.5473393526774596
    }
  ],
  "timing_metrics": [
    {
      "timestep": 0,
      "throughput": 11.5,
      "update": 1,
      "cumulative_wall_time": 4.3478260869565215
    },
    {
      "timestep": 101,
      "throughput": 12.65,
      "update": 2,
      "cumulative_wall_time": 8.695652173913043
    },
    {
      "timestep": 202,
      "throughput": 13.799999999999999,
      "update": 3,
      "cumulative_wall_time": 13.043478260869565
    },
    {
      "timestep": 303,
      "throughput": 14.950000000000001,
      "update": 4,
      "cumulative_wall_time": 17.391304347826086
    },
    {
      "timestep": 404,
      "throughput": 16.099999999999998,
      "update": 5,
      "cumulative_wall_time": 21.73913043478261
    },
    {
      "timestep": 505,
      "throughput": 17.25,
      "update": 6,
      "cumulative_wall_time": 26.086956521739133
    },
    {
      "timestep": 606,
      "throughput": 18.400000000000002,
      "update": 7,
      "cumulative_wall_time": 30.434782608695656
    },
    {
      "timestep": 707,
      "throughput": 19.55,
      "update": 8,
      "cumulative_wall_time": 34.78260869565218
    },
    {
      "timestep": 808,
      "throughput": 20.7,
      "update": 9,
      "cumulative_wall_time": 39.1304347826087
    },
    {
      "timestep": 909,
      "throughput": 21.849999999999998,
      "update": 10,
      "cumulative_wall_time": 43.478260869565226
    },
    {
      "timestep": 1010,
      "throughput": 24.1708688562081,
      "update": 11,
      "cumulative_wall_time": 47.82608695652175
    },
    {
      "timestep": 1111,
      "throughput": 20.938934720967666,
      "update": 12,
      "cumulative_wall_time": 52.17391304347827
    },
    {
      "timestep": 1212,
      "throughput": 20.31571815421073,
      "update": 13,
      "cumulative_wall_time": 56.521739130434796
    },
    {
      "timestep": 1313,
      "throughput": 24.58410464272953,
      "update": 14,
      "cumulative_wall_time": 60.86956521739132
    },
    {
      "timestep": 1414,
      "throughput": 19.690984951211263,
      "update": 15,
      "cumulative_wall_time": 65.21739130434784
    },
    {
      "timestep": 1515,
      "throughput": 27.521704023510694,
      "update": 16,
      "cumulative_wall_time": 69.56521739130436
    },
    {
      "timestep": 1616,
      "throughput": 25.106934077891534,
      "update": 17,
      "cumulative_wall_time": 73.91304347826087
    },
    {
      "timestep": 1717,
      "throughput": 20.90620469453683,
      "update": 18,
      "cumulative_wall_time": 78.26086956521739
    },
    {
      "timestep": 1818,
      "throughput": 22.74954011541453,
      "update": 19,
      "cumulative_wall_time": 82.6086956521739
    },
    {
      "timestep": 1919,
      "throughput": 19.3358381106547,
      "update": 20,
      "cumulative_wall_time": 86.95652173913042
    },
    {
      "timestep": 2020,
      "throughput": 22.246097928452556,
      "update": 21,
      "cumulative_wall_time": 91.30434782608694
    },
    {
      "timestep": 2121,
      "throughput": 25.883960771337662,
      "update": 22,
      "cumulative_wall_time": 95.65217391304346
    },
    {
      "timestep": 2222,
      "throughput": 27.24724423100182,
      "update": 23,
      "cumulative_wall_time": 99.99999999999997
    },
    {
      "timestep": 2323,
      "throughput": 24.579835431681772,
      "update": 24,
      "cumulative_wall_time": 104.34782608695649
    },
    {
      "timestep": 2424,
      "throughput": 17.56115751883826,
      "update": 25,
      "cumulative_wall_time": 108.695652173913
    },
    {
      "timestep": 2525,
      "throughput": 24.117277815585698,
      "update": 26,
      "cumulative_wall_time": 113.04347826086952
    },
    {
      "timestep": 2626,
      "throughput": 24.131799235174093,
      "update": 27,
      "cumulative_wall_time": 117.39130434782604
    },
    {
      "timestep": 2727,
      "throughput": 22.03103074887619,
      "update": 28,
      "cumulative_wall_time": 121.73913043478255
    },
    {
      "timestep": 2828,
      "throughput": 25.09031401713241,
      "update": 29,
      "cumulative_wall_time": 126.08695652173907
    },
    {
      "timestep": 2929,
      "throughput": 20.28624580814132,
      "update": 30,
      "cumulative_wall_time": 130.4347826086956
    },
    {
      "timestep": 3030,
      "throughput": 24.53484780067055,
      "update": 31,
      "cumulative_wall_time": 134.78260869565213
    },
    {
      "timestep": 3131,
      "throughput": 22.731238281809006,
      "update": 32,
      "cumulative_wall_time": 139.13043478260866
    },
    {
      "timestep": 3232,
      "throughput": 24.178573577014426,
      "update": 33,
      "cumulative_wall_time": 143.4782608695652
    },
    {
      "timestep": 3333,
      "throughput": 28.384194381681255,
      "update": 34,
      "cumulative_wall_time": 147.82608695652172
    },
    {
      "timestep": 3434,
      "throughput": 23.7951066481058,
      "update": 35,
      "cumulative_wall_time": 152.17391304347825
    },
    {
      "timestep": 3535,
      "throughput": 21.906779924904377,
      "update": 36,
      "cumulative_wall_time": 156.52173913043478
    },
    {
      "timestep": 3636,
      "throughput": 20.887267607588733,
      "update": 37,
      "cumulative_wall_time": 160.8695652173913
    },
    {
      "timestep": 3737,
      "throughput": 22.36929724305357,
      "update": 38,
      "cumulative_wall_time": 165.21739130434784
    },
    {
      "timestep": 3838,
      "throughput": 23.044074097243282,
      "update": 39,
      "cumulative_wall_time": 169.56521739130437
    },
    {
      "timestep": 3939,
      "throughput": 21.71956520184005,
      "update": 40,
      "cumulative_wall_time": 173.9130434782609
    },
    {
      "timestep": 4040,
      "throughput": 27.458361942088747,
      "update": 41,
      "cumulative_wall_time": 178.26086956521743
    },
    {
      "timestep": 4141,
      "throughput": 24.322895395858964,
      "update": 42,
      "cumulative_wall_time": 182.60869565217396
    },
    {
      "timestep": 4242,
      "throughput": 22.088681828112584,
      "update": 43,
      "cumulative_wall_time": 186.9565217391305
    },
    {
      "timestep": 4343,
      "throughput": 26.246268037896733,
      "update": 44,
      "cumulative_wall_time": 191.30434782608702
    },
    {
      "timestep": 4444,
      "throughput": 19.172137404671975,
      "update": 45,
      "cumulative_wall_time": 195.65217391304355
    },
    {
      "timestep": 4545,
      "throughput": 26.038466794879426,
      "update": 46,
      "cumulative_wall_time": 200.00000000000009
    },
    {
      "timestep": 4646,
      "throughput": 25.901604159622284,
      "update": 47,
      "cumulative_wall_time": 204.34782608695662
    },
    {
      "timestep": 4747,
      "throughput": 27.724152879155337,
      "update": 48,
      "cumulative_wall_time": 208.69565217391315
    },
    {
      "timestep": 4848,
      "throughput": 23.44603765879712,
      "update": 49,
      "cumulative_wall_time": 213.04347826086968
    },
    {
      "timestep": 4949,
      "throughput": 25.59289468347712,
      "update": 50,
      "cumulative_wall_time": 217.3913043478262
    },
    {
      "timestep": 5050,
      "throughput": 24.0847251380033,
      "update": 51,
      "cumulative_wall_time": 221.73913043478274
    },
    {
      "timestep": 5151,
      "throughput": 24.425656262567784,
      "update": 52,
      "cumulative_wall_time": 226.08695652173927
    },
    {
      "timestep": 5252,
      "throughput": 20.70570108828726,
      "update": 53,
      "cumulative_wall_time": 230.4347826086958
    },
    {
      "timestep": 5353,
      "throughput": 26.461782378609836,
      "update": 54,
      "cumulative_wall_time": 234.78260869565233
    },
    {
      "timestep": 5454,
      "throughput": 23.78454093571144,
      "update": 55,
      "cumulative_wall_time": 239.13043478260886
    },
    {
      "timestep": 5555,
      "throughput": 20.105165678167957,
      "update": 56,
      "cumulative_wall_time": 243.4782608695654
    },
    {
      "timestep": 5656,
      "throughput": 22.760238867761473,
      "update": 57,
      "cumulative_wall_time": 247.82608695652192
    },
    {
      "timestep": 5757,
      "throughput": 18.66155853569049,
      "update": 58,
      "cumulative_wall_time": 252.17391304347845
    },
    {
      "timestep": 5858,
      "throughput": 18.9610836207944,
      "update": 59,
      "cumulative_wall_time": 256.521739130435
    },
    {
      "timestep": 5959,
      "throughput": 20.8189748108968,
      "update": 60,
      "cumulative_wall_time": 260.8695652173915
    },
    {
      "timestep": 6060,
      "throughput": 24.667016556209315,
      "update": 61,
      "cumulative_wall_time": 265.217391304348
    },
    {
      "timestep": 6161,
      "throughput": 25.984920514969275,
      "update": 62,
      "cumulative_wall_time": 269.5652173913045
    },
    {
      "timestep": 6262,
      "throughput": 20.99855812835504,
      "update": 63,
      "cumulative_wall_time": 273.913043478261
    },
    {
      "timestep": 6363,
      "throughput": 22.167588319595318,
      "update": 64,
      "cumulative_wall_time": 278.2608695652175
    },
    {
      "timestep": 6464,
      "throughput": 23.440754197439684,
      "update": 65,
      "cumulative_wall_time": 282.608695652174
    },
    {
      "timestep": 6565,
      "throughput": 22.84727336237903,
      "update": 66,
      "cumulative_wall_time": 286.9565217391305
    },
    {
      "timestep": 6666,
      "throughput": 23.451181304103926,
      "update": 67,
      "cumulative_wall_time": 291.304347826087
    },
    {
      "timestep": 6767,
      "throughput": 20.205372131979367,
      "update": 68,
      "cumulative_wall_time": 295.6521739130435
    },
    {
      "timestep": 6868,
      "throughput": 24.259750521002267,
      "update": 69,
      "cumulative_wall_time": 300.0
    },
    {
      "timestep": 6969,
      "throughput": 22.52007165014352,
      "update": 70,
      "cumulative_wall_time": 304.3478260869565
    },
    {
      "timestep": 7070,
      "throughput": 21.950519564950635,
      "update": 71,
      "cumulative_wall_time": 308.695652173913
    },
    {
      "timestep": 7171,
      "throughput": 24.453872877094234,
      "update": 72,
      "cumulative_wall_time": 313.0434782608695
    },
    {
      "timestep": 7272,
      "throughput": 23.59518750622941,
      "update": 73,
      "cumulative_wall_time": 317.391304347826
    },
    {
      "timestep": 7373,
      "throughput": 24.057798443779856,
      "update": 74,
      "cumulative_wall_time": 321.7391304347825
    },
    {
      "timestep": 7474,
      "throughput": 22.58240183557065,
      "update": 75,
      "cumulative_wall_time": 326.086956521739
    },
    {
      "timestep": 7575,
      "throughput": 26.398128023631948,
      "update": 76,
      "cumulative_wall_time": 330.4347826086955
    },
    {
      "timestep": 7676,
      "throughput": 22.244426384983534,
      "update": 77,
      "cumulative_wall_time": 334.782608695652
    },
    {
      "timestep": 7777,
      "throughput": 26.172710390071547,
      "update": 78,
      "cumulative_wall_time": 339.1304347826085
    },
    {
      "timestep": 7878,
      "throughput": 22.297408131067282,
      "update": 79,
      "cumulative_wall_time": 343.478260869565
    },
    {
      "timestep": 7979,
      "throughput": 24.56104394320589,
      "update": 80,
      "cumulative_wall_time": 347.8260869565215
    },
    {
      "timestep": 8080,
      "throughput": 20.64901335259212,
      "update": 81,
      "cumulative_wall_time": 352.173913043478
    },
    {
      "timestep": 8181,
      "throughput": 18.697122360518755,
      "update": 82,
      "cumulative_wall_time": 356.5217391304345
    },
    {
      "timestep": 8282,
      "throughput": 25.213560032738716,
      "update": 83,
      "cumulative_wall_time": 360.869565217391
    },
    {
      "timestep": 8383,
      "throughput": 22.031105801936356,
      "update": 84,
      "cumulative_wall_time": 365.21739130434753
    },
    {
      "timestep": 8484,
      "throughput": 24.85528839386507,
      "update": 85,
      "cumulative_wall_time": 369.56521739130403
    },
    {
      "timestep": 8585,
      "throughput": 26.17523188873479,
      "update": 86,
      "cumulative_wall_time": 373.91304347826053
    },
    {
      "timestep": 8686,
      "throughput": 21.279251535255003,
      "update": 87,
      "cumulative_wall_time": 378.26086956521704
    },
    {
      "timestep": 8787,
      "throughput": 21.599930615555653,
      "update": 88,
      "cumulative_wall_time": 382.60869565217354
    },
    {
      "timestep": 8888,
      "throughput": 23.317681217112206,
      "update": 89,
      "cumulative_wall_time": 386.95652173913004
    },
    {
      "timestep": 8989,
      "throughput": 22.439251147580958,
      "update": 90,
      "cumulative_wall_time": 391.30434782608654
    },
    {
      "timestep": 9090,
      "throughput": 23.2479146619121,
      "update": 91,
      "cumulative_wall_time": 395.65217391304304
    },
    {
      "timestep": 9191,
      "throughput": 25.12386078518519,
      "update": 92,
      "cumulative_wall_time": 399.99999999999955
    },
    {
      "timestep": 9292,
      "throughput": 20.7910688883482,
      "update": 93,
      "cumulative_wall_time": 404.34782608695605
    },
    {
      "timestep": 9393,
      "throughput": 22.767959281652008,
      "update": 94,
      "cumulative_wall_time": 408.69565217391255
    },
    {
      "timestep": 9494,
      "throughput": 25.863543026972486,
      "update": 95,
      "cumulative_wall_time": 413.04347826086905
    },
    {
      "timestep": 9595,
      "throughput": 25.122620402807343,
      "update": 96,
      "cumulative_wall_time": 417.39130434782555
    },
    {
      "timestep": 9696,
      "throughput": 25.198713138887122,
      "update": 97,
      "cumulative_wall_time": 421.73913043478206
    },
    {
      "timestep": 9797,
      "throughput": 21.521085011457924,
      "update": 98,
      "cumulative_wall_time": 426.08695652173856
    },
    {
      "timestep": 9898,
      "throughput": 23.35311221018656,
      "update": 99,
      "cumulative_wall_time": 430.43478260869506
    },
    {
      "timestep": 10000,
      "throughput": 24.276501827341328,
      "update": 100,
      "cumulative_wall_time": 434.78260869565156
    }
  ],
  "scheduler_stats": {
    "total_experiences": 10000,
    "total_updates": 500,
    "policy_version": 500,
    "buffer_size": 1024,
    "curriculum": {
      "level_1": {
        "num_pulls": 1200,
        "success_rate": 0.85,
        "mean_reward": 0.774535753066723,
        "recent_gradient": 0.00880228815501225
      },
      "level_2": {
        "num_pulls": 2800,
        "success_rate": 0.65,
        "mean_reward": 0.6076855357527491,
        "recent_gradient": 0.021498278466352168
      },
      "level_3": {
        "num_pulls": 3500,
        "success_rate": 0.45,
        "mean_reward": 0.3831754599108145,
        "recent_gradient": 0.03149706388174175
      },
      "level_4": {
        "num_pulls": 1800,
        "success_rate": 0.28,
        "mean_reward": 0.28015326432172166,
        "recent_gradient": 0.019275276932362185
      },
      "level_5": {
        "num_pulls": 700,
        "success_rate": 0.15,
        "mean_reward": 0.13334041455555007,
        "recent_gradient": 0.012821048819579189
      },
      "total_steps": 10000
    },
    "staleness": {
      "discard_rate": 0.05
    },
    "workers": {
      "0": {
        "completed_tasks": 2500,
        "avg_throughput": 4.269411344381984
      },
      "1": {
        "completed_tasks": 2500,
        "avg_throughput": 4.280264511263108
      },
      "2": {
        "completed_tasks": 2500,
        "avg_throughput": 5.37398672115195
      },
      "3": {
        "completed_tasks": 2500,
        "avg_throughput": 4.826192872277722
      }
    }
  },
  "config": {
    "use_async": true,
    "curriculum_strategy": "adaptive",
    "use_csc": true,
    "use_eaas": true
  }
}