a1->g3
a2->g2
a3->g1

a1 a2 a3 g3 g2 g1

landmark_poses = np.array([[0.9, -0.45],
                   	   [0.55, -0.275],
                           [0.2, -0.1]])

agent_poses = np.array([[-0.9, 0.45],
                        [-0.55, 0.275],
                        [-0.2, 0.1]])
  
EPISODES = 300
STEPS = 100


/home/yu/anaconda3/envs/marl-minigrid/bin/python /home/yu/Music/MARL-ARL/current/simple-gridworld/evaluate_mpe_1a.py
frames: 4756000
step  0 :  [-1.705658824203744]
step  1 :  [-1.6736890423517279]
step  2 :  [-1.6376685077924502]
step  3 :  [-1.6048119594065968]
step  4 :  [-1.5379595029300066]
step  5 :  [-1.4418187912537044]
step  6 :  [-1.3218827497790397]
step  7 :  [-1.1831899583848815]
step  8 :  [-1.029979007645538]
step  9 :  [-0.8656861274327621]
step  10 :  [-0.7173694137845867]
step  11 :  [-0.5623097663199158]
step  12 :  [-0.40609068552492095]
step  13 :  [-0.278025859987007]
step  14 :  [-0.16199071991112268]
step  15 :  [-0.09643206982601842]
step  16 :  [-0.09234282181608525]
step  17 :  [-0.05776949047661396]
step  18 :  [-0.018980830988413456]
step  19 :  [-0.05117150907338788]
step  20 :  [-0.07562535989614501]
step  21 :  [-0.06766587809478884]
step  22 :  [-0.031767028844665306]
step  23 :  [-0.05589416179782239]
step  24 :  [-0.05709188749853961]
episode  0 : steps 25 , return [-16.73]
step  0 :  [-1.8335499934765302]
step  1 :  [-1.7968805759274435]
step  2 :  [-1.75395265909367]
step  3 :  [-1.7119030422179657]
step  4 :  [-1.6769416446616299]
step  5 :  [-1.6098289157053391]
step  6 :  [-1.5142840494996601]
step  7 :  [-1.39533011264301]
step  8 :  [-1.2578019599937693]
step  9 :  [-1.1058796972822287]
step  10 :  [-0.9430383975590495]
step  11 :  [-0.772186623952747]
step  12 :  [-0.5959792618385279]
step  13 :  [-0.4176620095677338]
step  14 :  [-0.2729237581151059]
step  15 :  [-0.11642597192419661]
step  16 :  [-0.06566184558977896]
step  17 :  [-0.09895454787717398]
step  18 :  [-0.10816090999005307]
step  19 :  [-0.06873494566918449]
step  20 :  [-0.019559034622071925]
step  21 :  [-0.03266305509730449]
step  22 :  [-0.03159783052109365]
step  23 :  [-0.05225004990224389]
step  24 :  [-0.056581803828605275]
episode  1 : steps 25 , return [-19.31]
step  0 :  [-1.6117365862710817]
step  1 :  [-1.5673278962927855]
step  2 :  [-1.5144128572230062]
step  3 :  [-1.4612072598305226]
step  4 :  [-1.4151361351599558]
step  5 :  [-1.3414002536274876]
step  6 :  [-1.241658078448397]
step  7 :  [-1.1198666309730454]
step  8 :  [-0.9802805982297476]
step  9 :  [-0.8267452799375805]
step  10 :  [-0.6978790450454071]
step  11 :  [-0.565811730451258]
step  12 :  [-0.43830697139925023]
step  13 :  [-0.33356986564561236]
step  14 :  [-0.22798723344074506]
step  15 :  [-0.1255005016653286]
step  16 :  [-0.08622856291838898]
step  17 :  [-0.027395605787399423]
step  18 :  [-0.04697550108984183]
step  19 :  [-0.0133929092294561]
step  20 :  [-0.03781766245934931]
step  21 :  [-0.006661418126896976]
step  22 :  [-0.03313852894199402]
step  23 :  [-0.005232434079780379]
step  24 :  [-0.03073365611553041]
episode  2 : steps 25 , return [-15.76]
step  0 :  [-1.701389727652194]
step  1 :  [-1.6728773427442973]
step  2 :  [-1.6416066524742323]
step  3 :  [-1.574081794303564]
step  4 :  [-1.476424566223184]
step  5 :  [-1.354755903958633]
step  6 :  [-1.2143793530032376]
step  7 :  [-1.0596270267358132]
step  8 :  [-0.8939427625328155]
step  9 :  [-0.7818724521821724]
step  10 :  [-0.6492237295390434]
step  11 :  [-0.5398310613641194]
step  12 :  [-0.46587217505336675]
step  13 :  [-0.39119279974438925]
step  14 :  [-0.3061882377733083]
step  15 :  [-0.21206484545833915]
step  16 :  [-0.10097150523053382]
step  17 :  [-0.02823456875310827]
step  18 :  [-0.02730525401423218]
step  19 :  [-0.020272939489678746]
step  20 :  [-0.021448208452873527]
step  21 :  [-0.024433346555847422]
step  22 :  [-0.007636664454146142]
step  23 :  [-0.044939331239195815]
step  24 :  [-0.023951936753969845]
episode  3 : steps 25 , return [-16.23]
step  0 :  [-1.5285895798381524]
step  1 :  [-1.4958534341792644]
step  2 :  [-1.459531096792998]
step  3 :  [-1.4275157414766997]
step  4 :  [-1.3621052823431596]
step  5 :  [-1.267528276046181]
step  6 :  [-1.1491489442240213]
step  7 :  [-1.0120258378343285]
step  8 :  [-0.8605128739032666]
step  9 :  [-0.7079200044365987]
step  10 :  [-0.5475602065727379]
step  11 :  [-0.3850278198589578]
step  12 :  [-0.2507080787836407]
step  13 :  [-0.132881157189236]
step  14 :  [-0.06004483478055275]
step  15 :  [-0.03241590180836354]
step  16 :  [-0.04749414495563862]
step  17 :  [-0.028000386289012896]
step  18 :  [-0.05962866913326384]
step  19 :  [-0.0362725410791701]
step  20 :  [-0.04878237148594989]
step  21 :  [-0.035309474082199796]
step  22 :  [-0.052974149952463676]
step  23 :  [-0.03339540735549007]
step  24 :  [-0.03475447537639486]
episode  4 : steps 25 , return [-14.06]
step  0 :  [-1.7946170497852447]
step  1 :  [-1.7590795083342294]
step  2 :  [-1.7178371016664957]
step  3 :  [-1.6780667047221636]
step  4 :  [-1.6060286324483177]
step  5 :  [-1.50595598322669]
step  6 :  [-1.3829815567022448]
step  7 :  [-1.2418799613279556]
step  8 :  [-1.0866892566872965]
step  9 :  [-0.9206754113438529]
step  10 :  [-0.7798586498860294]
step  11 :  [-0.6281952676901983]
step  12 :  [-0.5009489350604686]
step  13 :  [-0.41329110997989327]
step  14 :  [-0.3285361625062201]
step  15 :  [-0.23271721473824114]
step  16 :  [-0.1298355801213804]
step  17 :  [-0.028085643878842884]
step  18 :  [-0.07019856838193882]
step  19 :  [-0.06268837966052287]
step  20 :  [-0.012065762432857046]
step  21 :  [-0.022666500713991514]
step  22 :  [-0.03398551178067347]
step  23 :  [-0.025945645442836122]
step  24 :  [-0.026943986401408014]
episode  5 : steps 25 , return [-17.99]
step  0 :  [-1.7721841556106808]
step  1 :  [-1.7347022424091787]
step  2 :  [-1.6908528227965542]
step  3 :  [-1.6479902513159306]
step  4 :  [-1.6125518753283783]
step  5 :  [-1.5454154587387732]
step  6 :  [-1.4500396005288123]
step  7 :  [-1.3313435459385723]
step  8 :  [-1.1941294463370093]
step  9 :  [-1.0425849443687298]
step  10 :  [-0.8802313124715527]
step  11 :  [-0.7100942531558991]
step  12 :  [-0.5351463185482337]
step  13 :  [-0.3597569169356086]
step  14 :  [-0.21530261622381638]
step  15 :  [-0.06676695082270975]
step  16 :  [-0.03168918040849723]
step  17 :  [-0.02007922226043192]
step  18 :  [-0.03250505667962933]
step  19 :  [-0.02523324890561434]
step  20 :  [-0.029377600653548948]
step  21 :  [-0.01013934106653549]
step  22 :  [-0.04570677560152731]
step  23 :  [-0.023524016881272983]
step  24 :  [-0.057831416144785604]
episode  6 : steps 25 , return [-18.07]
step  0 :  [-1.4650115065857179]
step  1 :  [-1.4244632622161348]
step  2 :  [-1.3775918144779549]
step  3 :  [-1.3330277327868962]
step  4 :  [-1.259139813937631]
step  5 :  [-1.1585123881513262]
step  6 :  [-1.0355420030461275]
step  7 :  [-0.894665461749131]
step  8 :  [-0.7997590644559619]
step  9 :  [-0.6854308377782794]
step  10 :  [-0.5816587093524672]
step  11 :  [-0.49315154352815205]
step  12 :  [-0.42269189313700406]
step  13 :  [-0.34181140927911846]
step  14 :  [-0.2417844610142302]
step  15 :  [-0.12366739103541316]
step  16 :  [-0.029932836041604686]
step  17 :  [-0.05153657300555992]
step  18 :  [-0.05699922765443859]
step  19 :  [-0.030947697374891364]
step  20 :  [-0.03646760283755113]
step  21 :  [-0.029318865476013294]
step  22 :  [-0.027065776371895733]
step  23 :  [-0.032795919535405144]
step  24 :  [-0.053978082340708756]
episode  7 : steps 25 , return [-13.99]
step  0 :  [-1.561533800794617]
step  1 :  [-1.5197712799785934]
step  2 :  [-1.4707636075924515]
step  3 :  [-1.4227963362668745]
step  4 :  [-1.383334975654441]
step  5 :  [-1.3146386803464067]
step  6 :  [-1.2188720282961567]
step  7 :  [-1.100397158451235]
step  8 :  [-0.9638098197072666]
step  9 :  [-0.8133080417395827]
step  10 :  [-0.6554173074914288]
step  11 :  [-0.4926946365895093]
step  12 :  [-0.3328892608119536]
step  13 :  [-0.20068052164060807]
step  14 :  [-0.07490643573268767]
step  15 :  [-0.03612097697292655]
step  16 :  [-0.01543053563084042]
step  17 :  [-0.04778273375983244]
step  18 :  [-0.03257054567321952]
step  19 :  [-0.0706850565212118]
step  20 :  [-0.05234698475915791]
step  21 :  [-0.036358654988263905]
step  22 :  [-0.01807548664029346]
step  23 :  [-0.04377912706742621]
step  24 :  [-0.02159273515410194]
episode  8 : steps 25 , return [-14.9]
step  0 :  [-1.7492501758189423]
step  1 :  [-1.7099030188764428]
step  2 :  [-1.6635497794495278]
step  3 :  [-1.6177145858226674]
step  4 :  [-1.5790259918472682]
step  5 :  [-1.5096920490454864]
step  6 :  [-1.4127386930077221]
step  7 :  [-1.2928324722824058]
step  8 :  [-1.1546155264416589]
step  9 :  [-1.0021588959842325]
step  10 :  [-0.8388772713385888]
step  11 :  [-0.6766571938924911]
step  12 :  [-0.5100718411090496]
step  13 :  [-0.3456327586629478]
step  14 :  [-0.21020484344843005]
step  15 :  [-0.0848681581503889]
step  16 :  [-0.03097357310034173]
step  17 :  [-0.027660984804623312]
step  18 :  [-0.029496719402074177]
step  19 :  [-0.02366209800249547]
step  20 :  [-0.0706583465758784]
step  21 :  [-0.06001122612583756]
step  22 :  [-0.002509586914788289]
step  23 :  [-0.010001024027662942]
step  24 :  [-0.03644270870153542]
episode  9 : steps 25 , return [-17.65]
step  0 :  [-1.4956808508214543]
step  1 :  [-1.4503577892574107]
step  2 :  [-1.3966324818924678]
step  3 :  [-1.343213666359065]
step  4 :  [-1.2980950916743457]
step  5 :  [-1.225873428928126]
step  6 :  [-1.1277481349604634]
step  7 :  [-1.007562454997737]
step  8 :  [-0.8696136611755072]
step  9 :  [-0.7538973763925931]
step  10 :  [-0.624801310791833]
step  11 :  [-0.4885164330844478]
step  12 :  [-0.356475588679647]
step  13 :  [-0.24570180060236088]
step  14 :  [-0.13353094136142618]
step  15 :  [-0.010391000592094758]
step  16 :  [-0.05162107250167953]
step  17 :  [-0.05269051856201355]
step  18 :  [-0.0593195982760379]
step  19 :  [-0.02712749766567422]
step  20 :  [-0.03470896994145281]
step  21 :  [-0.044306892038465814]
step  22 :  [-0.0659265826725342]
step  23 :  [-0.08037020914479691]
step  24 :  [-0.061292917798760276]
episode  10 : steps 25 , return [-14.31]
step  0 :  [-1.5140322544341291]
step  1 :  [-1.4692764053326166]
step  2 :  [-1.4162703356702775]
step  3 :  [-1.3636227416523767]
step  4 :  [-1.3192043387729346]
step  5 :  [-1.2473346616449767]
step  6 :  [-1.1493870477341759]
step  7 :  [-1.0292858137726395]
step  8 :  [-0.8913638018360319]
step  9 :  [-0.7663370405696386]
step  10 :  [-0.6301434246857286]
step  11 :  [-0.488588476332889]
step  12 :  [-0.35267902550884916]
step  13 :  [-0.240328598973045]
step  14 :  [-0.1279729118194745]
step  15 :  [-0.07420456560021378]
step  16 :  [-0.02652586887710202]
step  17 :  [-0.02053480143114911]
step  18 :  [-0.025927606788304074]
step  19 :  [-0.020005820203839703]
step  20 :  [-0.025596610820469105]
step  21 :  [-0.05198153704689213]
step  22 :  [-0.0599525516613832]
step  23 :  [-0.021527126181926964]
step  24 :  [-0.04016039389479281]
episode  11 : steps 25 , return [-14.37]
step  0 :  [-1.3742222085485132]
step  1 :  [-1.3441670726279669]
step  2 :  [-1.276900215789149]
step  3 :  [-1.216078709635895]
step  4 :  [-1.1253322565557242]
step  5 :  [-1.00976911301441]
step  6 :  [-0.8744301973073364]
step  7 :  [-0.8032871654656193]
step  8 :  [-0.7156862992099752]
step  9 :  [-0.6268154023657947]
step  10 :  [-0.5402710987451913]
step  11 :  [-0.4664336004910315]
step  12 :  [-0.3827816594915782]
step  13 :  [-0.2916019647954521]
step  14 :  [-0.18918157483261214]
step  15 :  [-0.07072410390091155]
step  16 :  [-0.02117970533431555]
step  17 :  [-0.028265461341155134]
step  18 :  [-0.03482445141017853]
step  19 :  [-0.03068599707058212]
step  20 :  [-0.05897281942381811]
step  21 :  [-0.05685895559340737]
step  22 :  [-0.043593648998188544]
step  23 :  [-0.0503474100604659]
step  24 :  [-0.056742677276698385]
episode  12 : steps 25 , return [-12.69]
step  0 :  [-1.7566997769594985]
step  1 :  [-1.7285199152407833]
step  2 :  [-1.6974940204164288]
step  3 :  [-1.6299960409678873]
step  4 :  [-1.5322907347387202]
step  5 :  [-1.4105582452547851]
step  6 :  [-1.3144170716402128]
step  7 :  [-1.1953991437103908]
step  8 :  [-1.0580833585021148]
step  9 :  [-0.9065666861390062]
step  10 :  [-0.7444104448346803]
step  11 :  [-0.5766328794806219]
step  12 :  [-0.40696104598594046]
step  13 :  [-0.2689455165895171]
step  14 :  [-0.12152690279850015]
step  15 :  [-0.01095665009375285]
step  16 :  [-0.0705290732517776]
step  17 :  [-0.08318568186615001]
step  18 :  [-0.053077905416056614]
step  19 :  [-0.030183208228111776]
step  20 :  [-0.016219821998959574]
step  21 :  [-0.04036108673871718]
step  22 :  [-0.018016989642854885]
step  23 :  [-0.05041417754949981]
step  24 :  [-0.02540407357602432]
episode  13 : steps 25 , return [-16.75]
step  0 :  [-1.656712092970531]
step  1 :  [-1.6163941564302549]
step  2 :  [-1.5690233334547683]
step  3 :  [-1.522468455627861]
step  4 :  [-1.483730172879167]
step  5 :  [-1.4149058713014446]
step  6 :  [-1.318655009779446]
step  7 :  [-1.199520616603381]
step  8 :  [-1.0621302263235282]
step  9 :  [-0.9106085369505762]
step  10 :  [-0.7485095261434053]
step  11 :  [-0.5797569261078694]
step  12 :  [-0.40808854622025437]
step  13 :  [-0.24315279844712484]
step  14 :  [-0.11141921278518484]
step  15 :  [-0.06011866463914624]
step  16 :  [-0.029833677510412316]
step  17 :  [-0.05963123661933123]
step  18 :  [-0.036438141167749266]
step  19 :  [-0.06375591888343059]
step  20 :  [-0.040380563730145196]
step  21 :  [-0.028692432316904187]
step  22 :  [-0.06159953494653153]
step  23 :  [-0.06125363381020143]
step  24 :  [-0.10765854109247144]
episode  14 : steps 25 , return [-16.39]
step  0 :  [-1.5760287062515224]
step  1 :  [-1.5311188075440116]
step  2 :  [-1.4776389166276065]
step  3 :  [-1.4239571661108967]
step  4 :  [-1.3776757213784212]
step  5 :  [-1.3040328987192307]
step  6 :  [-1.2044977005506556]
step  7 :  [-1.0829557945385173]
step  8 :  [-0.9436437645333531]
step  9 :  [-0.7923016307217827]
step  10 :  [-0.6376057111057198]
step  11 :  [-0.49080617788913616]
step  12 :  [-0.37699882059422174]
step  13 :  [-0.26349478351088473]
step  14 :  [-0.16188268300589326]
step  15 :  [-0.0622476059554705]
step  16 :  [-0.023872275294175363]
step  17 :  [-0.03274650658299389]
step  18 :  [-0.06540926904993652]
step  19 :  [-0.06056682920753899]
step  20 :  [-0.03277947252254888]
step  21 :  [-0.0298062140082994]
step  22 :  [-0.0330597092265635]
step  23 :  [-0.018676327501577574]
step  24 :  [-0.036410725480259656]
episode  15 : steps 25 , return [-15.04]
step  0 :  [-1.494997251544106]
step  1 :  [-1.4640666369040976]
step  2 :  [-1.430396034983655]
step  3 :  [-1.3618537653962983]
step  4 :  [-1.2637904691452209]
step  5 :  [-1.1419850046776352]
step  6 :  [-1.001581874776939]
step  7 :  [-0.8468361419624207]
step  8 :  [-0.7895070006258809]
step  9 :  [-0.6998936501613633]
step  10 :  [-0.6149564264596524]
step  11 :  [-0.5364979748525838]
step  12 :  [-0.4705791749251332]
step  13 :  [-0.39252913888309027]
step  14 :  [-0.309961697537118]
step  15 :  [-0.21437208267490768]
step  16 :  [-0.1028371011786865]
step  17 :  [-0.027270657861749495]
step  18 :  [-0.021538292856790084]
step  19 :  [-0.040098551957906035]
step  20 :  [-0.025313544763755833]
step  21 :  [-0.06309041597594466]
step  22 :  [-0.04244248195166344]
step  23 :  [-0.07688824118487626]
step  24 :  [-0.052819812248122364]
episode  16 : steps 25 , return [-14.49]
step  0 :  [-1.7055157498867595]
step  1 :  [-1.6682455267306118]
step  2 :  [-1.6249221312886792]
step  3 :  [-1.5830896990394177]
step  4 :  [-1.5099629359369673]
step  5 :  [-1.4092947143441665]
step  6 :  [-1.2859856327273749]
step  7 :  [-1.144693588168719]
step  8 :  [-0.9893964512104495]
step  9 :  [-0.8233301402998712]
step  10 :  [-0.7795827973893718]
step  11 :  [-0.7006776227588916]
step  12 :  [-0.6189026270543425]
step  13 :  [-0.5373197860391132]
step  14 :  [-0.46693504978678907]
step  15 :  [-0.38591688609029234]
step  16 :  [-0.2950025931239743]
step  17 :  [-0.1922830331149671]
step  18 :  [-0.07290442927172072]
step  19 :  [-0.0419026415975092]
step  20 :  [-0.05228994953891794]
step  21 :  [-0.02438879220852786]
step  22 :  [-0.05640928582361346]
step  23 :  [-0.034267286510378726]
step  24 :  [-0.0272165700795422]
episode  17 : steps 25 , return [-18.03]
step  0 :  [-1.6336241967700749]
step  1 :  [-1.591968072110414]
step  2 :  [-1.542820154962551]
step  3 :  [-1.4941950286488002]
step  4 :  [-1.4532647785394937]
step  5 :  [-1.3830254853242894]
step  6 :  [-1.2857980538626068]
step  7 :  [-1.1659375660700455]
step  8 :  [-1.0279587482482118]
step  9 :  [-0.8759089169731193]
step  10 :  [-0.7269394225107978]
step  11 :  [-0.5694025475837767]
step  12 :  [-0.40852991473011524]
step  13 :  [-0.2761641750470304]
step  14 :  [-0.16155284394448366]
step  15 :  [-0.08940840434789388]
step  16 :  [-0.08383189570455947]
step  17 :  [-0.03356099279252547]
step  18 :  [-0.041020723391198256]
step  19 :  [-0.017061657067909762]
step  20 :  [-0.019472873770412454]
step  21 :  [-0.02791547721129316]
step  22 :  [-0.013595700402492458]
step  23 :  [-0.02029872235435072]
step  24 :  [-0.031000115133714534]
episode  18 : steps 25 , return [-15.97]
step  0 :  [-1.443742437062619]
step  1 :  [-1.4166535818280437]
step  2 :  [-1.388525476734104]
step  3 :  [-1.3239871446131446]
step  4 :  [-1.2288685265884294]
step  5 :  [-1.1092715297555686]
step  6 :  [-0.9705575879975414]
step  7 :  [-0.8171318959460377]
step  8 :  [-0.6846876135444472]
step  9 :  [-0.5522004411526228]
step  10 :  [-0.4278665315553087]
step  11 :  [-0.32736666953368265]
step  12 :  [-0.22490011020110082]
step  13 :  [-0.13538075391042267]
step  14 :  [-0.08488612963579319]
step  15 :  [-0.08365125744495727]
step  16 :  [-0.06943813204790138]
step  17 :  [-0.04002197454309048]
step  18 :  [-0.02334365299618768]
step  19 :  [-0.04008255060540108]
step  20 :  [-0.08283044457163735]
step  21 :  [-0.08034512488901098]
step  22 :  [-0.07073183694402063]
step  23 :  [-0.058904394853842156]
step  24 :  [-0.033170277598998064]
episode  19 : steps 25 , return [-12.72]
step  0 :  [-1.582127509124514]
step  1 :  [-1.5530834456880576]
step  2 :  [-1.521586738177252]
step  3 :  [-1.4542443303946946]
step  4 :  [-1.3568762473329303]
step  5 :  [-1.2354862427540105]
step  6 :  [-1.0953311416706557]
step  7 :  [-0.940721238525147]
step  8 :  [-0.789246497813972]
step  9 :  [-0.6294958693362426]
step  10 :  [-0.4996755539075119]
step  11 :  [-0.413028800419498]
step  12 :  [-0.33010889291897183]
step  13 :  [-0.23474772644247613]
step  14 :  [-0.13963116530720635]
step  15 :  [-0.05454375026903729]
step  16 :  [-0.0429305281324294]
step  17 :  [-0.048220344595782595]
step  18 :  [-0.015144185561959022]
step  19 :  [-0.021576274303515143]
step  20 :  [-0.025241112366769774]
step  21 :  [-0.0126262546127582]
step  22 :  [-0.041201347055720004]
step  23 :  [-0.03833695124903737]
step  24 :  [-0.05030384817774513]
episode  20 : steps 25 , return [-14.13]
step  0 :  [-1.6080638560571079]
step  1 :  [-1.573964936609754]
step  2 :  [-1.5354061361933233]
step  3 :  [-1.5000686724400956]
step  4 :  [-1.4318946084874775]
step  5 :  [-1.3350179241453346]
step  6 :  [-1.2146571714601386]
step  7 :  [-1.075714443101309]
step  8 :  [-0.9223604037664573]
step  9 :  [-0.7687725294823405]
step  10 :  [-0.6110462010043918]
step  11 :  [-0.4568486799588]
step  12 :  [-0.334578739813681]
step  13 :  [-0.2227768767662178]
step  14 :  [-0.09534361689631303]
step  15 :  [-0.029194619996559153]
step  16 :  [-0.09212318261202211]
step  17 :  [-0.09446639510027423]
step  18 :  [-0.0778697843775342]
step  19 :  [-0.07706701571702013]
step  20 :  [-0.04712518637232826]
step  21 :  [-0.018139439135520952]
step  22 :  [-0.017856418719112265]
step  23 :  [-0.024301028336762974]
step  24 :  [-0.034140255265285406]
episode  21 : steps 25 , return [-15.2]
step  0 :  [-1.6114471222422644]
step  1 :  [-1.5819628836678343]
step  2 :  [-1.5497333446228492]
step  3 :  [-1.4818044362161782]
step  4 :  [-1.3839880161841243]
step  5 :  [-1.2622673104399458]
step  6 :  [-1.1218818427979091]
step  7 :  [-0.9671328647065935]
step  8 :  [-0.8014496025882292]
step  9 :  [-0.7806117888248761]
step  10 :  [-0.7174806909762673]
step  11 :  [-0.6488413184568361]
step  12 :  [-0.5760678340761857]
step  13 :  [-0.5115120823362258]
step  14 :  [-0.4364881456695856]
step  15 :  [-0.3520908518317799]
step  16 :  [-0.24955083053538527]
step  17 :  [-0.1296319254957735]
step  18 :  [-0.03210143687939345]
step  19 :  [-0.04823953287835991]
step  20 :  [-0.05491942392893483]
step  21 :  [-0.028376143639453486]
step  22 :  [-0.03499126383903027]
step  23 :  [-0.027116456763156563]
step  24 :  [-0.0471975941302649]
episode  22 : steps 25 , return [-16.44]
step  0 :  [-1.4787413554562223]
step  1 :  [-1.4369575806509305]
step  2 :  [-1.3882885929061144]
step  3 :  [-1.341364479551945]
step  4 :  [-1.2657787013964161]
step  5 :  [-1.16391512640615]
step  6 :  [-1.0400326679067162]
step  7 :  [-0.8984773558998929]
step  8 :  [-0.8022194329651109]
step  9 :  [-0.832624068883783]
step  10 :  [-0.9138777817132154]
step  11 :  [-0.9400433564390649]
step  12 :  [-0.9118671409133259]
step  13 :  [-0.8426085206991448]
step  14 :  [-0.74287604156495]
step  15 :  [-0.6213347717700567]
step  16 :  [-0.4859392904689564]
step  17 :  [-0.3469791063084388]
step  18 :  [-0.22459419576045866]
step  19 :  [-0.1163002132099985]
step  20 :  [-0.081599698187039]
step  21 :  [-0.10276570704410694]
step  22 :  [-0.0940599579369084]
step  23 :  [-0.06568477891909824]
step  24 :  [-0.03050490314841929]
episode  23 : steps 25 , return [-18.17]
step  0 :  [-1.7348281041542468]
step  1 :  [-1.7032594009392137]
step  2 :  [-1.6676799426316051]
step  3 :  [-1.6351880825616596]
step  4 :  [-1.5684742872632123]
step  5 :  [-1.4723695003193862]
step  6 :  [-1.352420614237406]
step  7 :  [-1.2136894007040837]
step  8 :  [-1.0604222938967875]
step  9 :  [-0.896052889833492]
step  10 :  [-0.7385732056203754]
step  11 :  [-0.5766806104120553]
step  12 :  [-0.4154142591377188]
step  13 :  [-0.28511107761437066]
step  14 :  [-0.16855508411402936]
step  15 :  [-0.08500537042271687]
step  16 :  [-0.03510648249454441]
step  17 :  [-0.023718562656755954]
step  18 :  [-0.044594924829671104]
step  19 :  [-0.023910035597663307]
step  20 :  [-0.02690127076463666]
step  21 :  [-0.03899958496920965]
step  22 :  [-0.028810145483583266]
step  23 :  [-0.03706518579728464]
step  24 :  [-0.023314748732130346]
episode  24 : steps 25 , return [-16.86]
step  0 :  [-1.6565626554059232]
step  1 :  [-1.6227799910493663]
step  2 :  [-1.5844579051309788]
step  3 :  [-1.5490889306773645]
step  4 :  [-1.4806712718971125]
step  5 :  [-1.3834927495227944]
step  6 :  [-1.2628241991774838]
step  7 :  [-1.123578072455618]
step  8 :  [-0.9699137912342802]
step  9 :  [-0.8052090943204937]
step  10 :  [-0.6437998382206208]
step  11 :  [-0.48872955029595144]
step  12 :  [-0.36774333911927826]
step  13 :  [-0.24482966571129852]
step  14 :  [-0.13565004773296893]
step  15 :  [-0.08769998827743188]
step  16 :  [-0.07936408013290165]
step  17 :  [-0.042590283037603406]
step  18 :  [-0.06739456557307115]
step  19 :  [-0.045477821455357614]
step  20 :  [-0.03378129643234306]
step  21 :  [-0.011615734657701543]
step  22 :  [-0.01685958508900692]
step  23 :  [-0.030078905219487376]
step  24 :  [-0.01623900343251285]
episode  25 : steps 25 , return [-15.75]
step  0 :  [-1.7874505061740462]
step  1 :  [-1.750586559201234]
step  2 :  [-1.7075394497046286]
step  3 :  [-1.665584416545744]
step  4 :  [-1.6310730240940647]
step  5 :  [-1.5645199549945716]
step  6 :  [-1.469536726671801]
step  7 :  [-1.3511244261514417]
step  8 :  [-1.21413195961376]
step  9 :  [-1.0627760606786838]
step  10 :  [-0.9005978649556372]
step  11 :  [-0.730636059595451]
step  12 :  [-0.5558571808950479]
step  13 :  [-0.3804957404366738]
step  14 :  [-0.2359921043390127]
step  15 :  [-0.0853799097742509]
step  16 :  [-0.03084171631297558]
step  17 :  [-0.0799001539755319]
step  18 :  [-0.09349996949462094]
step  19 :  [-0.06585387563828635]
step  20 :  [-0.0054900221514919065]
step  21 :  [-0.0075765833921248495]
step  22 :  [-0.015197963864804103]
step  23 :  [-0.029424676390598207]
step  24 :  [-0.012702975561169868]
episode  26 : steps 25 , return [-18.43]
step  0 :  [-1.3503184928234013]
step  1 :  [-1.3209377025583904]
step  2 :  [-1.290214031439629]
step  3 :  [-1.224250971309647]
step  4 :  [-1.1282973207769105]
step  5 :  [-1.0081794365711614]
step  6 :  [-0.8691188976043231]
step  7 :  [-0.7894469227288081]
step  8 :  [-0.6904355756881712]
step  9 :  [-0.5846655629938928]
step  10 :  [-0.47993033503280724]
step  11 :  [-0.3903399205398787]
step  12 :  [-0.303496869377259]
step  13 :  [-0.21658511180493698]
step  14 :  [-0.12253273965732144]
step  15 :  [-0.06051224448030661]
step  16 :  [-0.03101905295330866]
step  17 :  [-0.03851805881162913]
step  18 :  [-0.030296720680030902]
step  19 :  [-0.0344885844812738]
step  20 :  [-0.07390760583013348]
step  21 :  [-0.07265063757212874]
step  22 :  [-0.054752778962559846]
step  23 :  [-0.05350656192835692]
step  24 :  [-0.02272422347535979]
episode  27 : steps 25 , return [-12.24]
step  0 :  [-1.5396456689086218]
step  1 :  [-1.5033733883655747]
step  2 :  [-1.4621088308169372]
step  3 :  [-1.4239272847807378]
step  4 :  [-1.3540872840488907]
step  5 :  [-1.2561713111124968]
step  6 :  [-1.135119307976619]
step  7 :  [-0.9956836346778309]
step  8 :  [-0.8419479038662266]
step  9 :  [-0.7312085135440547]
step  10 :  [-0.6096638564237903]
step  11 :  [-0.48381184295695256]
step  12 :  [-0.3789035336709768]
step  13 :  [-0.26628860202388754]
step  14 :  [-0.15821034740178777]
step  15 :  [-0.04117949671609814]
step  16 :  [-0.031176620071548873]
step  17 :  [-0.03131432488306233]
step  18 :  [-0.018009012273803825]
step  19 :  [-0.006124912978794758]
step  20 :  [-0.04538883258434928]
step  21 :  [-0.08623416539318059]
step  22 :  [-0.10179359520886617]
step  23 :  [-0.06716667339747606]
step  24 :  [-0.05603373077532691]
episode  28 : steps 25 , return [-14.62]
step  0 :  [-1.58077949589678]
step  1 :  [-1.5377451112938]
step  2 :  [-1.4868778149022144]
step  3 :  [-1.4364481671449798]
step  4 :  [-1.3939244193241744]
step  5 :  [-1.3229079024576242]
step  6 :  [-1.225307775336209]
step  7 :  [-1.1052885695771741]
step  8 :  [-0.9672804264109357]
step  9 :  [-0.8153072575765631]
step  10 :  [-0.6639623646423584]
step  11 :  [-0.5109429619155565]
step  12 :  [-0.3656064101878698]
step  13 :  [-0.24778551310731917]
step  14 :  [-0.13271634468368151]
step  15 :  [-0.07342892430077265]
step  16 :  [-0.09131615314550362]
step  17 :  [-0.07176040283475918]
step  18 :  [-0.0286580811749989]
step  19 :  [-0.04432150670275629]
step  20 :  [-0.01381094401535757]
step  21 :  [-0.029606038895190017]
step  22 :  [-0.017730539667005548]
step  23 :  [-0.02310055438305453]
step  24 :  [-0.04761791351360397]
episode  29 : steps 25 , return [-15.23]
step  0 :  [-1.5399775718051045]
step  1 :  [-1.50180300481658]
step  2 :  [-1.4578944005571557]
step  3 :  [-1.416436303098678]
step  4 :  [-1.344305462030687]
step  5 :  [-1.2447259682595242]
step  6 :  [-1.122413038890991]
step  7 :  [-0.9819701279311949]
step  8 :  [-0.8273687350877859]
step  9 :  [-0.7540971487443724]
step  10 :  [-0.665064042235581]
step  11 :  [-0.5673837020373076]
step  12 :  [-0.47072072616482574]
step  13 :  [-0.3852825103890368]
step  14 :  [-0.290322695965814]
step  15 :  [-0.18120071385845807]
step  16 :  [-0.10013778506382434]
step  17 :  [-0.07735357440365832]
step  18 :  [-0.07576498974611791]
step  19 :  [-0.07897730462786468]
step  20 :  [-0.05162396932277874]
step  21 :  [-0.02295011087711628]
step  22 :  [-0.03123590235035614]
step  23 :  [-0.01674947529686368]
step  24 :  [-0.029447274477859366]
episode  30 : steps 25 , return [-15.24]
step  0 :  [-1.5730160522638115]
step  1 :  [-1.547488072868077]
step  2 :  [-1.5208354433482079]
step  3 :  [-1.4568715141555635]
step  4 :  [-1.361928045183518]
step  5 :  [-1.2423214901690574]
step  6 :  [-1.1035055017508366]
step  7 :  [-0.9499185441087913]
step  8 :  [-0.7850755822331235]
step  9 :  [-0.618350957571979]
step  10 :  [-0.4626395720978139]
step  11 :  [-0.34357034561574945]
step  12 :  [-0.2338563207753693]
step  13 :  [-0.11750404548711002]
step  14 :  [-0.07387267126503116]
step  15 :  [-0.008216328306754747]
step  16 :  [-0.033218110444184656]
step  17 :  [-0.003095617306410627]
step  18 :  [-0.028708395478139977]
step  19 :  [-0.004357400856284215]
step  20 :  [-0.024559233600706602]
step  21 :  [-0.010258030870899578]
step  22 :  [-0.03418105607186685]
step  23 :  [-0.006015217073783561]
step  24 :  [-0.029388894436802003]
episode  31 : steps 25 , return [-13.57]
step  0 :  [-1.5301131352982682]
step  1 :  [-1.4854817011906813]
step  2 :  [-1.432581835516468]
step  3 :  [-1.3799508886608596]
step  4 :  [-1.3353773089797103]
step  5 :  [-1.2632744782414318]
step  6 :  [-1.1650788820151552]
step  7 :  [-1.044728246613556]
step  8 :  [-0.9065453035616597]
step  9 :  [-0.7753366257001584]
step  10 :  [-0.6349333602046286]
step  11 :  [-0.4914739248637236]
step  12 :  [-0.3560144321192093]
step  13 :  [-0.24575113263612433]
step  14 :  [-0.1360472501555967]
step  15 :  [-0.08258531968081206]
step  16 :  [-0.03244155290936457]
step  17 :  [-0.03540957077963858]
step  18 :  [-0.008746291454031533]
step  19 :  [-0.014333593090932826]
step  20 :  [-0.0211237881192383]
step  21 :  [-0.011510837939652891]
step  22 :  [-0.030738577909336404]
step  23 :  [-0.05377710127016243]
step  24 :  [-0.09676442399289518]
episode  32 : steps 25 , return [-14.57]
step  0 :  [-1.4867898952511727]
step  1 :  [-1.4485304720478847]
step  2 :  [-1.4047510761933135]
step  3 :  [-1.3638629802751958]
step  4 :  [-1.292408266868164]
step  5 :  [-1.1934672863003624]
step  6 :  [-1.071721929355572]
step  7 :  [-0.9317830242943698]
step  8 :  [-0.7976531482368803]
step  9 :  [-0.6554417694500269]
step  10 :  [-0.5561047658786393]
step  11 :  [-0.4426238362149281]
step  12 :  [-0.3426430809225523]
step  13 :  [-0.22883241339928145]
step  14 :  [-0.1170906442329013]
step  15 :  [-0.03848209523927994]
step  16 :  [-0.008493257514811434]
step  17 :  [-0.025856365515081796]
step  18 :  [-0.008539064131375163]
step  19 :  [-0.01882517475378767]
step  20 :  [-0.03791894171374762]
step  21 :  [-0.002899790656667121]
step  22 :  [-0.025720109694598644]
step  23 :  [-0.00683592728814307]
step  24 :  [-0.018864469894027652]
episode  33 : steps 25 , return [-13.53]
step  0 :  [-1.7864860625898693]
step  1 :  [-1.7474216505221873]
step  2 :  [-1.7013363872919234]
step  3 :  [-1.6556308324991131]
step  4 :  [-1.61680247398387]
step  5 :  [-1.5471691115300776]
step  6 :  [-1.4498770422285951]
step  7 :  [-1.3296300200293203]
step  8 :  [-1.1910718317643954]
step  9 :  [-1.0382548376694418]
step  10 :  [-0.8745523330761544]
step  11 :  [-0.7132516917071342]
step  12 :  [-0.5461325833046321]
step  13 :  [-0.37778638511655155]
step  14 :  [-0.2399895599728751]
step  15 :  [-0.12211919647269258]
step  16 :  [-0.04633407550925919]
step  17 :  [-0.056856446964841156]
step  18 :  [-0.06733510171070327]
step  19 :  [-0.04579090309166996]
step  20 :  [-0.07524496703517433]
step  21 :  [-0.10705669547995934]
step  22 :  [-0.10696105834991261]
step  23 :  [-0.07889469039840942]
step  24 :  [-0.032068954696270136]
episode  34 : steps 25 , return [-18.55]
step  0 :  [-1.5347266600626621]
step  1 :  [-1.4920719292926363]
step  2 :  [-1.4419288897717601]
step  3 :  [-1.392731100393635]
step  4 :  [-1.3521193102757436]
step  5 :  [-1.2828002641263854]
step  6 :  [-1.1866819380145246]
step  7 :  [-1.0680036256593133]
step  8 :  [-0.9313040132198375]
step  9 :  [-0.7807644122171715]
step  10 :  [-0.6224972498271356]
step  11 :  [-0.46062744412272455]
step  12 :  [-0.3288786059951517]
step  13 :  [-0.18546190591218092]
step  14 :  [-0.12608453175684692]
step  15 :  [-0.058489052504519405]
step  16 :  [-0.028295332158284312]
step  17 :  [-0.0306490229437337]
step  18 :  [-0.026712703617591003]
step  19 :  [-0.014715710054775458]
step  20 :  [-0.010044259554530612]
step  21 :  [-0.06577482187710455]
step  22 :  [-0.06574684605081152]
step  23 :  [-0.04980771422436266]
step  24 :  [-0.057230308635751154]
episode  35 : steps 25 , return [-14.59]
step  0 :  [-1.5215006390630745]
step  1 :  [-1.485122717332148]
step  2 :  [-1.4437953276072626]
step  3 :  [-1.405673533635677]
step  4 :  [-1.3359700322469281]
step  5 :  [-1.2382064634454455]
step  6 :  [-1.1173040162880756]
step  7 :  [-0.9780135566304319]
step  8 :  [-0.8244268173721659]
step  9 :  [-0.6982967539781888]
step  10 :  [-0.5688604517743552]
step  11 :  [-0.4436660310458887]
step  12 :  [-0.34079290663204825]
step  13 :  [-0.23667496754789016]
step  14 :  [-0.13383054671590175]
step  15 :  [-0.0934572653095185]
step  16 :  [-0.09512936956833305]
step  17 :  [-0.0907459566391435]
step  18 :  [-0.050082184793621136]
step  19 :  [-0.05706672785143049]
step  20 :  [-0.025293047847785643]
step  21 :  [-0.038406655943730064]
step  22 :  [-0.012717587330207116]
step  23 :  [-0.028200711149881905]
step  24 :  [-0.008612159126963984]
episode  36 : steps 25 , return [-14.27]
step  0 :  [-1.3680605360504234]
step  1 :  [-1.3353901543850533]
step  2 :  [-1.300015756145007]
step  3 :  [-1.2307872910949549]
step  4 :  [-1.1324773288336996]
step  5 :  [-1.0106125284043816]
step  6 :  [-0.8702214925479407]
step  7 :  [-0.8015405090978824]
step  8 :  [-0.7044695064009666]
step  9 :  [-0.6169387244375384]
step  10 :  [-0.5540824539002782]
step  11 :  [-0.47746347983811166]
step  12 :  [-0.39718238402529343]
step  13 :  [-0.3023398222586965]
step  14 :  [-0.20209924819992128]
step  15 :  [-0.13934116007822783]
step  16 :  [-0.13213115995542277]
step  17 :  [-0.13877736140724697]
step  18 :  [-0.11293338801420034]
step  19 :  [-0.08153713657580916]
step  20 :  [-0.05865702570511512]
step  21 :  [-0.038660957568902456]
step  22 :  [-0.0386088377014891]
step  23 :  [-0.026779405261343654]
step  24 :  [-0.053064952661539]
episode  37 : steps 25 , return [-13.12]
step  0 :  [-1.6447501484922298]
step  1 :  [-1.6130258169807412]
step  2 :  [-1.5775829490055167]
step  3 :  [-1.5458180712114353]
step  4 :  [-1.480008457233214]
step  5 :  [-1.3847956467299514]
step  6 :  [-1.265684536262866]
step  7 :  [-1.1277535083038301]
step  8 :  [-0.9752987694512906]
step  9 :  [-0.8118443813741116]
step  10 :  [-0.6469732447624518]
step  11 :  [-0.48044647374672506]
step  12 :  [-0.3208505297904247]
step  13 :  [-0.19174933543784456]
step  14 :  [-0.06925453261909864]
step  15 :  [-0.011761091753371582]
step  16 :  [-0.05461606166701335]
step  17 :  [-0.06492652066625373]
step  18 :  [-0.02937451288822053]
step  19 :  [-0.04666002955258264]
step  20 :  [-0.05490969027180394]
step  21 :  [-0.02469314472352666]
step  22 :  [-0.036453819312194415]
step  23 :  [-0.039239544192767914]
step  24 :  [-0.04396191949958722]
episode  38 : steps 25 , return [-15.54]
step  0 :  [-1.7889478384521285]
step  1 :  [-1.7565836416043488]
step  2 :  [-1.7197211297224246]
step  3 :  [-1.6853538787536892]
step  4 :  [-1.6171052997188458]
step  5 :  [-1.5197583816412323]
step  6 :  [-1.398789555601668]
step  7 :  [-1.2591925517738254]
step  8 :  [-1.1051491580416521]
step  9 :  [-0.9400222664167089]
step  10 :  [-0.7674890737834464]
step  11 :  [-0.5949646625767665]
step  12 :  [-0.46667493094919615]
step  13 :  [-0.3271765525042828]
step  14 :  [-0.20782537262283726]
step  15 :  [-0.14863116827171602]
step  16 :  [-0.08193221266767296]
step  17 :  [-0.045242757274043637]
step  18 :  [-0.026684373194848197]
step  19 :  [-0.03317649987465097]
step  20 :  [-0.010829499117467929]
step  21 :  [-0.046179710650233324]
step  22 :  [-0.02573991671802428]
step  23 :  [-0.05026217405029271]
step  24 :  [-0.05257216705624461]
episode  39 : steps 25 , return [-17.68]
step  0 :  [-1.5533372404967858]
step  1 :  [-1.506654960324154]
step  2 :  [-1.4507697420259518]
step  3 :  [-1.3942040307455446]
step  4 :  [-1.3447595938794203]
step  5 :  [-1.2690527646405088]
step  6 :  [-1.1680920373366377]
step  7 :  [-1.0454990447746988]
step  8 :  [-0.9053473917505432]
step  9 :  [-0.7947612820438459]
step  10 :  [-0.6717753625644439]
step  11 :  [-0.5507723834765602]
step  12 :  [-0.4405710203082266]
step  13 :  [-0.35122981552024923]
step  14 :  [-0.2562342396690995]
step  15 :  [-0.17824696995840894]
step  16 :  [-0.1189831042144957]
step  17 :  [-0.092074923523845]
step  18 :  [-0.04536123626664893]
step  19 :  [-0.04044336885835549]
step  20 :  [-0.012170632899378211]
step  21 :  [-0.02145382680958234]
step  22 :  [-0.0386976775298969]
step  23 :  [-0.0336815146051817]
step  24 :  [-0.041003094422375076]
episode  40 : steps 25 , return [-15.33]
step  0 :  [-1.6701709225598318]
step  1 :  [-1.6282706349400744]
step  2 :  [-1.5786458419000022]
step  3 :  [-1.5291983142338528]
step  4 :  [-1.4869811608618295]
step  5 :  [-1.415598422358344]
step  6 :  [-1.3173839118276207]
step  7 :  [-1.1966528414025002]
step  8 :  [-1.0578612100157416]
step  9 :  [-0.9049783767154597]
step  10 :  [-0.754647282539415]
step  11 :  [-0.598476657312986]
step  12 :  [-0.4416781150135208]
step  13 :  [-0.2969843798039912]
step  14 :  [-0.1842533500018742]
step  15 :  [-0.08393584350366967]
step  16 :  [-0.040212863893252244]
step  17 :  [-0.06133743182212616]
step  18 :  [-0.052020174362984624]
step  19 :  [-0.06566650514462982]
step  20 :  [-0.05057141017746948]
step  21 :  [-0.024923891629584038]
step  22 :  [-0.01567994766274263]
step  23 :  [-0.046263319801374034]
step  24 :  [-0.051774787797181705]
episode  41 : steps 25 , return [-16.55]
step  0 :  [-1.5190631510169876]
step  1 :  [-1.4860981498273076]
step  2 :  [-1.4495056139512847]
step  3 :  [-1.4172326388557348]
step  4 :  [-1.3516897852112417]
step  5 :  [-1.2570427451468984]
step  6 :  [-1.1386267793863531]
step  7 :  [-1.001487318943752]
step  8 :  [-0.849974241401847]
step  9 :  [-0.6986345331272036]
step  10 :  [-0.5401101770308951]
step  11 :  [-0.3806200471797874]
step  12 :  [-0.24847299898964148]
step  13 :  [-0.12853330185398057]
step  14 :  [-0.06058314693323498]
step  15 :  [-0.01781911069955384]
step  16 :  [-0.056152535986557735]
step  17 :  [-0.03696587481661641]
step  18 :  [-0.06507886267943232]
step  19 :  [-0.05349645789412967]
step  20 :  [-0.06630562237234466]
step  21 :  [-0.058325165734580395]
step  22 :  [-0.03927755564561408]
step  23 :  [-0.033713485177368704]
step  24 :  [-0.05550728578879951]
episode  42 : steps 25 , return [-14.01]
step  0 :  [-1.5588832595415607]
step  1 :  [-1.5302188602602966]
step  2 :  [-1.499348929919736]
step  3 :  [-1.4325078544566983]
step  4 :  [-1.335526224319725]
step  5 :  [-1.2144273189156547]
step  6 :  [-1.0744845688261244]
step  7 :  [-0.9200186448336319]
step  8 :  [-0.7879969835010726]
step  9 :  [-0.6439101258461403]
step  10 :  [-0.5184540337004305]
step  11 :  [-0.42897912018379575]
step  12 :  [-0.34239276959976434]
step  13 :  [-0.26053243766169687]
step  14 :  [-0.16661519092577723]
step  15 :  [-0.06596641009154057]
step  16 :  [-0.02996147521011256]
step  17 :  [-0.033606665266923436]
step  18 :  [-0.048242483782390384]
step  19 :  [-0.045813050169581045]
step  20 :  [-0.017739579477783405]
step  21 :  [-0.013233077986993785]
step  22 :  [-0.020472906353194008]
step  23 :  [-0.02210530346189232]
step  24 :  [-0.0030183069479060615]
episode  43 : steps 25 , return [-14.01]
step  0 :  [-1.5846060769678711]
step  1 :  [-1.5584927461162204]
step  2 :  [-1.5309890157619785]
step  3 :  [-1.4663935550230345]
step  4 :  [-1.3709717038220826]
step  5 :  [-1.2509922605444586]
step  6 :  [-1.1118743470799268]
step  7 :  [-0.9580291714341471]
step  8 :  [-0.7929424240610189]
step  9 :  [-0.6258292258442869]
step  10 :  [-0.47346462004159184]
step  11 :  [-0.3594257833739752]
step  12 :  [-0.253810490236282]
step  13 :  [-0.1466058635622167]
step  14 :  [-0.02432096484633366]
step  15 :  [-0.06294905150271345]
step  16 :  [-0.07386265581024001]
step  17 :  [-0.03811900274733809]
step  18 :  [-0.06099159904315106]
step  19 :  [-0.07192541369837438]
step  20 :  [-0.07615036665914791]
step  21 :  [-0.08038120992498196]
step  22 :  [-0.03534484076946516]
step  23 :  [-0.03751047586278029]
step  24 :  [-0.03107771058634234]
episode  44 : steps 25 , return [-14.08]
step  0 :  [-1.7287566681334852]
step  1 :  [-1.6861776569193432]
step  2 :  [-1.635402006397584]
step  3 :  [-1.584176842204717]
step  4 :  [-1.539393363619362]
step  5 :  [-1.4658581707969343]
step  6 :  [-1.3658653301622994]
step  7 :  [-1.2436359134429227]
step  8 :  [-1.1035219532513216]
step  9 :  [-0.9493784796863528]
step  10 :  [-0.7844261922573601]
step  11 :  [-0.6185030557633588]
step  12 :  [-0.4639725620991444]
step  13 :  [-0.3457920752668263]
step  14 :  [-0.23642494420318677]
step  15 :  [-0.12171503643124515]
step  16 :  [-0.035759310512461916]
step  17 :  [-0.055835740349016685]
step  18 :  [-0.06621814643656705]
step  19 :  [-0.029524808945484336]
step  20 :  [-0.056684316184768664]
step  21 :  [-0.06491096927249711]
step  22 :  [-0.022253156347368838]
step  23 :  [-0.03891419687803512]
step  24 :  [-0.004744951057418776]
episode  45 : steps 25 , return [-17.25]
step  0 :  [-1.5945721876447885]
step  1 :  [-1.5657429459475396]
step  2 :  [-1.5344844799628332]
step  3 :  [-1.4672671272266777]
step  4 :  [-1.3699676574697512]
step  5 :  [-1.2486164669589086]
step  6 :  [-1.1084835081702908]
step  7 :  [-0.9538856578078666]
step  8 :  [-0.7895786279622218]
step  9 :  [-0.6202269349830681]
step  10 :  [-0.48482075961837773]
step  11 :  [-0.3963139192114703]
step  12 :  [-0.3132346888247571]
step  13 :  [-0.2173671744011165]
step  14 :  [-0.1055126870125451]
step  15 :  [-0.0635842587509307]
step  16 :  [-0.011344298880289925]
step  17 :  [-0.03274055439850219]
step  18 :  [-0.009088050909761997]
step  19 :  [-0.027081343595069324]
step  20 :  [-0.010732485974413444]
step  21 :  [-0.0785765734147679]
step  22 :  [-0.08322844632275748]
step  23 :  [-0.09511928296300352]
step  24 :  [-0.08687113890368957]
episode  46 : steps 25 , return [-14.27]
step  0 :  [-1.5201028529770317]
step  1 :  [-1.4927950599589415]
step  2 :  [-1.4639679301069863]
step  3 :  [-1.3986645811962375]
step  4 :  [-1.3028427324551095]
step  5 :  [-1.1826261795362158]
step  6 :  [-1.0433613557056107]
step  7 :  [-0.8894209281441067]
step  8 :  [-0.7782349332580181]
step  9 :  [-0.6539577921117665]
step  10 :  [-0.5305137945750933]
step  11 :  [-0.4332992147520096]
step  12 :  [-0.32656584184362575]
step  13 :  [-0.22430410568722237]
step  14 :  [-0.11285297344882304]
step  15 :  [-0.07167034233171968]
step  16 :  [-0.06685965437596332]
step  17 :  [-0.05963242652382878]
step  18 :  [-0.007586639104735733]
step  19 :  [-0.04990618298591485]
step  20 :  [-0.06545777231185002]
step  21 :  [-0.03533901717958459]
step  22 :  [-0.06463552406643401]
step  23 :  [-0.03903069602877793]
step  24 :  [-0.040522328023763814]
episode  47 : steps 25 , return [-13.85]
step  0 :  [-1.7578754216023411]
step  1 :  [-1.729320092009707]
step  2 :  [-1.6977776861767024]
step  3 :  [-1.6299264311752824]
step  4 :  [-1.5319785296879065]
step  5 :  [-1.4100827423888516]
step  6 :  [-1.2695500496907184]
step  7 :  [-1.1147160346729335]
step  8 :  [-0.949032304654549]
step  9 :  [-0.7843176612695775]
step  10 :  [-0.6097742786141226]
step  11 :  [-0.5079983371522804]
step  12 :  [-0.4147328737389612]
step  13 :  [-0.33814873315626715]
step  14 :  [-0.25159784723569334]
step  15 :  [-0.14677505431632]
step  16 :  [-0.06975445271816864]
step  17 :  [-0.05118659867555188]
step  18 :  [-0.024208862042900306]
step  19 :  [-0.010590884164620595]
step  20 :  [-0.030528327956417693]
step  21 :  [-0.034868127915258215]
step  22 :  [-0.050989231756974944]
step  23 :  [-0.05162684336456508]
step  24 :  [-0.06327942117488809]
episode  48 : steps 25 , return [-16.53]
step  0 :  [-1.652136311201275]
step  1 :  [-1.6115606190654497]
step  2 :  [-1.563848282377356]
step  3 :  [-1.5168967509495368]
step  4 :  [-1.4777400305155675]
step  5 :  [-1.4086459103041065]
step  6 :  [-1.3122088743972717]
step  7 :  [-1.192936004366795]
step  8 :  [-1.0554333417764044]
step  9 :  [-0.9038109649251463]
step  10 :  [-0.7416157245436896]
step  11 :  [-0.5731732896762944]
step  12 :  [-0.40224620476762973]
step  13 :  [-0.263064821590849]
step  14 :  [-0.14908208674617623]
step  15 :  [-0.07308747172795602]
step  16 :  [-0.04587092546228849]
step  17 :  [-0.03754791895991455]
step  18 :  [-0.06869488967531667]
step  19 :  [-0.08882612811531121]
step  20 :  [-0.05893715634260222]
step  21 :  [-0.03439753015937645]
step  22 :  [-0.01369635033585372]
step  23 :  [-0.0053054132101418095]
step  24 :  [-0.035302635815545415]
episode  49 : steps 25 , return [-16.29]
step  0 :  [-1.4932577253212742]
step  1 :  [-1.4666794946286008]
step  2 :  [-1.4389852056544776]
step  3 :  [-1.3745654186164642]
step  4 :  [-1.2794345181283404]
step  5 :  [-1.1597695246184714]
step  6 :  [-1.0209611246933237]
step  7 :  [-0.8674211563160187]
step  8 :  [-0.7571492152505125]
step  9 :  [-0.6348163339269431]
step  10 :  [-0.5081844136789402]
step  11 :  [-0.3884727692672805]
step  12 :  [-0.2892665802544947]
step  13 :  [-0.18612842737351334]
step  14 :  [-0.06947128507199175]
step  15 :  [-0.02969522649625258]
step  16 :  [-0.030017866166593337]
step  17 :  [-0.027811446316369247]
step  18 :  [-0.02056768838047086]
step  19 :  [-0.05571863294790479]
step  20 :  [-0.03872525048777163]
step  21 :  [-0.027963492084947302]
step  22 :  [-0.046977264899000885]
step  23 :  [-0.04334224031767662]
step  24 :  [-0.02715772560315289]
episode  50 : steps 25 , return [-13.28]
step  0 :  [-1.6067045714313017]
step  1 :  [-1.5654649436998094]
step  2 :  [-1.5170032086284584]
step  3 :  [-1.4694097540088102]
step  4 :  [-1.42993270128215]
step  5 :  [-1.360907625935578]
step  6 :  [-1.2647001557046968]
step  7 :  [-1.145732983058093]
step  8 :  [-1.0085954035719324]
step  9 :  [-0.8574262598077732]
step  10 :  [-0.7025086797002047]
step  11 :  [-0.5405988200739787]
step  12 :  [-0.37749566558521225]
step  13 :  [-0.2424513796689458]
step  14 :  [-0.12229005000405645]
step  15 :  [-0.050215656727595086]
step  16 :  [-0.04263773434446389]
step  17 :  [-0.08465355657468449]
step  18 :  [-0.06855828615913004]
step  19 :  [-0.013087331021594352]
step  20 :  [-0.013676320886469038]
step  21 :  [-0.03967641863768328]
step  22 :  [-0.025510135567410146]
step  23 :  [-0.05935006407260718]
step  24 :  [-0.04517018117465662]
episode  51 : steps 25 , return [-15.65]
step  0 :  [-1.7574453650439148]
step  1 :  [-1.7238873266812114]
step  2 :  [-1.6854956864933528]
step  3 :  [-1.6494317551256867]
step  4 :  [-1.5801107715858695]
step  5 :  [-1.482049114322798]
step  6 :  [-1.3605798913175902]
step  7 :  [-1.2206150356367003]
step  8 :  [-1.0662860280866662]
step  9 :  [-0.9009211162653915]
step  10 :  [-0.7656975315250504]
step  11 :  [-0.6229261829988778]
step  12 :  [-0.4846973731713714]
step  13 :  [-0.376540685423529]
step  14 :  [-0.27451164273235834]
step  15 :  [-0.17701784521010203]
step  16 :  [-0.12399767228936988]
step  17 :  [-0.04245727508068252]
step  18 :  [-0.027182980964260146]
step  19 :  [-0.030833565127585776]
step  20 :  [-0.024540580398969208]
step  21 :  [-0.03801794862680913]
step  22 :  [-0.03442808829034378]
step  23 :  [-0.03953854843712764]
step  24 :  [-0.03620700101907699]
episode  52 : steps 25 , return [-17.53]
step  0 :  [-1.5109576978801775]
step  1 :  [-1.4737904278371472]
step  2 :  [-1.4314160661923656]
step  3 :  [-1.392080180734683]
step  4 :  [-1.3215805398285283]
step  5 :  [-1.2232642496486819]
step  6 :  [-1.101954002951633]
step  7 :  [-0.9623403543920922]
step  8 :  [-0.8084720393594397]
step  9 :  [-0.6666939478338845]
step  10 :  [-0.5328556347286336]
step  11 :  [-0.43066875204019933]
step  12 :  [-0.32435159769148936]
step  13 :  [-0.2247191677617249]
step  14 :  [-0.11539006659751959]
step  15 :  [-0.060606826918277235]
step  16 :  [-0.06012887695118372]
step  17 :  [-0.02988995592129113]
step  18 :  [-0.031602145335325425]
step  19 :  [-0.04037033330512349]
step  20 :  [-0.06788286499838732]
step  21 :  [-0.06310510180935866]
step  22 :  [-0.06821089324084018]
step  23 :  [-0.07500552977076065]
step  24 :  [-0.054648352334146104]
episode  53 : steps 25 , return [-14.07]
step  0 :  [-1.816557180031067]
step  1 :  [-1.7796225758359279]
step  2 :  [-1.736383052365597]
step  3 :  [-1.694036759228281]
step  4 :  [-1.6201506129646184]
step  5 :  [-1.5187521825017272]
step  6 :  [-1.3948352968565145]
step  7 :  [-1.2530860406726678]
step  8 :  [-1.0974925891227045]
step  9 :  [-0.9313066638218546]
step  10 :  [-0.7840995475036647]
step  11 :  [-0.6234749265488357]
step  12 :  [-0.5310361045495434]
step  13 :  [-0.45800760285399694]
step  14 :  [-0.3678567362043598]
step  15 :  [-0.276699029458709]
step  16 :  [-0.17574699888970893]
step  17 :  [-0.06410905483048912]
step  18 :  [-0.055981165196442015]
step  19 :  [-0.11996331637404398]
step  20 :  [-0.12420266253413943]
step  21 :  [-0.08415509639657194]
step  22 :  [-0.030881276284326204]
step  23 :  [-0.018749764103993937]
step  24 :  [-0.026603162670382784]
episode  54 : steps 25 , return [-18.58]
step  0 :  [-1.5222782659659089]
step  1 :  [-1.4854663948523652]
step  2 :  [-1.4435328989351697]
step  3 :  [-1.404655559551066]
step  4 :  [-1.3344174719951116]
step  5 :  [-1.2362595743552103]
step  6 :  [-1.115051264224122]
step  7 :  [-0.9755076873137486]
step  8 :  [-0.8216914334583234]
step  9 :  [-0.6988300305330597]
step  10 :  [-0.5734860537326797]
step  11 :  [-0.4529767236635849]
step  12 :  [-0.3540584998110705]
step  13 :  [-0.2527380056149192]
step  14 :  [-0.14289025950100556]
step  15 :  [-0.09490632224710599]
step  16 :  [-0.024982831306920673]
step  17 :  [-0.014594749592751383]
step  18 :  [-0.07856897587603152]
step  19 :  [-0.08231458091790828]
step  20 :  [-0.10776877392178348]
step  21 :  [-0.10241999052608453]
step  22 :  [-0.06065568541521122]
step  23 :  [-0.06533529953248518]
step  24 :  [-0.038493241181384134]
episode  55 : steps 25 , return [-14.48]
step  0 :  [-1.5638978268024906]
step  1 :  [-1.5230670093488046]
step  2 :  [-1.4753515609032066]
step  3 :  [-1.428982397984804]
step  4 :  [-1.353352172449426]
step  5 :  [-1.2512448452493474]
step  6 :  [-1.127083816536203]
step  7 :  [-0.9852845705334028]
step  8 :  [-0.8297023200615863]
step  9 :  [-0.7903979916296987]
step  10 :  [-0.7142562735410677]
step  11 :  [-0.6420641973700988]
step  12 :  [-0.5733509247440348]
step  13 :  [-0.5138554386421421]
step  14 :  [-0.44053115436776547]
step  15 :  [-0.3581461879316334]
step  16 :  [-0.26099005276297227]
step  17 :  [-0.1452498783837614]
step  18 :  [-0.013326815295903433]
step  19 :  [-0.04190625380735469]
step  20 :  [-0.05214733535996035]
step  21 :  [-0.018512648247140235]
step  22 :  [-0.04485666297211511]
step  23 :  [-0.019069293968000563]
step  24 :  [-0.06076671503938957]
episode  56 : steps 25 , return [-16.23]
step  0 :  [-1.7477754982437252]
step  1 :  [-1.7158199607395561]
step  2 :  [-1.6796628703248138]
step  3 :  [-1.6463897862647348]
step  4 :  [-1.5790710437250317]
step  5 :  [-1.4824911076868852]
step  6 :  [-1.3621576152194752]
step  7 :  [-1.2231005815394846]
step  8 :  [-1.069538551946644]
step  9 :  [-0.9048754011107139]
step  10 :  [-0.7489203660713353]
step  11 :  [-0.5889895847327176]
step  12 :  [-0.4313177133831203]
step  13 :  [-0.3051294339102847]
step  14 :  [-0.19050723759368665]
step  15 :  [-0.059563611102637]
step  16 :  [-0.007937445596835424]
step  17 :  [-0.037180226081346274]
step  18 :  [-0.03883754821993297]
step  19 :  [-0.027452957381173145]
step  20 :  [-0.031839150794619124]
step  21 :  [-0.02962820745384525]
step  22 :  [-0.058132742738930654]
step  23 :  [-0.0615373856499317]
step  24 :  [-0.026598992415561393]
episode  57 : steps 25 , return [-17.05]
step  0 :  [-1.4822523613078045]
step  1 :  [-1.4550984916890264]
step  2 :  [-1.4266745324695815]
step  3 :  [-1.3617852608241037]
step  4 :  [-1.2663333351922488]
step  5 :  [-1.1464356131160895]
step  6 :  [-1.0074474066191634]
step  7 :  [-0.8537568066207009]
step  8 :  [-0.7531186728635281]
step  9 :  [-0.6393569722254019]
step  10 :  [-0.5200284544547485]
step  11 :  [-0.40620172252148684]
step  12 :  [-0.31029252885685027]
step  13 :  [-0.20875022231365534]
step  14 :  [-0.13813523150831686]
step  15 :  [-0.04574591483773562]
step  16 :  [-0.020314573531746517]
step  17 :  [-0.024859786551203637]
step  18 :  [-0.02997867317666786]
step  19 :  [-0.05207452519940074]
step  20 :  [-0.0470025912979946]
step  21 :  [-0.08117098371761809]
step  22 :  [-0.0668186719692151]
step  23 :  [-0.03833236147858476]
step  24 :  [-0.048235020303409544]
episode  58 : steps 25 , return [-13.43]
step  0 :  [-1.7171478785575638]
step  1 :  [-1.6800598511610112]
step  2 :  [-1.6369462635283059]
step  3 :  [-1.5953043140672238]
step  4 :  [-1.5222631985407284]
step  5 :  [-1.421631997084435]
step  6 :  [-1.2983372411173866]
step  7 :  [-1.1570492349945234]
step  8 :  [-1.0017520245803502]
step  9 :  [-0.8356847626082917]
step  10 :  [-0.7797093636079784]
step  11 :  [-0.6915503159554207]
step  12 :  [-0.6041082720728412]
step  13 :  [-0.5206932580262755]
step  14 :  [-0.45010999468587193]
step  15 :  [-0.3686333185555614]
step  16 :  [-0.27146622862803677]
step  17 :  [-0.16614275898216324]
step  18 :  [-0.04890348373794237]
step  19 :  [-0.03576736538179828]
step  20 :  [-0.01905145566628126]
step  21 :  [-0.06036125942189936]
step  22 :  [-0.044015194941555875]
step  23 :  [-0.029933667286373485]
step  24 :  [-0.032047491300823024]
episode  59 : steps 25 , return [-17.99]
step  0 :  [-1.5306118575679966]
step  1 :  [-1.4891923776768623]
step  2 :  [-1.4407975813823133]
step  3 :  [-1.3938196753655228]
step  4 :  [-1.3558329537312919]
step  5 :  [-1.2884247869118]
step  6 :  [-1.1937832254068406]
step  7 :  [-1.0763392804103062]
step  8 :  [-0.9407802948546307]
step  9 :  [-0.791436151138473]
step  10 :  [-0.6323295189093351]
step  11 :  [-0.4679188869255627]
step  12 :  [-0.3062726558835256]
step  13 :  [-0.17189812035998955]
step  14 :  [-0.04357057390788641]
step  15 :  [-0.03177437161639909]
step  16 :  [-0.02810874676908037]
step  17 :  [-0.031381582666866574]
step  18 :  [-0.017957730481141222]
step  19 :  [-0.035774323924403835]
step  20 :  [-0.015271827064836265]
step  21 :  [-0.03928731859878846]
step  22 :  [-0.015427627672489723]
step  23 :  [-0.04150602129677775]
step  24 :  [-0.01606550114904176]
episode  60 : steps 25 , return [-14.4]
step  0 :  [-1.5917430095224068]
step  1 :  [-1.5454894267462822]
step  2 :  [-1.490058294761463]
step  3 :  [-1.433810731816433]
step  4 :  [-1.3843573935176523]
step  5 :  [-1.3083794232701225]
step  6 :  [-1.2070719234902163]
step  7 :  [-1.0841212990480837]
step  8 :  [-0.9436131226786737]
step  9 :  [-0.7978687798183977]
step  10 :  [-0.6474872151784459]
step  11 :  [-0.5126329314909654]
step  12 :  [-0.4130299137466527]
step  13 :  [-0.317897614912222]
step  14 :  [-0.21585706174873226]
step  15 :  [-0.1123528044837654]
step  16 :  [-0.058574472386605944]
step  17 :  [-0.05879249606892152]
step  18 :  [-0.035422958538569]
step  19 :  [-0.023932624878415687]
step  20 :  [-0.01185357999560715]
step  21 :  [-0.054952068161862315]
step  22 :  [-0.05450689873779718]
step  23 :  [-0.014501489947318832]
step  24 :  [-0.03225213823351054]
episode  61 : steps 25 , return [-15.35]
step  0 :  [-1.7667655196965073]
step  1 :  [-1.7297915990644654]
step  2 :  [-1.6866621283018535]
step  3 :  [-1.6447182208612339]
step  4 :  [-1.5712828890378205]
step  5 :  [-1.4702829668464772]
step  6 :  [-1.3466827118830047]
step  7 :  [-1.2051621418246228]
step  8 :  [-1.049707809823698]
step  9 :  [-0.8835644819698857]
step  10 :  [-0.7815820433751433]
step  11 :  [-0.657297475139611]
step  12 :  [-0.5531399942892177]
step  13 :  [-0.48170191139648805]
step  14 :  [-0.4085664015208525]
step  15 :  [-0.32203321748999625]
step  16 :  [-0.22613028474863817]
step  17 :  [-0.14629492151576864]
step  18 :  [-0.09616963975148382]
step  19 :  [-0.0854366107249199]
step  20 :  [-0.09545429834043344]
step  21 :  [-0.053343788061477104]
step  22 :  [-0.023169381623627465]
step  23 :  [-0.04828345038941705]
step  24 :  [-0.020881780994720524]
episode  62 : steps 25 , return [-18.35]
step  0 :  [-1.7136113929159886]
step  1 :  [-1.6835121020697692]
step  2 :  [-1.6500248247703373]
step  3 :  [-1.5809706606312455]
step  4 :  [-1.4822607777086674]
step  5 :  [-1.3598876884723448]
step  6 :  [-1.2190814726079346]
step  7 :  [-1.0641425287813526]
step  8 :  [-0.8985254661838036]
step  9 :  [-0.8300328590639416]
step  10 :  [-0.8545766272026712]
step  11 :  [-0.8809360847910606]
step  12 :  [-0.8572192968936947]
step  13 :  [-0.7947489898095221]
step  14 :  [-0.7040415367826862]
step  15 :  [-0.5949735045437478]
step  16 :  [-0.4786768718588045]
step  17 :  [-0.37098526046472124]
step  18 :  [-0.25921959433936637]
step  19 :  [-0.14027406097161071]
step  20 :  [-0.018512951809267538]
step  21 :  [-0.0609117131542434]
step  22 :  [-0.060133343457787106]
step  23 :  [-0.026918447827522726]
step  24 :  [-0.03834335276983586]
episode  63 : steps 25 , return [-19.62]
step  0 :  [-1.4462954728091126]
step  1 :  [-1.416229864523525]
step  2 :  [-1.3840037943888934]
step  3 :  [-1.316618432992232]
step  4 :  [-1.2194464823073923]
step  5 :  [-1.0983115416730445]
step  6 :  [-0.9583957875068607]
step  7 :  [-0.80400165190021]
step  8 :  [-0.665744246488616]
step  9 :  [-0.5466204873879474]
step  10 :  [-0.4624125834145488]
step  11 :  [-0.3783671847640442]
step  12 :  [-0.2965814066350603]
step  13 :  [-0.2004039108085354]
step  14 :  [-0.08688557098535599]
step  15 :  [-0.017002130774596072]
step  16 :  [-0.018909723104134656]
step  17 :  [-0.0227495336248372]
step  18 :  [-0.026332096068970506]
step  19 :  [-0.015685018313301772]
step  20 :  [-0.03584731228717932]
step  21 :  [-0.08263084474302726]
step  22 :  [-0.08733371593297014]
step  23 :  [-0.055639547297059826]
step  24 :  [-0.0785131924082674]
episode  64 : steps 25 , return [-12.72]
step  0 :  [-1.7061080262779749]
step  1 :  [-1.6697991221378348]
step  2 :  [-1.6278024090920395]
step  3 :  [-1.5876043586448985]
step  4 :  [-1.51560412349714]
step  5 :  [-1.4157288121670681]
step  6 :  [-1.292985242165529]
step  7 :  [-1.1520961241775702]
step  8 :  [-0.9970776861814994]
step  9 :  [-0.8311842577876623]
step  10 :  [-0.7715259046000517]
step  11 :  [-0.6877769914749707]
step  12 :  [-0.5969608438893267]
step  13 :  [-0.5056038062016597]
step  14 :  [-0.42596572925584025]
step  15 :  [-0.33711934377748737]
step  16 :  [-0.23586509277980694]
step  17 :  [-0.12398816171562078]
step  18 :  [-0.013037150205297523]
step  19 :  [-0.05001601279542331]
step  20 :  [-0.055389975332983864]
step  21 :  [-0.02485679409922126]
step  22 :  [-0.03593354420745377]
step  23 :  [-0.07935018495292713]
step  24 :  [-0.09787123592790223]
episode  65 : steps 25 , return [-17.84]
step  0 :  [-1.6060978792371967]
step  1 :  [-1.5686435514296229]
step  2 :  [-1.5254509979098332]
step  3 :  [-1.4844118087393798]
step  4 :  [-1.412255277832488]
step  5 :  [-1.3124904288807522]
step  6 :  [-1.1899473007384747]
step  7 :  [-1.0492735402413733]
step  8 :  [-0.8944539827777982]
step  9 :  [-0.7866179628878063]
step  10 :  [-0.6626324996653514]
step  11 :  [-0.5461851323904863]
step  12 :  [-0.44511077923341374]
step  13 :  [-0.3655941015700412]
step  14 :  [-0.27868955462275635]
step  15 :  [-0.17431167210808995]
step  16 :  [-0.051363891106485475]
step  17 :  [-0.023510479252601562]
step  18 :  [-0.012029802705310021]
step  19 :  [-0.026518237525450423]
step  20 :  [-0.0465063660221278]
step  21 :  [-0.04890895581964153]
step  22 :  [-0.02438337743609205]
step  23 :  [-0.05823742423144178]
step  24 :  [-0.050790215727925435]
episode  66 : steps 25 , return [-15.64]
step  0 :  [-1.5731616729195947]
step  1 :  [-1.5276165123919756]
step  2 :  [-1.473254630181361]
step  3 :  [-1.4184800221313973]
step  4 :  [-1.3709437080175304]
step  5 :  [-1.296437189018696]
step  6 :  [-1.196276972733634]
step  7 :  [-1.074254238496894]
step  8 :  [-0.9345421602569824]
step  9 :  [-0.7939609810720966]
step  10 :  [-0.6477652350464586]
step  11 :  [-0.5090877218933823]
step  12 :  [-0.4019833903016575]
step  13 :  [-0.2930691911709453]
step  14 :  [-0.19264701238971965]
step  15 :  [-0.08533840539273177]
step  16 :  [-0.0837749293517186]
step  17 :  [-0.07384578549115]
step  18 :  [-0.035584698475210126]
step  19 :  [-0.03527729284184849]
step  20 :  [-0.027729177175780842]
step  21 :  [-0.025372754031802853]
step  22 :  [-0.05709451089621183]
step  23 :  [-0.04317827546036525]
step  24 :  [-0.03584015709221597]
episode  67 : steps 25 , return [-15.21]
step  0 :  [-1.5102258353493574]
step  1 :  [-1.4760549343157818]
step  2 :  [-1.4378389221721815]
step  3 :  [-1.403641080646815]
step  4 :  [-1.336773663449552]
step  5 :  [-1.2411540335641442]
step  6 :  [-1.1219685418222376]
step  7 :  [-0.9841622660461248]
step  8 :  [-0.8320012731086947]
step  9 :  [-0.6867169883090044]
step  10 :  [-0.5363739263799613]
step  11 :  [-0.3887521607912533]
step  12 :  [-0.26702334001920436]
step  13 :  [-0.1495521451040133]
step  14 :  [-0.04611514817817798]
step  15 :  [-0.034258620061300475]
step  16 :  [-0.05164344407385725]
step  17 :  [-0.016985755097360763]
step  18 :  [-0.039900410467432694]
step  19 :  [-0.03849816878331984]
step  20 :  [-0.010176647312382544]
step  21 :  [-0.05750549089112989]
step  22 :  [-0.06566152938032159]
step  23 :  [-0.04192148375702996]
step  24 :  [-0.018702739391838773]
episode  68 : steps 25 , return [-13.79]
step  0 :  [-1.48033963173135]
step  1 :  [-1.4545031564073063]
step  2 :  [-1.4278890454626953]
step  3 :  [-1.3642737728769823]
step  4 :  [-1.2697595235476369]
step  5 :  [-1.150586949795103]
step  6 :  [-1.0121949091813651]
step  7 :  [-0.8590378080222503]
step  8 :  [-0.738069678998078]
step  9 :  [-0.6064997003886012]
step  10 :  [-0.47075013428216933]
step  11 :  [-0.35873620837127457]
step  12 :  [-0.23819292148986965]
step  13 :  [-0.1249730869247338]
step  14 :  [-0.005645020526203964]
step  15 :  [-0.06434382898019224]
step  16 :  [-0.06746346063289758]
step  17 :  [-0.02612717431592575]
step  18 :  [-0.029881239371336014]
step  19 :  [-0.025940932143133894]
step  20 :  [-0.030519103168517834]
step  21 :  [-0.03459304061771559]
step  22 :  [-0.007160519486019604]
step  23 :  [-0.016257335732753585]
step  24 :  [-0.027429313304578595]
episode  69 : steps 25 , return [-12.89]
step  0 :  [-1.4454872160691572]
step  1 :  [-1.414994364612446]
step  2 :  [-1.382184784042838]
step  3 :  [-1.3144031083186023]
step  4 :  [-1.2169539824003277]
step  5 :  [-1.095621222809427]
step  6 :  [-0.9555633619533623]
step  7 :  [-0.8016795974073105]
step  8 :  [-0.6414471471159555]
step  9 :  [-0.5398565200408293]
step  10 :  [-0.4356108857528839]
step  11 :  [-0.3456617781312283]
step  12 :  [-0.249492377608146]
step  13 :  [-0.14801292660767804]
step  14 :  [-0.049255852482938595]
step  15 :  [-0.02513564474238361]
step  16 :  [-0.03176101567344488]
step  17 :  [-0.01330515043174149]
step  18 :  [-0.06590695232118048]
step  19 :  [-0.08966040089591282]
step  20 :  [-0.12725439570707203]
step  21 :  [-0.13534836590066648]
step  22 :  [-0.11357839253927271]
step  23 :  [-0.09781643195017602]
step  24 :  [-0.04863554366242436]
episode  70 : steps 25 , return [-12.78]
step  0 :  [-1.7681063391190013]
step  1 :  [-1.7347824134305991]
step  2 :  [-1.6966749797778076]
step  3 :  [-1.6608992965140117]
step  4 :  [-1.5917397001232558]
step  5 :  [-1.4937731593356278]
step  6 :  [-1.372362728121343]
step  7 :  [-1.2324359183231308]
step  8 :  [-1.078132752945905]
step  9 :  [-0.9127864397221873]
step  10 :  [-0.7675053088924624]
step  11 :  [-0.6165955207956177]
step  12 :  [-0.4728028400635621]
step  13 :  [-0.36140959972341696]
step  14 :  [-0.2503994062229136]
step  15 :  [-0.15154062444228086]
step  16 :  [-0.05899063163617937]
step  17 :  [-0.034114056824060116]
step  18 :  [-0.04184310963248435]
step  19 :  [-0.004831667575490474]
step  20 :  [-0.015161022562360965]
step  21 :  [-0.022272236553482448]
step  22 :  [-0.0010175368325357102]
step  23 :  [-0.016624361307862046]
step  24 :  [-0.020903946144063466]
episode  71 : steps 25 , return [-17.38]
step  0 :  [-1.535402512306167]
step  1 :  [-1.5005989934925568]
step  2 :  [-1.4613886726653857]
step  3 :  [-1.425773017173706]
step  4 :  [-1.357764106872592]
step  5 :  [-1.2612129515047272]
step  6 :  [-1.141234196270056]
step  7 :  [-1.0027032527446007]
step  8 :  [-0.849807462838913]
step  9 :  [-0.7188746092219829]
step  10 :  [-0.5784366516588361]
step  11 :  [-0.4350657846303257]
step  12 :  [-0.31603590250646413]
step  13 :  [-0.19237412544897187]
step  14 :  [-0.08086170906926601]
step  15 :  [-0.029659374705283768]
step  16 :  [-0.027247150493805813]
step  17 :  [-0.030574847144348057]
step  18 :  [-0.05599088248226401]
step  19 :  [-0.06438646875661819]
step  20 :  [-0.0355571477625091]
step  21 :  [-0.06176393213059753]
step  22 :  [-0.05481758989537047]
step  23 :  [-0.01939830916437279]
step  24 :  [-0.046802313209123106]
episode  72 : steps 25 , return [-14.28]
step  0 :  [-1.6273407601553633]
step  1 :  [-1.5844336425433392]
step  2 :  [-1.5335621574979408]
step  3 :  [-1.4828213099144771]
step  4 :  [-1.4394852488086125]
step  5 :  [-1.3675791074174486]
step  6 :  [-1.2691314937477398]
step  7 :  [-1.1483169696510354]
step  8 :  [-1.0095284778396427]
step  9 :  [-0.8567146066015506]
step  10 :  [-0.7227835467501454]
step  11 :  [-0.579336698938724]
step  12 :  [-0.43275351413528695]
step  13 :  [-0.31117410621960445]
step  14 :  [-0.19885202829929582]
step  15 :  [-0.13746131438290132]
step  16 :  [-0.06730555736140664]
step  17 :  [-0.07291724451925816]
step  18 :  [-0.0485246796359949]
step  19 :  [-0.008919700258968679]
step  20 :  [-0.04453250516932768]
step  21 :  [-0.043093958589927435]
step  22 :  [-0.014413545552492793]
step  23 :  [-0.04066751461028761]
step  24 :  [-0.045579020624434315]
episode  73 : steps 25 , return [-16.09]
step  0 :  [-1.4049185975869434]
step  1 :  [-1.3759389736918883]
step  2 :  [-1.3454377833373614]
step  3 :  [-1.279400358022728]
step  4 :  [-1.1832721244474806]
step  5 :  [-1.0629517084640208]
step  6 :  [-0.923682915663843]
step  7 :  [-0.7975771991488383]
step  8 :  [-0.660622011399972]
step  9 :  [-0.5331738075889735]
step  10 :  [-0.4370605357674526]
step  11 :  [-0.3373095016726026]
step  12 :  [-0.24257600178706]
step  13 :  [-0.13662480739528318]
step  14 :  [-0.08200796039359559]
step  15 :  [-0.02394236046987639]
step  16 :  [-0.064129716517781]
step  17 :  [-0.06182127523005848]
step  18 :  [-0.02216941749950317]
step  19 :  [-0.03349344212932923]
step  20 :  [-0.0025785375051036044]
step  21 :  [-0.021818765556291028]
step  22 :  [-0.0557406956065534]
step  23 :  [-0.057481262790692496]
step  24 :  [-0.017345267707486112]
episode  74 : steps 25 , return [-12.16]
step  0 :  [-1.6027707102704891]
step  1 :  [-1.5575555475908343]
step  2 :  [-1.5035426557868743]
step  3 :  [-1.4490130159915262]
step  4 :  [-1.4014741634529766]
step  5 :  [-1.3267650436551355]
step  6 :  [-1.2263420278574315]
step  7 :  [-1.1040442890066886]
step  8 :  [-0.9640527218420903]
step  9 :  [-0.8101588390009565]
step  10 :  [-0.6692463870337112]
step  11 :  [-0.5350727019756266]
step  12 :  [-0.4318917848107696]
step  13 :  [-0.3237719100467231]
step  14 :  [-0.22236839825158214]
step  15 :  [-0.11154879289352118]
step  16 :  [-0.05841294352309319]
step  17 :  [-0.05660004683838228]
step  18 :  [-0.03328404258709786]
step  19 :  [-0.03086474460139418]
step  20 :  [-0.038327500254277606]
step  21 :  [-0.02487404458900542]
step  22 :  [-0.02384137890158594]
step  23 :  [-0.0735962894905342]
step  24 :  [-0.06985622907713875]
episode  75 : steps 25 , return [-15.65]
step  0 :  [-1.6786326843570094]
step  1 :  [-1.6550712165973864]
step  2 :  [-1.591359857954228]
step  3 :  [-1.4956640222868984]
step  4 :  [-1.4162784034522617]
step  5 :  [-1.3096939125705598]
step  6 :  [-1.181350389161807]
step  7 :  [-1.035998771838575]
step  8 :  [-0.8775389369133644]
step  9 :  [-0.758329504910939]
step  10 :  [-0.6287889658616459]
step  11 :  [-0.49721694773380243]
step  12 :  [-0.3908308218771858]
step  13 :  [-0.2756218510534718]
step  14 :  [-0.1667525266552777]
step  15 :  [-0.12039546264264402]
step  16 :  [-0.06156618147695144]
step  17 :  [-0.04009303447264082]
step  18 :  [-0.060604108331052085]
step  19 :  [-0.04341641661026241]
step  20 :  [-0.018734359250242878]
step  21 :  [-0.014683747816394513]
step  22 :  [-0.04060743171456248]
step  23 :  [-0.03243283365903314]
step  24 :  [-0.040415876533485585]
episode  76 : steps 25 , return [-15.43]
step  0 :  [-1.3961357430383299]
step  1 :  [-1.36736485491888]
step  2 :  [-1.3372016853873347]
step  3 :  [-1.2714342673303947]
step  4 :  [-1.17552012722703]
step  5 :  [-1.0553725447349975]
step  6 :  [-0.9162487509998601]
step  7 :  [-0.7962038298700902]
step  8 :  [-0.6643141628815703]
step  9 :  [-0.5383669277016411]
step  10 :  [-0.4417298398817184]
step  11 :  [-0.34909119266413174]
step  12 :  [-0.23954407349091897]
step  13 :  [-0.12866908704746088]
step  14 :  [-0.045537267023052094]
step  15 :  [-0.03668805093773201]
step  16 :  [-0.03846200366080985]
step  17 :  [-0.04625253377634876]
step  18 :  [-0.04049246834061065]
step  19 :  [-0.049011227357060386]
step  20 :  [-0.07846141909889183]
step  21 :  [-0.056605080035954894]
step  22 :  [-0.08626687448085338]
step  23 :  [-0.09677756910436923]
step  24 :  [-0.07032425732388546]
episode  77 : steps 25 , return [-12.32]
step  0 :  [-1.793386377274503]
step  1 :  [-1.755241861285003]
step  2 :  [-1.710406622590093]
step  3 :  [-1.666211519802533]
step  4 :  [-1.6290751723483727]
step  5 :  [-1.5606115970177996]
step  6 :  [-1.4641719819512584]
step  7 :  [-1.3445841112036616]
step  8 :  [-1.206572691007043]
step  9 :  [-1.0542506261224296]
step  10 :  [-0.8910481157669512]
step  11 :  [-0.7198485504166128]
step  12 :  [-0.5438475978276828]
step  13 :  [-0.3664669772386447]
step  14 :  [-0.22222677874205218]
step  15 :  [-0.10954421230352354]
step  16 :  [-0.03918235697277894]
step  17 :  [-0.033369586283846175]
step  18 :  [-0.07193534952292728]
step  19 :  [-0.05646123558354703]
step  20 :  [-0.024780124196721015]
step  21 :  [-0.03146165622569423]
step  22 :  [-0.013570804574505746]
step  23 :  [-0.0037237183587012232]
step  24 :  [-0.05248627158249602]
episode  78 : steps 25 , return [-18.36]
step  0 :  [-1.5810827226764694]
step  1 :  [-1.539434325126422]
step  2 :  [-1.4905051225175596]
step  3 :  [-1.4425002783887835]
step  4 :  [-1.4027969587726627]
step  5 :  [-1.3337875296907278]
step  6 :  [-1.2376984622823584]
step  7 :  [-1.1189008582399265]
step  8 :  [-0.9819741929752273]
step  9 :  [-0.831077079049428]
step  10 :  [-0.6757436609016338]
step  11 :  [-0.5149513904782588]
step  12 :  [-0.35587638509438213]
step  13 :  [-0.22403038551601567]
step  14 :  [-0.10663928499217229]
step  15 :  [-0.08259468520191703]
step  16 :  [-0.1119412515335687]
step  17 :  [-0.10314941793367928]
step  18 :  [-0.07665230844427906]
step  19 :  [-0.08805445142716874]
step  20 :  [-0.06287422736739376]
step  21 :  [-0.045050742954405865]
step  22 :  [-0.08182606475346524]
step  23 :  [-0.06410305426204226]
step  24 :  [-0.05177587308536252]
episode  79 : steps 25 , return [-15.61]
step  0 :  [-1.6711636216546206]
step  1 :  [-1.6452907994909372]
step  2 :  [-1.6177396564858315]
step  3 :  [-1.552852458322554]
step  4 :  [-1.4570866110692395]
step  5 :  [-1.3367778439502633]
step  6 :  [-1.197364565076713]
step  7 :  [-1.0432581833418444]
step  8 :  [-0.8779354065869805]
step  9 :  [-0.7669199373424184]
step  10 :  [-0.6430880385568455]
step  11 :  [-0.5203220171613558]
step  12 :  [-0.42358318601533196]
step  13 :  [-0.3303624382786014]
step  14 :  [-0.21846517230116264]
step  15 :  [-0.10739344508614962]
step  16 :  [-0.058575138407763926]
step  17 :  [-0.019757141832589278]
step  18 :  [-0.05594424570442444]
step  19 :  [-0.03561856374760526]
step  20 :  [-0.03277726321561728]
step  21 :  [-0.07900229820325079]
step  22 :  [-0.10263637350608913]
step  23 :  [-0.08313289881069737]
step  24 :  [-0.0206276370547775]
episode  80 : steps 25 , return [-15.9]
step  0 :  [-1.4979853611821552]
step  1 :  [-1.4627257441844954]
step  2 :  [-1.4230616026384855]
step  3 :  [-1.3871771831378144]
step  4 :  [-1.3191799969494107]
step  5 :  [-1.222752415941657]
step  6 :  [-1.1029450937631622]
step  7 :  [-0.9646159079421203]
step  8 :  [-0.8119626675569295]
step  9 :  [-0.6630604635560675]
step  10 :  [-0.5149187145368492]
step  11 :  [-0.3774365029695679]
step  12 :  [-0.26773077322845334]
step  13 :  [-0.15949204133162284]
step  14 :  [-0.04173861463008082]
step  15 :  [-0.04991002390831729]
step  16 :  [-0.03780020189840299]
step  17 :  [-0.05161255389267136]
step  18 :  [-0.03297264288012077]
step  19 :  [-0.027089784979123677]
step  20 :  [-0.019229670314834902]
step  21 :  [-0.06232286275480661]
step  22 :  [-0.09503548767142972]
step  23 :  [-0.08728905269875956]
step  24 :  [-0.05602965292805007]
episode  81 : steps 25 , return [-13.74]
step  0 :  [-1.7582439093757882]
step  1 :  [-1.7205629206704645]
step  2 :  [-1.6764855457909147]
step  3 :  [-1.6334181268276118]
step  4 :  [-1.597852911794124]
step  5 :  [-1.5307015112477613]
step  6 :  [-1.4353592118281437]
step  7 :  [-1.3167199188652887]
step  8 :  [-1.1795778493389864]
step  9 :  [-1.0281228660465698]
step  10 :  [-0.8658888456049212]
step  11 :  [-0.6959343920897728]
step  12 :  [-0.5213256993263484]
step  13 :  [-0.34678839946994133]
step  14 :  [-0.2026459600538644]
step  15 :  [-0.08151615762556463]
step  16 :  [-0.010991098611602674]
step  17 :  [-0.01919914200155386]
step  18 :  [-0.027868439762545733]
step  19 :  [-0.018271021830575256]
step  20 :  [-0.05794195144772696]
step  21 :  [-0.05624584715868489]
step  22 :  [-0.024579740007800048]
step  23 :  [-0.08586376883406867]
step  24 :  [-0.11631320743013338]
episode  82 : steps 25 , return [-18.01]
step  0 :  [-1.5818273676444015]
step  1 :  [-1.5385096451400584]
step  2 :  [-1.4872411316369605]
step  3 :  [-1.4363010110121825]
step  4 :  [-1.3931709522431952]
step  5 :  [-1.3217166746829088]
step  6 :  [-1.22378453399784]
step  7 :  [-1.103496566792568]
step  8 :  [-0.965251338865537]
step  9 :  [-0.8130435835089804]
step  10 :  [-0.6621138513380725]
step  11 :  [-0.5106329921143562]
step  12 :  [-0.3893146027686496]
step  13 :  [-0.25854248238489563]
step  14 :  [-0.13908250423236226]
step  15 :  [-0.024046331841870577]
step  16 :  [-0.041237419871690655]
step  17 :  [-0.04558296040996047]
step  18 :  [-0.04626378739565668]
step  19 :  [-0.050221120524243795]
step  20 :  [-0.005453554981574742]
step  21 :  [-0.021916711226959065]
step  22 :  [-0.017502284896980372]
step  23 :  [-0.012458184548125587]
step  24 :  [-0.03041490433083488]
episode  83 : steps 25 , return [-15.12]
step  0 :  [-1.6917623106877402]
step  1 :  [-1.6489241454475048]
step  2 :  [-1.5979139541259908]
step  3 :  [-1.5466067698085155]
step  4 :  [-1.502035343532531]
step  5 :  [-1.4288599630431018]
step  6 :  [-1.3292484187568905]
step  7 :  [-1.2073830741084524]
step  8 :  [-1.067613190375802]
step  9 :  [-0.9138094980342271]
step  10 :  [-0.7708497384883163]
step  11 :  [-0.6220621375244796]
step  12 :  [-0.47597398017542214]
step  13 :  [-0.360005317711366]
step  14 :  [-0.25254163321807493]
step  15 :  [-0.128989697254654]
step  16 :  [-0.07915298350726711]
step  17 :  [-0.04178246248325039]
step  18 :  [-0.06107711540366902]
step  19 :  [-0.030921854447174678]
step  20 :  [-0.03869075940826626]
step  21 :  [-0.020105870153678988]
step  22 :  [-0.07074710097902834]
step  23 :  [-0.13061894197287333]
step  24 :  [-0.14520834028309554]
episode  84 : steps 25 , return [-17.16]
step  0 :  [-1.5668148420611465]
step  1 :  [-1.5206640350325304]
step  2 :  [-1.4654745141686258]
step  3 :  [-1.4096973449762045]
step  4 :  [-1.361045111135746]
step  5 :  [-1.2857988615582816]
step  6 :  [-1.1851211579653176]
step  7 :  [-1.062713041437314]
step  8 :  [-0.922690871598683]
step  9 :  [-0.7950854998385838]
step  10 :  [-0.658908035667687]
step  11 :  [-0.5287263967486436]
step  12 :  [-0.4280805136790544]
step  13 :  [-0.32252551511299016]
step  14 :  [-0.22268505148262852]
step  15 :  [-0.11275613340147983]
step  16 :  [-0.05833679168812662]
step  17 :  [-0.015011645580895674]
step  18 :  [-0.04005446953844106]
step  19 :  [-0.015096633404804119]
step  20 :  [-0.04649576118993974]
step  21 :  [-0.035081085116623535]
step  22 :  [-0.07412014595071578]
step  23 :  [-0.05909792216029608]
step  24 :  [-0.03284084334539445]
episode  85 : steps 25 , return [-15.22]
step  0 :  [-1.588084036371382]
step  1 :  [-1.556386911055818]
step  2 :  [-1.521222813385544]
step  3 :  [-1.4901860667435403]
step  4 :  [-1.4251671410273479]
step  5 :  [-1.3307064253246335]
step  6 :  [-1.2123010774343739]
step  7 :  [-1.075060114165976]
step  8 :  [-0.9233385104607565]
step  9 :  [-0.7607663243252122]
step  10 :  [-0.592179265307408]
step  11 :  [-0.42094350242839734]
step  12 :  [-0.2820235258200504]
step  13 :  [-0.13157730727538303]
step  14 :  [-0.012866191790166964]
step  15 :  [-0.07006864969681216]
step  16 :  [-0.07660902486814153]
step  17 :  [-0.050703753498311674]
step  18 :  [-0.013197295108149218]
step  19 :  [-0.014698042555201931]
step  20 :  [-0.023443462264180745]
step  21 :  [-0.005251296507374908]
step  22 :  [-0.04435393394646207]
step  23 :  [-0.07991767972575116]
step  24 :  [-0.07325842574732316]
episode  86 : steps 25 , return [-14.77]
step  0 :  [-1.5578016643318187]
step  1 :  [-1.513894050226832]
step  2 :  [-1.4618958085696552]
step  3 :  [-1.4102038155079712]
step  4 :  [-1.3664383971372394]
step  5 :  [-1.2947039714110387]
step  6 :  [-1.196662913453148]
step  7 :  [-1.0763548881242775]
step  8 :  [-0.9381447479190842]
step  9 :  [-0.7860692475865849]
step  10 :  [-0.629580491805948]
step  11 :  [-0.47518869690764953]
step  12 :  [-0.3349020589967032]
step  13 :  [-0.22588224175878985]
step  14 :  [-0.12302181884728697]
step  15 :  [-0.07129792581687593]
step  16 :  [-0.0726593153813842]
step  17 :  [-0.06616206066248277]
step  18 :  [-0.02086668326997363]
step  19 :  [-0.04096913872078573]
step  20 :  [-0.042754447815956796]
step  21 :  [-0.0407316900190228]
step  22 :  [-0.06475213812002066]
step  23 :  [-0.04212794381867144]
step  24 :  [-0.00961217243947073]
episode  87 : steps 25 , return [-14.86]
step  0 :  [-1.6892138075691734]
step  1 :  [-1.6622164415438416]
step  2 :  [-1.6330606994696768]
step  3 :  [-1.5670148488093245]
step  4 :  [-1.4704018727457713]
step  5 :  [-1.349467692179398]
step  6 :  [-1.2095916378682363]
step  7 :  [-1.0551470523328503]
step  8 :  [-0.8895884560216321]
step  9 :  [-0.7785986898177436]
step  10 :  [-0.6501152170664259]
step  11 :  [-0.5319340455177167]
step  12 :  [-0.43224006216989763]
step  13 :  [-0.35578471327316874]
step  14 :  [-0.2720469938369201]
step  15 :  [-0.17050375165740958]
step  16 :  [-0.0512392432053502]
step  17 :  [-0.04196244900804817]
step  18 :  [-0.01832845450629159]
step  19 :  [-0.026073575539839737]
step  20 :  [-0.05601708200256401]
step  21 :  [-0.05370758304282214]
step  22 :  [-0.0780997946928131]
step  23 :  [-0.07837799427042656]
step  24 :  [-0.10114348423184895]
episode  88 : steps 25 , return [-16.22]
step  0 :  [-1.6143870138215703]
step  1 :  [-1.569059136053908]
step  2 :  [-1.5148439744159823]
step  3 :  [-1.4599850750687975]
step  4 :  [-1.4119488647429512]
step  5 :  [-1.3368145530807953]
step  6 :  [-1.2360379106808084]
step  7 :  [-1.1134419836755043]
step  8 :  [-0.9731875437705062]
step  9 :  [-0.8190423396681504]
step  10 :  [-0.6958210518024017]
step  11 :  [-0.5724900778582628]
step  12 :  [-0.456407358313883]
step  13 :  [-0.36176102101513335]
step  14 :  [-0.26333177994639023]
step  15 :  [-0.1532369777167064]
step  16 :  [-0.045827706954350456]
step  17 :  [-0.020881116179304382]
step  18 :  [-0.041762392259527874]
step  19 :  [-0.038087090837731215]
step  20 :  [-0.05090011142399787]
step  21 :  [-0.017872570382029985]
step  22 :  [-0.04166565033700007]
step  23 :  [-0.02786369070392241]
step  24 :  [-0.04324535032158118]
episode  89 : steps 25 , return [-15.88]
step  0 :  [-1.7739618431647457]
step  1 :  [-1.7335832381480083]
step  2 :  [-1.685717514077967]
step  3 :  [-1.637869997350103]
step  4 :  [-1.5966572340646596]
step  5 :  [-1.5253974513518094]
step  6 :  [-1.4269375701488778]
step  7 :  [-1.3058030352847674]
step  8 :  [-1.1665238143720595]
step  9 :  [-1.0130697841463265]
step  10 :  [-0.8487397905817002]
step  11 :  [-0.7019597840129121]
step  12 :  [-0.5486880260692103]
step  13 :  [-0.39546264027570194]
step  14 :  [-0.2692141914504932]
step  15 :  [-0.15160817425581605]
step  16 :  [-0.09166952837614761]
step  17 :  [-0.018007685406600166]
step  18 :  [-0.042731236820252566]
step  19 :  [-0.06442773603053659]
step  20 :  [-0.05681141738384725]
step  21 :  [-0.02319566785449414]
step  22 :  [-0.04944079933710336]
step  23 :  [-0.051616564192452655]
step  24 :  [-0.029899214026385477]
episode  90 : steps 25 , return [-18.21]
step  0 :  [-1.595947369753485]
step  1 :  [-1.565119323764842]
step  2 :  [-1.5311147114938848]
step  3 :  [-1.462030231624295]
step  4 :  [-1.3634466464149386]
step  5 :  [-1.241220630921996]
step  6 :  [-1.1005236288719848]
step  7 :  [-0.9456273123399561]
step  8 :  [-0.7935874426668649]
step  9 :  [-0.6291466985682255]
step  10 :  [-0.5361330061180308]
step  11 :  [-0.44840453646314027]
step  12 :  [-0.37440154321530883]
step  13 :  [-0.28929950387821046]
step  14 :  [-0.2084755186281925]
step  15 :  [-0.12524548777313604]
step  16 :  [-0.07431476490588493]
step  17 :  [-0.09340119958970744]
step  18 :  [-0.08425107216697136]
step  19 :  [-0.042179532684477564]
step  20 :  [-0.011425098871970836]
step  21 :  [-0.02753941415560453]
step  22 :  [-0.05212935722849698]
step  23 :  [-0.05813063599799044]
step  24 :  [-0.02275412511911387]
episode  91 : steps 25 , return [-14.68]
step  0 :  [-1.7633459222399954]
step  1 :  [-1.7300993471577915]
step  2 :  [-1.6921148419111989]
step  3 :  [-1.6565165415897696]
step  4 :  [-1.5874994589626643]
step  5 :  [-1.489645848657134]
step  6 :  [-1.3683254827828792]
step  7 :  [-1.2284718945124098]
step  8 :  [-1.0742302684618332]
step  9 :  [-0.9089386147405774]
step  10 :  [-0.7654356465901757]
step  11 :  [-0.6160404061636492]
step  12 :  [-0.4724263680249843]
step  13 :  [-0.36039399306658726]
step  14 :  [-0.24753949702118808]
step  15 :  [-0.1464264136175058]
step  16 :  [-0.05143952571697997]
step  17 :  [-0.03488689887013413]
step  18 :  [-0.04156256213099431]
step  19 :  [-0.01401040005841435]
step  20 :  [-0.01711415455660868]
step  21 :  [-0.027359251298208202]
step  22 :  [-0.010935310360663208]
step  23 :  [-0.04221067477228317]
step  24 :  [-0.03817042823427051]
episode  92 : steps 25 , return [-17.39]
step  0 :  [-1.5796013746551862]
step  1 :  [-1.5508896727989199]
step  2 :  [-1.5198594754246626]
step  3 :  [-1.4528438107684025]
step  4 :  [-1.3557075975018786]
step  5 :  [-1.2344825400405868]
step  6 :  [-1.0944424706351397]
step  7 :  [-0.939907027844683]
step  8 :  [-0.7886284858859901]
step  9 :  [-0.6296065809813838]
step  10 :  [-0.4977011344312784]
step  11 :  [-0.40776086253228844]
step  12 :  [-0.3218915492616584]
step  13 :  [-0.22468040091188224]
step  14 :  [-0.11850382153592834]
step  15 :  [-0.07121058665410628]
step  16 :  [-0.03256667311123474]
step  17 :  [-0.0345527944193668]
step  18 :  [-0.009033940632410628]
step  19 :  [-0.012341810401205668]
step  20 :  [-0.03019829768474594]
step  21 :  [-0.018526904684836087]
step  22 :  [-0.04261398618241867]
step  23 :  [-0.02638996408987238]
step  24 :  [-0.04962575845948376]
episode  93 : steps 25 , return [-14.04]
step  0 :  [-1.6273317361168336]
step  1 :  [-1.5895456428898822]
step  2 :  [-1.5458065111162336]
step  3 :  [-1.5039487918061742]
step  4 :  [-1.4311303166814027]
step  5 :  [-1.3308455222728268]
step  6 :  [-1.2078973767100172]
step  7 :  [-1.066908681962586]
step  8 :  [-0.9118447935446686]
step  9 :  [-0.7879867173468186]
step  10 :  [-0.650650883564321]
step  11 :  [-0.5306603069913896]
step  12 :  [-0.44481576983400867]
step  13 :  [-0.3605361131363056]
step  14 :  [-0.2658953501346551]
step  15 :  [-0.16515505624732776]
step  16 :  [-0.04988878063603733]
step  17 :  [-0.042504463179462]
step  18 :  [-0.02250437344585241]
step  19 :  [-0.039256312727197186]
step  20 :  [-0.036847910278146025]
step  21 :  [-0.041560291764145704]
step  22 :  [-0.029396439685064984]
step  23 :  [-0.024868433068100233]
step  24 :  [-0.018828884881557612]
episode  94 : steps 25 , return [-15.73]
step  0 :  [-1.553943541345675]
step  1 :  [-1.506544383916638]
step  2 :  [-1.4496447389320186]
step  3 :  [-1.3917893624745743]
step  4 :  [-1.3408154141554716]
step  5 :  [-1.2640339135161907]
step  6 :  [-1.162287953993853]
step  7 :  [-1.0390915228763438]
step  8 :  [-0.8984438747503705]
step  9 :  [-0.7974622936109301]
step  10 :  [-0.6810149834159447]
step  11 :  [-0.567828694384468]
step  12 :  [-0.46530546157394626]
step  13 :  [-0.38190681505201285]
step  14 :  [-0.2911281663809176]
step  15 :  [-0.18422133587891348]
step  16 :  [-0.09192272777882314]
step  17 :  [-0.051181346190765906]
step  18 :  [-0.010941266750015197]
step  19 :  [-0.04394652803573636]
step  20 :  [-0.04996998455603724]
step  21 :  [-0.029902918968164063]
step  22 :  [-0.015406069322465967]
step  23 :  [-0.0412460836818927]
step  24 :  [-0.0517082024106722]
episode  95 : steps 25 , return [-15.36]
step  0 :  [-1.6113053201065821]
step  1 :  [-1.5743869943894617]
step  2 :  [-1.5319161068254483]
step  3 :  [-1.4917344888107076]
step  4 :  [-1.420149899522555]
step  5 :  [-1.3207817672312219]
step  6 :  [-1.1985238421095024]
step  7 :  [-1.0580621060280844]
step  8 :  [-0.9034058588680559]
step  9 :  [-0.7852788334410512]
step  10 :  [-0.6544074935209794]
step  11 :  [-0.5312683923229405]
step  12 :  [-0.4250796621603174]
step  13 :  [-0.34259003491930695]
step  14 :  [-0.2543138516742995]
step  15 :  [-0.14968797394481045]
step  16 :  [-0.031097821814015606]
step  17 :  [-0.04823375398406422]
step  18 :  [-0.04174886070816711]
step  19 :  [-0.06400975196794574]
step  20 :  [-0.07596643224941269]
step  21 :  [-0.04570531752320121]
step  22 :  [-0.013937911908945621]
step  23 :  [-0.023848899022659114]
step  24 :  [-0.0122944455489332]
episode  96 : steps 25 , return [-15.61]
step  0 :  [-1.8499020462113334]
step  1 :  [-1.811804343872719]
step  2 :  [-1.7668555648493882]
step  3 :  [-1.7222302089284625]
step  4 :  [-1.684185679558235]
step  5 :  [-1.6147914184519567]
step  6 :  [-1.517494823193648]
step  7 :  [-1.3971296383642575]
step  8 :  [-1.2583920514062648]
step  9 :  [-1.1053465841967693]
step  10 :  [-0.9413482314506645]
step  11 :  [-0.7691386787125863]
step  12 :  [-0.5945544192618618]
step  13 :  [-0.4207449409442782]
step  14 :  [-0.2807693649080446]
step  15 :  [-0.1619999034835169]
step  16 :  [-0.08524388373883247]
step  17 :  [-0.036338962436998516]
step  18 :  [-0.02646295599562472]
step  19 :  [-0.008928164593276552]
step  20 :  [-0.05272211671119325]
step  21 :  [-0.03947982883286652]
step  22 :  [-0.03848975723821502]
step  23 :  [-0.04052443905970835]
step  24 :  [-0.027463520069506794]
episode  97 : steps 25 , return [-19.25]
step  0 :  [-1.4674546199029586]
step  1 :  [-1.4370921682806372]
step  2 :  [-1.404344883129579]
step  3 :  [-1.3365263435416657]
step  4 :  [-1.2390120343034077]
step  5 :  [-1.1176128021817773]
step  6 :  [-0.9774975872918636]
step  7 :  [-0.8229339381496299]
step  8 :  [-0.7878399987416032]
step  9 :  [-0.7162476541350487]
step  10 :  [-0.6373408943142105]
step  11 :  [-0.5545848087098021]
step  12 :  [-0.4821481400389586]
step  13 :  [-0.4010971664975091]
step  14 :  [-0.31288316307061587]
step  15 :  [-0.20766210852352665]
step  16 :  [-0.12466574692664169]
step  17 :  [-0.08592692896188993]
step  18 :  [-0.04401270883509965]
step  19 :  [-0.03718028668798749]
step  20 :  [-0.003586763798161764]
step  21 :  [-0.06890303419948261]
step  22 :  [-0.07379658184132275]
step  23 :  [-0.06354395580626603]
step  24 :  [-0.03274513730882053]
episode  98 : steps 25 , return [-14.44]
step  0 :  [-1.6236253966115723]
step  1 :  [-1.5863539122445056]
step  2 :  [-1.5433432645241425]
step  3 :  [-1.5024117167146145]
step  4 :  [-1.4302508275672614]
step  5 :  [-1.330441574528551]
step  6 :  [-1.2078432835691035]
step  7 :  [-1.0671152311350987]
step  8 :  [-0.912246401322825]
step  9 :  [-0.7872048405036743]
step  10 :  [-0.6496450903606444]
step  11 :  [-0.5258430568065469]
step  12 :  [-0.43505257670867586]
step  13 :  [-0.3432289821841986]
step  14 :  [-0.25552577063702103]
step  15 :  [-0.15543619288774382]
step  16 :  [-0.04307233145000043]
step  17 :  [-0.037735808267137516]
step  18 :  [-0.0471031973387575]
step  19 :  [-0.006072656784618665]
step  20 :  [-0.06340165425721356]
step  21 :  [-0.06967274490878177]
step  22 :  [-0.07095408801734482]
step  23 :  [-0.06434465352562246]
step  24 :  [-0.03797359372888911]
episode  99 : steps 25 , return [-15.8]
step  0 :  [-1.7032138647783615]
step  1 :  [-1.666527724247859]
step  2 :  [-1.6240204019624596]
step  3 :  [-1.583209631754975]
step  4 :  [-1.5107969772327166]
step  5 :  [-1.4106358284557907]
step  6 :  [-1.2876899247224565]
step  7 :  [-1.1466563034997332]
step  8 :  [-0.9915359163026611]
step  9 :  [-0.8255749178903987]
step  10 :  [-0.7774652378112764]
step  11 :  [-0.6982960494433831]
step  12 :  [-0.6125037883697904]
step  13 :  [-0.5249588890970427]
step  14 :  [-0.44888581004430766]
step  15 :  [-0.36803717194977054]
step  16 :  [-0.2810080091616072]
step  17 :  [-0.1773092785513069]
step  18 :  [-0.05743776591293894]
step  19 :  [-0.028084653921074346]
step  20 :  [-0.043135226301157216]
step  21 :  [-0.020690581700369325]
step  22 :  [-0.03871323146569191]
step  23 :  [-0.05284882807526366]
step  24 :  [-0.019046000784570825]
episode  100 : steps 25 , return [-17.9]
step  0 :  [-1.616402757826464]
step  1 :  [-1.5926166034249194]
step  2 :  [-1.5288484268545675]
step  3 :  [-1.4331511920862992]
step  4 :  [-1.3126387587636177]
step  5 :  [-1.173163542940202]
step  6 :  [-1.060707125469366]
step  7 :  [-0.928514730639109]
step  8 :  [-0.8063325981388971]
step  9 :  [-0.6957044543636798]
step  10 :  [-0.5914825795661148]
step  11 :  [-0.5132227133507529]
step  12 :  [-0.42383273685839845]
step  13 :  [-0.33430370568878687]
step  14 :  [-0.23242957353719854]
step  15 :  [-0.13018583553741883]
step  16 :  [-0.04112483126824658]
step  17 :  [-0.05328198512445243]
step  18 :  [-0.05852645155467466]
step  19 :  [-0.04875101427010646]
step  20 :  [-0.05144158285607687]
step  21 :  [-0.013947696697949695]
step  22 :  [-0.027762587887317156]
step  23 :  [-0.03345890509652043]
step  24 :  [-0.030439020353047772]
episode  101 : steps 25 , return [-14.73]
step  0 :  [-1.5476596993682934]
step  1 :  [-1.5178459191831812]
step  2 :  [-1.4854533008895607]
step  3 :  [-1.4176071901878498]
step  4 :  [-1.3199415677813482]
step  5 :  [-1.198370114346462]
step  6 :  [-1.058104137783168]
step  7 :  [-0.9034311597780587]
step  8 :  [-0.7894327323147644]
step  9 :  [-0.6574924890627065]
step  10 :  [-0.5453252187304612]
step  11 :  [-0.4589821741322366]
step  12 :  [-0.3956838419850896]
step  13 :  [-0.3223636704217151]
step  14 :  [-0.2287117053982084]
step  15 :  [-0.11535566990160966]
step  16 :  [-0.03801124892298454]
step  17 :  [-0.03368956874073882]
step  18 :  [-0.03526141528047886]
step  19 :  [-0.04787267105340194]
step  20 :  [-0.07515705911969521]
step  21 :  [-0.07206350747447587]
step  22 :  [-0.04592725415397111]
step  23 :  [-0.06237107739314525]
step  24 :  [-0.0357402063287178]
episode  102 : steps 25 , return [-14.41]
step  0 :  [-1.5718878396184288]
step  1 :  [-1.536883252221212]
step  2 :  [-1.497229758911704]
step  3 :  [-1.4607993931320988]
step  4 :  [-1.3920290167862446]
step  5 :  [-1.2948095011287635]
step  6 :  [-1.1742418005467605]
step  7 :  [-1.035168538344657]
step  8 :  [-0.8817297394609854]
step  9 :  [-0.7560579985377875]
step  10 :  [-0.6207158848426161]
step  11 :  [-0.48250691186467337]
step  12 :  [-0.3699533078007208]
step  13 :  [-0.2485931837910266]
step  14 :  [-0.1352177875528339]
step  15 :  [-0.085918371779589]
step  16 :  [-0.0326879677037239]
step  17 :  [-0.01651832011404691]
step  18 :  [-0.03416935192748162]
step  19 :  [-0.02901037875662898]
step  20 :  [-0.019385555317953867]
step  21 :  [-0.0020039060886189817]
step  22 :  [-0.03390866909455609]
step  23 :  [-0.01479054471441012]
step  24 :  [-0.03625736678387238]
episode  103 : steps 25 , return [-14.76]
step  0 :  [-1.6417732901360997]
step  1 :  [-1.6141777470073575]
step  2 :  [-1.5844008700748917]
step  3 :  [-1.5180601986668008]
step  4 :  [-1.4213057742377808]
step  5 :  [-1.3003047059705364]
step  6 :  [-1.160398539851263]
step  7 :  [-1.0059417237280246]
step  8 :  [-0.8403790585589432]
step  9 :  [-0.7755798970499218]
step  10 :  [-0.6850157036178526]
step  11 :  [-0.590380483179158]
step  12 :  [-0.4976135128490286]
step  13 :  [-0.4183861978472997]
step  14 :  [-0.33021389056214784]
step  15 :  [-0.2375034869782429]
step  16 :  [-0.13626734946589844]
step  17 :  [-0.07881096464143778]
step  18 :  [-0.049828933709408205]
step  19 :  [-0.031145556826212166]
step  20 :  [-0.038714226898348594]
step  21 :  [-0.023549400612787808]
step  22 :  [-0.03260123584265392]
step  23 :  [-0.019673193728048207]
step  24 :  [-0.04191272336406965]
episode  104 : steps 25 , return [-16.07]
step  0 :  [-1.4687945205170343]
step  1 :  [-1.4305581481032488]
step  2 :  [-1.386898846086976]
step  3 :  [-1.346305923377848]
step  4 :  [-1.275157642722717]
step  5 :  [-1.1764945559493]
step  6 :  [-1.0549944306807015]
step  7 :  [-0.915277036052206]
step  8 :  [-0.7958414395439178]
step  9 :  [-0.6652899809350092]
step  10 :  [-0.539962413493417]
step  11 :  [-0.42907318683143303]
step  12 :  [-0.3413776272687076]
step  13 :  [-0.24866036263471974]
step  14 :  [-0.14037404865961217]
step  15 :  [-0.015816932443577066]
step  16 :  [-0.045194460619396824]
step  17 :  [-0.05148251338082696]
step  18 :  [-0.01840993441885659]
step  19 :  [-0.05740528104269443]
step  20 :  [-0.05740491395944163]
step  21 :  [-0.09763214227496257]
step  22 :  [-0.09385044647487402]
step  23 :  [-0.054561908527068256]
step  24 :  [-0.046933404216772404]
episode  105 : steps 25 , return [-13.75]
step  0 :  [-1.767092428740826]
step  1 :  [-1.7287268889447907]
step  2 :  [-1.683672863866387]
step  3 :  [-1.639348803872578]
step  4 :  [-1.5642846318017383]
step  5 :  [-1.4621610894961246]
step  6 :  [-1.3377934585024667]
step  7 :  [-1.195774776044696]
step  8 :  [-1.040048289283936]
step  9 :  [-0.8738555483625677]
step  10 :  [-0.8292398501678213]
step  11 :  [-0.8630644023384215]
step  12 :  [-0.8630620833762433]
step  13 :  [-0.8213024519509254]
step  14 :  [-0.7480462344992228]
step  15 :  [-0.6535688081557356]
step  16 :  [-0.5490136767931353]
step  17 :  [-0.44953632031439483]
step  18 :  [-0.3553217282945073]
step  19 :  [-0.25017695586098715]
step  20 :  [-0.1794140657197321]
step  21 :  [-0.14105509855809695]
step  22 :  [-0.12807499162875755]
step  23 :  [-0.09496940443403759]
step  24 :  [-0.06374380095853045]
episode  106 : steps 25 , return [-21.28]
step  0 :  [-1.6847883897713682]
step  1 :  [-1.658694128151382]
step  2 :  [-1.6307861810197664]
step  3 :  [-1.5656136220738524]
step  4 :  [-1.469624684674927]
step  5 :  [-1.349142496875942]
step  6 :  [-1.2095944940389252]
step  7 :  [-1.0553835922034176]
step  8 :  [-0.8899803555816463]
step  9 :  [-0.7730442865657555]
step  10 :  [-0.6432004906239434]
step  11 :  [-0.5186228200875095]
step  12 :  [-0.4227924120372693]
step  13 :  [-0.3208181585645459]
step  14 :  [-0.22344692145514086]
step  15 :  [-0.11506598521615452]
step  16 :  [-0.06299464868094622]
step  17 :  [-0.06271741472387656]
step  18 :  [-0.05190644673983486]
step  19 :  [-0.05344619845554518]
step  20 :  [-0.071901251312339]
step  21 :  [-0.063610432245217]
step  22 :  [-0.01676163475723489]
step  23 :  [-0.02229499842010008]
step  24 :  [-0.01834662304686443]
episode  107 : steps 25 , return [-15.95]
step  0 :  [-1.5671238450765148]
step  1 :  [-1.5418916818433113]
step  2 :  [-1.4772796497410208]
step  3 :  [-1.420744591387245]
step  4 :  [-1.3325448998754656]
step  5 :  [-1.218588880881261]
step  6 :  [-1.0843270887217047]
step  7 :  [-0.93433580906464]
step  8 :  [-0.7826723460431056]
step  9 :  [-0.6265797056272914]
step  10 :  [-0.4793393742265927]
step  11 :  [-0.3660965687398009]
step  12 :  [-0.2605814306138016]
step  13 :  [-0.14439570643219685]
step  14 :  [-0.0323339606008658]
step  15 :  [-0.027428765245945754]
step  16 :  [-0.03181515603432416]
step  17 :  [-0.015211359572491662]
step  18 :  [-0.010231570502256992]
step  19 :  [-0.024304932533918855]
step  20 :  [-0.01423032307537003]
step  21 :  [-0.007501997642025065]
step  22 :  [-0.02749806057301576]
step  23 :  [-0.006010427421222047]
step  24 :  [-0.03500475320071769]
episode  108 : steps 25 , return [-13.47]
step  0 :  [-1.6554095589837425]
step  1 :  [-1.6246713770335988]
step  2 :  [-1.5905382928691891]
step  3 :  [-1.5212013752604727]
step  4 :  [-1.4223711065848152]
step  5 :  [-1.299950253171781]
step  6 :  [-1.1591275494232975]
step  7 :  [-1.004185119325157]
step  8 :  [-0.8385736141794813]
step  9 :  [-0.8293421402192936]
step  10 :  [-0.8915781478301131]
step  11 :  [-0.9072484853090185]
step  12 :  [-0.8740267225644033]
step  13 :  [-0.8037825397587465]
step  14 :  [-0.7069375312540568]
step  15 :  [-0.5931613772872578]
step  16 :  [-0.473516712132511]
step  17 :  [-0.3630788440093367]
step  18 :  [-0.2487886544350566]
step  19 :  [-0.1295336494004177]
step  20 :  [-0.01796697287211218]
step  21 :  [-0.0758235059430439]
step  22 :  [-0.07642966518239085]
step  23 :  [-0.07374165363033507]
step  24 :  [-0.05062331911212304]
episode  109 : steps 25 , return [-19.23]
step  0 :  [-1.597318708037643]
step  1 :  [-1.554443264606379]
step  2 :  [-1.5037324662078155]
step  3 :  [-1.453388053938352]
step  4 :  [-1.4108006770873747]
step  5 :  [-1.3396248064303555]
step  6 :  [-1.241838030450591]
step  7 :  [-1.1216245013734214]
step  8 :  [-0.9834116392516137]
step  9 :  [-0.8312041962108391]
step  10 :  [-0.6862651915069248]
step  11 :  [-0.5369877377241198]
step  12 :  [-0.3914397686645778]
step  13 :  [-0.2716465659548588]
step  14 :  [-0.1551502006776824]
step  15 :  [-0.11193392917681148]
step  16 :  [-0.05454054754671176]
step  17 :  [-0.016671080035067495]
step  18 :  [-0.039312272973105016]
step  19 :  [-0.06817872946861522]
step  20 :  [-0.07530395448103933]
step  21 :  [-0.04933907389039198]
step  22 :  [-0.03698486019673551]
step  23 :  [-0.07170582039540714]
step  24 :  [-0.06676275352621489]
episode  110 : steps 25 , return [-15.67]
step  0 :  [-1.6788830695793004]
step  1 :  [-1.652370563809251]
step  2 :  [-1.623916991060879]
step  3 :  [-1.5583834358685682]
step  4 :  [-1.4621463266444499]
step  5 :  [-1.3414887273707123]
step  6 :  [-1.2018146974724047]
step  7 :  [-1.0475131641912336]
step  8 :  [-0.8820465940368689]
step  9 :  [-0.774854392624006]
step  10 :  [-0.6519291232389468]
step  11 :  [-0.5335895073582815]
step  12 :  [-0.4286511682133331]
step  13 :  [-0.3452765990126195]
step  14 :  [-0.2552872568860525]
step  15 :  [-0.14860473792108045]
step  16 :  [-0.023937790028888486]
step  17 :  [-0.03199621099659996]
step  18 :  [-0.04050470225406381]
step  19 :  [-0.012856870340963394]
step  20 :  [-0.03216137377783277]
step  21 :  [-0.06135265481847059]
step  22 :  [-0.07940526202171044]
step  23 :  [-0.05114609793046189]
step  24 :  [-0.07943152365713886]
episode  111 : steps 25 , return [-16.]
step  0 :  [-1.550078307997193]
step  1 :  [-1.5190921622505853]
step  2 :  [-1.485078158898644]
step  3 :  [-1.4161252042311336]
step  4 :  [-1.3176955169563964]
step  5 :  [-1.1956012284894992]
step  6 :  [-1.054996032327954]
step  7 :  [-0.9001416353948759]
step  8 :  [-0.7917996929519722]
step  9 :  [-0.6618695460724946]
step  10 :  [-0.5588507304711373]
step  11 :  [-0.4915360448792162]
step  12 :  [-0.4221206169127861]
step  13 :  [-0.3420183638795945]
step  14 :  [-0.2509997897342416]
step  15 :  [-0.14183386786558888]
step  16 :  [-0.0631065447048622]
step  17 :  [-0.025192725942367402]
step  18 :  [-0.031507130058630324]
step  19 :  [-0.046415848144540965]
step  20 :  [-0.020980573058134378]
step  21 :  [-0.052245142154019444]
step  22 :  [-0.03676903039875599]
step  23 :  [-0.038364239460772206]
step  24 :  [-0.05376294117029692]
episode  112 : steps 25 , return [-14.47]
step  0 :  [-1.5666348421940344]
step  1 :  [-1.5390001290529127]
step  2 :  [-1.5095026740428834]
step  3 :  [-1.4435814782985148]
step  4 :  [-1.34723801226131]
step  5 :  [-1.2265928918880713]
step  6 :  [-1.0869769310981738]
step  7 :  [-0.9327449263991147]
step  8 :  [-0.7865447401327099]
step  9 :  [-0.6330845497396458]
step  10 :  [-0.49654944379948296]
step  11 :  [-0.39697885102021513]
step  12 :  [-0.3023630549867099]
step  13 :  [-0.201601859007648]
step  14 :  [-0.08719300600583237]
step  15 :  [-0.039533496783131776]
step  16 :  [-0.03882134144216058]
step  17 :  [-0.051699684424153305]
step  18 :  [-0.04317839985991663]
step  19 :  [-0.026214392875188935]
step  20 :  [-0.04498579476462415]
step  21 :  [-0.020601742455899037]
step  22 :  [-0.040826392396910396]
step  23 :  [-0.032627158243473335]
step  24 :  [-0.043694604189351297]
episode  113 : steps 25 , return [-13.94]
step  0 :  [-1.4640014922038727]
step  1 :  [-1.4360659465031291]
step  2 :  [-1.406668489525926]
step  3 :  [-1.3411689512353002]
step  4 :  [-1.2453099295282657]
step  5 :  [-1.125124401383804]
step  6 :  [-0.9859199482616313]
step  7 :  [-0.8320541385706768]
step  8 :  [-0.7361075902719627]
step  9 :  [-0.6284873012821494]
step  10 :  [-0.5156548778524914]
step  11 :  [-0.42126669647214177]
step  12 :  [-0.31689538126130357]
step  13 :  [-0.2137529656988958]
step  14 :  [-0.09986142538934853]
step  15 :  [-0.05773019405536088]
step  16 :  [-0.05441707414885672]
step  17 :  [-0.015083660410798802]
step  18 :  [-0.05263961980658503]
step  19 :  [-0.07274917370645766]
step  20 :  [-0.04339462231918336]
step  21 :  [-0.04990681309425313]
step  22 :  [-0.03860746341061218]
step  23 :  [-0.05463540624251985]
step  24 :  [-0.07530873014358772]
episode  114 : steps 25 , return [-13.28]
step  0 :  [-1.683181832057464]
step  1 :  [-1.653648635384161]
step  2 :  [-1.621054273801527]
step  3 :  [-1.5526797700373332]
step  4 :  [-1.4544645705605663]
step  5 :  [-1.3324313056807933]
step  6 :  [-1.1918306060650812]
step  7 :  [-1.036970026154218]
step  8 :  [-0.8712928774583909]
step  9 :  [-0.7835201909613214]
step  10 :  [-0.6674718518967]
step  11 :  [-0.5733558788077977]
step  12 :  [-0.5108813681131619]
step  13 :  [-0.44261457885423355]
step  14 :  [-0.37011627826676713]
step  15 :  [-0.27910670327879483]
step  16 :  [-0.1678023943361987]
step  17 :  [-0.04532348374657331]
step  18 :  [-0.018374236629904728]
step  19 :  [-0.09982627157169095]
step  20 :  [-0.11461707531899318]
step  21 :  [-0.08187443121146502]
step  22 :  [-0.03770675800978316]
step  23 :  [-0.027745630594080167]
step  24 :  [-0.011889875640828558]
episode  115 : steps 25 , return [-16.63]
step  0 :  [-1.742804791656193]
step  1 :  [-1.709161551641438]
step  2 :  [-1.6707049385212134]
step  3 :  [-1.6346451153643273]
step  4 :  [-1.5653836993893622]
step  5 :  [-1.467395448300698]
step  6 :  [-1.3459983737105654]
step  7 :  [-1.2060999170063378]
step  8 :  [-1.0518315721520752]
step  9 :  [-0.8865240149825673]
step  10 :  [-0.759943395777505]
step  11 :  [-0.6244642427933145]
step  12 :  [-0.49023770451295073]
step  13 :  [-0.36933017260451423]
step  14 :  [-0.27381423189420484]
step  15 :  [-0.17665679620259286]
step  16 :  [-0.07076597628531027]
step  17 :  [-0.00839391687820505]
step  18 :  [-0.06477653011606527]
step  19 :  [-0.08514576752963873]
step  20 :  [-0.06098449393594819]
step  21 :  [-0.040955327971373204]
step  22 :  [-0.025631507747276846]
step  23 :  [-0.06009784706517139]
step  24 :  [-0.04225863990451137]
episode  116 : steps 25 , return [-17.43]
step  0 :  [-1.7079515591688428]
step  1 :  [-1.6705647477857761]
step  2 :  [-1.627071197731049]
step  3 :  [-1.5850139986040352]
step  4 :  [-1.5117229003346078]
step  5 :  [-1.4109347491535065]
step  6 :  [-1.2875386165559455]
step  7 :  [-1.1461847728125079]
step  8 :  [-0.9908466212899093]
step  9 :  [-0.8247586555766596]
step  10 :  [-0.7798701301894881]
step  11 :  [-0.6998663765783621]
step  12 :  [-0.6183714409169444]
step  13 :  [-0.5380905642427447]
step  14 :  [-0.4690348611110191]
step  15 :  [-0.3888833335786847]
step  16 :  [-0.29965390209697096]
step  17 :  [-0.19819492207983916]
step  18 :  [-0.07971168342461855]
step  19 :  [-0.05121024338500265]
step  20 :  [-0.05880244654270686]
step  21 :  [-0.02982851518569862]
step  22 :  [-0.058837169226027095]
step  23 :  [-0.09232810579887446]
step  24 :  [-0.10263610113003807]
episode  117 : steps 25 , return [-18.23]
step  0 :  [-1.6265727353407746]
step  1 :  [-1.5989051035513313]
step  2 :  [-1.569094583145293]
step  3 :  [-1.502774789103257]
step  4 :  [-1.4060569842171364]
step  5 :  [-1.2850932771307797]
step  6 :  [-1.1452194138474359]
step  7 :  [-0.9907874996346746]
step  8 :  [-0.8252408750084573]
step  9 :  [-0.7648783803430536]
step  10 :  [-0.6827564270473493]
step  11 :  [-0.5925147272809542]
step  12 :  [-0.5014220404612051]
step  13 :  [-0.421242125430431]
step  14 :  [-0.33145589893039207]
step  15 :  [-0.23660427946796692]
step  16 :  [-0.13280539328973434]
step  17 :  [-0.074302206080771]
step  18 :  [-0.042164729804211216]
step  19 :  [-0.0274639634597152]
step  20 :  [-0.03773118514190292]
step  21 :  [-0.05796480496800995]
step  22 :  [-0.07243234666945829]
step  23 :  [-0.053455160489836444]
step  24 :  [-0.03937940615915261]
episode  118 : steps 25 , return [-16.02]
step  0 :  [-1.472114243980838]
step  1 :  [-1.4376247563940796]
step  2 :  [-1.3991564480206427]
step  3 :  [-1.3649558822741177]
step  4 :  [-1.2983025077611872]
step  5 :  [-1.2029698546912164]
step  6 :  [-1.0840999979718544]
step  7 :  [-0.9466388155608687]
step  8 :  [-0.7948862196799237]
step  9 :  [-0.6374773469170407]
step  10 :  [-0.47955059131663996]
step  11 :  [-0.35252982846056413]
step  12 :  [-0.2401677120807137]
step  13 :  [-0.10925480528183364]
step  14 :  [-0.04519669160137138]
step  15 :  [-0.05539509617735934]
step  16 :  [-0.0246178756106257]
step  17 :  [-0.045509131418285005]
step  18 :  [-0.0392254884599123]
step  19 :  [-0.029371286559502274]
step  20 :  [-0.037695872212921054]
step  21 :  [-0.09639587338701879]
step  22 :  [-0.1315385531511131]
step  23 :  [-0.11885565610292198]
step  24 :  [-0.06258390796384844]
episode  119 : steps 25 , return [-13.51]
step  0 :  [-1.5334313819863303]
step  1 :  [-1.5031056322716074]
step  2 :  [-1.4700778123440088]
step  3 :  [-1.401845176758137]
step  4 :  [-1.3039342901931394]
step  5 :  [-1.182204062213159]
step  6 :  [-1.0418371358824123]
step  7 :  [-0.8871070596392769]
step  8 :  [-0.789831313703834]
step  9 :  [-0.6700290044993874]
step  10 :  [-0.5668580260701722]
step  11 :  [-0.49452281892969435]
step  12 :  [-0.4163685307911291]
step  13 :  [-0.3366134798990838]
step  14 :  [-0.24056863796764613]
step  15 :  [-0.12592986146488602]
step  16 :  [-0.043951461121812425]
step  17 :  [-0.10020952862255057]
step  18 :  [-0.10011569338595584]
step  19 :  [-0.05183776651038772]
step  20 :  [-0.06359040618391831]
step  21 :  [-0.025289977165162018]
step  22 :  [-0.0430774290194496]
step  23 :  [-0.012204733383624837]
step  24 :  [-0.0705278034215918]
episode  120 : steps 25 , return [-14.48]
step  0 :  [-1.657536415931559]
step  1 :  [-1.6183665557171956]
step  2 :  [-1.5725887364867996]
step  3 :  [-1.5280090538782993]
step  4 :  [-1.4531905691601978]
step  5 :  [-1.3514411032912903]
step  6 :  [-1.2274262389895276]
step  7 :  [-1.0856772843316613]
step  8 :  [-0.9301066874766675]
step  9 :  [-0.7919330919719425]
step  10 :  [-0.6402984771737662]
step  11 :  [-0.5263507528604854]
step  12 :  [-0.45614010614592826]
step  13 :  [-0.38618575353106505]
step  14 :  [-0.3000567694663104]
step  15 :  [-0.21237948522980735]
step  16 :  [-0.11508062127129946]
step  17 :  [-0.05442368696899366]
step  18 :  [-0.011090147611549587]
step  19 :  [-0.027154056307000556]
step  20 :  [-0.05189604831949615]
step  21 :  [-0.05080021085147628]
step  22 :  [-0.0659251763922996]
step  23 :  [-0.0857470853515785]
step  24 :  [-0.07442611580429964]
episode  121 : steps 25 , return [-16.27]
step  0 :  [-1.4914304681033799]
step  1 :  [-1.4627076906356904]
step  2 :  [-1.4320878152879024]
step  3 :  [-1.3656437844502076]
step  4 :  [-1.2690563835959865]
step  5 :  [-1.1483019759056476]
step  6 :  [-1.008643111896536]
step  7 :  [-0.8544009200170828]
step  8 :  [-0.7805822655737584]
step  9 :  [-0.6853314574902476]
step  10 :  [-0.5848933484046981]
step  11 :  [-0.4863688651760783]
step  12 :  [-0.4022010215459346]
step  13 :  [-0.31015253288344047]
step  14 :  [-0.21545788311289119]
step  15 :  [-0.11506636598068731]
step  16 :  [-0.047106090751881775]
step  17 :  [-0.09696185174936008]
step  18 :  [-0.0924004432030503]
step  19 :  [-0.06761936623518192]
step  20 :  [-0.039539033107639496]
step  21 :  [-0.062063061070269314]
step  22 :  [-0.042943928737223004]
step  23 :  [-0.02411681015564652]
step  24 :  [-0.06869577412637745]
episode  122 : steps 25 , return [-14.15]
step  0 :  [-1.611145308465851]
step  1 :  [-1.567803041367852]
step  2 :  [-1.5163846934257148]
step  3 :  [-1.4650624516165454]
step  4 :  [-1.421200401719382]
step  5 :  [-1.3490281074568138]
step  6 :  [-1.250444346711855]
step  7 :  [-1.1295622082536267]
step  8 :  [-0.9907457552324725]
step  9 :  [-0.8379324054123003]
step  10 :  [-0.7021405881894046]
step  11 :  [-0.5603962373613063]
step  12 :  [-0.42019189035720844]
step  13 :  [-0.30421813596852143]
step  14 :  [-0.19143252428810648]
step  15 :  [-0.07470132196949002]
step  16 :  [-0.03226434383109354]
step  17 :  [-0.013966125863187904]
step  18 :  [-0.02660026504681993]
step  19 :  [-0.029483935397446884]
step  20 :  [-0.02127267590831469]
step  21 :  [-0.04242027558696543]
step  22 :  [-0.04638526025045279]
step  23 :  [-0.019105413363812804]
step  24 :  [-0.062087204613029884]
episode  123 : steps 25 , return [-15.69]
step  0 :  [-1.760632468555004]
step  1 :  [-1.7303556146998618]
step  2 :  [-1.6964512923863788]
step  3 :  [-1.6270036412597932]
step  4 :  [-1.5279797835787696]
step  5 :  [-1.4053846779556978]
step  6 :  [-1.264449642206622]
step  7 :  [-1.1094777031565783]
step  8 :  [-0.943934600923796]
step  9 :  [-0.8320271807543176]
step  10 :  [-0.8234749351902537]
step  11 :  [-0.8399709184272166]
step  12 :  [-0.8158015039495933]
step  13 :  [-0.758564246196146]
step  14 :  [-0.6780663945025132]
step  15 :  [-0.5854508014474491]
step  16 :  [-0.495113825071595]
step  17 :  [-0.4065052540942557]
step  18 :  [-0.30443951606148584]
step  19 :  [-0.18506365169734323]
step  20 :  [-0.10076737858884297]
step  21 :  [-0.06618863499194257]
step  22 :  [-0.08418128012305805]
step  23 :  [-0.06021125450757951]
step  24 :  [-0.07759716094201874]
episode  124 : steps 25 , return [-20.18]
step  0 :  [-1.5753801961954703]
step  1 :  [-1.546661905659078]
step  2 :  [-1.515641934364335]
step  3 :  [-1.4486463036813375]
step  4 :  [-1.3515305600694767]
step  5 :  [-1.2303232479711101]
step  6 :  [-1.0902972349954403]
step  7 :  [-0.9357718445839996]
step  8 :  [-0.7885183446699062]
step  9 :  [-0.63260007957062]
step  10 :  [-0.5021076397143842]
step  11 :  [-0.4123069924069171]
step  12 :  [-0.3262030962722047]
step  13 :  [-0.23979037794193206]
step  14 :  [-0.15168533326881947]
step  15 :  [-0.0717209022263734]
step  16 :  [-0.051838757878224444]
step  17 :  [-0.05430959933787892]
step  18 :  [-0.05630219503624321]
step  19 :  [-0.02780701751554367]
step  20 :  [-0.03254774815974348]
step  21 :  [-0.030187968821832972]
step  22 :  [-0.031118055694710985]
step  23 :  [-0.014648481746500396]
step  24 :  [-0.012313293174177667]
episode  125 : steps 25 , return [-14.13]
step  0 :  [-1.7886057822237211]
step  1 :  [-1.7519736040502143]
step  2 :  [-1.7092424330231435]
step  3 :  [-1.6676708052567135]
step  4 :  [-1.59441283610663]
step  5 :  [-1.4934973152981077]
step  6 :  [-1.3699362883554316]
step  7 :  [-1.2284329630000714]
step  8 :  [-1.0729854231794014]
step  9 :  [-0.9068439900389226]
step  10 :  [-0.7818520992774635]
step  11 :  [-0.6400905255844387]
step  12 :  [-0.5261595727641454]
step  13 :  [-0.4508658484486853]
step  14 :  [-0.3756322193861587]
step  15 :  [-0.29490756940600066]
step  16 :  [-0.20564934182927816]
step  17 :  [-0.10170478203117737]
step  18 :  [-0.03229773997103366]
step  19 :  [-0.03024826452634581]
step  20 :  [-0.06101676749331355]
step  21 :  [-0.04996488376616244]
step  22 :  [-0.03147193520028793]
step  23 :  [-0.02814200368012164]
step  24 :  [-0.06252746161270202]
episode  126 : steps 25 , return [-18.26]
step  0 :  [-1.5313057844074165]
step  1 :  [-1.49435239390401]
step  2 :  [-1.4521806657209686]
step  3 :  [-1.4129399460898349]
step  4 :  [-1.3424001922694682]
step  5 :  [-1.2439961774200086]
step  6 :  [-1.1225837238923067]
step  7 :  [-0.9828634388541981]
step  8 :  [-0.8288821934893588]
step  9 :  [-0.7195670440869737]
step  10 :  [-0.6015310141787148]
step  11 :  [-0.4812140303942675]
step  12 :  [-0.3806303843515017]
step  13 :  [-0.2801554574818516]
step  14 :  [-0.16626089160866195]
step  15 :  [-0.04930153417047005]
step  16 :  [-0.040930433487047266]
step  17 :  [-0.03470880330226674]
step  18 :  [-0.06896352609147693]
step  19 :  [-0.09997390830582913]
step  20 :  [-0.07576224455500295]
step  21 :  [-0.02502465238768604]
step  22 :  [-0.024431656290836726]
step  23 :  [-0.02594913461391639]
step  24 :  [-0.013774828305128597]
episode  127 : steps 25 , return [-14.5]
step  0 :  [-1.7502403494723715]
step  1 :  [-1.7208347603920628]
step  2 :  [-1.6881592628691056]
step  3 :  [-1.6591172319736065]
step  4 :  [-1.5947998919572273]
step  5 :  [-1.5004491510659048]
step  6 :  [-1.38185903693068]
step  7 :  [-1.2442525616903484]
step  8 :  [-1.0919967178801726]
step  9 :  [-0.9286377525902589]
step  10 :  [-0.7570701057953583]
step  11 :  [-0.5808211827237728]
step  12 :  [-0.40269313398692264]
step  13 :  [-0.2587221754957386]
step  14 :  [-0.10297494812858458]
step  15 :  [-0.06778630110064934]
step  16 :  [-0.11198268931903343]
step  17 :  [-0.12183633750988569]
step  18 :  [-0.08220566938558113]
step  19 :  [-0.05484169860471645]
step  20 :  [-0.02940305261293755]
step  21 :  [-0.03714192129167003]
step  22 :  [-0.042968398656124486]
step  23 :  [-0.04453796900144463]
step  24 :  [-0.042184785251192354]
episode  128 : steps 25 , return [-17.3]
step  0 :  [-1.6359029160410374]
step  1 :  [-1.6003794548866204]
step  2 :  [-1.5597384646458208]
step  3 :  [-1.5216517415900992]
step  4 :  [-1.4514174046964334]
step  5 :  [-1.3529635149392065]
step  6 :  [-1.2313539920449945]
step  7 :  [-1.091374104768385]
step  8 :  [-0.9370959949860352]
step  9 :  [-0.7830164686148541]
step  10 :  [-0.6251155675994213]
step  11 :  [-0.5116015368991998]
step  12 :  [-0.3862656152376546]
step  13 :  [-0.27739965397588384]
step  14 :  [-0.15809367479382383]
step  15 :  [-0.046075562976922654]
step  16 :  [-0.009581367359572135]
step  17 :  [-0.025036234583273805]
step  18 :  [-0.019972740161752395]
step  19 :  [-0.024645076586760937]
step  20 :  [-0.03442584872221152]
step  21 :  [-0.03941666107429573]
step  22 :  [-0.09869178710186392]
step  23 :  [-0.09441190314971491]
step  24 :  [-0.09289981232553732]
episode  129 : steps 25 , return [-15.61]
step  0 :  [-1.615212883178291]
step  1 :  [-1.5769514334279913]
step  2 :  [-1.5326013991441276]
step  3 :  [-1.4900668987561083]
step  4 :  [-1.4168347088601108]
step  5 :  [-1.3162850951822052]
step  6 :  [-1.193161086030302]
step  7 :  [-1.0520527841973644]
step  8 :  [-0.8969072950207976]
step  9 :  [-0.7882533255563322]
step  10 :  [-0.6620326919349557]
step  11 :  [-0.5501679498775792]
step  12 :  [-0.4695162997091247]
step  13 :  [-0.38461489851476033]
step  14 :  [-0.3003914051539294]
step  15 :  [-0.20133264624527367]
step  16 :  [-0.08393189460969308]
step  17 :  [-0.05030286400337194]
step  18 :  [-0.030473426646424686]
step  19 :  [-0.0746942144285448]
step  20 :  [-0.07136649968463936]
step  21 :  [-0.08200035137809522]
step  22 :  [-0.07265658966257386]
step  23 :  [-0.02019687241040256]
step  24 :  [-0.02948085272177979]
episode  130 : steps 25 , return [-15.96]
step  0 :  [-1.5628259115489374]
step  1 :  [-1.5347093476733742]
step  2 :  [-1.5045707658417522]
step  3 :  [-1.4382197002519934]
step  4 :  [-1.3415773528295865]
step  5 :  [-1.2207186124865275]
step  6 :  [-1.0809471811206703]
step  7 :  [-0.9266013784633688]
step  8 :  [-0.7873659519363175]
step  9 :  [-0.6384971950355578]
step  10 :  [-0.5072239487191841]
step  11 :  [-0.4124150565235995]
step  12 :  [-0.3215089871815317]
step  13 :  [-0.22376690082718173]
step  14 :  [-0.1235582919614242]
step  15 :  [-0.0717109426277262]
step  16 :  [-0.021487352918951142]
step  17 :  [-0.033834846173761875]
step  18 :  [-0.06248899115408062]
step  19 :  [-0.059184836012042476]
step  20 :  [-0.015369703264229224]
step  21 :  [-0.027123498757218287]
step  22 :  [-0.01159971437107004]
step  23 :  [-0.01681508479636745]
step  24 :  [-0.044714920048638265]
episode  131 : steps 25 , return [-13.99]
step  0 :  [-1.838872961291065]
step  1 :  [-1.8017938791674895]
step  2 :  [-1.7582845198360268]
step  3 :  [-1.7154910833835704]
step  4 :  [-1.6412246581825258]
step  5 :  [-1.539528395780489]
step  6 :  [-1.4153921765612512]
step  7 :  [-1.2734951221708761]
step  8 :  [-1.117821601348642]
step  9 :  [-0.9516264453425342]
step  10 :  [-0.7858948633328977]
step  11 :  [-0.6095455631548586]
step  12 :  [-0.5115071426600944]
step  13 :  [-0.4374268439503328]
step  14 :  [-0.3530110048749022]
step  15 :  [-0.26694555292590216]
step  16 :  [-0.16580263912231222]
step  17 :  [-0.0838164040623343]
step  18 :  [-0.05602364422264176]
step  19 :  [-0.012364634616563246]
step  20 :  [-0.06597010258849191]
step  21 :  [-0.07599396701616969]
step  22 :  [-0.13037388563613456]
step  23 :  [-0.12516636728171776]
step  24 :  [-0.10545956662285468]
episode  132 : steps 25 , return [-18.84]
step  0 :  [-1.5520163575680812]
step  1 :  [-1.5272842008994332]
step  2 :  [-1.501814349310137]
step  3 :  [-1.4387505997264542]
step  4 :  [-1.3445056357714964]
step  5 :  [-1.2254594113374946]
step  6 :  [-1.0871152753045217]
step  7 :  [-0.9339552798886783]
step  8 :  [-0.7712445184544129]
step  9 :  [-0.6060229459541402]
step  10 :  [-0.4466774353269428]
step  11 :  [-0.32154060545659985]
step  12 :  [-0.20758414665405509]
step  13 :  [-0.15099524730944866]
step  14 :  [-0.0810347812958022]
step  15 :  [-0.031242209633204992]
step  16 :  [-0.02916153689568919]
step  17 :  [-0.014653373711113383]
step  18 :  [-0.0298866262733541]
step  19 :  [-0.04023925135036729]
step  20 :  [-0.04324605374604418]
step  21 :  [-0.03991874065939953]
step  22 :  [-0.0727018669936411]
step  23 :  [-0.06490396936406502]
step  24 :  [-0.08471801692636154]
episode  133 : steps 25 , return [-13.65]
step  0 :  [-1.66711548050007]
step  1 :  [-1.6249066115309645]
step  2 :  [-1.5748625280521362]
step  3 :  [-1.5249097591882441]
step  4 :  [-1.4821313116744632]
step  5 :  [-1.4103696459955353]
step  6 :  [-1.311884705729649]
step  7 :  [-1.1909480056267452]
step  8 :  [-1.0519875968405181]
step  9 :  [-0.8989519861069651]
step  10 :  [-0.7543956509773557]
step  11 :  [-0.6030397278341747]
step  12 :  [-0.45044209188653883]
step  13 :  [-0.32661966568030626]
step  14 :  [-0.19603809693684796]
step  15 :  [-0.0781401778133072]
step  16 :  [-0.023976111306206974]
step  17 :  [-0.03855554093159519]
step  18 :  [-0.05800029319068856]
step  19 :  [-0.03870692865481276]
step  20 :  [-0.006340484886172949]
step  21 :  [-0.031999846333031476]
step  22 :  [-0.03836388775847865]
step  23 :  [-0.0519183078457159]
step  24 :  [-0.032991307570333264]
episode  134 : steps 25 , return [-16.47]
step  0 :  [-1.780681267145348]
step  1 :  [-1.7436473110351751]
step  2 :  [-1.700388085426649]
step  3 :  [-1.658207925754211]
step  4 :  [-1.5845604012174723]
step  5 :  [-1.4833883311005767]
step  6 :  [-1.3596566337147895]
step  7 :  [-1.2180424047806766]
step  8 :  [-1.0625301215589826]
step  9 :  [-0.8963658109774908]
step  10 :  [-0.7824036289012116]
step  11 :  [-0.6483623684986798]
step  12 :  [-0.5408994681479258]
step  13 :  [-0.4700164680947853]
step  14 :  [-0.39785131656536954]
step  15 :  [-0.31687892443810384]
step  16 :  [-0.2258801967854628]
step  17 :  [-0.11734902418802169]
step  18 :  [-0.01810432131699103]
step  19 :  [-0.069512233193453]
step  20 :  [-0.08368743046643921]
step  21 :  [-0.05109177907473509]
step  22 :  [-0.07806999519563848]
step  23 :  [-0.1059608553745519]
step  24 :  [-0.0945934556139298]
episode  135 : steps 25 , return [-18.49]
step  0 :  [-1.444039721876564]
step  1 :  [-1.415558843415313]
step  2 :  [-1.3855218866448415]
step  3 :  [-1.3196535538552616]
step  4 :  [-1.2235675107194823]
step  5 :  [-1.1032335594194584]
step  6 :  [-0.9639260005611815]
step  7 :  [-0.8099832912358154]
step  8 :  [-0.6802056390512686]
step  9 :  [-0.5563572905097167]
step  10 :  [-0.46218510845421373]
step  11 :  [-0.3596104575345033]
step  12 :  [-0.2615043620805959]
step  13 :  [-0.15341317337174834]
step  14 :  [-0.06110249852468052]
step  15 :  [-0.0429966887903387]
step  16 :  [-0.01985244127734511]
step  17 :  [-0.04097827883238457]
step  18 :  [-0.025170225380963304]
step  19 :  [-0.02124897924371845]
step  20 :  [-0.04676807367937755]
step  21 :  [-0.06585510476298789]
step  22 :  [-0.08429819169350686]
step  23 :  [-0.06240328611206614]
step  24 :  [-0.01931015419176204]
episode  136 : steps 25 , return [-12.63]
step  0 :  [-1.695752635171393]
step  1 :  [-1.6537828431943165]
step  2 :  [-1.6039696092573756]
step  3 :  [-1.554134633167964]
step  4 :  [-1.511245162533974]
step  5 :  [-1.439233634263702]
step  6 :  [-1.340465673500456]
step  7 :  [-1.2192456426407356]
step  8 :  [-1.0800031933323848]
step  9 :  [-0.9266701133924496]
step  10 :  [-0.7675500567215163]
step  11 :  [-0.6054388841756121]
step  12 :  [-0.4470786906483876]
step  13 :  [-0.3212457596724439]
step  14 :  [-0.19416327406112982]
step  15 :  [-0.08574166649678809]
step  16 :  [-0.041558516065575576]
step  17 :  [-0.018428081420392078]
step  18 :  [-0.020974512052254913]
step  19 :  [-0.03247733231235309]
step  20 :  [-0.030387135063527592]
step  21 :  [-0.03425669644508256]
step  22 :  [-0.06325765814029698]
step  23 :  [-0.07021469495823233]
step  24 :  [-0.03809550749220515]
episode  137 : steps 25 , return [-16.8]
step  0 :  [-1.4437169370685317]
step  1 :  [-1.402600455660815]
step  2 :  [-1.3550375809204533]
step  3 :  [-1.3097853716823142]
step  4 :  [-1.2355418675270238]
step  5 :  [-1.1347241827083565]
step  6 :  [-1.0116490433487872]
step  7 :  [-0.870713629998034]
step  8 :  [-0.7997020324601934]
step  9 :  [-0.7032493159616379]
step  10 :  [-0.6107524899553006]
step  11 :  [-0.525647803100858]
step  12 :  [-0.45458035771781413]
step  13 :  [-0.3726468190831308]
step  14 :  [-0.273808515528437]
step  15 :  [-0.17154333909935088]
step  16 :  [-0.05871140255297643]
step  17 :  [-0.012764753874701131]
step  18 :  [-0.0825727083682556]
step  19 :  [-0.10212727192507308]
step  20 :  [-0.07830616714812795]
step  21 :  [-0.04619968053663233]
step  22 :  [-0.032075956003511354]
step  23 :  [-0.02829278191741442]
step  24 :  [-0.024695097063601512]
episode  138 : steps 25 , return [-14.14]
step  0 :  [-1.4858845952036102]
step  1 :  [-1.4418310705665973]
step  2 :  [-1.3899389684839154]
step  3 :  [-1.3389085670118286]
step  4 :  [-1.2967001898977708]
step  5 :  [-1.2266272857898772]
step  6 :  [-1.1301720046628634]
step  7 :  [-1.0113831557208084]
step  8 :  [-0.8747257851209905]
step  9 :  [-0.7417739931880633]
step  10 :  [-0.5974947563781695]
step  11 :  [-0.44791271717815323]
step  12 :  [-0.3236612754713362]
step  13 :  [-0.18937558831096066]
step  14 :  [-0.06555638167292431]
step  15 :  [-0.016896426321949088]
step  16 :  [-0.012502011361599298]
step  17 :  [-0.03681909770863113]
step  18 :  [-0.03672882366208947]
step  19 :  [-0.0457324145580745]
step  20 :  [-0.018039658311985195]
step  21 :  [-0.033297320628143466]
step  22 :  [-0.03786382689713439]
step  23 :  [-0.04377200849146631]
step  24 :  [-0.0632480724981416]
episode  139 : steps 25 , return [-13.91]
step  0 :  [-1.4047332521239844]
step  1 :  [-1.3713747855192056]
step  2 :  [-1.3348340651919932]
step  3 :  [-1.2646759746214569]
step  4 :  [-1.1656610651109867]
step  5 :  [-1.0432836539114163]
step  6 :  [-0.9025480034999306]
step  7 :  [-0.8043759814442707]
step  8 :  [-0.832854248875571]
step  9 :  [-0.9259009441166951]
step  10 :  [-0.9725510701197151]
step  11 :  [-0.9577610009161179]
step  12 :  [-0.8967688418463825]
step  13 :  [-0.8453582992635212]
step  14 :  [-0.8069509284940978]
step  15 :  [-0.7370471915056566]
step  16 :  [-0.6431726385535629]
step  17 :  [-0.5343274536550964]
step  18 :  [-0.42278830689666225]
step  19 :  [-0.3215384310687975]
step  20 :  [-0.2132419283959515]
step  21 :  [-0.09597663693440994]
step  22 :  [-0.043194404198210086]
step  23 :  [-0.0440415778679008]
step  24 :  [-0.0035808665258212293]
episode  140 : steps 25 , return [-18.59]
step  0 :  [-1.5542295060701223]
step  1 :  [-1.5100979485140884]
step  2 :  [-1.4577999431074906]
step  3 :  [-1.405755804069454]
step  4 :  [-1.3616152735243188]
step  5 :  [-1.2896407898431574]
step  6 :  [-1.1914355394168534]
step  7 :  [-1.0710062915074854]
step  8 :  [-0.9326981068724645]
step  9 :  [-0.7831634937969034]
step  10 :  [-0.62880868226413]
step  11 :  [-0.47643556160464556]
step  12 :  [-0.3548153836136964]
step  13 :  [-0.2283196966154356]
step  14 :  [-0.11419586358065784]
step  15 :  [-0.06281891000282745]
step  16 :  [-0.061304293034595454]
step  17 :  [-0.025421914849119702]
step  18 :  [-0.05438149850951116]
step  19 :  [-0.07577775512990409]
step  20 :  [-0.06266253278672143]
step  21 :  [-0.02398816799235276]
step  22 :  [-0.041847084942377794]
step  23 :  [-0.022472389994018585]
step  24 :  [-0.05306094306744585]
episode  141 : steps 25 , return [-14.84]
step  0 :  [-1.4630489982596773]
step  1 :  [-1.4323060389030924]
step  2 :  [-1.3990583279371407]
step  3 :  [-1.3309142543532075]
step  4 :  [-1.2331806183103484]
step  5 :  [-1.111630715312351]
step  6 :  [-0.971412555846666]
step  7 :  [-0.8167827474711723]
step  8 :  [-0.7882084950119005]
step  9 :  [-0.7212007776714354]
step  10 :  [-0.6467462519800385]
step  11 :  [-0.5676574517176556]
step  12 :  [-0.4946540633881772]
step  13 :  [-0.4260603513144834]
step  14 :  [-0.34142122669388547]
step  15 :  [-0.23589768720814533]
step  16 :  [-0.15253191914879266]
step  17 :  [-0.10679021005597156]
step  18 :  [-0.04797387287638571]
step  19 :  [-0.0503395155195041]
step  20 :  [-0.05292722947301358]
step  21 :  [-0.04175665815751051]
step  22 :  [-0.04069890377736432]
step  23 :  [-0.025817553614201762]
step  24 :  [-0.013043088980483156]
episode  142 : steps 25 , return [-14.51]
step  0 :  [-1.4639594924267065]
step  1 :  [-1.4364427735591672]
step  2 :  [-1.407619105166356]
step  3 :  [-1.3425186916806466]
step  4 :  [-1.2469489404738834]
step  5 :  [-1.12698225468129]
step  6 :  [-0.98795191541153]
step  7 :  [-0.8342345757662404]
step  8 :  [-0.7309147776903084]
step  9 :  [-0.6167608558631629]
step  10 :  [-0.49824799729553476]
step  11 :  [-0.38838212580316345]
step  12 :  [-0.2961416118988533]
step  13 :  [-0.19767364826788042]
step  14 :  [-0.08523461931115842]
step  15 :  [-0.038260453418256665]
step  16 :  [-0.0483770236985153]
step  17 :  [-0.03572476591516222]
step  18 :  [-0.04847751109138416]
step  19 :  [-0.03934093298222363]
step  20 :  [-0.026682117982104955]
step  21 :  [-0.01834840391358939]
step  22 :  [-0.044248025336966555]
step  23 :  [-0.03624667003548841]
step  24 :  [-0.03024664831968037]
episode  143 : steps 25 , return [-13.03]
step  0 :  [-1.532291833928633]
step  1 :  [-1.497137694970193]
step  2 :  [-1.4574564984691802]
step  3 :  [-1.4212842859521655]
step  4 :  [-1.3528980764064156]
step  5 :  [-1.2560757491886008]
step  6 :  [-1.1358889196154691]
step  7 :  [-0.9971851117083754]
step  8 :  [-0.8441299715234115]
step  9 :  [-0.715739296429073]
step  10 :  [-0.5784427350243011]
step  11 :  [-0.43904706537031263]
step  12 :  [-0.3232274337986094]
step  13 :  [-0.20461810696095756]
step  14 :  [-0.0976515460608798]
step  15 :  [-0.04801839646664419]
step  16 :  [-0.06772836509020393]
step  17 :  [-0.04587776540232043]
step  18 :  [-0.0013591579194030508]
step  19 :  [-0.03972675935576278]
step  20 :  [-0.049761757733353076]
step  21 :  [-0.027042375464106868]
step  22 :  [-0.05519912118048413]
step  23 :  [-0.05829469184702265]
step  24 :  [-0.03602931922740823]
episode  144 : steps 25 , return [-14.28]
step  0 :  [-1.4971177790707342]
step  1 :  [-1.4712364279111765]
step  2 :  [-1.44447366943287]
step  3 :  [-1.3806925254257867]
step  4 :  [-1.2860225664961982]
step  5 :  [-1.1667086173890284]
step  6 :  [-1.0281850906204058]
step  7 :  [-0.8748968547841439]
step  8 :  [-0.7536639837244471]
step  9 :  [-0.6219182633471985]
step  10 :  [-0.4866888665872164]
step  11 :  [-0.3598589419831225]
step  12 :  [-0.256371006666341]
step  13 :  [-0.1514079386355028]
step  14 :  [-0.03771050399665888]
step  15 :  [-0.06553270435460933]
step  16 :  [-0.10079091259848592]
step  17 :  [-0.08944769685558233]
step  18 :  [-0.07709713943272506]
step  19 :  [-0.06379667882206079]
step  20 :  [-0.09636960507684318]
step  21 :  [-0.07439622741546666]
step  22 :  [-0.04682759697557539]
step  23 :  [-0.0314941509681667]
step  24 :  [-0.037271858378343015]
episode  145 : steps 25 , return [-13.5]
step  0 :  [-1.513875310499639]
step  1 :  [-1.4720886790056142]
step  2 :  [-1.4232541241161063]
step  3 :  [-1.3758506527223437]
step  4 :  [-1.3375526295134035]
step  5 :  [-1.2700516533355226]
step  6 :  [-1.1754200147516134]
step  7 :  [-1.0580431743269727]
step  8 :  [-0.9225983118976387]
step  9 :  [-0.7734332502117109]
step  10 :  [-0.6146370187396742]
step  11 :  [-0.4508861103335804]
step  12 :  [-0.3164761973549954]
step  13 :  [-0.16939941934384314]
step  14 :  [-0.043045442535523976]
step  15 :  [-0.03995520585481246]
step  16 :  [-0.05220818592209167]
step  17 :  [-0.011757023765628311]
step  18 :  [-0.030973278403926628]
step  19 :  [-0.0066871303968106515]
step  20 :  [-0.05467847234107228]
step  21 :  [-0.0604244736385463]
step  22 :  [-0.027564637675414682]
step  23 :  [-0.04271926504830947]
step  24 :  [-0.012336418105514927]
episode  146 : steps 25 , return [-14.26]
step  0 :  [-1.6058127728519018]
step  1 :  [-1.5693673001270654]
step  2 :  [-1.527574252225191]
step  3 :  [-1.4882675322113557]
step  4 :  [-1.4173175892201095]
step  5 :  [-1.3184194347823546]
step  6 :  [-1.1965186474088711]
step  7 :  [-1.0563369290201985]
step  8 :  [-0.9019097790109069]
step  9 :  [-0.7821150481463323]
step  10 :  [-0.6509477584217296]
step  11 :  [-0.5245494806836141]
step  12 :  [-0.42675524406985016]
step  13 :  [-0.33289835548291385]
step  14 :  [-0.22225120875211296]
step  15 :  [-0.11048381385446056]
step  16 :  [-0.07260324540099308]
step  17 :  [-0.06538733433387055]
step  18 :  [-0.10700977550683015]
step  19 :  [-0.09182659116712122]
step  20 :  [-0.04807373802393569]
step  21 :  [-0.029548250488896245]
step  22 :  [-0.04066024382366264]
step  23 :  [-0.014805994135054412]
step  24 :  [-0.04725675525504213]
episode  147 : steps 25 , return [-15.65]
step  0 :  [-1.4982086252896472]
step  1 :  [-1.4715195967217813]
step  2 :  [-1.4436484791312147]
step  3 :  [-1.3790873890710273]
step  4 :  [-1.2838438871606561]
step  5 :  [-1.1640872397293414]
step  6 :  [-1.025201095441399]
step  7 :  [-0.8715905007290962]
step  8 :  [-0.7620014773779615]
step  9 :  [-0.6401199313804211]
step  10 :  [-0.5144149370522227]
step  11 :  [-0.41222906251137986]
step  12 :  [-0.31508924012888506]
step  13 :  [-0.19773943377228329]
step  14 :  [-0.08921933766567758]
step  15 :  [-0.026275277821939728]
step  16 :  [-0.026322008985645667]
step  17 :  [-0.058004645640513885]
step  18 :  [-0.045351140201777045]
step  19 :  [-0.030653385764238573]
step  20 :  [-0.015646954250386425]
step  21 :  [-0.04760505757120795]
step  22 :  [-0.027186566410718937]
step  23 :  [-0.04984665231028872]
step  24 :  [-0.03300337782830805]
episode  148 : steps 25 , return [-13.43]
step  0 :  [-1.6497794988035785]
step  1 :  [-1.6150500483645651]
step  2 :  [-1.5754497249262922]
step  3 :  [-1.538553782456824]
step  4 :  [-1.4690921355360482]
step  5 :  [-1.3711663462350046]
step  6 :  [-1.2499365194082932]
step  7 :  [-1.1102447681166405]
step  8 :  [-0.9562002732403007]
step  9 :  [-0.7911363386550084]
step  10 :  [-0.624696197761363]
step  11 :  [-0.47110507158482856]
step  12 :  [-0.3547312958513861]
step  13 :  [-0.24703807987654006]
step  14 :  [-0.13979633738740727]
step  15 :  [-0.08510330501479872]
step  16 :  [-0.04841332562146499]
step  17 :  [-0.05639438567608777]
step  18 :  [-0.03214271446650081]
step  19 :  [-0.04203580305326819]
step  20 :  [-0.0249185147670857]
step  21 :  [-0.03398315844202689]
step  22 :  [-0.02217890587334341]
step  23 :  [-0.029468111597379297]
step  24 :  [-0.021257151941599245]
episode  149 : steps 25 , return [-15.56]
step  0 :  [-1.7826229325823177]
step  1 :  [-1.748530825823971]
step  2 :  [-1.709317670172105]
step  3 :  [-1.6721056425737837]
step  4 :  [-1.6018873962891365]
step  5 :  [-1.5031296685644828]
step  6 :  [-1.3811170039745022]
step  7 :  [-1.2407219154773883]
step  8 :  [-1.0860448579586808]
step  9 :  [-0.9203884940050984]
step  10 :  [-0.7751816354554759]
step  11 :  [-0.6232700672264835]
step  12 :  [-0.4845884309288685]
step  13 :  [-0.3811071205265253]
step  14 :  [-0.2829877563607001]
step  15 :  [-0.18116664049723238]
step  16 :  [-0.06318073605746104]
step  17 :  [-0.025422194235767286]
step  18 :  [-0.011373215015195375]
step  19 :  [-0.02847106665175046]
step  20 :  [-0.023549315759745885]
step  21 :  [-0.03468473037594229]
step  22 :  [-0.028451497196270187]
step  23 :  [-0.03601238395099954]
step  24 :  [-0.02035041525847153]
episode  150 : steps 25 , return [-17.65]
step  0 :  [-1.7564448069318697]
step  1 :  [-1.7249914746861597]
step  2 :  [-1.6894915874951428]
step  3 :  [-1.656971593311211]
step  4 :  [-1.5901517942756738]
step  5 :  [-1.493920902678211]
step  6 :  [-1.3738453302564009]
step  7 :  [-1.2349907178724926]
step  8 :  [-1.081599673325907]
step  9 :  [-0.9170955456461959]
step  10 :  [-0.7498859840761816]
step  11 :  [-0.5807458921573395]
step  12 :  [-0.4152329957971851]
step  13 :  [-0.2832607703328846]
step  14 :  [-0.1648242751159171]
step  15 :  [-0.10047637933745601]
step  16 :  [-0.026255328637731782]
step  17 :  [-0.03049824846428697]
step  18 :  [-0.031349159283950594]
step  19 :  [-0.042896420225734]
step  20 :  [-0.037341825867158174]
step  21 :  [-0.02214896695504114]
step  22 :  [-0.04905691926437372]
step  23 :  [-0.048588300514368576]
step  24 :  [-0.013962766158849012]
episode  151 : steps 25 , return [-17.12]
step  0 :  [-1.651953741936191]
step  1 :  [-1.615658325117596]
step  2 :  [-1.5738861434704081]
step  3 :  [-1.5343002440643703]
step  4 :  [-1.4629497045535098]
step  5 :  [-1.3636543166633273]
step  6 :  [-1.2413971723684867]
step  7 :  [-1.1009049380716611]
step  8 :  [-0.9462053069898612]
step  9 :  [-0.7867003242228766]
step  10 :  [-0.6238148514668802]
step  11 :  [-0.4821989394711043]
step  12 :  [-0.38080616120942484]
step  13 :  [-0.28532161195222394]
step  14 :  [-0.18171534607074344]
step  15 :  [-0.08044331149741248]
step  16 :  [-0.03760864720640232]
step  17 :  [-0.020096563029725623]
step  18 :  [-0.04519668876690872]
step  19 :  [-0.037024350918408645]
step  20 :  [-0.01779275198810969]
step  21 :  [-0.03102264372319335]
step  22 :  [-0.03655801008432591]
step  23 :  [-0.023619580860720447]
step  24 :  [-0.022825751381658006]
episode  152 : steps 25 , return [-15.58]
step  0 :  [-1.7412762727105853]
step  1 :  [-1.7136339326523016]
step  2 :  [-1.6833979839783924]
step  3 :  [-1.6164761221925015]
step  4 :  [-1.5191855865658377]
step  5 :  [-1.3977443059430308]
step  6 :  [-1.2575056163793652]
step  7 :  [-1.1028262230315515]
step  8 :  [-0.9371577310586733]
step  9 :  [-0.7814189306408984]
step  10 :  [-0.6165705367696257]
step  11 :  [-0.4863088113737309]
step  12 :  [-0.4024273409541081]
step  13 :  [-0.32273151776401504]
step  14 :  [-0.22930075934913244]
step  15 :  [-0.1437561087480932]
step  16 :  [-0.07654028412459439]
step  17 :  [-0.06095417800977374]
step  18 :  [-0.05677128875524046]
step  19 :  [-0.04227174283067673]
step  20 :  [-0.030801821591890627]
step  21 :  [-0.028578457960240077]
step  22 :  [-0.01631260341280073]
step  23 :  [-0.024629146749550773]
step  24 :  [-0.062360955074260746]
episode  153 : steps 25 , return [-16.35]
step  0 :  [-1.7745037378036452]
step  1 :  [-1.7351078242900022]
step  2 :  [-1.6886026835298515]
step  3 :  [-1.6424408934693127]
step  4 :  [-1.603176608745506]
step  5 :  [-1.5332963667318649]
step  6 :  [-1.4358568905066862]
step  7 :  [-1.3155171386823543]
step  8 :  [-1.176897621617295]
step  9 :  [-1.0240383984309356]
step  10 :  [-0.8603070708176987]
step  11 :  [-0.7025511338104974]
step  12 :  [-0.5384908662367468]
step  13 :  [-0.3735884074614542]
step  14 :  [-0.23792824720816566]
step  15 :  [-0.11827907021247343]
step  16 :  [-0.045374367568608326]
step  17 :  [-0.03778737815266558]
step  18 :  [-0.025569433199890534]
step  19 :  [-0.017149596366889903]
step  20 :  [-0.04550338019277793]
step  21 :  [-0.03791038306977053]
step  22 :  [-0.020350310672582066]
step  23 :  [-0.012681772539714005]
step  24 :  [-0.054659844356499926]
episode  154 : steps 25 , return [-18.06]
step  0 :  [-1.6557349333425722]
step  1 :  [-1.6283850539755995]
step  2 :  [-1.5988849616558463]
step  3 :  [-1.532694851097444]
step  4 :  [-1.4360265294776862]
step  5 :  [-1.3150766052098841]
step  6 :  [-1.175201477509451]
step  7 :  [-1.0207633098014852]
step  8 :  [-0.8552107482145163]
step  9 :  [-0.7767666928090011]
step  10 :  [-0.6747898282646879]
step  11 :  [-0.5726451401860987]
step  12 :  [-0.47666225693305664]
step  13 :  [-0.3967889819520817]
step  14 :  [-0.3082303062557954]
step  15 :  [-0.20440139801543966]
step  16 :  [-0.099854012257812]
step  17 :  [-0.048301849641374836]
step  18 :  [-0.04753898839405824]
step  19 :  [-0.025666727030447856]
step  20 :  [-0.015532824746054568]
step  21 :  [-0.01702968401911204]
step  22 :  [-0.028857604347055546]
step  23 :  [-0.032465617872228285]
step  24 :  [-0.08905918263528345]
episode  155 : steps 25 , return [-16.03]
step  0 :  [-1.5232672520088335]
step  1 :  [-1.4873783598585033]
step  2 :  [-1.4467211296870712]
step  3 :  [-1.4094137063925345]
step  4 :  [-1.3402740096861827]
step  5 :  [-1.2429206058100648]
step  6 :  [-1.122334075242378]
step  7 :  [-0.9833049266960329]
step  8 :  [-0.8299564796059733]
step  9 :  [-0.7024327208677337]
step  10 :  [-0.5696395358125619]
step  11 :  [-0.4390231745454545]
step  12 :  [-0.3311334667639121]
step  13 :  [-0.22833291068249922]
step  14 :  [-0.13802931108067626]
step  15 :  [-0.07748848677253188]
step  16 :  [-0.0761888349454359]
step  17 :  [-0.08352405902150423]
step  18 :  [-0.043841892144758775]
step  19 :  [-0.027301406596212323]
step  20 :  [-0.07863968910278368]
step  21 :  [-0.08474683222357439]
step  22 :  [-0.08718104308156288]
step  23 :  [-0.06973258208133996]
step  24 :  [-0.03644627142286592]
episode  156 : steps 25 , return [-14.46]
step  0 :  [-1.545738711260216]
step  1 :  [-1.5038063133225292]
step  2 :  [-1.4546279342362871]
step  3 :  [-1.4065593734380062]
step  4 :  [-1.3671447178615772]
step  5 :  [-1.2985984470897576]
step  6 :  [-1.2030169516717395]
step  7 :  [-1.0847442603372817]
step  8 :  [-0.9483824746153521]
step  9 :  [-0.7981571872803997]
step  10 :  [-0.6391561063688698]
step  11 :  [-0.4753505146275885]
step  12 :  [-0.31480951096288234]
step  13 :  [-0.18213529562476127]
step  14 :  [-0.055454036190465524]
step  15 :  [-0.025643952755145662]
step  16 :  [-0.01394003900223792]
step  17 :  [-0.03250355798446939]
step  18 :  [-0.00903844262413166]
step  19 :  [-0.04048044359346312]
step  20 :  [-0.014819339292157686]
step  21 :  [-0.05294152385037333]
step  22 :  [-0.045618805751569874]
step  23 :  [-0.038770277272271635]
step  24 :  [-0.026748472185810536]
episode  157 : steps 25 , return [-14.58]
step  0 :  [-1.5560769112664483]
step  1 :  [-1.5265248098550686]
step  2 :  [-1.4944516287572662]
step  3 :  [-1.4267965761048769]
step  4 :  [-1.3292505594238304]
step  5 :  [-1.2077559097881567]
step  6 :  [-1.0675388560799177]
step  7 :  [-0.9128943762237284]
step  8 :  [-0.7892674393286849]
step  9 :  [-0.6502863757600262]
step  10 :  [-0.5331480586386254]
step  11 :  [-0.45208072077509565]
step  12 :  [-0.37192151557572756]
step  13 :  [-0.283078517878559]
step  14 :  [-0.18692634166991334]
step  15 :  [-0.07565520711700773]
step  16 :  [-0.06319874573581767]
step  17 :  [-0.04276682107214004]
step  18 :  [-0.0276880065100545]
step  19 :  [-0.05591303328481803]
step  20 :  [-0.036641642268293036]
step  21 :  [-0.02223390592508475]
step  22 :  [-0.011553412223475418]
step  23 :  [-0.0538798308923273]
step  24 :  [-0.03582166572822355]
episode  158 : steps 25 , return [-14.21]
step  0 :  [-1.4541715407826916]
step  1 :  [-1.4232186253166994]
step  2 :  [-1.3897288867259805]
step  3 :  [-1.3214518205958814]
step  4 :  [-1.2236412659745868]
step  5 :  [-1.102045247171582]
step  6 :  [-0.9617991566643426]
step  7 :  [-0.8071587576596657]
step  8 :  [-0.7882367409893485]
step  9 :  [-0.7284320885440401]
step  10 :  [-0.6589133287176204]
step  11 :  [-0.582344081487339]
step  12 :  [-0.5089477045007363]
step  13 :  [-0.4390512449944401]
step  14 :  [-0.3532099189910388]
step  15 :  [-0.24718435605770736]
step  16 :  [-0.15435431913800624]
step  17 :  [-0.1036262280779478]
step  18 :  [-0.06881288197128227]
step  19 :  [-0.04356163447889905]
step  20 :  [-0.01773809891320537]
step  21 :  [-0.06737028114666378]
step  22 :  [-0.06761263870560175]
step  23 :  [-0.02488329198910235]
step  24 :  [-0.03827555312677549]
episode  159 : steps 25 , return [-14.58]
step  0 :  [-1.5974256724290388]
step  1 :  [-1.5619297467656048]
step  2 :  [-1.5214861985422081]
step  3 :  [-1.483902283690987]
step  4 :  [-1.414196996847273]
step  5 :  [-1.316223505033301]
step  6 :  [-1.195033926716864]
step  7 :  [-1.0554239748272218]
step  8 :  [-0.9014861411458605]
step  9 :  [-0.773589527006319]
step  10 :  [-0.6367489390533111]
step  11 :  [-0.5014313555705023]
step  12 :  [-0.39416731620164075]
step  13 :  [-0.28026129755475615]
step  14 :  [-0.1737245888770608]
step  15 :  [-0.05900517011219438]
step  16 :  [-0.021450912960989606]
step  17 :  [-0.015012828981206662]
step  18 :  [-0.05699850502455422]
step  19 :  [-0.040808784075270985]
step  20 :  [-0.06314329437140247]
step  21 :  [-0.047428046818494884]
step  22 :  [-0.020206154257357497]
step  23 :  [-0.013067351829287753]
step  24 :  [-0.007869505972269715]
episode  160 : steps 25 , return [-15.15]
step  0 :  [-1.7462825525667884]
step  1 :  [-1.7109487700864723]
step  2 :  [-1.6701527455023943]
step  3 :  [-1.6311992232538384]
step  4 :  [-1.5599053025677578]
step  5 :  [-1.4604505621233537]
step  6 :  [-1.3379678480436732]
step  7 :  [-1.197245655255881]
step  8 :  [-1.0423358612583848]
step  9 :  [-0.8765122862492609]
step  10 :  [-0.7761415305892795]
step  11 :  [-0.6582716396528455]
step  12 :  [-0.5445406354988647]
step  13 :  [-0.45742934665765306]
step  14 :  [-0.360779371618394]
step  15 :  [-0.266205152990392]
step  16 :  [-0.16002468096371297]
step  17 :  [-0.11592256419591604]
step  18 :  [-0.04706617861637143]
step  19 :  [-0.0504931399107067]
step  20 :  [-0.10027641807513481]
step  21 :  [-0.10814388374927608]
step  22 :  [-0.07905321456790587]
step  23 :  [-0.021358095998009193]
step  24 :  [-0.036178581429732654]
episode  161 : steps 25 , return [-18.01]
step  0 :  [-1.5665389520183235]
step  1 :  [-1.5365036804960082]
step  2 :  [-1.5037193167039538]
step  3 :  [-1.4355478937316712]
step  4 :  [-1.379863903528752]
step  5 :  [-1.2938527686487498]
step  6 :  [-1.1826300702757613]
step  7 :  [-1.051382856838418]
step  8 :  [-0.9047243593445631]
step  9 :  [-0.7466478525395114]
step  10 :  [-0.5808568887973952]
step  11 :  [-0.4118651639475345]
step  12 :  [-0.25012806894188633]
step  13 :  [-0.12027815736077331]
step  14 :  [-0.06880195330092516]
step  15 :  [-0.02418981661828207]
step  16 :  [-0.06156498165226733]
step  17 :  [-0.05397033361827832]
step  18 :  [-0.023266399253128848]
step  19 :  [-0.03158280464860083]
step  20 :  [-0.01543694155860101]
step  21 :  [-0.04705999412618218]
step  22 :  [-0.025810170101595104]
step  23 :  [-0.03085252415896838]
step  24 :  [-0.07578432676971589]
episode  162 : steps 25 , return [-14.42]
step  0 :  [-1.6739331160656885]
step  1 :  [-1.6498713843826462]
step  2 :  [-1.5858481548851913]
step  3 :  [-1.4899662752725922]
step  4 :  [-1.4101034070476821]
step  5 :  [-1.3031728855789964]
step  6 :  [-1.1745664647701766]
step  7 :  [-1.0290037533582153]
step  8 :  [-0.8703611603043222]
step  9 :  [-0.7609262744927899]
step  10 :  [-0.6395196463768876]
step  11 :  [-0.5152346600447861]
step  12 :  [-0.39895788847111185]
step  13 :  [-0.3031368473738643]
step  14 :  [-0.20270609041767151]
step  15 :  [-0.08805539051254188]
step  16 :  [-0.06107595682992753]
step  17 :  [-0.04467450090341979]
step  18 :  [-0.017991456070208346]
step  19 :  [-0.018420629563757437]
step  20 :  [-0.03292551793644396]
step  21 :  [-0.0868087392218592]
step  22 :  [-0.10036077637635818]
step  23 :  [-0.06789118953664018]
step  24 :  [-0.027724205376126004]
episode  163 : steps 25 , return [-15.55]
step  0 :  [-1.712295038952254]
step  1 :  [-1.6861837294427622]
step  2 :  [-1.6581435411475247]
step  3 :  [-1.5928049242818165]
step  4 :  [-1.496660217611814]
step  5 :  [-1.3760452486240142]
step  6 :  [-1.2363893512039297]
step  7 :  [-1.0820940991694081]
step  8 :  [-0.9166285567558078]
step  9 :  [-0.7770310111963801]
step  10 :  [-0.6282097116552446]
step  11 :  [-0.49389520687900795]
step  12 :  [-0.3949624901065643]
step  13 :  [-0.3005796193634886]
step  14 :  [-0.1983988781224159]
step  15 :  [-0.09547352932200828]
step  16 :  [-0.041808689694938804]
step  17 :  [-0.05108225250622875]
step  18 :  [-0.05517144398163651]
step  19 :  [-0.0667117849871711]
step  20 :  [-0.046939177669423855]
step  21 :  [-0.013015594174386773]
step  22 :  [-0.030887636121093166]
step  23 :  [-0.014951913988551285]
step  24 :  [-0.027307960190962044]
episode  164 : steps 25 , return [-15.99]
step  0 :  [-1.7324106826789603]
step  1 :  [-1.6910501821638335]
step  2 :  [-1.6419585787171]
step  3 :  [-1.592813628979229]
step  4 :  [-1.5504226005125952]
step  5 :  [-1.4785542743942466]
step  6 :  [-1.3797730307891425]
step  7 :  [-1.2584684246149873]
step  8 :  [-1.1191037411733467]
step  9 :  [-0.965617281659049]
step  10 :  [-0.8012984201765764]
step  11 :  [-0.6357809976636245]
step  12 :  [-0.475198373210349]
step  13 :  [-0.3485031715025035]
step  14 :  [-0.21935518179316738]
step  15 :  [-0.10591614210356567]
step  16 :  [-0.034562054221696684]
step  17 :  [-0.07992058950849987]
step  18 :  [-0.08680783058230374]
step  19 :  [-0.06659248112299186]
step  20 :  [-0.02166082539375952]
step  21 :  [-0.024742095096961923]
step  22 :  [-0.09465561480254311]
step  23 :  [-0.13407667880417476]
step  24 :  [-0.12153886462345692]
episode  165 : steps 25 , return [-17.66]
step  0 :  [-1.8182241521843046]
step  1 :  [-1.782956818803783]
step  2 :  [-1.7420087731300176]
step  3 :  [-1.702475214476897]
step  4 :  [-1.6305178894514274]
step  5 :  [-1.5304600107733197]
step  6 :  [-1.407474365036023]
step  7 :  [-1.2663538331691255]
step  8 :  [-1.1111451887697643]
step  9 :  [-0.9451190696452236]
step  10 :  [-0.7802365632663745]
step  11 :  [-0.6102609922249809]
step  12 :  [-0.4736329924407988]
step  13 :  [-0.3840336511704413]
step  14 :  [-0.3001405854791347]
step  15 :  [-0.20356420634735137]
step  16 :  [-0.0906744652767563]
step  17 :  [-0.06298858002738456]
step  18 :  [-0.06884334367818025]
step  19 :  [-0.02512511581689918]
step  20 :  [-0.040652024256404816]
step  21 :  [-0.0160145912747319]
step  22 :  [-0.04331183300829727]
step  23 :  [-0.053673452649108944]
step  24 :  [-0.018480324261350187]
episode  166 : steps 25 , return [-18.11]
step  0 :  [-1.6232096753457768]
step  1 :  [-1.5850806410043663]
step  2 :  [-1.5408821874185483]
step  3 :  [-1.4984825501038563]
step  4 :  [-1.4253079796292034]
step  5 :  [-1.3247808494203421]
step  6 :  [-1.2016633423022784]
step  7 :  [-1.060554574962769]
step  8 :  [-0.905406071601149]
step  9 :  [-0.7883441854858169]
step  10 :  [-0.655772803702765]
step  11 :  [-0.5402939699640074]
step  12 :  [-0.45800667495092323]
step  13 :  [-0.3764121641878478]
step  14 :  [-0.28295278357409603]
step  15 :  [-0.18252874740777514]
step  16 :  [-0.11005081923593477]
step  17 :  [-0.09120194803602491]
step  18 :  [-0.05671282629921149]
step  19 :  [-0.03131621504138027]
step  20 :  [-0.01409266420384676]
step  21 :  [-0.039858554049684664]
step  22 :  [-0.020523395658244032]
step  23 :  [-0.05613695723395758]
step  24 :  [-0.035114725662275637]
episode  167 : steps 25 , return [-15.9]
step  0 :  [-1.6119779805308696]
step  1 :  [-1.5733730185568173]
step  2 :  [-1.5285589436384934]
step  3 :  [-1.4854704251224573]
step  4 :  [-1.411870712973712]
step  5 :  [-1.3110695328096544]
step  6 :  [-1.1877694369881562]
step  7 :  [-1.0465369029058327]
step  8 :  [-0.8913054355610432]
step  9 :  [-0.7886583984613229]
step  10 :  [-0.6665778210675808]
step  11 :  [-0.5589575126858467]
step  12 :  [-0.48183030895399886]
step  13 :  [-0.4040712718477352]
step  14 :  [-0.31085396797878184]
step  15 :  [-0.21027679407926045]
step  16 :  [-0.09760626837323669]
step  17 :  [-0.05176913935472628]
step  18 :  [-0.04874742488437704]
step  19 :  [-0.017752447100445854]
step  20 :  [-0.022342151739953357]
step  21 :  [-0.013839167979228548]
step  22 :  [-0.01104572146346744]
step  23 :  [-0.05158016166075001]
step  24 :  [-0.050490571872166934]
episode  168 : steps 25 , return [-15.83]
step  0 :  [-1.6274611990992103]
step  1 :  [-1.5896678868903913]
step  2 :  [-1.545918222956936]
step  3 :  [-1.5040466088331164]
step  4 :  [-1.4312179608728033]
step  5 :  [-1.3309256724108667]
step  6 :  [-1.2079719639509219]
step  7 :  [-1.0669791302101672]
step  8 :  [-0.9119121968403806]
step  9 :  [-0.7880013006025192]
step  10 :  [-0.6506137473538088]
step  11 :  [-0.5306552863464802]
step  12 :  [-0.44487942565187133]
step  13 :  [-0.360657271369931]
step  14 :  [-0.2661226525850832]
step  15 :  [-0.16547055492277235]
step  16 :  [-0.050292718776007515]
step  17 :  [-0.028978561207546057]
step  18 :  [-0.033251496031585365]
step  19 :  [-0.02449200296892961]
step  20 :  [-0.017616419875564376]
step  21 :  [-0.045032531664109234]
step  22 :  [-0.027242685141795075]
step  23 :  [-0.057669454678611946]
step  24 :  [-0.03554220997808445]
episode  169 : steps 25 , return [-15.74]
step  0 :  [-1.784030342530367]
step  1 :  [-1.750738088957601]
step  2 :  [-1.7126190271689947]
step  3 :  [-1.676740711779343]
step  4 :  [-1.607449476318133]
step  5 :  [-1.509355941595535]
step  6 :  [-1.3878327862417217]
step  7 :  [-1.2478082760934923]
step  8 :  [-1.0934198203897032]
step  9 :  [-0.9279963441766048]
step  10 :  [-0.7712551357840268]
step  11 :  [-0.6110410293422806]
step  12 :  [-0.4625622175077226]
step  13 :  [-0.3499369869869108]
step  14 :  [-0.2447060521187073]
step  15 :  [-0.13907527581485893]
step  16 :  [-0.019246960172681783]
step  17 :  [-0.06005620585792878]
step  18 :  [-0.12635453129653762]
step  19 :  [-0.13733613714296855]
step  20 :  [-0.11931269794847026]
step  21 :  [-0.07555179088712731]
step  22 :  [-0.06345970814410246]
step  23 :  [-0.03357784454304674]
step  24 :  [-0.03373300652315661]
episode  170 : steps 25 , return [-17.95]
step  0 :  [-1.748909560123595]
step  1 :  [-1.7147797798597024]
step  2 :  [-1.675632239189634]
step  3 :  [-1.6386896137789344]
step  4 :  [-1.5687865305110569]
step  5 :  [-1.4703221106084092]
step  6 :  [-1.3485629146667075]
step  7 :  [-1.2083811033067986]
step  8 :  [-1.053882738960411]
step  9 :  [-0.8883780626765804]
step  10 :  [-0.7671718079735169]
step  11 :  [-0.6355045723087613]
step  12 :  [-0.5066339823322589]
step  13 :  [-0.40550729181499545]
step  14 :  [-0.2980564605558227]
step  15 :  [-0.1963589589213728]
step  16 :  [-0.08492540371979805]
step  17 :  [-0.03315880606801606]
step  18 :  [-0.029608690541789523]
step  19 :  [-0.03582543902895316]
step  20 :  [-0.07658062299732438]
step  21 :  [-0.10268003957766346]
step  22 :  [-0.0746987944129825]
step  23 :  [-0.0054442520176952005]
step  24 :  [-0.009344858060404049]
episode  171 : steps 25 , return [-17.58]
step  0 :  [-1.6825885118587203]
step  1 :  [-1.640642066090211]
step  2 :  [-1.590908105064394]
step  3 :  [-1.541249750414084]
step  4 :  [-1.498678803815352]
step  5 :  [-1.4269705080442094]
step  6 :  [-1.3284713847757432]
step  7 :  [-1.2074894004635088]
step  8 :  [-1.0684661440641885]
step  9 :  [-0.9153510088111861]
step  10 :  [-0.7615973810996614]
step  11 :  [-0.6032806173951066]
step  12 :  [-0.4462018174316499]
step  13 :  [-0.32006148078269075]
step  14 :  [-0.20616797766852857]
step  15 :  [-0.07484588568982188]
step  16 :  [-0.0537806835338631]
step  17 :  [-0.09480557757973142]
step  18 :  [-0.09814514327106798]
step  19 :  [-0.06222663842817234]
step  20 :  [-0.06742097915916112]
step  21 :  [-0.0857804454736634]
step  22 :  [-0.06927200442866074]
step  23 :  [-0.022745080546136488]
step  24 :  [-0.02426344518802755]
episode  172 : steps 25 , return [-16.89]
step  0 :  [-1.585282595780641]
step  1 :  [-1.553493199995522]
step  2 :  [-1.5182146061793385]
step  3 :  [-1.4483059780648724]
step  4 :  [-1.349182853187811]
step  5 :  [-1.2266122331669573]
step  6 :  [-1.0857191617335473]
step  7 :  [-0.9307590964079511]
step  8 :  [-0.795581652422399]
step  9 :  [-0.8073564611065803]
step  10 :  [-0.9159784911210136]
step  11 :  [-0.9872481388977649]
step  12 :  [-0.9910275418894877]
step  13 :  [-0.9440580040939929]
step  14 :  [-0.8681941247800794]
step  15 :  [-0.8462023184125554]
step  16 :  [-0.8854925106342562]
step  17 :  [-0.9295984483157662]
step  18 :  [-0.9306148453209758]
step  19 :  [-0.8928289618776432]
step  20 :  [-0.8466854941201797]
step  21 :  [-0.7851962682966257]
step  22 :  [-0.6941051416787573]
step  23 :  [-0.5818773623729679]
step  24 :  [-0.4576490923258741]
episode  173 : steps 25 , return [-24.86]
step  0 :  [-1.4700914769087694]
step  1 :  [-1.4286654604868618]
step  2 :  [-1.3805393729700628]
step  3 :  [-1.3343646063637944]
step  4 :  [-1.2593392261030651]
step  5 :  [-1.1578922422430449]
step  6 :  [-1.0343189919369165]
step  7 :  [-0.8929908727827851]
step  8 :  [-0.8011963113545298]
step  9 :  [-0.6880956851603341]
step  10 :  [-0.5908245385430672]
step  11 :  [-0.5224705461865065]
step  12 :  [-0.4513616024027013]
step  13 :  [-0.3631057030924535]
step  14 :  [-0.26599519133671656]
step  15 :  [-0.17033605694949408]
step  16 :  [-0.07837685277875217]
step  17 :  [-0.034969479503757665]
step  18 :  [-0.03325796676904957]
step  19 :  [-0.0428247528450723]
step  20 :  [-0.01343050123034468]
step  21 :  [-0.05804135321252446]
step  22 :  [-0.06145135163605206]
step  23 :  [-0.06439192423257334]
step  24 :  [-0.023157510994394555]
episode  174 : steps 25 , return [-14.22]
step  0 :  [-1.6110833611164967]
step  1 :  [-1.5828938619637516]
step  2 :  [-1.5524375499747622]
step  3 :  [-1.4857199832950847]
step  4 :  [-1.3887454572854503]
step  5 :  [-1.2676108665311197]
step  6 :  [-1.1276221402785995]
step  7 :  [-0.9731152094744571]
step  8 :  [-0.8075259505997323]
step  9 :  [-0.728560349840865]
step  10 :  [-0.6404013856130955]
step  11 :  [-0.548621860230527]
step  12 :  [-0.47141872287069203]
step  13 :  [-0.3836485465284623]
step  14 :  [-0.29173386304384813]
step  15 :  [-0.18507382444891804]
step  16 :  [-0.0931847705862803]
step  17 :  [-0.054369792483514576]
step  18 :  [-0.04847071499215801]
step  19 :  [-0.017305150264464886]
step  20 :  [-0.0478130678165733]
step  21 :  [-0.04668716924691716]
step  22 :  [-0.022151475229001374]
step  23 :  [-0.024525684899310455]
step  24 :  [-0.035482786146936465]
episode  175 : steps 25 , return [-15.44]
step  0 :  [-1.6834996987807367]
step  1 :  [-1.6586882854999512]
step  2 :  [-1.6325300840878325]
step  3 :  [-1.568577947543208]
step  4 :  [-1.4734668335833427]
step  5 :  [-1.3536333278252553]
step  6 :  [-1.2145765204002725]
step  7 :  [-1.0607467327332545]
step  8 :  [-0.8956478897566604]
step  9 :  [-0.7619550659892934]
step  10 :  [-0.6202906757891292]
step  11 :  [-0.481619490177567]
step  12 :  [-0.37227632677554195]
step  13 :  [-0.2587041812213248]
step  14 :  [-0.15416460207571067]
step  15 :  [-0.045696280966126795]
step  16 :  [-0.06662453690740239]
step  17 :  [-0.0573353733915287]
step  18 :  [-0.012355394142886273]
step  19 :  [-0.011087220012732086]
step  20 :  [-0.05421323654644177]
step  21 :  [-0.0418302470184822]
step  22 :  [-0.0793527481439515]
step  23 :  [-0.06785662352837235]
step  24 :  [-0.012223416293297379]
episode  176 : steps 25 , return [-15.64]
step  0 :  [-1.7607305659561536]
step  1 :  [-1.7199466957193854]
step  2 :  [-1.6715618218239987]
step  3 :  [-1.6231403480809186]
step  4 :  [-1.5813642745806618]
step  5 :  [-1.5097761990925973]
step  6 :  [-1.4111140011069354]
step  7 :  [-1.2898473924226257]
step  8 :  [-1.1504764952689952]
step  9 :  [-0.9969543458467535]
step  10 :  [-0.8325699564889792]
step  11 :  [-0.6837371945930008]
step  12 :  [-0.5315908719870187]
step  13 :  [-0.38400953514413066]
step  14 :  [-0.26350952403728395]
step  15 :  [-0.14684750238808644]
step  16 :  [-0.03625864882980952]
step  17 :  [-0.03103619146446241]
step  18 :  [-0.04369808511646833]
step  19 :  [-0.006957753241004583]
step  20 :  [-0.028437232142580354]
step  21 :  [-0.006697083829899795]
step  22 :  [-0.021838208142570772]
step  23 :  [-0.014301870615600688]
step  24 :  [-0.051615688479913976]
episode  177 : steps 25 , return [-17.8]
step  0 :  [-1.4413590404992027]
step  1 :  [-1.403940248026041]
step  2 :  [-1.3615598170981462]
step  3 :  [-1.3227851410275493]
step  4 :  [-1.2530726652558535]
step  5 :  [-1.155554416316044]
step  6 :  [-1.0350008474248402]
step  7 :  [-0.8961170896274262]
step  8 :  [-0.7844334011332629]
step  9 :  [-0.6604739654378461]
step  10 :  [-0.5332631519728133]
step  11 :  [-0.41268736589926297]
step  12 :  [-0.3130375476886638]
step  13 :  [-0.2098224002204888]
step  14 :  [-0.09403469795428952]
step  15 :  [-0.055801658705530874]
step  16 :  [-0.03534537360784934]
step  17 :  [-0.059521127935297805]
step  18 :  [-0.04471022965088307]
step  19 :  [-0.021280381790365614]
step  20 :  [-0.06607981548711174]
step  21 :  [-0.07247652855511755]
step  22 :  [-0.04431525816997758]
step  23 :  [-0.07379718371694703]
step  24 :  [-0.053954607035589824]
episode  178 : steps 25 , return [-13.4]
step  0 :  [-1.7492686351053217]
step  1 :  [-1.7182913272937672]
step  2 :  [-1.6834694161665047]
step  3 :  [-1.6134363324229108]
step  4 :  [-1.554153073032956]
step  5 :  [-1.4648321405615143]
step  6 :  [-1.3505905361708026]
step  7 :  [-1.2164737675217225]
step  8 :  [-1.0668596254472094]
step  9 :  [-0.9053515729645493]
step  10 :  [-0.746414570361292]
step  11 :  [-0.5835167742418989]
step  12 :  [-0.42179343584140194]
step  13 :  [-0.2915693990110013]
step  14 :  [-0.15816681982524797]
step  15 :  [-0.048625013686816675]
step  16 :  [-0.031873858963025886]
step  17 :  [-0.031170584787596364]
step  18 :  [-0.08242604038644066]
step  19 :  [-0.1146687663842348]
step  20 :  [-0.10037509922011988]
step  21 :  [-0.04463173531773615]
step  22 :  [-0.02100908450600519]
step  23 :  [-0.03545434402529365]
step  24 :  [-0.020831739014335424]
episode  179 : steps 25 , return [-17.06]
step  0 :  [-1.7706308936439838]
step  1 :  [-1.739743719417362]
step  2 :  [-1.7049685964054953]
step  3 :  [-1.673252553401409]
step  4 :  [-1.6069476914813854]
step  5 :  [-1.51106702024121]
step  6 :  [-1.3912442991948588]
step  7 :  [-1.2525844071547048]
step  8 :  [-1.0993552449261081]
step  9 :  [-0.9349993262334857]
step  10 :  [-0.7622649636281127]
step  11 :  [-0.5883415005711375]
step  12 :  [-0.41779004387820035]
step  13 :  [-0.2816428383802428]
step  14 :  [-0.16165324242289622]
step  15 :  [-0.09190790674350896]
step  16 :  [-0.017671373336297546]
step  17 :  [-0.04000974257049367]
step  18 :  [-0.0295607897086424]
step  19 :  [-0.020079580161566163]
step  20 :  [-0.020699148876331702]
step  21 :  [-0.021419761470830127]
step  22 :  [-0.016249731552880026]
step  23 :  [-0.031026852772649223]
step  24 :  [-0.02759497465894174]
episode  180 : steps 25 , return [-17.21]
step  0 :  [-1.696816619314384]
step  1 :  [-1.6713586050573574]
step  2 :  [-1.644268016240027]
step  3 :  [-1.5796293257796472]
step  4 :  [-1.484004742109955]
step  5 :  [-1.3637798729057409]
step  6 :  [-1.224418315496666]
step  7 :  [-1.0703448772431547]
step  8 :  [-0.9050437199070129]
step  9 :  [-0.7712055381617696]
step  10 :  [-0.6285422752093044]
step  11 :  [-0.49323639046322215]
step  12 :  [-0.38936834087718436]
step  13 :  [-0.2836239089572676]
step  14 :  [-0.1860828546968943]
step  15 :  [-0.08190796690858569]
step  16 :  [-0.020040090614569774]
step  17 :  [-0.05090198392411206]
step  18 :  [-0.07662447934559151]
step  19 :  [-0.050020714223206045]
step  20 :  [-0.06744692294014631]
step  21 :  [-0.05650292962786988]
step  22 :  [-0.005044259424822933]
step  23 :  [-0.009459874419058134]
step  24 :  [-0.043639143037659256]
episode  181 : steps 25 , return [-15.85]
step  0 :  [-1.4380991590342194]
step  1 :  [-1.3982451301129297]
step  2 :  [-1.3524798779205773]
step  3 :  [-1.3095221774144814]
step  4 :  [-1.2369009580970365]
step  5 :  [-1.1372640068449205]
step  6 :  [-1.015078716775722]
step  7 :  [-0.8748437541062252]
step  8 :  [-0.7976266543298021]
step  9 :  [-0.6984805992502235]
step  10 :  [-0.5972675559877386]
step  11 :  [-0.5000127450139918]
step  12 :  [-0.4180111231572304]
step  13 :  [-0.3388414842766389]
step  14 :  [-0.25670530123181656]
step  15 :  [-0.1622204371632956]
step  16 :  [-0.07731081197084325]
step  17 :  [-0.06349191135242618]
step  18 :  [-0.06811667883604487]
step  19 :  [-0.06110226435857743]
step  20 :  [-0.06829513842357314]
step  21 :  [-0.025285539315564754]
step  22 :  [-0.042921068096161634]
step  23 :  [-0.06319292529356635]
step  24 :  [-0.06564996440117958]
episode  182 : steps 25 , return [-14.07]
step  0 :  [-1.42428985043186]
step  1 :  [-1.3954150803997896]
step  2 :  [-1.3649472756610426]
step  3 :  [-1.2988564227716894]
step  4 :  [-1.2026496703457898]
step  5 :  [-1.082247561665183]
step  6 :  [-0.9429002556889493]
step  7 :  [-0.798360547646574]
step  8 :  [-0.6471485644219908]
step  9 :  [-0.5120563672268452]
step  10 :  [-0.41298757509325423]
step  11 :  [-0.31773740808557105]
step  12 :  [-0.23046524666425336]
step  13 :  [-0.13517960422248873]
step  14 :  [-0.07755982843309796]
step  15 :  [-0.035481295389792965]
step  16 :  [-0.013682901034088401]
step  17 :  [-0.03849559743959657]
step  18 :  [-0.04265259072127819]
step  19 :  [-0.005061836525591017]
step  20 :  [-0.02623543310341492]
step  21 :  [-0.013771995432829372]
step  22 :  [-0.024600724756660267]
step  23 :  [-0.02435234582121717]
step  24 :  [-0.02708210745998171]
episode  183 : steps 25 , return [-12.09]
step  0 :  [-1.6717671312659421]
step  1 :  [-1.6448741595512764]
step  2 :  [-1.6159311182849463]
step  3 :  [-1.5500796024680703]
step  4 :  [-1.4536274867424264]
step  5 :  [-1.332820454604844]
step  6 :  [-1.1930412647681672]
step  7 :  [-1.038666514859329]
step  8 :  [-0.873152081164403]
step  9 :  [-0.7762435774160774]
step  10 :  [-0.6605041637475274]
step  11 :  [-0.5482988111480923]
step  12 :  [-0.4473126534139798]
step  13 :  [-0.3658550523089212]
step  14 :  [-0.2766723142723664]
step  15 :  [-0.17064985366745944]
step  16 :  [-0.08533716860678603]
step  17 :  [-0.08853896139635367]
step  18 :  [-0.12686627704903972]
step  19 :  [-0.1332739604250277]
step  20 :  [-0.11031446410727817]
step  21 :  [-0.05441585735828911]
step  22 :  [-0.0701115804329147]
step  23 :  [-0.046607190973997736]
step  24 :  [-0.0712377117598466]
episode  184 : steps 25 , return [-16.41]
step  0 :  [-1.4201956018538189]
step  1 :  [-1.391886478364766]
step  2 :  [-1.3622182525418804]
step  3 :  [-1.2966980947577311]
step  4 :  [-1.200912301537881]
step  5 :  [-1.0808327363988266]
step  6 :  [-0.9417446500197312]
step  7 :  [-0.7969779703870354]
step  8 :  [-0.6460112277042346]
step  9 :  [-0.5393351883216271]
step  10 :  [-0.41991317975902215]
step  11 :  [-0.31567087227378854]
step  12 :  [-0.215715966977782]
step  13 :  [-0.09606708057177579]
step  14 :  [-0.04224095016054741]
step  15 :  [-0.05103274459563262]
step  16 :  [-0.05642337591008809]
step  17 :  [-0.05519769805659785]
step  18 :  [-0.08583905302017257]
step  19 :  [-0.08399076573679709]
step  20 :  [-0.04919821155145302]
step  21 :  [-0.046364420837223023]
step  22 :  [-0.015299545687917573]
step  23 :  [-0.03793087474006376]
step  24 :  [-0.012500118253054136]
episode  185 : steps 25 , return [-12.26]
step  0 :  [-1.538970944844089]
step  1 :  [-1.5012655444834846]
step  2 :  [-1.4580139918275168]
step  3 :  [-1.4173783313290202]
step  4 :  [-1.3458249429783684]
step  5 :  [-1.2466640869559]
step  6 :  [-1.1246656621835949]
step  7 :  [-0.984469156179426]
step  8 :  [-0.8300722508358979]
step  9 :  [-0.7435904701275935]
step  10 :  [-0.6440684909910156]
step  11 :  [-0.5378850983197666]
step  12 :  [-0.43616736413865176]
step  13 :  [-0.34787001448285176]
step  14 :  [-0.2507331249711973]
step  15 :  [-0.13781279310081693]
step  16 :  [-0.08822733450972332]
step  17 :  [-0.026158553039758635]
step  18 :  [-0.01234260082007078]
step  19 :  [-0.01838820980688322]
step  20 :  [-0.07583618658374908]
step  21 :  [-0.11253747547301886]
step  22 :  [-0.10059417485623331]
step  23 :  [-0.08026025001552427]
step  24 :  [-0.02424557066118984]
episode  186 : steps 25 , return [-15.08]
step  0 :  [-1.4794242399066075]
step  1 :  [-1.4491949508435962]
step  2 :  [-1.4165684458304162]
step  3 :  [-1.3487901454276716]
step  4 :  [-1.2512830989613681]
step  5 :  [-1.1298783938557428]
step  6 :  [-0.9897539943402917]
step  7 :  [-0.8351817898925455]
step  8 :  [-0.7879893311266405]
step  9 :  [-0.7072346742958261]
step  10 :  [-0.622764344813931]
step  11 :  [-0.5380897844373185]
step  12 :  [-0.4651692595775617]
step  13 :  [-0.3824540604478114]
step  14 :  [-0.2869103595879666]
step  15 :  [-0.1781114466241305]
step  16 :  [-0.06487327039844044]
step  17 :  [-0.010530094414107903]
step  18 :  [-0.017543498426427547]
step  19 :  [-0.03163616780276553]
step  20 :  [-0.028337301358931536]
step  21 :  [-0.01734019332936658]
step  22 :  [-0.05142460013102988]
step  23 :  [-0.03404662401543668]
step  24 :  [-0.056007436636452024]
episode  187 : steps 25 , return [-14.18]
step  0 :  [-1.6795286421341828]
step  1 :  [-1.6418924913777178]
step  2 :  [-1.5981587635413]
step  3 :  [-1.5559760434310723]
step  4 :  [-1.5220837011980923]
step  5 :  [-1.4565935047213774]
step  6 :  [-1.362790185500977]
step  7 :  [-1.245591828350245]
step  8 :  [-1.109874113028836]
step  9 :  [-0.9599578223893326]
step  10 :  [-0.7995994041991626]
step  11 :  [-0.632312732274944]
step  12 :  [-0.46234560360698407]
step  13 :  [-0.32215624119610103]
step  14 :  [-0.17152898876856457]
step  15 :  [-0.039619984696081134]
step  16 :  [-0.04618302059848403]
step  17 :  [-0.059875291413489816]
step  18 :  [-0.02029931902473762]
step  19 :  [-0.04062546640125938]
step  20 :  [-0.07191552719326078]
step  21 :  [-0.07437650422829156]
step  22 :  [-0.03382550083037449]
step  23 :  [-0.04685903489010071]
step  24 :  [-0.012456278216070817]
episode  188 : steps 25 , return [-16.97]
step  0 :  [-1.7627367115350792]
step  1 :  [-1.7223886905741321]
step  2 :  [-1.6746022220055838]
step  3 :  [-1.6269137135686895]
step  4 :  [-1.5859723873736022]
step  5 :  [-1.514964556472833]
step  6 :  [-1.4167246708782861]
step  7 :  [-1.2957819950723508]
step  8 :  [-1.1566758184921535]
step  9 :  [-1.0033884915167137]
step  10 :  [-0.8392366500151142]
step  11 :  [-0.6881705264611825]
step  12 :  [-0.532536153681199]
step  13 :  [-0.37957535852694435]
step  14 :  [-0.25399436543254594]
step  15 :  [-0.13450921818719727]
step  16 :  [-0.08419312328627299]
step  17 :  [-0.03138992923174489]
step  18 :  [-0.01625062688837932]
step  19 :  [-0.00980883978243497]
step  20 :  [-0.05527241357779574]
step  21 :  [-0.04993242455352802]
step  22 :  [-0.05102741121653669]
step  23 :  [-0.012524806530154869]
step  24 :  [-0.06249378139396202]
episode  189 : steps 25 , return [-17.96]
step  0 :  [-1.7250941217907296]
step  1 :  [-1.6836671728753978]
step  2 :  [-1.6345080288589122]
step  3 :  [-1.5853201043603466]
step  4 :  [-1.5429387036649653]
step  5 :  [-1.4711181081364582]
step  6 :  [-1.3723952936668034]
step  7 :  [-1.251150464186974]
step  8 :  [-1.1118452575059308]
step  9 :  [-0.9584204657822254]
step  10 :  [-0.794172120318535]
step  11 :  [-0.6279510677222697]
step  12 :  [-0.4666538408828919]
step  13 :  [-0.3392475424551451]
step  14 :  [-0.21000568234659592]
step  15 :  [-0.09770602088004805]
step  16 :  [-0.04883128824885182]
step  17 :  [-0.03486456176186704]
step  18 :  [-0.005005577990988809]
step  19 :  [-0.0796215012156769]
step  20 :  [-0.08909359624662816]
step  21 :  [-0.05685328281097603]
step  22 :  [-0.0023449239116925483]
step  23 :  [-0.04112583379450897]
step  24 :  [-0.045024812498905775]
episode  190 : steps 25 , return [-17.27]
step  0 :  [-1.6781009282027008]
step  1 :  [-1.6481183518710927]
step  2 :  [-1.6149291555574092]
step  3 :  [-1.5461666367445133]
step  4 :  [-1.4476949126245817]
step  5 :  [-1.3254951427936899]
step  6 :  [-1.1847957130033024]
step  7 :  [-1.02989479262413]
step  8 :  [-0.8642383549909681]
step  9 :  [-0.8288661985789199]
step  10 :  [-0.8606538933637017]
step  11 :  [-0.8514506029563048]
step  12 :  [-0.8031319966774128]
step  13 :  [-0.7258112583814754]
step  14 :  [-0.6298555856854371]
step  15 :  [-0.5271242439412342]
step  16 :  [-0.42870058600401373]
step  17 :  [-0.3217827543921741]
step  18 :  [-0.21159879858710762]
step  19 :  [-0.0943496043664716]
step  20 :  [-0.028079116567697227]
step  21 :  [-0.06449010621755567]
step  22 :  [-0.0901687355380954]
step  23 :  [-0.11970359138035315]
step  24 :  [-0.11767906077904336]
episode  191 : steps 25 , return [-19.04]
step  0 :  [-1.643001138852059]
step  1 :  [-1.6060993635440823]
step  2 :  [-1.5635233961202004]
step  3 :  [-1.523002483516473]
step  4 :  [-1.4510411832758887]
step  5 :  [-1.3513297181138089]
step  6 :  [-1.2287785591269373]
step  7 :  [-1.0880718648189238]
step  8 :  [-0.933211162156746]
step  9 :  [-0.787306761508155]
step  10 :  [-0.6341158214079726]
step  11 :  [-0.5010103118663424]
step  12 :  [-0.40590434022278066]
step  13 :  [-0.3149091041999833]
step  14 :  [-0.21549002541862758]
step  15 :  [-0.11777832135927342]
step  16 :  [-0.0727869521184073]
step  17 :  [-0.05729183462620811]
step  18 :  [-0.022654216679120417]
step  19 :  [-0.05362889791655703]
step  20 :  [-0.037199820748394896]
step  21 :  [-0.016055220525344638]
step  22 :  [-0.06969402677197811]
step  23 :  [-0.08332894105278324]
step  24 :  [-0.060169715579914476]
episode  192 : steps 25 , return [-15.84]
step  0 :  [-1.6249748815581948]
step  1 :  [-1.5877683251719703]
step  2 :  [-1.544842215637521]
step  3 :  [-1.5040063091661815]
step  4 :  [-1.4319057421469008]
step  5 :  [-1.332136348710687]
step  6 :  [-1.2095654726288265]
step  7 :  [-1.068856917553732]
step  8 :  [-0.9140023486356456]
step  9 :  [-0.7871494290384977]
step  10 :  [-0.6483160403558261]
step  11 :  [-0.5235094744827586]
step  12 :  [-0.43201082584695477]
step  13 :  [-0.34324923397357243]
step  14 :  [-0.24312699759915007]
step  15 :  [-0.13842617263760287]
step  16 :  [-0.08195601118836458]
step  17 :  [-0.08679605164324344]
step  18 :  [-0.05820391157998745]
step  19 :  [-0.05362223518528436]
step  20 :  [-0.029216019050154453]
step  21 :  [-0.04019533189995596]
step  22 :  [-0.013908657936978128]
step  23 :  [-0.03657302277465453]
step  24 :  [-0.008017581360554507]
episode  193 : steps 25 , return [-15.74]
step  0 :  [-1.7131724337942782]
step  1 :  [-1.6800880405084402]
step  2 :  [-1.6425082472678383]
step  3 :  [-1.6076977379700226]
step  4 :  [-1.5394330073567055]
step  5 :  [-1.4422348508642784]
step  6 :  [-1.321472814441657]
step  7 :  [-1.1820996710507818]
step  8 :  [-1.028286875031604]
step  9 :  [-0.8634054778154695]
step  10 :  [-0.7318273780723532]
step  11 :  [-0.5922614611311404]
step  12 :  [-0.4512046434707432]
step  13 :  [-0.3358988267158059]
step  14 :  [-0.21571542868689875]
step  15 :  [-0.10592822762105866]
step  16 :  [-0.031607020498190065]
step  17 :  [-0.07891158726807934]
step  18 :  [-0.08454352808847672]
step  19 :  [-0.05775274544474163]
step  20 :  [-0.017531816157525748]
step  21 :  [-0.0489316153647117]
step  22 :  [-0.03764715141096614]
step  23 :  [-0.010664434782736598]
step  24 :  [-0.028527704626148676]
episode  194 : steps 25 , return [-16.85]
step  0 :  [-1.6414740553766325]
step  1 :  [-1.6100565161161808]
step  2 :  [-1.5750484625499943]
step  3 :  [-1.5438366009325146]
step  4 :  [-1.478436619443304]
step  5 :  [-1.3835401569473305]
step  6 :  [-1.2646870533706729]
step  7 :  [-1.1269819720974308]
step  8 :  [-0.9747446101274887]
step  9 :  [-0.8115266954671458]
step  10 :  [-0.6454251274639042]
step  11 :  [-0.4769827432589059]
step  12 :  [-0.34124534872523865]
step  13 :  [-0.19346437548605383]
step  14 :  [-0.06518169323673029]
step  15 :  [-0.027639468310933283]
step  16 :  [-0.03955874531690017]
step  17 :  [-0.020372038381489332]
step  18 :  [-0.02532164514284641]
step  19 :  [-0.028962768315942227]
step  20 :  [-0.021688707697207755]
step  21 :  [-0.035685320005583006]
step  22 :  [-0.02201580651562869]
step  23 :  [-0.03268035335612155]
step  24 :  [-0.0679065791572138]
episode  195 : steps 25 , return [-15.45]
step  0 :  [-1.764502020221228]
step  1 :  [-1.7237620663351831]
step  2 :  [-1.675425768252141]
step  3 :  [-1.6270442721903935]
step  4 :  [-1.5852851761588391]
step  5 :  [-1.5136889491922079]
step  6 :  [-1.4150093471113534]
step  7 :  [-1.2937222384519622]
step  8 :  [-1.1543296596081352]
step  9 :  [-1.0007843768966767]
step  10 :  [-0.8363732987187149]
step  11 :  [-0.6891469567437292]
step  12 :  [-0.5376676359321929]
step  13 :  [-0.38945657156499025]
step  14 :  [-0.26799642160350867]
step  15 :  [-0.15109321906205678]
step  16 :  [-0.04401658736630674]
step  17 :  [-0.04650953405532427]
step  18 :  [-0.03416501449219585]
step  19 :  [-0.01678648305125232]
step  20 :  [-0.06218454805661754]
step  21 :  [-0.0585080834828269]
step  22 :  [-0.09117886021692165]
step  23 :  [-0.0964427186827843]
step  24 :  [-0.06489148916362444]
episode  196 : steps 25 , return [-18.14]
step  0 :  [-1.6755259776465032]
step  1 :  [-1.6324925940425505]
step  2 :  [-1.5812672533933867]
step  3 :  [-1.529786650014081]
step  4 :  [-1.485152753618292]
step  5 :  [-1.412029457022953]
step  6 :  [-1.3125104344874796]
step  7 :  [-1.1907500053643314]
step  8 :  [-1.0510895088949093]
step  9 :  [-0.8974024612704322]
step  10 :  [-0.7643237978199131]
step  11 :  [-0.6232651062953475]
step  12 :  [-0.48157261150081143]
step  13 :  [-0.3513577595313158]
step  14 :  [-0.24764627536910166]
step  15 :  [-0.14478989433264325]
step  16 :  [-0.09304923979137662]
step  17 :  [-0.06391601335993095]
step  18 :  [-0.0448992981965062]
step  19 :  [-0.01507967271647931]
step  20 :  [-0.008218261789038958]
step  21 :  [-0.03188709777588658]
step  22 :  [-0.018480208176361295]
step  23 :  [-0.04897085752878447]
step  24 :  [-0.03198244203464448]
episode  197 : steps 25 , return [-16.74]
step  0 :  [-1.8070306103873395]
step  1 :  [-1.7677595320191233]
step  2 :  [-1.7213222242441113]
step  3 :  [-1.6750726568130347]
step  4 :  [-1.6354611335853322]
step  5 :  [-1.5651653904103904]
step  6 :  [-1.46732108338748]
step  7 :  [-1.3466043562094814]
step  8 :  [-1.207628133259562]
step  9 :  [-1.0544112317178485]
step  10 :  [-0.8902839932987338]
step  11 :  [-0.7305029180549762]
step  12 :  [-0.5660328139913609]
step  13 :  [-0.40139442994325053]
step  14 :  [-0.2675901683399923]
step  15 :  [-0.12977174256969923]
step  16 :  [-0.030643768082719524]
step  17 :  [-0.05771682522972352]
step  18 :  [-0.06607565808688967]
step  19 :  [-0.038107061893984925]
step  20 :  [-0.030741800023016345]
step  21 :  [-0.03364591842379536]
step  22 :  [-0.04288512143863018]
step  23 :  [-0.033425344374921395]
step  24 :  [-0.01848109791491624]
episode  198 : steps 25 , return [-18.59]
step  0 :  [-1.4829509413811197]
step  1 :  [-1.4526122646130932]
step  2 :  [-1.4198171829523398]
step  3 :  [-1.3519115856235313]
step  4 :  [-1.2543096595087022]
step  5 :  [-1.1328350027864789]
step  6 :  [-0.9926603620026357]
step  7 :  [-0.8380547060972292]
step  8 :  [-0.7882314735732597]
step  9 :  [-0.7053133225080539]
step  10 :  [-0.6203168026076811]
step  11 :  [-0.5364894813706409]
step  12 :  [-0.4659377480819837]
step  13 :  [-0.402072897435663]
step  14 :  [-0.3223524970079069]
step  15 :  [-0.2217011610814749]
step  16 :  [-0.10413356700573963]
step  17 :  [-0.016082350954055472]
step  18 :  [-0.009842914621632575]
step  19 :  [-0.02062583467362924]
step  20 :  [-0.032732322695030874]
step  21 :  [-0.027424692760034765]
step  22 :  [-0.061281823361498566]
step  23 :  [-0.060675723847559045]
step  24 :  [-0.04966407030182704]
episode  199 : steps 25 , return [-14.37]
step  0 :  [-1.6664741907398979]
step  1 :  [-1.635886114258693]
step  2 :  [-1.6019139931456663]
step  3 :  [-1.532655630479693]
step  4 :  [-1.4338644963256988]
step  5 :  [-1.3114630501097215]
step  6 :  [-1.170649260891899]
step  7 :  [-1.0157092312454463]
step  8 :  [-0.8500939729060677]
step  9 :  [-0.8294290889752155]
step  10 :  [-0.8844890458213827]
step  11 :  [-0.900587849793353]
step  12 :  [-0.8681074111544749]
step  13 :  [-0.7987378752497113]
step  14 :  [-0.7029002250308706]
step  15 :  [-0.5903820235494767]
step  16 :  [-0.47252423440606495]
step  17 :  [-0.36335391718404864]
step  18 :  [-0.2573139065764643]
step  19 :  [-0.15437894170688546]
step  20 :  [-0.09897379040825588]
step  21 :  [-0.08753517217789027]
step  22 :  [-0.07257146337097757]
step  23 :  [-0.06795768625799793]
step  24 :  [-0.020534518501665232]
episode  200 : steps 25 , return [-19.39]
step  0 :  [-1.5034259920339095]
step  1 :  [-1.4643844796990757]
step  2 :  [-1.4194355212557617]
step  3 :  [-1.376962187347944]
step  4 :  [-1.304314442911009]
step  5 :  [-1.2044638374983079]
step  6 :  [-1.082005984691208]
step  7 :  [-0.9414854532053957]
step  8 :  [-0.7992324232648179]
step  9 :  [-0.6500038807830817]
step  10 :  [-0.5218239328140211]
step  11 :  [-0.43090051112099653]
step  12 :  [-0.3430374591752313]
step  13 :  [-0.2502130837889358]
step  14 :  [-0.1534848304553015]
step  15 :  [-0.05268717820827828]
step  16 :  [-0.07535409005336978]
step  17 :  [-0.05945736954709649]
step  18 :  [-0.004387440211048312]
step  19 :  [-0.015149381740245526]
step  20 :  [-0.06362431899064873]
step  21 :  [-0.05732191172797238]
step  22 :  [-0.031490454076182534]
step  23 :  [-0.03394118807597951]
step  24 :  [-0.05660728846802142]
episode  201 : steps 25 , return [-13.9]
step  0 :  [-1.508514101005861]
step  1 :  [-1.468058756432664]
step  2 :  [-1.4211117774345599]
step  3 :  [-1.3761090940393292]
step  4 :  [-1.3406530169040614]
step  5 :  [-1.2752397730038318]
step  6 :  [-1.1822442425401483]
step  7 :  [-1.0662622463831561]
step  8 :  [-0.9321389439260759]
step  9 :  [-0.784396983846801]
step  10 :  [-0.6273787525900337]
step  11 :  [-0.46625172779112317]
step  12 :  [-0.33235699848259104]
step  13 :  [-0.18805974879174867]
step  14 :  [-0.05752692313399363]
step  15 :  [-0.031114436720313554]
step  16 :  [-0.01600685559064456]
step  17 :  [-0.025513399172772518]
step  18 :  [-0.0017088812531354657]
step  19 :  [-0.02883520124496844]
step  20 :  [-0.007895989000714594]
step  21 :  [-0.03235108497986995]
step  22 :  [-0.012635610577836414]
step  23 :  [-0.03469200208121518]
step  24 :  [-0.015316989715181837]
episode  202 : steps 25 , return [-14.23]
step  0 :  [-1.6445352042957635]
step  1 :  [-1.6015467228045734]
step  2 :  [-1.5504968975584486]
step  3 :  [-1.4994245696055368]
step  4 :  [-1.4555432478782333]
step  5 :  [-1.3831415211360896]
step  6 :  [-1.2842630892784865]
step  7 :  [-1.1630692473023574]
step  8 :  [-1.0239293836196082]
step  9 :  [-0.8707594880756617]
step  10 :  [-0.7408948694856256]
step  11 :  [-0.6013070019561761]
step  12 :  [-0.45798274411314516]
step  13 :  [-0.32384131319147963]
step  14 :  [-0.21537055987047388]
step  15 :  [-0.10961477766771921]
step  16 :  [-0.05438519175592646]
step  17 :  [-0.06570322469322594]
step  18 :  [-0.03176151657159162]
step  19 :  [-0.05242047154972038]
step  20 :  [-0.03828562038596713]
step  21 :  [-0.052336030189533894]
step  22 :  [-0.04728256439329593]
step  23 :  [-0.06146904751490533]
step  24 :  [-0.03126101026658556]
episode  203 : steps 25 , return [-16.36]
step  0 :  [-1.6205868841623927]
step  1 :  [-1.5963465622065987]
step  2 :  [-1.5712301970972151]
step  3 :  [-1.5081938756600595]
step  4 :  [-1.413849170243729]
step  5 :  [-1.2946541098370588]
step  6 :  [-1.1561398763371713]
step  7 :  [-1.0027917071429286]
step  8 :  [-0.8381541105279067]
step  9 :  [-0.6993940263099487]
step  10 :  [-0.5542937833138251]
step  11 :  [-0.4098047516595654]
step  12 :  [-0.2909428838062095]
step  13 :  [-0.17742090215297693]
step  14 :  [-0.05516982776050077]
step  15 :  [-0.015281647776612409]
step  16 :  [-0.0180892689612582]
step  17 :  [-0.02746517674183615]
step  18 :  [-0.039855091157301854]
step  19 :  [-0.04488168451908036]
step  20 :  [-0.027001863287718128]
step  21 :  [-0.01103430828544134]
step  22 :  [-0.04497411548767347]
step  23 :  [-0.05550769255780026]
step  24 :  [-0.03375421824863729]
episode  204 : steps 25 , return [-14.51]
step  0 :  [-1.5934262148959741]
step  1 :  [-1.5492579274446674]
step  2 :  [-1.4967507972689207]
step  3 :  [-1.4441773320483855]
step  4 :  [-1.399023001982295]
step  5 :  [-1.3260560149290546]
step  6 :  [-1.2269517036787372]
step  7 :  [-1.1057038337678262]
step  8 :  [-0.9666087134121483]
step  9 :  [-0.81356116099161]
step  10 :  [-0.6683306728998769]
step  11 :  [-0.5251018851809999]
step  12 :  [-0.39373820106572216]
step  13 :  [-0.2892990137292864]
step  14 :  [-0.18485994999591152]
step  15 :  [-0.06911343101700547]
step  16 :  [-0.056331122290839065]
step  17 :  [-0.039185447997733595]
step  18 :  [-0.07021562162414521]
step  19 :  [-0.051187323351414196]
step  20 :  [-0.014291883843005873]
step  21 :  [-0.010602441258644941]
step  22 :  [-0.04151800991362534]
step  23 :  [-0.03090947992520879]
step  24 :  [-0.047993628466094784]
episode  205 : steps 25 , return [-15.41]
step  0 :  [-1.742177603979363]
step  1 :  [-1.70489405937722]
step  2 :  [-1.6614214808529995]
step  3 :  [-1.6191916005867888]
step  4 :  [-1.5456505677527548]
step  5 :  [-1.4446222555497066]
step  6 :  [-1.3210247905409636]
step  7 :  [-1.1795168210763782]
step  8 :  [-1.0240744829823174]
step  9 :  [-0.8579368455576163]
step  10 :  [-0.7811077196759605]
step  11 :  [-0.6760959120535303]
step  12 :  [-0.5825003733469107]
step  13 :  [-0.5156818450172855]
step  14 :  [-0.43780858008999923]
step  15 :  [-0.3570126834079361]
step  16 :  [-0.2607852305099888]
step  17 :  [-0.1504650203833563]
step  18 :  [-0.035244334340732736]
step  19 :  [-0.02630726153248851]
step  20 :  [-0.022092930451388736]
step  21 :  [-0.024766107113823252]
step  22 :  [-0.023861807406688158]
step  23 :  [-0.007343591855377519]
step  24 :  [-0.04109594747289824]
episode  206 : steps 25 , return [-18.04]
step  0 :  [-1.6359631028677248]
step  1 :  [-1.609015466296763]
step  2 :  [-1.580147282380352]
step  3 :  [-1.5144493129377228]
step  4 :  [-1.4181572253602868]
step  5 :  [-1.2974923553708329]
step  6 :  [-1.1578304876193175]
step  7 :  [-1.0035470763436336]
step  8 :  [-0.8380977335728088]
step  9 :  [-0.7584184030992104]
step  10 :  [-0.6618834806871134]
step  11 :  [-0.5596385110722474]
step  12 :  [-0.4605939169684611]
step  13 :  [-0.3754008326481767]
step  14 :  [-0.2815187825395591]
step  15 :  [-0.17316673360144139]
step  16 :  [-0.0669737273994202]
step  17 :  [-0.016934135786043775]
step  18 :  [-0.03700447873647127]
step  19 :  [-0.039317737952430105]
step  20 :  [-0.04727871027474531]
step  21 :  [-0.021849985965362227]
step  22 :  [-0.03916999352161933]
step  23 :  [-0.03649504577709225]
step  24 :  [-0.04633968976268886]
episode  207 : steps 25 , return [-15.68]
step  0 :  [-1.784595144119817]
step  1 :  [-1.744883884213126]
step  2 :  [-1.697908887701927]
step  3 :  [-1.6511104193444812]
step  4 :  [-1.6110319602829148]
step  5 :  [-1.5405203150499167]
step  6 :  [-1.4425818229943015]
step  7 :  [-1.3218327259013924]
step  8 :  [-1.1828582765386992]
step  9 :  [-1.0296660805345246]
step  10 :  [-0.8655863493862891]
step  11 :  [-0.7128147677080685]
step  12 :  [-0.553402367492954]
step  13 :  [-0.3927859931981833]
step  14 :  [-0.26089394098610824]
step  15 :  [-0.1431463908695113]
step  16 :  [-0.0644114811254978]
step  17 :  [-0.008071605361343501]
step  18 :  [-0.01715044107930992]
step  19 :  [-0.06527606783076494]
step  20 :  [-0.05964320767038619]
step  21 :  [-0.05064345245469669]
step  22 :  [-0.0545594837113304]
step  23 :  [-0.08014352677146011]
step  24 :  [-0.05037686961443492]
episode  208 : steps 25 , return [-18.39]
step  0 :  [-1.7454963981185652]
step  1 :  [-1.7051151206202957]
step  2 :  [-1.6573400108969474]
step  3 :  [-1.6097602683750056]
step  4 :  [-1.5690812334299635]
step  5 :  [-1.4983529844034937]
step  6 :  [-1.4003735618254658]
step  7 :  [-1.2796675697419664]
step  8 :  [-1.1407819674734234]
step  9 :  [-0.9877138687315496]
step  10 :  [-0.8238042705737018]
step  11 :  [-0.6659729483900922]
step  12 :  [-0.5063360897984622]
step  13 :  [-0.353416355585495]
step  14 :  [-0.22946966550883813]
step  15 :  [-0.11012677575854579]
step  16 :  [-0.05650796047857719]
step  17 :  [-0.05227286667915016]
step  18 :  [-0.012715196531895675]
step  19 :  [-0.023334816958901286]
step  20 :  [-0.014090323904560066]
step  21 :  [-0.01713795449411428]
step  22 :  [-0.04316301917911462]
step  23 :  [-0.04481783434219841]
step  24 :  [-0.00471439429245549]
episode  209 : steps 25 , return [-17.55]
step  0 :  [-1.4162432750075118]
step  1 :  [-1.3848422763688066]
step  2 :  [-1.3509425300579683]
step  3 :  [-1.2825266889879834]
step  4 :  [-1.1846884335996317]
step  5 :  [-1.0631076024919386]
step  6 :  [-0.9228890788812081]
step  7 :  [-0.8013325355710298]
step  8 :  [-0.6648861351746154]
step  9 :  [-0.5518871472097189]
step  10 :  [-0.4746811140267997]
step  11 :  [-0.3975216904762033]
step  12 :  [-0.3109848096675918]
step  13 :  [-0.21587900387864595]
step  14 :  [-0.1042390774968574]
step  15 :  [-0.045421148578410425]
step  16 :  [-0.044717774513552744]
step  17 :  [-0.027248635901783825]
step  18 :  [-0.05675698092452293]
step  19 :  [-0.07141303626953853]
step  20 :  [-0.04612433071582071]
step  21 :  [-0.021015031793424593]
step  22 :  [-0.023217399164204296]
step  23 :  [-0.03732569329303086]
step  24 :  [-0.02386278050198523]
episode  210 : steps 25 , return [-12.52]
step  0 :  [-1.7105141001520432]
step  1 :  [-1.6798574707302094]
step  2 :  [-1.6456189250674584]
step  3 :  [-1.6149088618633485]
step  4 :  [-1.5495628288052152]
step  5 :  [-1.4545329969877006]
step  6 :  [-1.3354625881969258]
step  7 :  [-1.1974902809681696]
step  8 :  [-1.0449315418360265]
step  9 :  [-0.8812974486816827]
step  10 :  [-0.7160415943850079]
step  11 :  [-0.5457587849375826]
step  12 :  [-0.3744202180828738]
step  13 :  [-0.23469150071077585]
step  14 :  [-0.11757181685270456]
step  15 :  [-0.04069184101187461]
step  16 :  [-0.033367932631707856]
step  17 :  [-0.02352235262966405]
step  18 :  [-0.06488157836958972]
step  19 :  [-0.04693812664924266]
step  20 :  [-0.03411273371483826]
step  21 :  [-0.032571480840450015]
step  22 :  [-0.028973043114996856]
step  23 :  [-0.039983458395312484]
step  24 :  [-0.0279770571087201]
episode  211 : steps 25 , return [-16.48]
step  0 :  [-1.5917747285234853]
step  1 :  [-1.5588133434919504]
step  2 :  [-1.521892896575481]
step  3 :  [-1.4886796172707668]
step  4 :  [-1.4220894391826802]
step  5 :  [-1.3264348659959382]
step  6 :  [-1.2070637558132193]
step  7 :  [-1.068977131799821]
step  8 :  [-0.9164349375076433]
step  9 :  [-0.7551726036673765]
step  10 :  [-0.5899446439594187]
step  11 :  [-0.4252925363024933]
step  12 :  [-0.2926103281870805]
step  13 :  [-0.175843968331164]
step  14 :  [-0.10604138538410339]
step  15 :  [-0.03692641710884121]
step  16 :  [-0.015102816030220671]
step  17 :  [-0.02706875731838706]
step  18 :  [-0.03926627884942126]
step  19 :  [-0.03687068839581103]
step  20 :  [-0.0532255649415663]
step  21 :  [-0.058928795417961616]
step  22 :  [-0.049207989993321426]
step  23 :  [-0.017759129137738562]
step  24 :  [-0.052270527833722644]
episode  212 : steps 25 , return [-14.83]
step  0 :  [-1.6194029283566558]
step  1 :  [-1.5941119256049947]
step  2 :  [-1.5293875601267095]
step  3 :  [-1.4724988239227994]
step  4 :  [-1.3839223171580217]
step  5 :  [-1.2696149732524988]
step  6 :  [-1.135035190874258]
step  7 :  [-0.9847501929041059]
step  8 :  [-0.8224243767655463]
step  9 :  [-0.6976169426701404]
step  10 :  [-0.569199570089118]
step  11 :  [-0.44433378934116036]
step  12 :  [-0.34197455876078414]
step  13 :  [-0.24554551061319024]
step  14 :  [-0.1589856878761253]
step  15 :  [-0.08848441110637072]
step  16 :  [-0.06576258188534598]
step  17 :  [-0.07253696306341746]
step  18 :  [-0.027619417350095075]
step  19 :  [-0.050270707533465624]
step  20 :  [-0.04867452023830809]
step  21 :  [-0.027757528355262587]
step  22 :  [-0.03730124689043121]
step  23 :  [-0.04616059989662215]
step  24 :  [-0.017205402496476677]
episode  213 : steps 25 , return [-14.75]
step  0 :  [-1.5958859218959767]
step  1 :  [-1.5688934527568936]
step  2 :  [-1.5401395006750727]
step  3 :  [-1.4746406244937287]
step  4 :  [-1.378551379485045]
step  5 :  [-1.2580669479887263]
step  6 :  [-1.1185567675404378]
step  7 :  [-0.964396757013786]
step  8 :  [-0.7990446482036894]
step  9 :  [-0.6310627757010309]
step  10 :  [-0.5142737071544935]
step  11 :  [-0.39047871496532405]
step  12 :  [-0.28402989747468876]
step  13 :  [-0.17853933528286636]
step  14 :  [-0.05856201311145577]
step  15 :  [-0.00832791250358579]
step  16 :  [-0.07244852781746466]
step  17 :  [-0.08741631951679106]
step  18 :  [-0.06742617704800208]
step  19 :  [-0.022311863063341007]
step  20 :  [-0.022243569167397018]
step  21 :  [-0.04538370927361475]
step  22 :  [-0.05408704191961001]
step  23 :  [-0.03154202503956086]
step  24 :  [-0.056109475181892146]
episode  214 : steps 25 , return [-14.22]
step  0 :  [-1.7641661825311081]
step  1 :  [-1.729014366877498]
step  2 :  [-1.6884065355416749]
step  3 :  [-1.6495835268114414]
step  4 :  [-1.5783127424734378]
step  5 :  [-1.4788395608098723]
step  6 :  [-1.3563247759206338]
step  7 :  [-1.2155688568932619]
step  8 :  [-1.060628822742924]
step  9 :  [-0.8947808476611432]
step  10 :  [-0.7776806536756025]
step  11 :  [-0.6459820736748454]
step  12 :  [-0.5244241473179712]
step  13 :  [-0.4337787820532867]
step  14 :  [-0.339238717476724]
step  15 :  [-0.24836038125616575]
step  16 :  [-0.14503649801513735]
step  17 :  [-0.02600240701441962]
step  18 :  [-0.04245712357774567]
step  19 :  [-0.03633141797792555]
step  20 :  [-0.012773115983532177]
step  21 :  [-0.057798486575054146]
step  22 :  [-0.06611736876086063]
step  23 :  [-0.04224724572521094]
step  24 :  [-0.052069598440354754]
episode  215 : steps 25 , return [-17.87]
step  0 :  [-1.366386248849978]
step  1 :  [-1.3342897827922722]
step  2 :  [-1.299719690644]
step  3 :  [-1.231044162279462]
step  4 :  [-1.133121762030334]
step  5 :  [-1.0115307976815031]
step  6 :  [-0.8713300501823109]
step  7 :  [-0.8006501843773411]
step  8 :  [-0.7028058544412934]
step  9 :  [-0.6116354617081747]
step  10 :  [-0.5296273996111427]
step  11 :  [-0.4617847284543693]
step  12 :  [-0.38235621802422254]
step  13 :  [-0.2849539539640102]
step  14 :  [-0.18553549972272018]
step  15 :  [-0.07517428413048936]
step  16 :  [-0.07170701224883332]
step  17 :  [-0.054302280876098265]
step  18 :  [-0.0362471932905235]
step  19 :  [-0.025432792128926993]
step  20 :  [-0.04399685842662714]
step  21 :  [-0.03443714801470868]
step  22 :  [-0.024562465718275247]
step  23 :  [-0.01643204391201121]
step  24 :  [-0.04868710935982129]
episode  216 : steps 25 , return [-12.64]
step  0 :  [-1.7364855646363913]
step  1 :  [-1.697797667777435]
step  2 :  [-1.652401701578551]
step  3 :  [-1.6078248143395926]
step  4 :  [-1.570692890246143]
step  5 :  [-1.5025410306814624]
step  6 :  [-1.4065157585305634]
step  7 :  [-1.2873755639751623]
step  8 :  [-1.1498355605599089]
step  9 :  [-0.9980343327517148]
step  10 :  [-0.8354674211557964]
step  11 :  [-0.6671634080174611]
step  12 :  [-0.4944311867354446]
step  13 :  [-0.32291366197845084]
step  14 :  [-0.18123578285302297]
step  15 :  [-0.05617960151014409]
step  16 :  [-0.022133356090190525]
step  17 :  [-0.03179626346224636]
step  18 :  [-0.020190132621109448]
step  19 :  [-0.050074859713064475]
step  20 :  [-0.03039597978589587]
step  21 :  [-0.025787472849435288]
step  22 :  [-0.01690546032182898]
step  23 :  [-0.02694277474497059]
step  24 :  [-0.009554952128770729]
episode  217 : steps 25 , return [-17.4]
step  0 :  [-1.7309629945140783]
step  1 :  [-1.6921680174936626]
step  2 :  [-1.64664289736501]
step  3 :  [-1.6019374201648247]
step  4 :  [-1.526745151655695]
step  5 :  [-1.4648413736677797]
step  6 :  [-1.3749723559888312]
step  7 :  [-1.2611895388592398]
step  8 :  [-1.1280535469212156]
step  9 :  [-0.979762278610204]
step  10 :  [-0.8199409472059691]
step  11 :  [-0.6562231245323313]
step  12 :  [-0.48892090254923515]
step  13 :  [-0.35378836576001155]
step  14 :  [-0.20553359597848797]
step  15 :  [-0.07944746146803758]
step  16 :  [-0.012786820904219459]
step  17 :  [-0.021987416228565208]
step  18 :  [-0.02526256017424052]
step  19 :  [-0.013019062257962967]
step  20 :  [-0.03947285754702237]
step  21 :  [-0.01897766442775175]
step  22 :  [-0.04777170043353179]
step  23 :  [-0.024157746850383598]
step  24 :  [-0.05248585272041732]
episode  218 : steps 25 , return [-17.27]
step  0 :  [-1.3647648697483692]
step  1 :  [-1.334938300615041]
step  2 :  [-1.3035111645065445]
step  3 :  [-1.2369984364944533]
step  4 :  [-1.1406140282024346]
step  5 :  [-1.0201500148256804]
step  6 :  [-0.880798299011705]
step  7 :  [-0.7963395837730695]
step  8 :  [-0.6917130962147006]
step  9 :  [-0.5852920009682844]
step  10 :  [-0.48380641686064313]
step  11 :  [-0.39889024146633734]
step  12 :  [-0.30670185113986725]
step  13 :  [-0.2148813961553629]
step  14 :  [-0.11960252461070699]
step  15 :  [-0.06324133448833213]
step  16 :  [-0.07336256733650216]
step  17 :  [-0.06719737224067501]
step  18 :  [-0.038805722029068415]
step  19 :  [-0.02811579649170127]
step  20 :  [-0.02063347977690828]
step  21 :  [-0.0377227298305127]
step  22 :  [-0.018291878322802102]
step  23 :  [-0.08138539851146358]
step  24 :  [-0.09111434073849985]
episode  219 : steps 25 , return [-12.4]
step  0 :  [-1.60420572434807]
step  1 :  [-1.567633075991064]
step  2 :  [-1.5256705776890256]
step  3 :  [-1.4861654864405378]
step  4 :  [-1.4150846177519598]
step  5 :  [-1.3160959888773405]
step  6 :  [-1.194129845294309]
step  7 :  [-1.0538986791091232]
step  8 :  [-0.8994319454253471]
step  9 :  [-0.7824729092361669]
step  10 :  [-0.653433065189045]
step  11 :  [-0.528865773427954]
step  12 :  [-0.4184227316855776]
step  13 :  [-0.3310798980226364]
step  14 :  [-0.23862935991839648]
step  15 :  [-0.13061325817692396]
step  16 :  [-0.01150561019541505]
step  17 :  [-0.05544325148536279]
step  18 :  [-0.06207949647509474]
step  19 :  [-0.028810488042341657]
step  20 :  [-0.0044880206480212665]
step  21 :  [-0.03899563874589632]
step  22 :  [-0.02044876158314482]
step  23 :  [-0.029807940468470507]
step  24 :  [-0.02370255433163874]
episode  220 : steps 25 , return [-15.42]
step  0 :  [-1.5072477628207417]
step  1 :  [-1.46565436748267]
step  2 :  [-1.4171204332053313]
step  3 :  [-1.3701435989015995]
step  4 :  [-1.3324145351842152]
step  5 :  [-1.2653749003064165]
step  6 :  [-1.1711304862050822]
step  7 :  [-1.054101500651929]
step  8 :  [-0.9190014427250122]
step  9 :  [-0.7702254714436214]
step  10 :  [-0.6119455671865707]
step  11 :  [-0.4490334590804398]
step  12 :  [-0.3147623460404845]
step  13 :  [-0.16867007012281512]
step  14 :  [-0.039908112137890625]
step  15 :  [-0.04430502642388364]
step  16 :  [-0.03789748769014497]
step  17 :  [-0.04470726293098527]
step  18 :  [-0.01874134430047754]
step  19 :  [-0.027851712141449235]
step  20 :  [-0.013829702561105085]
step  21 :  [-0.018468242956247636]
step  22 :  [-0.01561278401781446]
step  23 :  [-0.013294287869910392]
step  24 :  [-0.017843000843401596]
episode  221 : steps 25 , return [-14.11]
step  0 :  [-1.4799165240963537]
step  1 :  [-1.4423751469628745]
step  2 :  [-1.39962945872029]
step  3 :  [-1.360079696542999]
step  4 :  [-1.2895995367052133]
step  5 :  [-1.1913908306900791]
step  6 :  [-1.07022010483837]
step  7 :  [-0.9307600948080575]
step  8 :  [-0.7949595074373955]
step  9 :  [-0.6519127777573598]
step  10 :  [-0.5166133163399178]
step  11 :  [-0.41268266196249337]
step  12 :  [-0.31418227664479914]
step  13 :  [-0.201838253261031]
step  14 :  [-0.0882264409054821]
step  15 :  [-0.06288102492180145]
step  16 :  [-0.05923627583046976]
step  17 :  [-0.05497731731089702]
step  18 :  [-0.03802236351391085]
step  19 :  [-0.030305911232409447]
step  20 :  [-0.041156673767570436]
step  21 :  [-0.02385157642867594]
step  22 :  [-0.056688514429925355]
step  23 :  [-0.05541752668010013]
step  24 :  [-0.014104825166214377]
episode  222 : steps 25 , return [-13.58]
step  0 :  [-1.4760504589682109]
step  1 :  [-1.4487136044458278]
step  2 :  [-1.4200718764991591]
step  3 :  [-1.355053514027271]
step  4 :  [-1.259519751598005]
step  5 :  [-1.139566768894476]
step  6 :  [-1.000538713770694]
step  7 :  [-0.8468170102830833]
step  8 :  [-0.7479457843234089]
step  9 :  [-0.6361447280621753]
step  10 :  [-0.518570220423916]
step  11 :  [-0.42112725683687907]
step  12 :  [-0.32619534836084974]
step  13 :  [-0.2113447797190736]
step  14 :  [-0.09570138918950336]
step  15 :  [-0.054921453520398796]
step  16 :  [-0.088272754177538]
step  17 :  [-0.09351203248326964]
step  18 :  [-0.0652840055872704]
step  19 :  [-0.006836864146972328]
step  20 :  [-0.008132175424661632]
step  21 :  [-0.03242374737345837]
step  22 :  [-0.012461625186881995]
step  23 :  [-0.050517762089481354]
step  24 :  [-0.039993965357572124]
episode  223 : steps 25 , return [-13.36]
step  0 :  [-1.6419632575559073]
step  1 :  [-1.5977302604063273]
step  2 :  [-1.5449484811639367]
step  3 :  [-1.4917200011270269]
step  4 :  [-1.445341029291202]
step  5 :  [-1.371194715567621]
step  6 :  [-1.2710413187552352]
step  7 :  [-1.1488632415357196]
step  8 :  [-1.0089089240530313]
step  9 :  [-0.8549983683926543]
step  10 :  [-0.744787564007944]
step  11 :  [-0.6230185525916663]
step  12 :  [-0.4962389657126149]
step  13 :  [-0.3911300792426076]
step  14 :  [-0.29054141740143413]
step  15 :  [-0.1709751074312484]
step  16 :  [-0.06192870578716103]
step  17 :  [-0.0046328657028677145]
step  18 :  [-0.012109938876649504]
step  19 :  [-0.031855932699382083]
step  20 :  [-0.014997834587136724]
step  21 :  [-0.04658810618082499]
step  22 :  [-0.034233942833400775]
step  23 :  [-0.0749788395511616]
step  24 :  [-0.05727485497985567]
episode  224 : steps 25 , return [-16.43]
step  0 :  [-1.6509294120804394]
step  1 :  [-1.6107286357084387]
step  2 :  [-1.5635427032241342]
step  3 :  [-1.5172541152313712]
step  4 :  [-1.4788765703692088]
step  5 :  [-1.4103465956359098]
step  6 :  [-1.3143396342739622]
step  7 :  [-1.1954168701485355]
step  8 :  [-1.0582240291777505]
step  9 :  [-0.906906689184274]
step  10 :  [-0.7450497919134488]
step  11 :  [-0.5760242853311255]
step  12 :  [-0.40376749319703636]
step  13 :  [-0.2634614579855359]
step  14 :  [-0.15179274232824422]
step  15 :  [-0.0770757612738666]
step  16 :  [-0.03471124778027654]
step  17 :  [-0.06688645099935918]
step  18 :  [-0.08783555662032588]
step  19 :  [-0.07491810024470212]
step  20 :  [-0.04048430684036779]
step  21 :  [-0.05945478030517485]
step  22 :  [-0.031621742896278664]
step  23 :  [-0.04069511284248049]
step  24 :  [-0.019208926985675542]
episode  225 : steps 25 , return [-16.38]
step  0 :  [-1.635864340139319]
step  1 :  [-1.5940660459338258]
step  2 :  [-1.54471118837658]
step  3 :  [-1.4958133419867452]
step  4 :  [-1.4545451986821782]
step  5 :  [-1.3840511336993424]
step  6 :  [-1.2866243810749378]
step  7 :  [-1.1665990206758363]
step  8 :  [-1.0284728735449504]
step  9 :  [-0.8762767741018899]
step  10 :  [-0.7291662212558825]
step  11 :  [-0.5734213115363889]
step  12 :  [-0.41432226369420405]
step  13 :  [-0.2645779277870068]
step  14 :  [-0.1465260307947837]
step  15 :  [-0.053910106647007926]
step  16 :  [-0.049385689637027115]
step  17 :  [-0.0537144147545873]
step  18 :  [-0.03300599246248148]
step  19 :  [-0.033333855723004895]
step  20 :  [-0.052605868310332524]
step  21 :  [-0.020255017557851]
step  22 :  [-0.04670536711135354]
step  23 :  [-0.018417871546282126]
step  24 :  [-0.0450951513616446]
episode  226 : steps 25 , return [-16.]
step  0 :  [-1.5730339681935652]
step  1 :  [-1.5359547693144748]
step  2 :  [-1.493422467364726]
step  3 :  [-1.4534299573407405]
step  4 :  [-1.3821565385483092]
step  5 :  [-1.283107656343842]
step  6 :  [-1.1611413738968535]
step  7 :  [-1.020937747888942]
step  8 :  [-0.8665124262484436]
step  9 :  [-0.7754958862760584]
step  10 :  [-0.6682576105135658]
step  11 :  [-0.5570025842183511]
step  12 :  [-0.4505020095440975]
step  13 :  [-0.3608318256229529]
step  14 :  [-0.2644099901571615]
step  15 :  [-0.1544552718289202]
step  16 :  [-0.05013276485136946]
step  17 :  [-0.02156228518561996]
step  18 :  [-0.041365401191478114]
step  19 :  [-0.06008101425656921]
step  20 :  [-0.06365803508156816]
step  21 :  [-0.02135424487487682]
step  22 :  [-0.042171910777654004]
step  23 :  [-0.09133989004479823]
step  24 :  [-0.09279036738284993]
episode  227 : steps 25 , return [-15.49]
step  0 :  [-1.6128872700756636]
step  1 :  [-1.5764524105074587]
step  2 :  [-1.5346447070808071]
step  3 :  [-1.495271909589721]
step  4 :  [-1.4242433630488651]
step  5 :  [-1.3252711796342806]
step  6 :  [-1.2033052134933002]
step  7 :  [-1.063066803610466]
step  8 :  [-0.9085892335013761]
step  9 :  [-0.7834072774097747]
step  10 :  [-0.6477687429088432]
step  11 :  [-0.5192176156457023]
step  12 :  [-0.42081620658288327]
step  13 :  [-0.3181733196397767]
step  14 :  [-0.22106906154424424]
step  15 :  [-0.11346727214676643]
step  16 :  [-0.057607199259997126]
step  17 :  [-0.08038069031233722]
step  18 :  [-0.07170248998213279]
step  19 :  [-0.05106855962681677]
step  20 :  [-0.07198991465969273]
step  21 :  [-0.06943574613601664]
step  22 :  [-0.065861859309558]
step  23 :  [-0.06432763897117726]
step  24 :  [-0.08558602833249945]
episode  228 : steps 25 , return [-15.79]
step  0 :  [-1.5788811868634005]
step  1 :  [-1.5410064096569207]
step  2 :  [-1.497344453574247]
step  3 :  [-1.4559116195345465]
step  4 :  [-1.3836085523118746]
step  5 :  [-1.2838054233115004]
step  6 :  [-1.1612708618823493]
step  7 :  [-1.0206248361833188]
step  8 :  [-0.8658397800527008]
step  9 :  [-0.7847858798096435]
step  10 :  [-0.6825503390456457]
step  11 :  [-0.5789942696817079]
step  12 :  [-0.48078307194373726]
step  13 :  [-0.3985558123773634]
step  14 :  [-0.30816529151072447]
step  15 :  [-0.20333661982176182]
step  16 :  [-0.09640317216674482]
step  17 :  [-0.04389329838350167]
step  18 :  [-0.05556029775611266]
step  19 :  [-0.021887236757872262]
step  20 :  [-0.02892115689934204]
step  21 :  [-0.035530460854879105]
step  22 :  [-0.00881688926023413]
step  23 :  [-0.032994626837056944]
step  24 :  [-0.05010549544295061]
episode  229 : steps 25 , return [-15.6]
step  0 :  [-1.4831114223746438]
step  1 :  [-1.4557640102902756]
step  2 :  [-1.4270708199162034]
step  3 :  [-1.3619909070044431]
step  4 :  [-1.2663988909427222]
step  5 :  [-1.1463939348660315]
step  6 :  [-1.0073194611114908]
step  7 :  [-0.8535544610708132]
step  8 :  [-0.7563749122403811]
step  9 :  [-0.6454349529981631]
step  10 :  [-0.5286870858367059]
step  11 :  [-0.43255614928183067]
step  12 :  [-0.32384171922677624]
step  13 :  [-0.2182601110453075]
step  14 :  [-0.12047076912597258]
step  15 :  [-0.07063846526475934]
step  16 :  [-0.08099625652189053]
step  17 :  [-0.09394846773502781]
step  18 :  [-0.0544991139937042]
step  19 :  [-0.02599842463249554]
step  20 :  [-0.03513709257279787]
step  21 :  [-0.007781208625342757]
step  22 :  [-0.06288933726477705]
step  23 :  [-0.07294231353901452]
step  24 :  [-0.040515750305691045]
episode  230 : steps 25 , return [-13.57]
step  0 :  [-1.7771167883867796]
step  1 :  [-1.7424256659405717]
step  2 :  [-1.7024074794443065]
step  3 :  [-1.66423735446167]
step  4 :  [-1.5933721620458452]
step  5 :  [-1.4941627293676398]
step  6 :  [-1.3718258545964652]
step  7 :  [-1.2311930885959421]
step  8 :  [-1.0763393052006698]
step  9 :  [-0.9105509241158675]
step  10 :  [-0.7771354744943544]
step  11 :  [-0.6334508353518917]
step  12 :  [-0.5341227043099188]
step  13 :  [-0.42128988791012834]
step  14 :  [-0.32206535789852936]
step  15 :  [-0.21035267598290527]
step  16 :  [-0.10058763014460083]
step  17 :  [-0.01919814111754363]
step  18 :  [-0.07356126317274371]
step  19 :  [-0.07640802794170606]
step  20 :  [-0.047933298396922126]
step  21 :  [-0.08878618866572371]
step  22 :  [-0.07759416156085797]
step  23 :  [-0.0589212331259981]
step  24 :  [-0.029633657504008315]
episode  231 : steps 25 , return [-18.03]
step  0 :  [-1.748869943731825]
step  1 :  [-1.7214747636340133]
step  2 :  [-1.6915473763803013]
step  3 :  [-1.6248173037763862]
step  4 :  [-1.5276503651347475]
step  5 :  [-1.406289833162434]
step  6 :  [-1.2661026504582524]
step  7 :  [-1.1114524951854403]
step  8 :  [-0.9457932541418658]
step  9 :  [-0.7811524498625628]
step  10 :  [-0.6099271023700111]
step  11 :  [-0.47497850751861104]
step  12 :  [-0.38863912723765814]
step  13 :  [-0.3079160112976864]
step  14 :  [-0.21376658202840418]
step  15 :  [-0.10189302202058187]
step  16 :  [-0.018387735676742064]
step  17 :  [-0.021110540159486404]
step  18 :  [-0.0617830275032822]
step  19 :  [-0.06999348330424915]
step  20 :  [-0.03618538773848694]
step  21 :  [-0.05161827731907175]
step  22 :  [-0.02181440237389167]
step  23 :  [-0.017050279142111394]
step  24 :  [-0.023540448291956298]
episode  232 : steps 25 , return [-16.24]
step  0 :  [-1.4453133341318527]
step  1 :  [-1.4110308508388854]
step  2 :  [-1.3729882395634445]
step  3 :  [-1.301680763530931]
step  4 :  [-1.2018294172843493]
step  5 :  [-1.078881705109884]
step  6 :  [-0.9378147777347975]
step  7 :  [-0.8089112689148479]
step  8 :  [-0.857917431656159]
step  9 :  [-0.9411398063311248]
step  10 :  [-0.9570628676621421]
step  11 :  [-0.9210653558336581]
step  12 :  [-0.8458885751170873]
step  13 :  [-0.7417013504063044]
step  14 :  [-0.6168384299508758]
step  15 :  [-0.47906156080375767]
step  16 :  [-0.33879312402619705]
step  17 :  [-0.21572896280369427]
step  18 :  [-0.09304504150066707]
step  19 :  [-0.05307068736942148]
step  20 :  [-0.03935840039625271]
step  21 :  [-0.05393514328117223]
step  22 :  [-0.037510515912424526]
step  23 :  [-0.03385169727812798]
step  24 :  [-0.028109546015151653]
episode  233 : steps 25 , return [-16.81]
step  0 :  [-1.6193207626717014]
step  1 :  [-1.5957987724081029]
step  2 :  [-1.5321951244067387]
step  3 :  [-1.436596883233232]
step  4 :  [-1.3161351872892908]
step  5 :  [-1.2183811786077048]
step  6 :  [-1.097557135085226]
step  7 :  [-0.9583455146161319]
step  8 :  [-0.8048048116343622]
step  9 :  [-0.6564194989800397]
step  10 :  [-0.5188664007979648]
step  11 :  [-0.41480197704442495]
step  12 :  [-0.3164787525751947]
step  13 :  [-0.20639186294268982]
step  14 :  [-0.09482243285020486]
step  15 :  [-0.0439522803495804]
step  16 :  [-0.042899636364365924]
step  17 :  [-0.013219835884066002]
step  18 :  [-0.01404894455672361]
step  19 :  [-0.02290923451669416]
step  20 :  [-0.005102339728772396]
step  21 :  [-0.019056370824430548]
step  22 :  [-0.022586250097825562]
step  23 :  [-0.012572766594169678]
step  24 :  [-0.02329480014539038]
episode  234 : steps 25 , return [-14.01]
step  0 :  [-1.8134709104316917]
step  1 :  [-1.775392550801054]
step  2 :  [-1.7305840654319948]
step  3 :  [-1.6863167402008736]
step  4 :  [-1.648947422450453]
step  5 :  [-1.5802143222724618]
step  6 :  [-1.4835133724047236]
step  7 :  [-1.3636805870831858]
step  8 :  [-1.2254341037020546]
step  9 :  [-1.0728715368261357]
step  10 :  [-0.9093967155425983]
step  11 :  [-0.7378370532317547]
step  12 :  [-0.5623485163239159]
step  13 :  [-0.3860116577521748]
step  14 :  [-0.24300739909412028]
step  15 :  [-0.12730016468982316]
step  16 :  [-0.05015375719123061]
step  17 :  [-0.0361508522046796]
step  18 :  [-0.056237387053439954]
step  19 :  [-0.03656745650665864]
step  20 :  [-0.023574393600801543]
step  21 :  [-0.04169555208456348]
step  22 :  [-0.022564669667839987]
step  23 :  [-0.0517533084155956]
step  24 :  [-0.09909713942924316]
episode  235 : steps 25 , return [-18.76]
step  0 :  [-1.4634550129472041]
step  1 :  [-1.4215323908098814]
step  2 :  [-1.3727413643269308]
step  3 :  [-1.325787115829817]
step  4 :  [-1.2885904553429766]
step  5 :  [-1.222298388950413]
step  6 :  [-1.1288609982625804]
step  7 :  [-1.0126844622363802]
step  8 :  [-0.8785452009153916]
step  9 :  [-0.7309908449221301]
step  10 :  [-0.5745503860027038]
step  11 :  [-0.4151184520267284]
step  12 :  [-0.28198754484767535]
step  13 :  [-0.14271279921776303]
step  14 :  [-0.02387497533496336]
step  15 :  [-0.11605477711039386]
step  16 :  [-0.18129625945072897]
step  17 :  [-0.19101032569139578]
step  18 :  [-0.1674554516034793]
step  19 :  [-0.11402488189668775]
step  20 :  [-0.03192319696834513]
step  21 :  [-0.01282997853789936]
step  22 :  [-0.06599037858413011]
step  23 :  [-0.06569487190177146]
step  24 :  [-0.016014958720715892]
episode  236 : steps 25 , return [-14.25]
step  0 :  [-1.7747980809879413]
step  1 :  [-1.7428385593343358]
step  2 :  [-1.7065798984567286]
step  3 :  [-1.6730292039869787]
step  4 :  [-1.6054094585281085]
step  5 :  [-1.5085509831235109]
step  6 :  [-1.387969919113789]
step  7 :  [-1.2486912345167904]
step  8 :  [-1.0949224362094223]
step  9 :  [-0.9300508564759862]
step  10 :  [-0.7606068322531048]
step  11 :  [-0.5903401642260299]
step  12 :  [-0.4275651099334399]
step  13 :  [-0.3002357854709795]
step  14 :  [-0.1840435328277044]
step  15 :  [-0.059564292606195585]
step  16 :  [-0.022242303494375656]
step  17 :  [-0.005759438439821594]
step  18 :  [-0.033052298719565096]
step  19 :  [-0.02535488934952363]
step  20 :  [-0.03542415441711289]
step  21 :  [-0.042103055727397296]
step  22 :  [-0.040814463891270004]
step  23 :  [-0.052695505891083017]
step  24 :  [-0.07082429392390499]
episode  237 : steps 25 , return [-17.32]
step  0 :  [-1.5619629057944546]
step  1 :  [-1.520262328266705]
step  2 :  [-1.4713394932141644]
step  3 :  [-1.4234753258095696]
step  4 :  [-1.3841293613925498]
step  5 :  [-1.315512469397551]
step  6 :  [-1.2198042547459786]
step  7 :  [-1.1013759960845668]
step  8 :  [-0.9648296538008626]
step  9 :  [-0.8143684837927256]
step  10 :  [-0.6563883406955207]
step  11 :  [-0.49344288234426276]
step  12 :  [-0.333162142988272]
step  13 :  [-0.2004503002337425]
step  14 :  [-0.07451489086860374]
step  15 :  [-0.03782476193163415]
step  16 :  [-0.017102350881705173]
step  17 :  [-0.04846105081626174]
step  18 :  [-0.10719982248985503]
step  19 :  [-0.11555880696625867]
step  20 :  [-0.09184344604385035]
step  21 :  [-0.0407179472822591]
step  22 :  [-0.03250789251533475]
step  23 :  [-0.04489461022167137]
step  24 :  [-0.0436721680806218]
episode  238 : steps 25 , return [-15.11]
step  0 :  [-1.5404623896684608]
step  1 :  [-1.5012012819090401]
step  2 :  [-1.4557773956902356]
step  3 :  [-1.4124328739365]
step  4 :  [-1.3785437234096234]
step  5 :  [-1.3140115864703046]
step  6 :  [-1.2215403976059644]
step  7 :  [-1.1058833907145464]
step  8 :  [-0.9719566437649293]
step  9 :  [-0.8242948212454404]
step  10 :  [-0.6671683788871863]
step  11 :  [-0.5054168047755759]
step  12 :  [-0.34757464815511124]
step  13 :  [-0.2149430730039367]
step  14 :  [-0.08689521312345526]
step  15 :  [-0.053180780572599846]
step  16 :  [-0.04904388926563228]
step  17 :  [-0.0462006410453808]
step  18 :  [-0.03632433258468243]
step  19 :  [-0.03288142822210764]
step  20 :  [-0.0239388620259773]
step  21 :  [-0.022429044087973218]
step  22 :  [-0.02416066696807844]
step  23 :  [-0.009522568559329621]
step  24 :  [-0.046573863878770924]
episode  239 : steps 25 , return [-14.89]
step  0 :  [-1.7578189962417503]
step  1 :  [-1.7173527823835129]
step  2 :  [-1.6694185553406273]
step  3 :  [-1.6215732096403972]
step  4 :  [-1.5804885121901644]
step  5 :  [-1.509405545700563]
step  6 :  [-1.4111251449190763]
step  7 :  [-1.2901603333281073]
step  8 :  [-1.1510423796786118]
step  9 :  [-0.9977497999158544]
step  10 :  [-0.8335980467196806]
step  11 :  [-0.681380425123999]
step  12 :  [-0.5256716544166554]
step  13 :  [-0.3742093722399497]
step  14 :  [-0.25036893192060017]
step  15 :  [-0.13133657493432224]
step  16 :  [-0.08361909061697312]
step  17 :  [-0.07467397660768284]
step  18 :  [-0.04467208267213443]
step  19 :  [-0.04282828887015863]
step  20 :  [-0.027814197485974565]
step  21 :  [-0.024960113445640142]
step  22 :  [-0.04650327913978401]
step  23 :  [-0.05136938666109524]
step  24 :  [-0.018346044672065662]
episode  240 : steps 25 , return [-17.92]
step  0 :  [-1.7703699524671512]
step  1 :  [-1.7314721618097133]
step  2 :  [-1.6856705513182502]
step  3 :  [-1.6404030216500276]
step  4 :  [-1.6022046527559437]
step  5 :  [-1.5331052309759627]
step  6 :  [-1.4362605788171183]
step  7 :  [-1.3163975209570118]
step  8 :  [-1.178185824561298]
step  9 :  [-1.0257068363034108]
step  10 :  [-0.8623724023756661]
step  11 :  [-0.6986537036468515]
step  12 :  [-0.5292202145140968]
step  13 :  [-0.35902941764526225]
step  14 :  [-0.21916131618970294]
step  15 :  [-0.0997749468616757]
step  16 :  [-0.02284608440685894]
step  17 :  [-0.06439186414136151]
step  18 :  [-0.09036540483160263]
step  19 :  [-0.07213856871586799]
step  20 :  [-0.058674155012465805]
step  21 :  [-0.034770792673718985]
step  22 :  [-0.03069898901192419]
step  23 :  [-0.022801033267828136]
step  24 :  [-0.011419057504255667]
episode  241 : steps 25 , return [-18.1]
step  0 :  [-1.534930030329025]
step  1 :  [-1.502811450151747]
step  2 :  [-1.4673102994601446]
step  3 :  [-1.3974042749502986]
step  4 :  [-1.2983523360757492]
step  5 :  [-1.175857732678318]
step  6 :  [-1.0350178659195979]
step  7 :  [-0.8800738030560249]
step  8 :  [-0.8379685984912396]
step  9 :  [-0.8668357501505586]
step  10 :  [-0.8636480319122742]
step  11 :  [-0.8188510438458271]
step  12 :  [-0.7427126426217159]
step  13 :  [-0.64535501188298]
step  14 :  [-0.5377096108408433]
step  15 :  [-0.43641696345853]
step  16 :  [-0.3294177140068889]
step  17 :  [-0.2194162700326702]
step  18 :  [-0.09739605435247628]
step  19 :  [-0.06521366997788589]
step  20 :  [-0.04554506863395398]
step  21 :  [-0.056844206080998515]
step  22 :  [-0.036377373105722026]
step  23 :  [-0.06541022025979673]
step  24 :  [-0.11047071648571725]
episode  242 : steps 25 , return [-17.07]
step  0 :  [-1.571067152225709]
step  1 :  [-1.5340186125214272]
step  2 :  [-1.4915373784567834]
step  3 :  [-1.4516220578406827]
step  4 :  [-1.3804119719480226]
step  5 :  [-1.2814139042035773]
step  6 :  [-1.1594886350548603]
step  7 :  [-1.019318936339808]
step  8 :  [-0.8649230311627519]
step  9 :  [-0.7740380887493808]
step  10 :  [-0.6671211909186161]
step  11 :  [-0.555753299082469]
step  12 :  [-0.44886065231926425]
step  13 :  [-0.358663006916586]
step  14 :  [-0.26176230183644084]
step  15 :  [-0.1514749392370829]
step  16 :  [-0.047015589068922344]
step  17 :  [-0.023213549102518046]
step  18 :  [-0.04182161036483324]
step  19 :  [-0.018435895039331292]
step  20 :  [-0.03658564330500352]
step  21 :  [-0.048239249152791396]
step  22 :  [-0.05412703357266237]
step  23 :  [-0.03601434600297117]
step  24 :  [-0.07377709151103602]
episode  243 : steps 25 , return [-15.35]
step  0 :  [-1.6270678391722169]
step  1 :  [-1.598550122265715]
step  2 :  [-1.567575908247307]
step  3 :  [-1.5004570710441776]
step  4 :  [-1.4031793004327398]
step  5 :  [-1.2818199553699356]
step  6 :  [-1.141670197991067]
step  7 :  [-0.9870571427796115]
step  8 :  [-0.82141507892061]
step  9 :  [-0.7794700425496315]
step  10 :  [-0.7015327647012051]
step  11 :  [-0.6192287083897535]
step  12 :  [-0.5359398426764338]
step  13 :  [-0.4639824341945985]
step  14 :  [-0.38630688095509963]
step  15 :  [-0.30136503921649205]
step  16 :  [-0.19879566051631115]
step  17 :  [-0.07773993587921436]
step  18 :  [-0.023884991794880586]
step  19 :  [-0.036297379020307545]
step  20 :  [-0.09134921733680382]
step  21 :  [-0.08638280096499883]
step  22 :  [-0.12930811862632674]
step  23 :  [-0.11476023383552746]
step  24 :  [-0.09293348904764485]
episode  244 : steps 25 , return [-16.57]
step  0 :  [-1.4333529780658902]
step  1 :  [-1.4008555565110754]
step  2 :  [-1.365347260131935]
step  3 :  [-1.2957782001853655]
step  4 :  [-1.1971140090948809]
step  5 :  [-1.074948478676468]
step  6 :  [-0.9343346143105272]
step  7 :  [-0.849077922963584]
step  8 :  [-0.8284145864498942]
step  9 :  [-0.7808559175465029]
step  10 :  [-0.7072472913141201]
step  11 :  [-0.6160744363468537]
step  12 :  [-0.5186046676589674]
step  13 :  [-0.4265482127961227]
step  14 :  [-0.3344338369075333]
step  15 :  [-0.23771226029454404]
step  16 :  [-0.12933926887817573]
step  17 :  [-0.05769530931055546]
step  18 :  [-0.004986397845257387]
step  19 :  [-0.05738132847689984]
step  20 :  [-0.08175474274390022]
step  21 :  [-0.05680128420926956]
step  22 :  [-0.014384484838141424]
step  23 :  [-0.021235918490413577]
step  24 :  [-0.04525997301333627]
episode  245 : steps 25 , return [-14.47]
step  0 :  [-1.5310134325927378]
step  1 :  [-1.5058560704303965]
step  2 :  [-1.479909519001164]
step  3 :  [-1.416582033934222]
step  4 :  [-1.322181405187844]
step  5 :  [-1.2030375931747754]
step  6 :  [-1.064628510613337]
step  7 :  [-0.9114225850956781]
step  8 :  [-0.766695195161557]
step  9 :  [-0.615760229634387]
step  10 :  [-0.466550071185185]
step  11 :  [-0.3477020204699533]
step  12 :  [-0.22412980865914658]
step  13 :  [-0.11276757882010847]
step  14 :  [-0.06282850934535578]
step  15 :  [-0.02731325981481223]
step  16 :  [-0.035493190981598824]
step  17 :  [-0.015117043119377399]
step  18 :  [-0.02745755900554156]
step  19 :  [-0.024836917943321015]
step  20 :  [-0.019362417752498702]
step  21 :  [-0.025857141908420186]
step  22 :  [-0.026699877376315278]
step  23 :  [-0.03348588795652668]
step  24 :  [-0.02004131908071231]
episode  246 : steps 25 , return [-13.29]
step  0 :  [-1.5876632725386137]
step  1 :  [-1.5571472187446262]
step  2 :  [-1.5236075547452617]
step  3 :  [-1.4548609576191405]
step  4 :  [-1.3565180421708627]
step  5 :  [-1.2344570219260749]
step  6 :  [-1.0938623052119496]
step  7 :  [-0.9390100998916889]
step  8 :  [-0.7924327446350425]
step  9 :  [-0.6911647697576133]
step  10 :  [-0.6339585783336337]
step  11 :  [-0.6068347050150383]
step  12 :  [-0.5662736283030129]
step  13 :  [-0.5011592636536257]
step  14 :  [-0.4242545826033098]
step  15 :  [-0.32775368428668666]
step  16 :  [-0.21209016062912603]
step  17 :  [-0.10782518493662373]
step  18 :  [-0.04828898902742597]
step  19 :  [-0.03760134623895097]
step  20 :  [-0.069059088862561]
step  21 :  [-0.05047949722578016]
step  22 :  [-0.016114582752365603]
step  23 :  [-0.014126204694522318]
step  24 :  [-0.024945899948074803]
episode  247 : steps 25 , return [-15.87]
step  0 :  [-1.5219269495044394]
step  1 :  [-1.4868914089030636]
step  2 :  [-1.4474229629487945]
step  3 :  [-1.4115921902548265]
step  4 :  [-1.3435024574420817]
step  5 :  [-1.2469316084072677]
step  6 :  [-1.126962973306441]
step  7 :  [-0.988459534971809]
step  8 :  [-0.8356066932549701]
step  9 :  [-0.7009819946691546]
step  10 :  [-0.5602235005682706]
step  11 :  [-0.4207860318788876]
step  12 :  [-0.30547717793846146]
step  13 :  [-0.19328989315693362]
step  14 :  [-0.07637717570631707]
step  15 :  [-0.032683587896583294]
step  16 :  [-0.06579690680818567]
step  17 :  [-0.06162817555277978]
step  18 :  [-0.023648120586551937]
step  19 :  [-0.05208926837052126]
step  20 :  [-0.036304284942591455]
step  21 :  [-0.009887383726347995]
step  22 :  [-0.04657017159762145]
step  23 :  [-0.05232190561956726]
step  24 :  [-0.022092065666811708]
episode  248 : steps 25 , return [-14.07]
step  0 :  [-1.7452375953919517]
step  1 :  [-1.7094535315664712]
step  2 :  [-1.668040433775292]
step  3 :  [-1.6283332720024486]
step  4 :  [-1.5565206678279648]
step  5 :  [-1.456699907026652]
step  6 :  [-1.3339539932005384]
step  7 :  [-1.1930407817215714]
step  8 :  [-1.0379932809398116]
step  9 :  [-0.8720744799066344]
step  10 :  [-0.7784340534798992]
step  11 :  [-0.6635499602731042]
step  12 :  [-0.5543407618329608]
step  13 :  [-0.47208772534615845]
step  14 :  [-0.3796480618742287]
step  15 :  [-0.2882929929360622]
step  16 :  [-0.18466656758407057]
step  17 :  [-0.08828272777923085]
step  18 :  [-0.048193407919829484]
step  19 :  [-0.019006033742586675]
step  20 :  [-0.01820685562129946]
step  21 :  [-0.03043098673197689]
step  22 :  [-0.0361117548205652]
step  23 :  [-0.03690277116992127]
step  24 :  [-0.025457868916449043]
episode  249 : steps 25 , return [-17.82]
step  0 :  [-1.7703411183634994]
step  1 :  [-1.7304462900802433]
step  2 :  [-1.6832633779175543]
step  3 :  [-1.6362832248104708]
step  4 :  [-1.5961037347089884]
step  5 :  [-1.5255955307793565]
step  6 :  [-1.4277024328362564]
step  7 :  [-1.3070155688486507]
step  8 :  [-1.1681116825211053]
step  9 :  [-1.014998583414259]
step  10 :  [-0.8510140260868333]
step  11 :  [-0.6980548230552968]
step  12 :  [-0.5390541183573191]
step  13 :  [-0.3802770288687951]
step  14 :  [-0.24948611033624052]
step  15 :  [-0.1293479673160271]
step  16 :  [-0.06542508789053939]
step  17 :  [-0.011799699699089816]
step  18 :  [-0.043890313264425274]
step  19 :  [-0.023505153262619996]
step  20 :  [-0.05876312377212707]
step  21 :  [-0.04937699383678067]
step  22 :  [-0.014568418497051656]
step  23 :  [-0.018985793814420397]
step  24 :  [-0.02669701353615156]
episode  250 : steps 25 , return [-18.02]
step  0 :  [-1.790805167816446]
step  1 :  [-1.7516841414712105]
step  2 :  [-1.7055064938721622]
step  3 :  [-1.659663573984158]
step  4 :  [-1.6206436745032473]
step  5 :  [-1.5508515588074883]
step  6 :  [-1.453428481516351]
step  7 :  [-1.3330705221987076]
step  8 :  [-1.1944136104106329]
step  9 :  [-1.0415018373948983]
step  10 :  [-0.8776980166746439]
step  11 :  [-0.7170738163209482]
step  12 :  [-0.5508297873027554]
step  13 :  [-0.3835116419745843]
step  14 :  [-0.24671036931492055]
step  15 :  [-0.1287040252746435]
step  16 :  [-0.053833687842728]
step  17 :  [-0.04629987270516605]
step  18 :  [-0.014396464836255694]
step  19 :  [-0.007920252881339752]
step  20 :  [-0.0441332238731382]
step  21 :  [-0.03396869696905405]
step  22 :  [-0.029130400004852147]
step  23 :  [-0.02547888222779146]
step  24 :  [-0.03528096011410741]
episode  251 : steps 25 , return [-18.3]
step  0 :  [-1.8202327669301377]
step  1 :  [-1.7833618801625666]
step  2 :  [-1.740198468235482]
step  3 :  [-1.697926970924423]
step  4 :  [-1.6240795541746769]
step  5 :  [-1.522701735088012]
step  6 :  [-1.398795973365864]
step  7 :  [-1.2570526257353984]
step  8 :  [-1.101461965495571]
step  9 :  [-0.9352765490696945]
step  10 :  [-0.7841342545247926]
step  11 :  [-0.6205263129625065]
step  12 :  [-0.5262225302867397]
step  13 :  [-0.43607080065453446]
step  14 :  [-0.3598117752703079]
step  15 :  [-0.27296685070106275]
step  16 :  [-0.1693687563222142]
step  17 :  [-0.06363648360373794]
step  18 :  [-0.031760901279317875]
step  19 :  [-0.0075039351533391745]
step  20 :  [-0.030213094016778404]
step  21 :  [-0.03099745337826061]
step  22 :  [-0.04616740599893809]
step  23 :  [-0.051941244065961234]
step  24 :  [-0.05610128738608258]
episode  252 : steps 25 , return [-18.37]
step  0 :  [-1.714178041897009]
step  1 :  [-1.6907830101201915]
step  2 :  [-1.6664241985655164]
step  3 :  [-1.6036482445777194]
step  4 :  [-1.5093481902068044]
step  5 :  [-1.3901016999366613]
step  6 :  [-1.2514908902608857]
step  7 :  [-1.0980195743536458]
step  8 :  [-0.9332313319691498]
step  9 :  [-0.7618922808723678]
step  10 :  [-0.5898921372322669]
step  11 :  [-0.4262404865384471]
step  12 :  [-0.2988385858014296]
step  13 :  [-0.1826775662474842]
step  14 :  [-0.05992239330624062]
step  15 :  [-0.026320296785191554]
step  16 :  [-0.0010675763002713074]
step  17 :  [-0.06496648543238928]
step  18 :  [-0.06617736139406097]
step  19 :  [-0.057122612407913276]
step  20 :  [-0.05489687095551961]
step  21 :  [-0.05871046597525879]
step  22 :  [-0.05149642972180237]
step  23 :  [-0.061473684353763054]
step  24 :  [-0.05922965782923495]
episode  253 : steps 25 , return [-15.68]
step  0 :  [-1.7322297456784694]
step  1 :  [-1.702413574993791]
step  2 :  [-1.6692434119279078]
step  3 :  [-1.6003561705883678]
step  4 :  [-1.5017370453571481]
step  5 :  [-1.3794133854675885]
step  6 :  [-1.2386319533968162]
step  7 :  [-1.0837002987299778]
step  8 :  [-0.9180733529436702]
step  9 :  [-0.7867293142439795]
step  10 :  [-0.6923989475188371]
step  11 :  [-0.6475204973327222]
step  12 :  [-0.6318731716324721]
step  13 :  [-0.6000821674818456]
step  14 :  [-0.5414840198400586]
step  15 :  [-0.46933891946894146]
step  16 :  [-0.37623397419608867]
step  17 :  [-0.26345401041013783]
step  18 :  [-0.1574490146232457]
step  19 :  [-0.04658614373961072]
step  20 :  [-0.06833894858357085]
step  21 :  [-0.054980097067478646]
step  22 :  [-0.0499337925615809]
step  23 :  [-0.03700641359351846]
step  24 :  [-0.08413202003564313]
episode  254 : steps 25 , return [-18.33]
step  0 :  [-1.6196332070177226]
step  1 :  [-1.582255009526525]
step  2 :  [-1.5391126019155714]
step  3 :  [-1.4980445433143394]
step  4 :  [-1.465980000454615]
step  5 :  [-1.402197830325992]
step  6 :  [-1.3099490433960383]
step  7 :  [-1.1942145970331357]
step  8 :  [-1.0599781817684424]
step  9 :  [-0.9117228859833839]
step  10 :  [-0.753486718801746]
step  11 :  [-0.5893841006761619]
step  12 :  [-0.4252877969060032]
step  13 :  [-0.2872494261472626]
step  14 :  [-0.14845676984532816]
step  15 :  [-0.0395158213426594]
step  16 :  [-0.050527101979456375]
step  17 :  [-0.06159130427907748]
step  18 :  [-0.037457242452753885]
step  19 :  [-0.04835317715078966]
step  20 :  [-0.023266864083739777]
step  21 :  [-0.04643717961668237]
step  22 :  [-0.04665565049884961]
step  23 :  [-0.008950738515924546]
step  24 :  [-0.04245639309800017]
episode  255 : steps 25 , return [-16.19]
step  0 :  [-1.5607300812512481]
step  1 :  [-1.5236401130114017]
step  2 :  [-1.4811465695618726]
step  3 :  [-1.4412902345944063]
step  4 :  [-1.370171764730949]
step  5 :  [-1.2712670024522936]
step  6 :  [-1.1494274718527229]
step  7 :  [-1.0093349986207807]
step  8 :  [-0.8550105715766989]
step  9 :  [-0.7667466408904648]
step  10 :  [-0.6628561766700048]
step  11 :  [-0.552721443752341]
step  12 :  [-0.4624488152315698]
step  13 :  [-0.3578036369917894]
step  14 :  [-0.25537407747384766]
step  15 :  [-0.1467352804825909]
step  16 :  [-0.09812635138977441]
step  17 :  [-0.028234449619839983]
step  18 :  [-0.01982183678629908]
step  19 :  [-0.039079589768061716]
step  20 :  [-0.04656987031620555]
step  21 :  [-0.0077672819649262015]
step  22 :  [-0.030959675643970175]
step  23 :  [-0.05810140708024854]
step  24 :  [-0.06131769988122054]
episode  256 : steps 25 , return [-15.26]
step  0 :  [-1.5169242297587164]
step  1 :  [-1.4833951172080937]
step  2 :  [-1.4460339798543702]
step  3 :  [-1.4128343652502668]
step  4 :  [-1.3466413663209387]
step  5 :  [-1.251508870831667]
step  6 :  [-1.132702796476771]
step  7 :  [-0.9952200864915028]
step  8 :  [-0.8433682274181622]
step  9 :  [-0.6959714703808323]
step  10 :  [-0.5418199966287075]
step  11 :  [-0.38776410311940923]
step  12 :  [-0.2601295046079672]
step  13 :  [-0.14081093174722997]
step  14 :  [-0.08078109026614964]
step  15 :  [-0.010017855631418692]
step  16 :  [-0.029946639716372087]
step  17 :  [-0.015508910009813517]
step  18 :  [-0.04651670205940474]
step  19 :  [-0.028675009474950604]
step  20 :  [-0.05518985607837547]
step  21 :  [-0.05713698812590475]
step  22 :  [-0.028267183356360276]
step  23 :  [-0.03279694793433872]
step  24 :  [-0.03971603360824612]
episode  257 : steps 25 , return [-13.88]
step  0 :  [-1.4987219390655726]
step  1 :  [-1.4609868334955192]
step  2 :  [-1.4178805335910807]
step  3 :  [-1.3777331503342565]
step  4 :  [-1.3067310960615077]
step  5 :  [-1.2080841023324405]
step  6 :  [-1.0865419781263752]
step  7 :  [-0.9467537294032423]
step  8 :  [-0.7973657936644308]
step  9 :  [-0.6436822291598141]
step  10 :  [-0.5048446791387153]
step  11 :  [-0.4017149374040088]
step  12 :  [-0.30399621044765884]
step  13 :  [-0.1995689584288454]
step  14 :  [-0.09544773515377478]
step  15 :  [-0.04081932639000449]
step  16 :  [-0.04508978922443632]
step  17 :  [-0.03554684215576489]
step  18 :  [-0.004877683907299486]
step  19 :  [-0.029521537241238984]
step  20 :  [-0.0177603910196469]
step  21 :  [-0.03281354005863864]
step  22 :  [-0.03791687578136363]
step  23 :  [-0.07490800222542682]
step  24 :  [-0.1043727837974489]
episode  258 : steps 25 , return [-13.67]
step  0 :  [-1.6318476418666503]
step  1 :  [-1.603122991758713]
step  2 :  [-1.5718454185119797]
step  3 :  [-1.504505742693588]
step  4 :  [-1.40706790579293]
step  5 :  [-1.2855939536852097]
step  6 :  [-1.1453652078184213]
step  7 :  [-0.990703497914943]
step  8 :  [-0.8250425422622494]
step  9 :  [-0.7799391020102726]
step  10 :  [-0.6992263215544303]
step  11 :  [-0.6167030377265127]
step  12 :  [-0.5352217805032423]
step  13 :  [-0.46528857913700133]
step  14 :  [-0.38460280397853325]
step  15 :  [-0.2946415257329401]
step  16 :  [-0.1927288513220862]
step  17 :  [-0.07395840985582003]
step  18 :  [-0.031213398431138156]
step  19 :  [-0.06804255387968039]
step  20 :  [-0.07835652383094015]
step  21 :  [-0.06109131438761784]
step  22 :  [-0.008812308887612981]
step  23 :  [-0.012140227982061873]
step  24 :  [-0.039665300666532906]
episode  259 : steps 25 , return [-16.31]
step  0 :  [-1.593645598083667]
step  1 :  [-1.5515120914730618]
step  2 :  [-1.5018538475340453]
step  3 :  [-1.4528520335589425]
step  4 :  [-1.411864864805592]
step  5 :  [-1.341852043036661]
step  6 :  [-1.2449528124698548]
step  7 :  [-1.1254619848961918]
step  8 :  [-0.9878900844783762]
step  9 :  [-0.8363192510186005]
step  10 :  [-0.6862026776583631]
step  11 :  [-0.5306190126554178]
step  12 :  [-0.3769789910237389]
step  13 :  [-0.24987178473026886]
step  14 :  [-0.12902011176601932]
step  15 :  [-0.07648356460261437]
step  16 :  [-0.027422712560068986]
step  17 :  [-0.02584406551130327]
step  18 :  [-0.007082396429386643]
step  19 :  [-0.04987079725198076]
step  20 :  [-0.04671687165516338]
step  21 :  [-0.08918265351342078]
step  22 :  [-0.07668875835369207]
step  23 :  [-0.04625868742402506]
step  24 :  [-0.05010711140745226]
episode  260 : steps 25 , return [-15.52]
step  0 :  [-1.661938370066161]
step  1 :  [-1.6323912367843645]
step  2 :  [-1.5998632032451907]
step  3 :  [-1.5315902518803741]
step  4 :  [-1.4334708063074881]
step  5 :  [-1.311513569878059]
step  6 :  [-1.1709644602748295]
step  7 :  [-1.0161284553852041]
step  8 :  [-0.8504448225881703]
step  9 :  [-0.7826401921329811]
step  10 :  [-0.6824256049945782]
step  11 :  [-0.5956762558346121]
step  12 :  [-0.5229410452404354]
step  13 :  [-0.46425781465652405]
step  14 :  [-0.3916351626444275]
step  15 :  [-0.29799203309448946]
step  16 :  [-0.20770985417427948]
step  17 :  [-0.10728304549723856]
step  18 :  [-0.04065786944233767]
step  19 :  [-0.04059648209242903]
step  20 :  [-0.07601103411079707]
step  21 :  [-0.06638625074579659]
step  22 :  [-0.03646942931127402]
step  23 :  [-0.03620226076803345]
step  24 :  [-0.03672860054567656]
episode  261 : steps 25 , return [-16.59]
step  0 :  [-1.6275445016103762]
step  1 :  [-1.5980265609420607]
step  2 :  [-1.5656816649710201]
step  3 :  [-1.4976281823603528]
step  4 :  [-1.399704036742352]
step  5 :  [-1.2778994761462696]
step  6 :  [-1.1374553405671268]
step  7 :  [-0.9826736645138588]
step  8 :  [-0.8169868182706185]
step  9 :  [-0.7812390152576504]
step  10 :  [-0.7063712304883724]
step  11 :  [-0.6318653129107997]
step  12 :  [-0.558581884702565]
step  13 :  [-0.4967014684668186]
step  14 :  [-0.43812050888166737]
step  15 :  [-0.3612547438303274]
step  16 :  [-0.2615716306837918]
step  17 :  [-0.14117837169218808]
step  18 :  [-0.058844340010625905]
step  19 :  [-0.009512159085760972]
step  20 :  [-0.021871439544380235]
step  21 :  [-0.06525870153330297]
step  22 :  [-0.060926425195782646]
step  23 :  [-0.05464011010990897]
step  24 :  [-0.06364595868583532]
episode  262 : steps 25 , return [-16.62]
step  0 :  [-1.421900529379104]
step  1 :  [-1.3886338824381332]
step  2 :  [-1.3521245158808797]
step  3 :  [-1.320765942406345]
step  4 :  [-1.2564557676214132]
step  5 :  [-1.1630970728384684]
step  6 :  [-1.045988796110184]
step  7 :  [-0.9102484951704493]
step  8 :  [-0.7604035169479603]
step  9 :  [-0.6006859016875516]
step  10 :  [-0.43553260711819924]
step  11 :  [-0.30071622509066487]
step  12 :  [-0.1522739024852738]
step  13 :  [-0.03398775743382217]
step  14 :  [-0.054610421881442314]
step  15 :  [-0.06687057997505644]
step  16 :  [-0.030828781110836673]
step  17 :  [-0.04772390667035256]
step  18 :  [-0.06376943842439844]
step  19 :  [-0.06737758177368051]
step  20 :  [-0.10036638907603446]
step  21 :  [-0.08343109134503893]
step  22 :  [-0.04432815923491183]
step  23 :  [-0.04477386006159186]
step  24 :  [-0.012928793576202144]
episode  263 : steps 25 , return [-12.76]
step  0 :  [-1.483001889402483]
step  1 :  [-1.4430796337195892]
step  2 :  [-1.3969972995962472]
step  3 :  [-1.353273041647905]
step  4 :  [-1.2798674445902867]
step  5 :  [-1.1795321445428009]
step  6 :  [-1.0567478733976123]
step  7 :  [-0.9159958800619238]
step  8 :  [-0.7996111495271886]
step  9 :  [-0.6693730417616565]
step  10 :  [-0.5548635854842925]
step  11 :  [-0.4723990208939509]
step  12 :  [-0.387228690505712]
step  13 :  [-0.30316955442187776]
step  14 :  [-0.20442892453232017]
step  15 :  [-0.1357921768991904]
step  16 :  [-0.04605373349979534]
step  17 :  [-0.054614728482215505]
step  18 :  [-0.02557150751152774]
step  19 :  [-0.05292691766296791]
step  20 :  [-0.0262064362794434]
step  21 :  [-0.04569692029247867]
step  22 :  [-0.049411554116158184]
step  23 :  [-0.01753443605979815]
step  24 :  [-0.02392870232923361]
episode  264 : steps 25 , return [-13.98]
step  0 :  [-1.4859456095552617]
step  1 :  [-1.454508395772596]
step  2 :  [-1.4201861024697542]
step  3 :  [-1.3512331088601852]
step  4 :  [-1.2529022485855712]
step  5 :  [-1.1309209221937873]
step  6 :  [-0.9904064777563958]
step  7 :  [-0.8356017604085583]
step  8 :  [-0.8362755219629204]
step  9 :  [-0.8577411015305942]
step  10 :  [-0.836597836640325]
step  11 :  [-0.7810991403722226]
step  12 :  [-0.7012682382392457]
step  13 :  [-0.6080783157815735]
step  14 :  [-0.5151980672109794]
step  15 :  [-0.4239353144638487]
step  16 :  [-0.3197693216634317]
step  17 :  [-0.19930327962478828]
step  18 :  [-0.09934706831387805]
step  19 :  [-0.049438318724190855]
step  20 :  [-0.06513717384662454]
step  21 :  [-0.05712749666423572]
step  22 :  [-0.0353529661185221]
step  23 :  [-0.015150460423073721]
step  24 :  [-0.03828451107455978]
episode  265 : steps 25 , return [-16.36]
step  0 :  [-1.4298567121557915]
step  1 :  [-1.402291053324762]
step  2 :  [-1.373587482688589]
step  3 :  [-1.308701192733181]
step  4 :  [-1.2133568677760245]
step  5 :  [-1.0936030885122832]
step  6 :  [-0.9547717827593794]
step  7 :  [-0.8012533554056507]
step  8 :  [-0.645398441773484]
step  9 :  [-0.5012276157831999]
step  10 :  [-0.39217223986158395]
step  11 :  [-0.29015039842187385]
step  12 :  [-0.1784473223445412]
step  13 :  [-0.0678065513764978]
step  14 :  [-0.01158604212219981]
step  15 :  [-0.020316077642110898]
step  16 :  [-0.041733931839960145]
step  17 :  [-0.034137228284021805]
step  18 :  [-0.01423979199717619]
step  19 :  [-0.015232799164611467]
step  20 :  [-0.029542679219729976]
step  21 :  [-0.023520923659045297]
step  22 :  [-0.022159212345320634]
step  23 :  [-0.01802248357202824]
step  24 :  [-0.06480367070542838]
episode  266 : steps 25 , return [-11.95]
step  0 :  [-1.6002074943304245]
step  1 :  [-1.5553855407975]
step  2 :  [-1.5019347046834188]
step  3 :  [-1.4481295585817633]
step  4 :  [-1.4014658484010951]
step  5 :  [-1.327389073801188]
step  6 :  [-1.227439675793412]
step  7 :  [-1.105514563383112]
step  8 :  [-0.9658365246883421]
step  9 :  [-0.8122331745732395]
step  10 :  [-0.6708515968306297]
step  11 :  [-0.5338971217288293]
step  12 :  [-0.4273175775278542]
step  13 :  [-0.31422777790942863]
step  14 :  [-0.2086175561578659]
step  15 :  [-0.09481663195776013]
step  16 :  [-0.04804809212951266]
step  17 :  [-0.04289065422498978]
step  18 :  [-0.027539523668934574]
step  19 :  [-0.02521976778676556]
step  20 :  [-0.05780594887139035]
step  21 :  [-0.04361781497412932]
step  22 :  [-0.031389596630033746]
step  23 :  [-0.015307511617864816]
step  24 :  [-0.04532151020349545]
episode  267 : steps 25 , return [-15.53]
step  0 :  [-1.418460966326178]
step  1 :  [-1.3857900296613253]
step  2 :  [-1.3501238252326166]
step  3 :  [-1.2805029802595513]
step  4 :  [-1.1818294130748268]
step  5 :  [-1.0596697682299336]
step  6 :  [-0.9190648015185482]
step  7 :  [-0.8036559254792003]
step  8 :  [-0.819232577167678]
step  9 :  [-0.9156742536260639]
step  10 :  [-0.9739878356990948]
step  11 :  [-0.9679826570466453]
step  12 :  [-0.9135861806091065]
step  13 :  [-0.8482125243857593]
step  14 :  [-0.7939732149482712]
step  15 :  [-0.7110973530309094]
step  16 :  [-0.6074645018287663]
step  17 :  [-0.4920157907596179]
step  18 :  [-0.37839903819920606]
step  19 :  [-0.2776499128964535]
step  20 :  [-0.16998570516679748]
step  21 :  [-0.048320765636190914]
step  22 :  [-0.03848778491800064]
step  23 :  [-0.04597810181155691]
step  24 :  [-0.021559742437049983]
episode  268 : steps 25 , return [-18.42]
step  0 :  [-1.5335565480403468]
step  1 :  [-1.5024131133604275]
step  2 :  [-1.4682607837158967]
step  3 :  [-1.3992663046402896]
step  4 :  [-1.300832815839289]
step  5 :  [-1.1787473142752176]
step  6 :  [-1.0381522260566978]
step  7 :  [-0.8833037017823333]
step  8 :  [-0.7914123194058679]
step  9 :  [-0.6741803105466142]
step  10 :  [-0.577750250081263]
step  11 :  [-0.5127485149972598]
step  12 :  [-0.44461059473450926]
step  13 :  [-0.3608939297708653]
step  14 :  [-0.266832159351142]
step  15 :  [-0.15734496828399577]
step  16 :  [-0.05448712513583272]
step  17 :  [-0.019408333893457117]
step  18 :  [-0.038281774215806336]
step  19 :  [-0.04227258301100025]
step  20 :  [-0.008860518789868802]
step  21 :  [-0.037891052423559037]
step  22 :  [-0.02298984771726786]
step  23 :  [-0.027014150854962327]
step  24 :  [-0.03404414253218554]
episode  269 : steps 25 , return [-14.38]
step  0 :  [-1.5870281160254784]
step  1 :  [-1.5497101652584995]
step  2 :  [-1.506786623773421]
step  3 :  [-1.4662114582572738]
step  4 :  [-1.3944656271034932]
step  5 :  [-1.2950412538574898]
step  6 :  [-1.1727750192861066]
step  7 :  [-1.032326765482609]
step  8 :  [-0.8776939499507682]
step  9 :  [-0.7830159359199277]
step  10 :  [-0.6711231032524619]
step  11 :  [-0.5594394637817687]
step  12 :  [-0.4558424515909764]
step  13 :  [-0.3704923123818816]
step  14 :  [-0.2779059928034048]
step  15 :  [-0.17002529861237559]
step  16 :  [-0.07316750480586187]
step  17 :  [-0.034078502784940956]
step  18 :  [-0.014203531747966682]
step  19 :  [-0.034333852133791185]
step  20 :  [-0.028571863800485008]
step  21 :  [-0.02531148153005165]
step  22 :  [-0.03735522922787069]
step  23 :  [-0.03292390834621551]
step  24 :  [-0.014461854888989753]
episode  270 : steps 25 , return [-15.46]
step  0 :  [-1.7175988038090304]
step  1 :  [-1.6928770860277274]
step  2 :  [-1.6667050680913886]
step  3 :  [-1.6026494148094304]
step  4 :  [-1.5074145925212517]
step  5 :  [-1.3874616807843285]
step  6 :  [-1.2482969585182515]
step  7 :  [-1.0943709222550986]
step  8 :  [-0.9291843143130163]
step  9 :  [-0.7708105178666849]
step  10 :  [-0.6089372856989068]
step  11 :  [-0.458812413256462]
step  12 :  [-0.34494521724754934]
step  13 :  [-0.2376230585759823]
step  14 :  [-0.14803482180334424]
step  15 :  [-0.07978085993994315]
step  16 :  [-0.06407992076797722]
step  17 :  [-0.07379361139214603]
step  18 :  [-0.031363692235303706]
step  19 :  [-0.049396971724372435]
step  20 :  [-0.014652500781569558]
step  21 :  [-0.036124016345126575]
step  22 :  [-0.009725091695923054]
step  23 :  [-0.029020456031470444]
step  24 :  [-0.011219068760523757]
episode  271 : steps 25 , return [-15.81]
step  0 :  [-1.7870305704233305]
step  1 :  [-1.7490498993460804]
step  2 :  [-1.7044619213515317]
step  3 :  [-1.6606063881418]
step  4 :  [-1.6239098113366632]
step  5 :  [-1.55579366855816]
step  6 :  [-1.459633878580834]
step  7 :  [-1.3402807088127509]
step  8 :  [-1.2024784326165652]
step  9 :  [-1.0503590353242511]
step  10 :  [-0.8873759800157034]
step  11 :  [-0.7164454325696166]
step  12 :  [-0.540313827989211]
step  13 :  [-0.3626567821542376]
step  14 :  [-0.21788258312952632]
step  15 :  [-0.1329007817305669]
step  16 :  [-0.05338166278223331]
step  17 :  [-0.02650621967471608]
step  18 :  [-0.05074931279023299]
step  19 :  [-0.0228428111865715]
step  20 :  [-0.003307839160249186]
step  21 :  [-0.035625640256474946]
step  22 :  [-0.0115966923458068]
step  23 :  [-0.047328281330168864]
step  24 :  [-0.03888344169154173]
episode  272 : steps 25 , return [-18.28]
step  0 :  [-1.55994248641078]
step  1 :  [-1.5164566961449866]
step  2 :  [-1.4650416335776384]
step  3 :  [-1.4140676800417031]
step  4 :  [-1.3711195259432412]
step  5 :  [-1.2999496766169691]
step  6 :  [-1.2023223754731684]
step  7 :  [-1.0823403704984695]
step  8 :  [-0.9444117391247107]
step  9 :  [-0.7925636040525474]
step  10 :  [-0.6357239741292997]
step  11 :  [-0.47951497381475955]
step  12 :  [-0.35417767235553316]
step  13 :  [-0.22190291935050238]
step  14 :  [-0.10217346943813117]
step  15 :  [-0.04869572923071178]
step  16 :  [-0.05466673257666343]
step  17 :  [-0.02044671775207314]
step  18 :  [-0.0276245021120561]
step  19 :  [-0.029978815867630015]
step  20 :  [-0.014977426873399013]
step  21 :  [-0.03311469481391293]
step  22 :  [-0.03893973814738417]
step  23 :  [-0.04588126871183129]
step  24 :  [-0.03254694836502227]
episode  273 : steps 25 , return [-14.79]
step  0 :  [-1.7317900024478574]
step  1 :  [-1.7034118128243576]
step  2 :  [-1.6722077983763894]
step  3 :  [-1.6046504550633842]
step  4 :  [-1.5069337966641]
step  5 :  [-1.3852073458126548]
step  6 :  [-1.2447863355743487]
step  7 :  [-1.090008396897281]
step  8 :  [-0.9243215928263249]
step  9 :  [-0.7827438280775085]
step  10 :  [-0.6848914325571949]
step  11 :  [-0.625275556596837]
step  12 :  [-0.593949660519536]
step  13 :  [-0.5497445137522248]
step  14 :  [-0.49203452977461315]
step  15 :  [-0.41477344684239936]
step  16 :  [-0.3145738640793297]
step  17 :  [-0.22696694805412698]
step  18 :  [-0.1318143772566312]
step  19 :  [-0.06612405028203978]
step  20 :  [-0.01104488681946379]
step  21 :  [-0.047911879546309974]
step  22 :  [-0.029118679338255994]
step  23 :  [-0.04880195934766712]
step  24 :  [-0.05111116132489262]
episode  274 : steps 25 , return [-17.93]
step  0 :  [-1.6412238778315698]
step  1 :  [-1.5996761904106294]
step  2 :  [-1.5506506281148897]
step  3 :  [-1.502130117600687]
step  4 :  [-1.4612513946853496]
step  5 :  [-1.3909998376593389]
step  6 :  [-1.2937344443630945]
step  7 :  [-1.173824560349124]
step  8 :  [-1.0357881952587613]
step  9 :  [-0.8836689595986021]
step  10 :  [-0.7329921967471212]
step  11 :  [-0.5744168158093453]
step  12 :  [-0.41281836669220673]
step  13 :  [-0.28028143105318953]
step  14 :  [-0.1656872169270955]
step  15 :  [-0.09345906159242857]
step  16 :  [-0.042787793474862675]
step  17 :  [-0.016811127759034542]
step  18 :  [-0.01434610861794394]
step  19 :  [-0.02364233369500692]
step  20 :  [-0.050401762907061616]
step  21 :  [-0.021194958830740757]
step  22 :  [-0.04866484719676397]
step  23 :  [-0.021124998767169854]
step  24 :  [-0.04800554966941563]
episode  275 : steps 25 , return [-16.08]
step  0 :  [-1.5679016731613815]
step  1 :  [-1.5259383308451995]
step  2 :  [-1.4766231288433993]
step  3 :  [-1.4282265017714861]
step  4 :  [-1.3882007951066315]
step  5 :  [-1.3190550547878483]
step  6 :  [-1.2229194465580828]
step  7 :  [-1.1041231466419272]
step  8 :  [-0.9672301013890894]
step  9 :  [-0.816400679229305]
step  10 :  [-0.6599282973262711]
step  11 :  [-0.4990343311186966]
step  12 :  [-0.34174362952875176]
step  13 :  [-0.21197093167593245]
step  14 :  [-0.08776492760738029]
step  15 :  [-0.04138362760626231]
step  16 :  [-0.02480937456429384]
step  17 :  [-0.06055676796217085]
step  18 :  [-0.041422866579074936]
step  19 :  [-0.07225367931724669]
step  20 :  [-0.05089407176220793]
step  21 :  [-0.041637651654621806]
step  22 :  [-0.04406815165553342]
step  23 :  [-0.034662873424333274]
step  24 :  [-0.03193576201661573]
episode  276 : steps 25 , return [-15.06]
step  0 :  [-1.3574160391208983]
step  1 :  [-1.3258427426784791]
step  2 :  [-1.292050606554485]
step  3 :  [-1.2239427915926835]
step  4 :  [-1.1264371397349477]
step  5 :  [-1.0051541117600071]
step  6 :  [-0.8651803941063742]
step  7 :  [-0.7997281016988528]
step  8 :  [-0.706502068276054]
step  9 :  [-0.6147716747497117]
step  10 :  [-0.5280907847032491]
step  11 :  [-0.4551576464513093]
step  12 :  [-0.3720383929571019]
step  13 :  [-0.28442465042025]
step  14 :  [-0.18573839448862325]
step  15 :  [-0.07401207598256226]
step  16 :  [-0.0050559877512691654]
step  17 :  [-0.012300588887206565]
step  18 :  [-0.05482864665562193]
step  19 :  [-0.04676345396745416]
step  20 :  [-0.03990620841067049]
step  21 :  [-0.02744900701929284]
step  22 :  [-0.021782449252417676]
step  23 :  [-0.042407113192905216]
step  24 :  [-0.02487623908338253]
episode  277 : steps 25 , return [-12.49]
step  0 :  [-1.682407271006033]
step  1 :  [-1.6573758802612204]
step  2 :  [-1.5927299467255038]
step  3 :  [-1.4964749962683215]
step  4 :  [-1.4156030477630566]
step  5 :  [-1.307917836125073]
step  6 :  [-1.178730250819576]
step  7 :  [-1.0327034798803612]
step  8 :  [-0.873670665698279]
step  9 :  [-0.7759650464170229]
step  10 :  [-0.6623424422132741]
step  11 :  [-0.5481087824186968]
step  12 :  [-0.44192713919055193]
step  13 :  [-0.3544345440915518]
step  14 :  [-0.26017323446916824]
step  15 :  [-0.15070973199068252]
step  16 :  [-0.1039111994087789]
step  17 :  [-0.03738495307286894]
step  18 :  [-0.02264083596788091]
step  19 :  [-0.03382031956275235]
step  20 :  [-0.04770353211902095]
step  21 :  [-0.029944808854177416]
step  22 :  [-0.011631120431492377]
step  23 :  [-0.05037999139562126]
step  24 :  [-0.05671770183697703]
episode  278 : steps 25 , return [-15.83]
step  0 :  [-1.4738296065022167]
step  1 :  [-1.4456531147627245]
step  2 :  [-1.4158734090017944]
step  3 :  [-1.3500727271667343]
step  4 :  [-1.2539778199440461]
step  5 :  [-1.1336049172714022]
step  6 :  [-0.994247300909853]
step  7 :  [-0.8402499891644098]
step  8 :  [-0.756936614005326]
step  9 :  [-0.6581461590009039]
step  10 :  [-0.5519791607751864]
step  11 :  [-0.44834096980190624]
step  12 :  [-0.35870744018583334]
step  13 :  [-0.26118369472704406]
step  14 :  [-0.17038448845719775]
step  15 :  [-0.09011168245177428]
step  16 :  [-0.05509382244183406]
step  17 :  [-0.026941043215054472]
step  18 :  [-0.020446710473925107]
step  19 :  [-0.00973052160252786]
step  20 :  [-0.04855214567228629]
step  21 :  [-0.04943661581247548]
step  22 :  [-0.008687612884511305]
step  23 :  [-0.02924365268991143]
step  24 :  [-0.01517852261247345]
episode  279 : steps 25 , return [-13.47]
step  0 :  [-1.5780445001583883]
step  1 :  [-1.547477475884935]
step  2 :  [-1.5139109444446899]
step  3 :  [-1.4451748543679719]
step  4 :  [-1.3468526134862373]
step  5 :  [-1.2248116712799202]
step  6 :  [-1.0842319398158256]
step  7 :  [-0.9293872945157461]
step  8 :  [-0.7921149254537997]
step  9 :  [-0.6402027495005507]
step  10 :  [-0.5516300469909834]
step  11 :  [-0.4612535016176606]
step  12 :  [-0.38263858736803713]
step  13 :  [-0.29450583625821314]
step  14 :  [-0.20031815836082428]
step  15 :  [-0.09872153462349716]
step  16 :  [-0.040146990729449335]
step  17 :  [-0.04584369468887883]
step  18 :  [-0.0683452514829739]
step  19 :  [-0.06178084043740111]
step  20 :  [-0.06667896980202812]
step  21 :  [-0.0813291903664693]
step  22 :  [-0.07103073884029097]
step  23 :  [-0.05499571230076353]
step  24 :  [-0.014484561206728693]
episode  280 : steps 25 , return [-14.6]
step  0 :  [-1.8082472586567784]
step  1 :  [-1.7706201673680537]
step  2 :  [-1.7264516790858098]
step  3 :  [-1.6830022469233439]
step  4 :  [-1.646614424175065]
step  5 :  [-1.5786087189466789]
step  6 :  [-1.4824675684038313]
step  7 :  [-1.363087610882239]
step  8 :  [-1.2252318017370707]
step  9 :  [-1.0730358102810609]
step  10 :  [-0.9099442614869775]
step  11 :  [-0.7388435905950798]
step  12 :  [-0.5624495779546967]
step  13 :  [-0.3840985652145435]
step  14 :  [-0.21303983713285923]
step  15 :  [-0.07922593551548725]
step  16 :  [-0.039601024828849356]
step  17 :  [-0.01444210342563274]
step  18 :  [-0.0477969449394421]
step  19 :  [-0.04424697878753341]
step  20 :  [-0.038403733364581145]
step  21 :  [-0.028681436507208197]
step  22 :  [-0.029512112491842702]
step  23 :  [-0.06859725751845924]
step  24 :  [-0.06828032287851743]
episode  281 : steps 25 , return [-18.62]
step  0 :  [-1.4886115743833297]
step  1 :  [-1.4618745262583754]
step  2 :  [-1.4339872876771176]
step  3 :  [-1.3694494486233162]
step  4 :  [-1.2742412889816421]
step  5 :  [-1.1545223769563937]
step  6 :  [-1.0156736767971701]
step  7 :  [-0.8621009349037101]
step  8 :  [-0.7547868702367246]
step  9 :  [-0.6350835652666366]
step  10 :  [-0.5105781847024214]
step  11 :  [-0.3925223670539652]
step  12 :  [-0.2941428853655126]
step  13 :  [-0.1913109322272452]
step  14 :  [-0.07472930089301759]
step  15 :  [-0.03361530480297352]
step  16 :  [-0.03362949079463753]
step  17 :  [-0.03390300581584542]
step  18 :  [-0.022796516533335726]
step  19 :  [-0.016158163145506655]
step  20 :  [-0.0162849856274533]
step  21 :  [-0.03451273668917279]
step  22 :  [-0.07829762149537471]
step  23 :  [-0.08365089887099343]
step  24 :  [-0.05374404133985731]
episode  282 : steps 25 , return [-13.32]
step  0 :  [-1.6530890670511493]
step  1 :  [-1.6132088774254119]
step  2 :  [-1.566460710115787]
step  3 :  [-1.5207031650072942]
step  4 :  [-1.4829208579539985]
step  5 :  [-1.4148028587669708]
step  6 :  [-1.3190992183807377]
step  7 :  [-1.2004165706864953]
step  8 :  [-1.063431171004664]
step  9 :  [-0.9123132754341019]
step  10 :  [-0.7506743588737557]
step  11 :  [-0.5818489171750791]
step  12 :  [-0.4098565007932881]
step  13 :  [-0.2694868720853707]
step  14 :  [-0.1174015181915728]
step  15 :  [-0.02395674550335754]
step  16 :  [-0.08736373425256971]
step  17 :  [-0.09551093457781366]
step  18 :  [-0.08823286901412242]
step  19 :  [-0.10386236387687865]
step  20 :  [-0.06733895127940379]
step  21 :  [-0.030472077552797298]
step  22 :  [-0.03839402467318958]
step  23 :  [-0.03704379247258809]
step  24 :  [-0.055904548467974366]
episode  283 : steps 25 , return [-16.5]
step  0 :  [-1.7169076946475237]
step  1 :  [-1.6788718310269892]
step  2 :  [-1.634447729266887]
step  3 :  [-1.5911869153405767]
step  4 :  [-1.517034618163332]
step  5 :  [-1.4156293898598928]
step  6 :  [-1.2917942665592783]
step  7 :  [-1.1501379196530466]
step  8 :  [-0.9946110478123193]
step  9 :  [-0.8284436870424838]
step  10 :  [-0.7815057805084649]
step  11 :  [-0.6985323884710386]
step  12 :  [-0.6203827706739571]
step  13 :  [-0.5476558615368754]
step  14 :  [-0.48580060036643635]
step  15 :  [-0.41065370132898027]
step  16 :  [-0.3290976185856459]
step  17 :  [-0.23331198316098706]
step  18 :  [-0.11948454736235946]
step  19 :  [-0.049495820454365895]
step  20 :  [-0.02480545021150007]
step  21 :  [-0.05787142691945086]
step  22 :  [-0.04028794423749012]
step  23 :  [-0.07772968987413302]
step  24 :  [-0.057875121047919136]
episode  284 : steps 25 , return [-18.35]
step  0 :  [-1.5185350665439994]
step  1 :  [-1.4713925680330644]
step  2 :  [-1.4149994863907533]
step  3 :  [-1.3580339225761544]
step  4 :  [-1.3084849072828606]
step  5 :  [-1.2329598942377025]
step  6 :  [-1.1322778942999892]
step  7 :  [-1.0099926736419425]
step  8 :  [-0.8701645463357389]
step  9 :  [-0.7846208247925337]
step  10 :  [-0.6822697919188458]
step  11 :  [-0.5722806825894189]
step  12 :  [-0.4634778153444157]
step  13 :  [-0.3700981862718458]
step  14 :  [-0.2708146835576092]
step  15 :  [-0.16131589509804978]
step  16 :  [-0.12926668006640185]
step  17 :  [-0.07656222077668856]
step  18 :  [-0.03904810091292331]
step  19 :  [-0.05737666993443064]
step  20 :  [-0.05086180235876137]
step  21 :  [-0.02442086782857118]
step  22 :  [-0.03581371034590179]
step  23 :  [-0.012907361365533516]
step  24 :  [-0.02114808419795827]
episode  285 : steps 25 , return [-15.07]
step  0 :  [-1.3727257981617496]
step  1 :  [-1.3436829525482]
step  2 :  [-1.3132858581181306]
step  3 :  [-1.2474532463566057]
step  4 :  [-1.1515432639510483]
step  5 :  [-1.031428800313327]
step  6 :  [-0.892351276247671]
step  7 :  [-0.7938333067126098]
step  8 :  [-0.6791416616803299]
step  9 :  [-0.5635513574974078]
step  10 :  [-0.4724248716035094]
step  11 :  [-0.3686712744525956]
step  12 :  [-0.2681878929068048]
step  13 :  [-0.1601504477903156]
step  14 :  [-0.0674533342220922]
step  15 :  [-0.04695452021758938]
step  16 :  [-0.014383163312604343]
step  17 :  [-0.022786200040545608]
step  18 :  [-0.02136290485348433]
step  19 :  [-0.03579304681618779]
step  20 :  [-0.046926026830953024]
step  21 :  [-0.019183382579621013]
step  22 :  [-0.04225912468806349]
step  23 :  [-0.0496518323076633]
step  24 :  [-0.045250158567950234]
episode  286 : steps 25 , return [-12.07]
step  0 :  [-1.602533356567425]
step  1 :  [-1.5722017991171258]
step  2 :  [-1.538849670351511]
step  3 :  [-1.4701861444496462]
step  4 :  [-1.4135870114601237]
step  5 :  [-1.3267456009128247]
step  6 :  [-1.2147585795570182]
step  7 :  [-1.0827645079930353]
step  8 :  [-0.9353020752373862]
step  9 :  [-0.7762372081365062]
step  10 :  [-0.6091961929273592]
step  11 :  [-0.43789775107623846]
step  12 :  [-0.26990892232721725]
step  13 :  [-0.13163323036965513]
step  14 :  [-0.003258766519055696]
step  15 :  [-0.06454316564632338]
step  16 :  [-0.0726500314883738]
step  17 :  [-0.05176680660164618]
step  18 :  [-0.011145950309958297]
step  19 :  [-0.04699975755458934]
step  20 :  [-0.04822170566142254]
step  21 :  [-0.01215229246609387]
step  22 :  [-0.03571595299874401]
step  23 :  [-0.013942592841815404]
step  24 :  [-0.03692773493366794]
episode  287 : steps 25 , return [-14.78]
step  0 :  [-1.7177866791230139]
step  1 :  [-1.694783120215577]
step  2 :  [-1.6709405607366297]
step  3 :  [-1.6085184085893953]
step  4 :  [-1.5144726666534833]
step  5 :  [-1.3954176696010643]
step  6 :  [-1.2569585556487546]
step  7 :  [-1.1036152022549615]
step  8 :  [-0.9389445247168682]
step  9 :  [-0.7657191406638334]
step  10 :  [-0.5920235542336543]
step  11 :  [-0.42542417283390915]
step  12 :  [-0.2948132214773201]
step  13 :  [-0.17677932628143736]
step  14 :  [-0.08079373863558514]
step  15 :  [-0.03777981630882316]
step  16 :  [-0.02305238162896384]
step  17 :  [-0.03201707383439344]
step  18 :  [-0.007504111259769121]
step  19 :  [-0.03901360388350341]
step  20 :  [-0.03977466956014986]
step  21 :  [-0.0013973500877222979]
step  22 :  [-0.046825441030208116]
step  23 :  [-0.066713368952088]
step  24 :  [-0.04475514947324369]
episode  288 : steps 25 , return [-15.58]
step  0 :  [-1.4968862017162134]
step  1 :  [-1.4563358045675496]
step  2 :  [-1.4093095887308145]
step  3 :  [-1.3642978054265766]
step  4 :  [-1.2899295506264459]
step  5 :  [-1.1888721553944726]
step  6 :  [-1.0655398213533978]
step  7 :  [-0.9243655625159748]
step  8 :  [-0.8010168321744812]
step  9 :  [-0.6644827569204017]
step  10 :  [-0.5520498863980875]
step  11 :  [-0.47541246774992063]
step  12 :  [-0.39855567232781813]
step  13 :  [-0.31306692939595104]
step  14 :  [-0.21878170815922127]
step  15 :  [-0.10790143002534322]
step  16 :  [-0.04623916572824347]
step  17 :  [-0.045152280146175894]
step  18 :  [-0.03343658943353489]
step  19 :  [-0.027921618862706474]
step  20 :  [-0.024189765408391115]
step  21 :  [-0.017961688725842386]
step  22 :  [-0.05621876378041879]
step  23 :  [-0.04102229181498758]
step  24 :  [-0.040388097577510496]
episode  289 : steps 25 , return [-14.06]
step  0 :  [-1.7427179726611413]
step  1 :  [-1.7069214222489948]
step  2 :  [-1.665499988285121]
step  3 :  [-1.6257969488776522]
step  4 :  [-1.5539967920162643]
step  5 :  [-1.4541897695166803]
step  6 :  [-1.3314563433971605]
step  7 :  [-1.1905535481528524]
step  8 :  [-1.0355141847044382]
step  9 :  [-0.8696011582113362]
step  10 :  [-0.77824366544025]
step  11 :  [-0.6653510167169492]
step  12 :  [-0.5571837446895777]
step  13 :  [-0.47534246517478185]
step  14 :  [-0.39412912018557095]
step  15 :  [-0.2926808964030313]
step  16 :  [-0.18837074620923433]
step  17 :  [-0.07557198111850993]
step  18 :  [-0.02836924215886554]
step  19 :  [-0.03122033040243926]
step  20 :  [-0.020669058459885852]
step  21 :  [-0.044987597935279754]
step  22 :  [-0.04670571653964284]
step  23 :  [-0.03299441531108517]
step  24 :  [-0.014832268771896572]
episode  290 : steps 25 , return [-17.82]
step  0 :  [-1.577451456009487]
step  1 :  [-1.531136419395563]
step  2 :  [-1.475673821816018]
step  3 :  [-1.419480329936802]
step  4 :  [-1.3702311047955407]
step  5 :  [-1.2944927122683778]
step  6 :  [-1.1934138585566136]
step  7 :  [-1.0706711750784423]
step  8 :  [-0.9303550832441508]
step  9 :  [-0.7969347609804796]
step  10 :  [-0.6560778598611892]
step  11 :  [-0.5252881216082679]
step  12 :  [-0.4262113350861644]
step  13 :  [-0.33124981954238936]
step  14 :  [-0.22372532720380692]
step  15 :  [-0.11339571766650584]
step  16 :  [-0.06430900608198079]
step  17 :  [-0.06347453256469365]
step  18 :  [-0.06565773293182062]
step  19 :  [-0.07070308125554062]
step  20 :  [-0.07314983199031586]
step  21 :  [-0.05438179240885629]
step  22 :  [-0.04032270391032252]
step  23 :  [-0.03555820904993603]
step  24 :  [-0.045387100384790824]
episode  291 : steps 25 , return [-15.45]
step  0 :  [-1.5499341330612297]
step  1 :  [-1.5114873819343186]
step  2 :  [-1.4671557619906608]
step  3 :  [-1.4250993735671384]
step  4 :  [-1.3925940912240837]
step  5 :  [-1.3289915029500625]
step  6 :  [-1.2371969468029693]
step  7 :  [-1.1220793110236094]
step  8 :  [-0.9886283824251764]
step  9 :  [-0.8414340059061356]
step  10 :  [-0.6848146216443103]
step  11 :  [-0.5236370290190274]
step  12 :  [-0.3662483963974707]
step  13 :  [-0.2334181655088792]
step  14 :  [-0.10520579568048406]
step  15 :  [-0.06125771745285284]
step  16 :  [-0.05486400659159333]
step  17 :  [-0.09809833415513226]
step  18 :  [-0.08126803276140611]
step  19 :  [-0.0719355991384006]
step  20 :  [-0.05737068532906247]
step  21 :  [-0.0022361141654721056]
step  22 :  [-0.008940975954766407]
step  23 :  [-0.0374817041103001]
step  24 :  [-0.023325477794746925]
episode  292 : steps 25 , return [-15.27]
step  0 :  [-1.5652607943226948]
step  1 :  [-1.5316122351597643]
step  2 :  [-1.493861602028249]
step  3 :  [-1.4598194405268046]
step  4 :  [-1.3927721891852933]
step  5 :  [-1.2968509285630638]
step  6 :  [-1.177315877354701]
step  7 :  [-1.0391240378799897]
step  8 :  [-0.8865137056523906]
step  9 :  [-0.7425754004675462]
step  10 :  [-0.5907546844775501]
step  11 :  [-0.4362475159025511]
step  12 :  [-0.3099498729084111]
step  13 :  [-0.17569086364178152]
step  14 :  [-0.054553940658370485]
step  15 :  [-0.002314463654213695]
step  16 :  [-0.04294004104956393]
step  17 :  [-0.04514572772495057]
step  18 :  [-0.010249822563425973]
step  19 :  [-0.03728183634914673]
step  20 :  [-0.02948686765774925]
step  21 :  [-0.04455516459982739]
step  22 :  [-0.043240026524148434]
step  23 :  [-0.05066234401721295]
step  24 :  [-0.05133356095964446]
episode  293 : steps 25 , return [-14.51]
step  0 :  [-1.6019058853097399]
step  1 :  [-1.5739797524776142]
step  2 :  [-1.5439238386411938]
step  3 :  [-1.4775086000158273]
step  4 :  [-1.3807601744906561]
step  5 :  [-1.259793491874703]
step  6 :  [-1.1199273045848872]
step  7 :  [-0.9655055532980923]
step  8 :  [-0.7999672351953884]
step  9 :  [-0.6307520576624208]
step  10 :  [-0.5179848263460307]
step  11 :  [-0.40201582098296823]
step  12 :  [-0.3029081969526814]
step  13 :  [-0.2005472893182804]
step  14 :  [-0.09365369721210552]
step  15 :  [-0.04318165866148091]
step  16 :  [-0.08421042443521419]
step  17 :  [-0.08918090774638177]
step  18 :  [-0.06232366872678866]
step  19 :  [-0.010429696095311747]
step  20 :  [-0.03699902532824171]
step  21 :  [-0.038871889517940496]
step  22 :  [-0.004532047086557513]
step  23 :  [-0.029870340447329866]
step  24 :  [-0.04968558288234307]
episode  294 : steps 25 , return [-14.32]
step  0 :  [-1.5817283719974453]
step  1 :  [-1.5546042406486673]
step  2 :  [-1.5257346922567312]
step  3 :  [-1.4601998409399195]
step  4 :  [-1.3641074562684412]
step  5 :  [-1.2436329302325504]
step  6 :  [-1.1041370988583417]
step  7 :  [-0.9499921529935734]
step  8 :  [-0.7863317630232892]
step  9 :  [-0.6198493249498161]
step  10 :  [-0.47374306846403624]
step  11 :  [-0.3683048421757382]
step  12 :  [-0.2698089709997029]
step  13 :  [-0.16427000396089486]
step  14 :  [-0.12265863449295482]
step  15 :  [-0.054516752502960085]
step  16 :  [-0.04248923739729223]
step  17 :  [-0.06741858298314056]
step  18 :  [-0.07318498215447937]
step  19 :  [-0.04154820334193979]
step  20 :  [-0.007777298170469416]
step  21 :  [-0.026976729413910615]
step  22 :  [-0.037793160218261755]
step  23 :  [-0.051098310395152946]
step  24 :  [-0.05977472836811039]
episode  295 : steps 25 , return [-14.05]
step  0 :  [-1.57537661518005]
step  1 :  [-1.5319468084563617]
step  2 :  [-1.480547184034848]
step  3 :  [-1.4294862696998947]
step  4 :  [-1.3862796527059744]
step  5 :  [-1.3148162377568005]
step  6 :  [-1.2169038882177796]
step  7 :  [-1.09664947281797]
step  8 :  [-0.9584473580817009]
step  9 :  [-0.8062952476495345]
step  10 :  [-0.652248516540206]
step  11 :  [-0.4988548616823019]
step  12 :  [-0.3761831556014168]
step  13 :  [-0.24575284350490723]
step  14 :  [-0.12690506961102171]
step  15 :  [-0.006278186086504297]
step  16 :  [-0.058250240748740044]
step  17 :  [-0.06050784474327395]
step  18 :  [-0.041523306512938826]
step  19 :  [-0.040634182380106985]
step  20 :  [-0.03847906761649144]
step  21 :  [-0.008271242011549123]
step  22 :  [-0.045574816414905815]
step  23 :  [-0.035817783875964376]
step  24 :  [-0.013067587574956352]
episode  296 : steps 25 , return [-15.05]
step  0 :  [-1.4676867869144854]
step  1 :  [-1.4404897170146445]
step  2 :  [-1.4120835812883532]
step  3 :  [-1.3472602915866776]
step  4 :  [-1.2518848240062612]
step  5 :  [-1.1320618815217436]
step  6 :  [-0.993144514309218]
step  7 :  [-0.8395233149128435]
step  8 :  [-0.7340302213756971]
step  9 :  [-0.6173157859363629]
step  10 :  [-0.4959655502753633]
step  11 :  [-0.38281164413837243]
step  12 :  [-0.2881245161452678]
step  13 :  [-0.18801225549466144]
step  14 :  [-0.07451904926177001]
step  15 :  [-0.06389531217331236]
step  16 :  [-0.04342008261376751]
step  17 :  [-0.07393977359509125]
step  18 :  [-0.05107849457679427]
step  19 :  [-0.06529978593461055]
step  20 :  [-0.045101434570843035]
step  21 :  [-0.07859092291447776]
step  22 :  [-0.10617708827989387]
step  23 :  [-0.07734177105003703]
step  24 :  [-0.05595725295154301]
episode  297 : steps 25 , return [-13.33]
step  0 :  [-1.5583473511644426]
step  1 :  [-1.5167750118658394]
step  2 :  [-1.4680467622616604]
step  3 :  [-1.4204514659321497]
step  4 :  [-1.3814551304354838]
step  5 :  [-1.3131148435508049]
step  6 :  [-1.217633131858009]
step  7 :  [-1.0994023165803717]
step  8 :  [-0.9630443225125553]
step  9 :  [-0.8127858975073113]
step  10 :  [-0.6540980543332562]
step  11 :  [-0.4901655096145946]
step  12 :  [-0.328400901259718]
step  13 :  [-0.1942241270790139]
step  14 :  [-0.06765846013405229]
step  15 :  [-0.03325923421981143]
step  16 :  [-0.03349478047015566]
step  17 :  [-0.03515398715339454]
step  18 :  [-0.022022130491388243]
step  19 :  [-0.012739603787531676]
step  20 :  [-0.04063645997699868]
step  21 :  [-0.02039727226183777]
step  22 :  [-0.04867224684391673]
step  23 :  [-0.047954946696736014]
step  24 :  [-0.04742242319808691]
episode  298 : steps 25 , return [-14.83]
step  0 :  [-1.4952708658607947]
step  1 :  [-1.4539505086774214]
step  2 :  [-1.4058539460325636]
step  3 :  [-1.3595167100069818]
step  4 :  [-1.284246223413585]
step  5 :  [-1.1825589694688383]
step  6 :  [-1.0587783860314497]
step  7 :  [-0.9172829630495495]
step  8 :  [-0.802240569292547]
step  9 :  [-0.8184711077327894]
step  10 :  [-0.8850131480813033]
step  11 :  [-0.9012085526120693]
step  12 :  [-0.8690587045309508]
step  13 :  [-0.8003780922970197]
step  14 :  [-0.7057394759968797]
step  15 :  [-0.5951975308212425]
step  16 :  [-0.4805744001443584]
step  17 :  [-0.37331838425835107]
step  18 :  [-0.2596120090084793]
step  19 :  [-0.14746170157808636]
step  20 :  [-0.04641749250174845]
step  21 :  [-0.04669218263238075]
step  22 :  [-0.05641245795110259]
step  23 :  [-0.03364065901326301]
step  24 :  [-0.04149128501706797]
episode  299 : steps 25 , return [-18.02]
Averaged episode return over  300  episodes:  [-15.7]
Total number of samples:  7500

Process finished with exit code 0



/home/yu/anaconda3/envs/marl-minigrid/bin/python /home/yu/Music/MARL-ARL/current/simple-gridworld/evaluate_mpe_1a.py
frames: 4756000
step  0 :  [-1.573707001029488]
step  1 :  [-1.5437288090628605]
step  2 :  [-1.5109899864314371]
step  3 :  [-1.442827541391775]
step  4 :  [-1.3449043393623847]
step  5 :  [-1.2231364462882197]
step  6 :  [-1.1111385311701267]
step  7 :  [-0.979902489329689]
step  8 :  [-0.8333502416058479]
step  9 :  [-0.6750640673572851]
step  10 :  [-0.5083869177450883]
step  11 :  [-0.33736075514887975]
step  12 :  [-0.17328423647705568]
step  13 :  [-0.05666099628562314]
step  14 :  [-0.052749688940211446]
step  15 :  [-0.03551119020015042]
step  16 :  [-0.025740194212123042]
step  17 :  [-0.07040884153202241]
step  18 :  [-0.07178058667131469]
step  19 :  [-0.042684917286167516]
step  20 :  [-0.05826382717943356]
step  21 :  [-0.02973032751527772]
step  22 :  [-0.053575153939247395]
step  23 :  [-0.024847860140221417]
step  24 :  [-0.052175341874833636]
episode  0 : steps 25 , return [-13.83]
step  0 :  [-1.6350560250501516]
step  1 :  [-1.5915596438314812]
step  2 :  [-1.5398347556555119]
step  3 :  [-1.487975605830041]
step  4 :  [-1.4432620790458748]
step  5 :  [-1.3703325882773651]
step  6 :  [-1.271098568377585]
step  7 :  [-1.1511732173452556]
step  8 :  [-1.0130773132012414]
step  9 :  [-0.8607459241002647]
step  10 :  [-0.6975434433427713]
step  11 :  [-0.5263960377933842]
step  12 :  [-0.35039122626909797]
step  13 :  [-0.21142988211393185]
step  14 :  [-0.11830361158564137]
step  15 :  [-0.03531063183931159]
step  16 :  [-0.029599682249364774]
step  17 :  [-0.02745414897575382]
step  18 :  [-0.019815741622418025]
step  19 :  [-0.025031047900231692]
step  20 :  [-0.01432458287110222]
step  21 :  [-0.024546686449777234]
step  22 :  [-0.01124605672568525]
step  23 :  [-0.024577813670542813]
step  24 :  [-0.00952113528076271]
episode  1 : steps 25 , return [-15.49]
step  0 :  [-1.6279074923897172]
step  1 :  [-1.601961927032349]
step  2 :  [-1.5744940736819748]
step  3 :  [-1.509790330099057]
step  4 :  [-1.41422091369955]
step  5 :  [-1.2940925935794538]
step  6 :  [-1.1548364445931578]
step  7 :  [-1.000864728127353]
step  8 :  [-0.8356583240052073]
step  9 :  [-0.6619191840126541]
step  10 :  [-0.48172738339117827]
step  11 :  [-0.2966914651332137]
step  12 :  [-0.10823650300279802]
step  13 :  [-0.02076432378214876]
step  14 :  [-0.016556499358359837]
step  15 :  [-0.034877323855862466]
step  16 :  [-0.031332902548235016]
step  17 :  [-0.06531366710553205]
step  18 :  [-0.053353950614662374]
step  19 :  [-0.019812726544179714]
step  20 :  [-0.039920868580829175]
step  21 :  [-0.01488719686063964]
step  22 :  [-0.04720409203883734]
step  23 :  [-0.02397241225942143]
step  24 :  [-0.053271279141071784]
episode  2 : steps 25 , return [-13.98]
step  0 :  [-1.5009280090780344]
step  1 :  [-1.4658344132234582]
step  2 :  [-1.426386049849749]
step  3 :  [-1.3907442581627094]
step  4 :  [-1.3229026891621183]
step  5 :  [-1.226582052198913]
step  6 :  [-1.1075690324941678]
step  7 :  [-0.9699383733071836]
step  8 :  [-0.8179023802258436]
step  9 :  [-0.6550193273332446]
step  10 :  [-0.4844610219500143]
step  11 :  [-0.310040666975087]
step  12 :  [-0.1697477870715858]
step  13 :  [-0.11499579279364604]
step  14 :  [-0.08362857841825706]
step  15 :  [-0.04795579887480306]
step  16 :  [-0.04194635595392115]
step  17 :  [-0.01071255087364299]
step  18 :  [-0.032290579000739665]
step  19 :  [-0.011774323687224645]
step  20 :  [-0.03666402516825732]
step  21 :  [-0.05959003239461712]
step  22 :  [-0.06344352346128872]
step  23 :  [-0.09621190285990441]
step  24 :  [-0.0827053874530472]
episode  3 : steps 25 , return [-13.53]
step  0 :  [-1.4757118867881946]
step  1 :  [-1.4372967922701803]
step  2 :  [-1.393354193848584]
step  3 :  [-1.3523526912050647]
step  4 :  [-1.280880397028438]
step  5 :  [-1.222531059419909]
step  6 :  [-1.1526720570188098]
step  7 :  [-1.0548720132982643]
step  8 :  [-0.9346894810571309]
step  9 :  [-0.7974018352323627]
step  10 :  [-0.6479110079109536]
step  11 :  [-0.4914733033524262]
step  12 :  [-0.3366666827867957]
step  13 :  [-0.21032079518060404]
step  14 :  [-0.13986800186854392]
step  15 :  [-0.13180951436427618]
step  16 :  [-0.1069638391765572]
step  17 :  [-0.06773134391722466]
step  18 :  [-0.03647707223150653]
step  19 :  [-0.06933249484299533]
step  20 :  [-0.04452336679244495]
step  21 :  [-0.027896708939668478]
step  22 :  [-0.030044050787429114]
step  23 :  [-0.03165745868905748]
step  24 :  [-0.024549048795943624]
episode  4 : steps 25 , return [-14.5]
step  0 :  [-1.6555600148144043]
step  1 :  [-1.6297986966992073]
step  2 :  [-1.6024639736748734]
step  3 :  [-1.537771609768655]
step  4 :  [-1.4421683347542067]
step  5 :  [-1.3219917901954468]
step  6 :  [-1.182685392668221]
step  7 :  [-1.0286657859088288]
step  8 :  [-0.8634144570753519]
step  9 :  [-0.6896314665878073]
step  10 :  [-0.5093911954007296]
step  11 :  [-0.3242823366998114]
step  12 :  [-0.135562102991979]
step  13 :  [-0.0446904285630588]
step  14 :  [-0.027854595545383023]
step  15 :  [-0.06297441713685631]
step  16 :  [-0.04169007694928243]
step  17 :  [-0.03832223631532675]
step  18 :  [-0.020074240630075457]
step  19 :  [-0.052210965498401936]
step  20 :  [-0.046355921309493384]
step  21 :  [-0.009254698797209825]
step  22 :  [-0.009859917075887762]
step  23 :  [-0.04281804468240737]
step  24 :  [-0.02759860047279831]
episode  5 : steps 25 , return [-14.35]
step  0 :  [-1.7869034233395233]
step  1 :  [-1.7466434228525716]
step  2 :  [-1.6989003373553009]
step  3 :  [-1.6511363633716643]
step  4 :  [-1.6099216670330643]
step  5 :  [-1.5385928681259269]
step  6 :  [-1.4400438548887344]
step  7 :  [-1.3188167567786973]
step  8 :  [-1.1794453312650306]
step  9 :  [-1.025896625432094]
step  10 :  [-0.861460797970924]
step  11 :  [-0.688830826878528]
step  12 :  [-0.5103153719614242]
step  13 :  [-0.3284525657568309]
step  14 :  [-0.15040628616970497]
step  15 :  [-0.02505418944630463]
step  16 :  [-0.06392963115218445]
step  17 :  [-0.06462255606580627]
step  18 :  [-0.04958004804855433]
step  19 :  [-0.053013120376373145]
step  20 :  [-0.04187543638745895]
step  21 :  [-0.04648879133168098]
step  22 :  [-0.037737828553941366]
step  23 :  [-0.03028309371533808]
step  24 :  [-0.05291399485041308]
episode  6 : steps 25 , return [-18.]
step  0 :  [-1.615848798464621]
step  1 :  [-1.5838895558939583]
step  2 :  [-1.5482446716081377]
step  3 :  [-1.5164265673263915]
step  4 :  [-1.4507139792082668]
step  5 :  [-1.3556513809878756]
step  6 :  [-1.2367099311456302]
step  7 :  [-1.0989618177242035]
step  8 :  [-0.9467133726029857]
step  9 :  [-0.7835177458591981]
step  10 :  [-0.6123798916697583]
step  11 :  [-0.4362645343985487]
step  12 :  [-0.2601970733766124]
step  13 :  [-0.11577762960192277]
step  14 :  [-0.053722749171456856]
step  15 :  [-0.044514062429795734]
step  16 :  [-0.023826526446672748]
step  17 :  [-0.01217132097046755]
step  18 :  [-0.03598557600788044]
step  19 :  [-0.04293948185010668]
step  20 :  [-0.06152914451138053]
step  21 :  [-0.0629969385710231]
step  22 :  [-0.07645681098133494]
step  23 :  [-0.07439312399733786]
step  24 :  [-0.08492761803780817]
episode  7 : steps 25 , return [-15.13]
step  0 :  [-1.7264979644537692]
step  1 :  [-1.687325633990034]
step  2 :  [-1.6412930516990936]
step  3 :  [-1.5959839900109063]
step  4 :  [-1.5580877024225714]
step  5 :  [-1.4894463787924785]
step  6 :  [-1.393086358158694]
step  7 :  [-1.2737003524033643]
step  8 :  [-1.1359648032119132]
step  9 :  [-0.9839929026995922]
step  10 :  [-0.8212605919374213]
step  11 :  [-0.6507766877213824]
step  12 :  [-0.4755852452721125]
step  13 :  [-0.30071507824060534]
step  14 :  [-0.14831813641866784]
step  15 :  [-0.08802638398104777]
step  16 :  [-0.11305047064830945]
step  17 :  [-0.0990595266295942]
step  18 :  [-0.10333669341048991]
step  19 :  [-0.08995702248916346]
step  20 :  [-0.03418533437686159]
step  21 :  [-0.036907115761306154]
step  22 :  [-0.06443521788095857]
step  23 :  [-0.04380172800897944]
step  24 :  [-0.09098840682903972]
episode  8 : steps 25 , return [-17.65]
step  0 :  [-1.768208998778781]
step  1 :  [-1.7385954743162302]
step  2 :  [-1.7055707921651653]
step  3 :  [-1.6366949001863027]
step  4 :  [-1.5380438317430085]
step  5 :  [-1.4156825047968025]
step  6 :  [-1.2748738187668587]
step  7 :  [-1.1433127956990552]
step  8 :  [-0.9896138262763264]
step  9 :  [-0.8281345460440144]
step  10 :  [-0.6603348011760254]
step  11 :  [-0.48863672679130193]
step  12 :  [-0.31818947000007614]
step  13 :  [-0.18034736420905204]
step  14 :  [-0.12330403228325668]
step  15 :  [-0.044937880057638845]
step  16 :  [-0.05496202272157563]
step  17 :  [-0.05123530945987797]
step  18 :  [-0.011843844192505027]
step  19 :  [-0.06876552005088463]
step  20 :  [-0.078245563342422]
step  21 :  [-0.047197147329939675]
step  22 :  [-0.02472877152630251]
step  23 :  [-0.0514153595335991]
step  24 :  [-0.02613909012185985]
episode  9 : steps 25 , return [-16.27]
step  0 :  [-1.664843798822091]
step  1 :  [-1.6250228759270644]
step  2 :  [-1.5783127791306772]
step  3 :  [-1.5325293506803475]
step  4 :  [-1.456859883808126]
step  5 :  [-1.3946545195429527]
step  6 :  [-1.3048571701487914]
step  7 :  [-1.191321966779815]
step  8 :  [-1.0585400724107488]
step  9 :  [-0.9107114774353747]
step  10 :  [-0.7515335572431291]
step  11 :  [-0.5843899411141057]
step  12 :  [-0.4131757994458028]
step  13 :  [-0.246339290143824]
step  14 :  [-0.11077840623282867]
step  15 :  [-0.054409231687533734]
step  16 :  [-0.042954323251585894]
step  17 :  [-0.012128622862157754]
step  18 :  [-0.06110855142432894]
step  19 :  [-0.0683998450551163]
step  20 :  [-0.03284000706376473]
step  21 :  [-0.05816966318697909]
step  22 :  [-0.030954042505585627]
step  23 :  [-0.028981529360600854]
step  24 :  [-0.016700973449311585]
episode  10 : steps 25 , return [-16.23]
step  0 :  [-1.6893368813019891]
step  1 :  [-1.6511659343514296]
step  2 :  [-1.6066548191547274]
step  3 :  [-1.563450097603099]
step  4 :  [-1.4894442191358712]
step  5 :  [-1.3881943057661394]
step  6 :  [-1.2644935659357666]
step  7 :  [-1.1526034080738425]
step  8 :  [-1.0177514917009347]
step  9 :  [-0.8699995965885602]
step  10 :  [-0.7120628544873356]
step  11 :  [-0.547039512054201]
step  12 :  [-0.37941398938546284]
step  13 :  [-0.22159590804161117]
step  14 :  [-0.10276742031450721]
step  15 :  [-0.06740147266015574]
step  16 :  [-0.046535923109270655]
step  17 :  [-0.06586260784636752]
step  18 :  [-0.05497870411231916]
step  19 :  [-0.07701278199509205]
step  20 :  [-0.09313502767243437]
step  21 :  [-0.08174510565481513]
step  22 :  [-0.05414018313525603]
step  23 :  [-0.08230700221688533]
step  24 :  [-0.05751070963701839]
episode  11 : steps 25 , return [-16.34]
step  0 :  [-1.5707972930540754]
step  1 :  [-1.526956152351203]
step  2 :  [-1.4749981245589157]
step  3 :  [-1.4232670000146572]
step  4 :  [-1.3793231863491315]
step  5 :  [-1.3073693601478957]
step  6 :  [-1.214063724019108]
step  7 :  [-1.1023492104759554]
step  8 :  [-0.9716447498915397]
step  9 :  [-0.826036683168665]
step  10 :  [-0.6693844212696833]
step  11 :  [-0.5056760167650729]
step  12 :  [-0.34090827905892507]
step  13 :  [-0.20444165119523022]
step  14 :  [-0.08385657236663745]
step  15 :  [-0.010337397209526079]
step  16 :  [-0.0017399659908983402]
step  17 :  [-0.04686971953240394]
step  18 :  [-0.03168359364199758]
step  19 :  [-0.04471433936561197]
step  20 :  [-0.0766529667538704]
step  21 :  [-0.11571745048915956]
step  22 :  [-0.11252272466350967]
step  23 :  [-0.07841808342494018]
step  24 :  [-0.09280947798982356]
episode  12 : steps 25 , return [-15.21]
step  0 :  [-1.4604674943614713]
step  1 :  [-1.4287563500351916]
step  2 :  [-1.3941882816981308]
step  3 :  [-1.3251571768453578]
step  4 :  [-1.2309798212085787]
step  5 :  [-1.172666632313268]
step  6 :  [-1.0847498777372264]
step  7 :  [-0.9732829579920039]
step  8 :  [-0.8431879324794344]
step  9 :  [-0.6993165247693789]
step  10 :  [-0.5467370253603051]
step  11 :  [-0.3926186571105779]
step  12 :  [-0.254822678863659]
step  13 :  [-0.15239977628914297]
step  14 :  [-0.11853332567631208]
step  15 :  [-0.09674730322809387]
step  16 :  [-0.08936640580143834]
step  17 :  [-0.0712376435840598]
step  18 :  [-0.08094567158296025]
step  19 :  [-0.06145133594618015]
step  20 :  [-0.0798181755153957]
step  21 :  [-0.05828941973851905]
step  22 :  [-0.04525861703849114]
step  23 :  [-0.01213355233061206]
step  24 :  [-0.006040719094280682]
episode  13 : steps 25 , return [-13.68]
step  0 :  [-1.5504295761630542]
step  1 :  [-1.516403497468111]
step  2 :  [-1.47133781742792]
step  3 :  [-1.424265844075578]
step  4 :  [-1.3831731470978463]
step  5 :  [-1.313599390934223]
step  6 :  [-1.2246561230959172]
step  7 :  [-1.1270599583447025]
step  8 :  [-1.0081558242891517]
step  9 :  [-0.8721814605593577]
step  10 :  [-0.7233611198573543]
step  11 :  [-0.5660347777022922]
step  12 :  [-0.4060477988949178]
step  13 :  [-0.2574720150372884]
step  14 :  [-0.14192109413945259]
step  15 :  [-0.06318386537350781]
step  16 :  [-0.06625460076587586]
step  17 :  [-0.08522644418033637]
step  18 :  [-0.04984469242394155]
step  19 :  [-0.05132234134845293]
step  20 :  [-0.030898319791757035]
step  21 :  [-0.03261571317680819]
step  22 :  [-0.034818430188898776]
step  23 :  [-0.04080267517246511]
step  24 :  [-0.040689327278737475]
episode  14 : steps 25 , return [-15.48]
step  0 :  [-1.6463001704939395]
step  1 :  [-1.6181891037017309]
step  2 :  [-1.5876892270114036]
step  3 :  [-1.5208398523932563]
step  4 :  [-1.4237228740494292]
step  5 :  [-1.3024625914680745]
step  6 :  [-1.1623741206558345]
step  7 :  [-1.006615039974079]
step  8 :  [-0.841071064316523]
step  9 :  [-0.6678645733440656]
step  10 :  [-0.48893891982545923]
step  11 :  [-0.30648105539760945]
step  12 :  [-0.16538426144009483]
step  13 :  [-0.06673767706676607]
step  14 :  [-0.017949011175118334]
step  15 :  [-0.04071275252050434]
step  16 :  [-0.031102616131901906]
step  17 :  [-0.04518117769918069]
step  18 :  [-0.03944679592789062]
step  19 :  [-0.04882843389556062]
step  20 :  [-0.0442561727565191]
step  21 :  [-0.05115919052981594]
step  22 :  [-0.04698562223778293]
step  23 :  [-0.02760604693607112]
step  24 :  [-0.04510089520350552]
episode  15 : steps 25 , return [-14.24]
step  0 :  [-1.583589654140682]
step  1 :  [-1.5401668968329072]
step  2 :  [-1.4887441089489055]
step  3 :  [-1.437598456986266]
step  4 :  [-1.3942108228042658]
step  5 :  [-1.3225615932785983]
step  6 :  [-1.2244766208737816]
step  7 :  [-1.1078993568480113]
step  8 :  [-0.9730428182557094]
step  9 :  [-0.8238878237791584]
step  10 :  [-0.664074633607492]
step  11 :  [-0.497227851551649]
step  12 :  [-0.32859334211640956]
step  13 :  [-0.18997108362985313]
step  14 :  [-0.13259625435493133]
step  15 :  [-0.11434202309725718]
step  16 :  [-0.07439607446128212]
step  17 :  [-0.04401679497946342]
step  18 :  [-0.0345984686378218]
step  19 :  [-0.021416112709157803]
step  20 :  [-0.005286232738883681]
step  21 :  [-0.04309465025963672]
step  22 :  [-0.08350806962313555]
step  23 :  [-0.08394970003547819]
step  24 :  [-0.05124955450947517]
episode  16 : steps 25 , return [-15.26]
step  0 :  [-1.5740506309415558]
step  1 :  [-1.5418506380001782]
step  2 :  [-1.5060571529980347]
step  3 :  [-1.4743508802291792]
step  4 :  [-1.4089234981831822]
step  5 :  [-1.3141946868132264]
step  6 :  [-1.1955994430809314]
step  7 :  [-1.0582123686701008]
step  8 :  [-0.9063677320724022]
step  9 :  [-0.743682621577575]
step  10 :  [-0.5733159269662823]
step  11 :  [-0.3987104626897801]
step  12 :  [-0.2272429287490115]
step  13 :  [-0.08780113524867765]
step  14 :  [-0.029898723482110555]
step  15 :  [-0.02013663418918815]
step  16 :  [-0.04523095926108701]
step  17 :  [-0.06317001523682571]
step  18 :  [-0.058871144952295326]
step  19 :  [-0.026971244275383558]
step  20 :  [-0.037617185740444946]
step  21 :  [-0.012409423766587789]
step  22 :  [-0.044541737167935226]
step  23 :  [-0.028289799003891287]
step  24 :  [-0.05337582969656733]
episode  17 : steps 25 , return [-14.43]
step  0 :  [-1.444538224924975]
step  1 :  [-1.4147205516424182]
step  2 :  [-1.382844989984353]
step  3 :  [-1.3157065693090553]
step  4 :  [-1.2248736675041396]
step  5 :  [-1.1385964408296634]
step  6 :  [-1.0278741164982363]
step  7 :  [-0.8975399328522962]
step  8 :  [-0.7521662191938585]
step  9 :  [-0.5960274042630488]
step  10 :  [-0.43388396826162673]
step  11 :  [-0.27474202855649577]
step  12 :  [-0.14359082538023332]
step  13 :  [-0.08836892999848013]
step  14 :  [-0.057510292703942076]
step  15 :  [-0.057475560774045385]
step  16 :  [-0.021836687025437087]
step  17 :  [-0.021515715973323895]
step  18 :  [-0.040461516324827446]
step  19 :  [-0.0065577761052416994]
step  20 :  [-0.03143129509689717]
step  21 :  [-0.07624322867056543]
step  22 :  [-0.07922726195085514]
step  23 :  [-0.07433624713043865]
step  24 :  [-0.061977057758006014]
episode  18 : steps 25 , return [-12.66]
step  0 :  [-1.5125545571547658]
step  1 :  [-1.4977864641382894]
step  2 :  [-1.470331836500469]
step  3 :  [-1.4398644361409103]
step  4 :  [-1.3767766606553602]
step  5 :  [-1.2842942923824459]
step  6 :  [-1.2079216323681081]
step  7 :  [-1.1452754004338732]
step  8 :  [-1.0543726160103117]
step  9 :  [-0.940213374679968]
step  10 :  [-0.8080260922983759]
step  11 :  [-0.6628672861552114]
step  12 :  [-0.5102201796968489]
step  13 :  [-0.35873018062975964]
step  14 :  [-0.23278610250705056]
step  15 :  [-0.15274788161756164]
step  16 :  [-0.127632684827751]
step  17 :  [-0.13113110942478798]
step  18 :  [-0.10452806205706928]
step  19 :  [-0.07827623008149985]
step  20 :  [-0.009961926439402377]
step  21 :  [-0.011843798732114283]
step  22 :  [-0.03691739699816164]
step  23 :  [-0.020116627537776235]
step  24 :  [-0.04158730593360264]
episode  19 : steps 25 , return [-16.22]
step  0 :  [-1.7634006518741985]
step  1 :  [-1.7259693725229894]
step  2 :  [-1.6822195825653574]
step  3 :  [-1.6395283595921952]
step  4 :  [-1.5655926668866063]
step  5 :  [-1.4642516784945914]
step  6 :  [-1.3404186725076555]
step  7 :  [-1.198744305995114]
step  8 :  [-1.0629536758660725]
step  9 :  [-0.914872282708553]
step  10 :  [-0.7567581728003482]
step  11 :  [-0.5913091828907978]
step  12 :  [-0.4221947375679689]
step  13 :  [-0.25795904483861587]
step  14 :  [-0.1259148732745348]
step  15 :  [-0.07254887748645138]
step  16 :  [-0.06724797143231011]
step  17 :  [-0.07464220639400468]
step  18 :  [-0.03641259154301446]
step  19 :  [-0.059538018486218584]
step  20 :  [-0.04413690958621182]
step  21 :  [-0.032079042342620365]
step  22 :  [-0.01773670331764829]
step  23 :  [-0.026514136386098158]
step  24 :  [-0.0028870466786912875]
episode  20 : steps 25 , return [-16.95]
step  0 :  [-1.749950903531574]
step  1 :  [-1.7155945634943186]
step  2 :  [-1.6761316113503955]
step  3 :  [-1.6387957904685955]
step  4 :  [-1.568614066323985]
step  5 :  [-1.4699470960940015]
step  6 :  [-1.3480368623879808]
step  7 :  [-1.2077394850339611]
step  8 :  [-1.0531511997015075]
step  9 :  [-0.8875728863098132]
step  10 :  [-0.7136031315923148]
step  11 :  [-0.5332584011514481]
step  12 :  [-0.3480945720351901]
step  13 :  [-0.15934779045587413]
step  14 :  [-0.06831106680172323]
step  15 :  [-0.037102085971260974]
step  16 :  [-0.056572928197043786]
step  17 :  [-0.042109273067594995]
step  18 :  [-0.06019119931154016]
step  19 :  [-0.04092090561366735]
step  20 :  [-0.07332470314982154]
step  21 :  [-0.05555645715554704]
step  22 :  [-0.06476160336408061]
step  23 :  [-0.04523271249390592]
step  24 :  [-0.02771650300944941]
episode  21 : steps 25 , return [-16.64]
step  0 :  [-1.5546574717403996]
step  1 :  [-1.515615469756127]
step  2 :  [-1.4704344470251727]
step  3 :  [-1.4272884528394763]
step  4 :  [-1.353915671340758]
step  5 :  [-1.2534118420732383]
step  6 :  [-1.1769810704282273]
step  7 :  [-1.075703493416793]
step  8 :  [-0.9539356119416735]
step  9 :  [-0.8159568285980751]
step  10 :  [-0.6660884147917646]
step  11 :  [-0.5090976757882382]
step  12 :  [-0.3525900333981821]
step  13 :  [-0.2193265467664297]
step  14 :  [-0.1355056723808286]
step  15 :  [-0.11971996174989279]
step  16 :  [-0.09549461949495795]
step  17 :  [-0.03981148960406601]
step  18 :  [-0.03469224111768756]
step  19 :  [-0.032397795677467554]
step  20 :  [-0.02594773875093316]
step  21 :  [-0.04465806434595835]
step  22 :  [-0.038215146887454025]
step  23 :  [-0.030588030179184787]
step  24 :  [-0.024982171276630008]
episode  22 : steps 25 , return [-14.97]
step  0 :  [-1.6281566525135398]
step  1 :  [-1.6003676468330008]
step  2 :  [-1.5703845680601987]
step  3 :  [-1.5039415807999192]
step  4 :  [-1.4071348298269741]
step  5 :  [-1.2861065760569974]
step  6 :  [-1.146186333670198]
step  7 :  [-0.9904061774399577]
step  8 :  [-0.8243041309161308]
step  9 :  [-0.6502175147182199]
step  10 :  [-0.4700697068145874]
step  11 :  [-0.28557583356657895]
step  12 :  [-0.10011326565068067]
step  13 :  [-0.0353168770757346]
step  14 :  [-0.04310784053831988]
step  15 :  [-0.05030470570536491]
step  16 :  [-0.049148461261908215]
step  17 :  [-0.07065904386950331]
step  18 :  [-0.04243907075683617]
step  19 :  [-0.018950883709581732]
step  20 :  [-0.011280100282358277]
step  21 :  [-0.028975317711229565]
step  22 :  [-0.02654497050981315]
step  23 :  [-0.0477456261818816]
step  24 :  [-0.04107859105528234]
episode  23 : steps 25 , return [-13.93]
step  0 :  [-1.6775525593802203]
step  1 :  [-1.6392987916456403]
step  2 :  [-1.594716675636974]
step  3 :  [-1.5514957857196328]
step  4 :  [-1.4775262284673045]
step  5 :  [-1.37632528712069]
step  6 :  [-1.2526706061409034]
step  7 :  [-1.1450940925739281]
step  8 :  [-1.0149058374596118]
step  9 :  [-0.8702602250974009]
step  10 :  [-0.7143104577423127]
step  11 :  [-0.5503601804109693]
step  12 :  [-0.3827664972612165]
step  13 :  [-0.2226499745382017]
step  14 :  [-0.09882104731396792]
step  15 :  [-0.05807094869483238]
step  16 :  [-0.03816640705794238]
step  17 :  [-0.026982157604420003]
step  18 :  [-0.06409982499734623]
step  19 :  [-0.04709450981040256]
step  20 :  [-0.07896028543877245]
step  21 :  [-0.05841774139743017]
step  22 :  [-0.08735678980669898]
step  23 :  [-0.0647883808766174]
step  24 :  [-0.09208807761353961]
episode  24 : steps 25 , return [-16.18]
step  0 :  [-1.532687944093733]
step  1 :  [-1.5008308545199025]
step  2 :  [-1.4657004947992203]
step  3 :  [-1.3960502225268256]
step  4 :  [-1.2971735209876685]
step  5 :  [-1.199223437500051]
step  6 :  [-1.1095156224773954]
step  7 :  [-0.9983685348986235]
step  8 :  [-0.8694037477367101]
step  9 :  [-0.7268224203599962]
step  10 :  [-0.5752720692354747]
step  11 :  [-0.42122998920968835]
step  12 :  [-0.2795871970843121]
step  13 :  [-0.16828657942957986]
step  14 :  [-0.12649604628734765]
step  15 :  [-0.055629942326385774]
step  16 :  [-0.06606776064161586]
step  17 :  [-0.05129476991652492]
step  18 :  [-0.009322011199247356]
step  19 :  [-0.027220834942366906]
step  20 :  [-0.022244409961357924]
step  21 :  [-0.026498779672248816]
step  22 :  [-0.03248410197142664]
step  23 :  [-0.03775106063231434]
step  24 :  [-0.09696238554097837]
episode  25 : steps 25 , return [-14.09]
step  0 :  [-1.490682381228152]
step  1 :  [-1.4516963316628888]
step  2 :  [-1.4068849349217978]
step  3 :  [-1.3646828467145298]
step  4 :  [-1.2922915397277108]
step  5 :  [-1.2257819111138386]
step  6 :  [-1.162149005826836]
step  7 :  [-1.0695281235848575]
step  8 :  [-0.9534499611589732]
step  9 :  [-0.8192944588459858]
step  10 :  [-0.6720463813564924]
step  11 :  [-0.5168642227612303]
step  12 :  [-0.36145659254402984]
step  13 :  [-0.23026821110742735]
step  14 :  [-0.10630855274155983]
step  15 :  [-0.047168511817323344]
step  16 :  [-0.037484658605890536]
step  17 :  [-0.07646450442527561]
step  18 :  [-0.05721339459070372]
step  19 :  [-0.06225026123772668]
step  20 :  [-0.04350156992137411]
step  21 :  [-0.029756595179581992]
step  22 :  [-0.02000780638160395]
step  23 :  [-0.03643459914467195]
step  24 :  [-0.027473763334569804]
episode  26 : steps 25 , return [-14.56]
step  0 :  [-1.483915012299619]
step  1 :  [-1.444855205198869]
step  2 :  [-1.3999732725564935]
step  3 :  [-1.3577373300445648]
step  4 :  [-1.2853592733458445]
step  5 :  [-1.225519678375268]
step  6 :  [-1.1656740859261296]
step  7 :  [-1.0758569639196172]
step  8 :  [-0.9618344862018936]
step  9 :  [-0.829159884918748]
step  10 :  [-0.6829218719049224]
step  11 :  [-0.5282759508700021]
step  12 :  [-0.3726086313870153]
step  13 :  [-0.24109142991595103]
step  14 :  [-0.11551944267292474]
step  15 :  [-0.08002719999251952]
step  16 :  [-0.06442082733502981]
step  17 :  [-0.004998176396712464]
step  18 :  [-0.009386562456821606]
step  19 :  [-0.060004029447147895]
step  20 :  [-0.05002770249968819]
step  21 :  [-0.07376800596741298]
step  22 :  [-0.06083681811506794]
step  23 :  [-0.044943726954516816]
step  24 :  [-0.035529341832100166]
episode  27 : steps 25 , return [-14.65]
step  0 :  [-1.6225186933063758]
step  1 :  [-1.5903873097487995]
step  2 :  [-1.5544774982104377]
step  3 :  [-1.5222899011797404]
step  4 :  [-1.4562822479871118]
step  5 :  [-1.3609798917677072]
step  6 :  [-1.2418352415393221]
step  7 :  [-1.1039032535422653]
step  8 :  [-0.9514721466232041]
step  9 :  [-0.7880704923947639]
step  10 :  [-0.6166578444760574]
step  11 :  [-0.44008268381780474]
step  12 :  [-0.2629181494389102]
step  13 :  [-0.11807823417899689]
step  14 :  [-0.0569987414177216]
step  15 :  [-0.040696982203936145]
step  16 :  [-0.016821880367970832]
step  17 :  [-0.01955999290494685]
step  18 :  [-0.036909133475782785]
step  19 :  [-0.042300072453308274]
step  20 :  [-0.030236407430148996]
step  21 :  [-0.01303396115928348]
step  22 :  [-0.03174309798374669]
step  23 :  [-0.04435840078984791]
step  24 :  [-0.034505508060801444]
episode  28 : steps 25 , return [-15.]
step  0 :  [-1.6469890350528593]
step  1 :  [-1.622198268351501]
step  2 :  [-1.5962197529145523]
step  3 :  [-1.5324985558187845]
step  4 :  [-1.437610385688878]
step  5 :  [-1.3179758705702713]
step  6 :  [-1.1790937008353057]
step  7 :  [-1.025419903250238]
step  8 :  [-0.8604678523416999]
step  9 :  [-0.6869707971377588]
step  10 :  [-0.5070557352815793]
step  11 :  [-0.3224560389331013]
step  12 :  [-0.1353389186860484]
step  13 :  [-0.050508963267246465]
step  14 :  [-0.039553263425922795]
step  15 :  [-0.06858739011172041]
step  16 :  [-0.051624060263020195]
step  17 :  [-0.04955133729608591]
step  18 :  [-0.050728233970794255]
step  19 :  [-0.03333812468439121]
step  20 :  [-0.03241807223561873]
step  21 :  [-0.02221117341628663]
step  22 :  [-0.02151960813996517]
step  23 :  [-0.02394202423832456]
step  24 :  [-0.013489091611428992]
episode  29 : steps 25 , return [-14.33]
step  0 :  [-1.7730770247760002]
step  1 :  [-1.7421722587943558]
step  2 :  [-1.7073644039304496]
step  3 :  [-1.6755946762207354]
step  4 :  [-1.6092422446060741]
step  5 :  [-1.5133210852356034]
step  6 :  [-1.393463731944371]
step  7 :  [-1.2547732329821717]
step  8 :  [-1.1015153720006052]
step  9 :  [-0.9371299866478506]
step  10 :  [-0.7643611610297217]
step  11 :  [-0.5854525029921903]
step  12 :  [-0.402512727693736]
step  13 :  [-0.21910883308068121]
step  14 :  [-0.07085422978074896]
step  15 :  [-0.019439855242533097]
step  16 :  [-0.03145804148632208]
step  17 :  [-0.031095074285148586]
step  18 :  [-0.007342930782193453]
step  19 :  [-0.020601863131205378]
step  20 :  [-0.02635121048060346]
step  21 :  [-0.0278499602534414]
step  22 :  [-0.03773367190668368]
step  23 :  [-0.034363136182852756]
step  24 :  [-0.028493100112764885]
episode  30 : steps 25 , return [-17.01]
step  0 :  [-1.4388965124114388]
step  1 :  [-1.4111547327805587]
step  2 :  [-1.382159399541947]
step  3 :  [-1.3170344592800416]
step  4 :  [-1.2214979167913746]
step  5 :  [-1.111894967464976]
step  6 :  [-0.9819610829405057]
step  7 :  [-0.836119569307473]
step  8 :  [-0.6782343331860481]
step  9 :  [-0.5118177283327291]
step  10 :  [-0.34104082836478494]
step  11 :  [-0.1772933567061775]
step  12 :  [-0.05931372597568505]
step  13 :  [-0.05138368153670772]
step  14 :  [-0.03315527785887706]
step  15 :  [-0.04533897540028092]
step  16 :  [-0.02285796317034242]
step  17 :  [-0.04583492863899123]
step  18 :  [-0.020210630459664616]
step  19 :  [-0.047377631702000676]
step  20 :  [-0.02027103675562388]
step  21 :  [-0.04861047479708417]
step  22 :  [-0.020817221727346687]
step  23 :  [-0.04941045762306882]
step  24 :  [-0.02127547249744618]
episode  31 : steps 25 , return [-11.89]
step  0 :  [-1.6480866457934837]
step  1 :  [-1.6085727478517589]
step  2 :  [-1.5623529738307045]
step  3 :  [-1.5172838448861687]
step  4 :  [-1.4803432335418598]
step  5 :  [-1.412860014079125]
step  6 :  [-1.31765686469491]
step  7 :  [-1.1993944140314141]
step  8 :  [-1.0627924104187423]
step  9 :  [-0.9120639844920868]
step  10 :  [-0.7508774357683264]
step  11 :  [-0.5826699360802987]
step  12 :  [-0.41171447371980585]
step  13 :  [-0.24820599242416147]
step  14 :  [-0.11725549719098528]
step  15 :  [-0.06570337225903575]
step  16 :  [-0.04729878809011353]
step  17 :  [-0.07962146269842597]
step  18 :  [-0.05999132742869832]
step  19 :  [-0.09473738023396261]
step  20 :  [-0.14570286545580366]
step  21 :  [-0.1435786387713232]
step  22 :  [-0.1201958532447299]
step  23 :  [-0.07589020585411338]
step  24 :  [-0.05094870170542284]
episode  32 : steps 25 , return [-16.72]
step  0 :  [-1.553767928985811]
step  1 :  [-1.5113359349423297]
step  2 :  [-1.4614238466702436]
step  3 :  [-1.412378993092571]
step  4 :  [-1.334977229522115]
step  5 :  [-1.2811243749846226]
step  6 :  [-1.2289660759097336]
step  7 :  [-1.1451869229200387]
step  8 :  [-1.0356050602496338]
step  9 :  [-0.9058750272646411]
step  10 :  [-0.7610351403423631]
step  11 :  [-0.6057206989388602]
step  12 :  [-0.44519179615647114]
step  13 :  [-0.289572950690909]
step  14 :  [-0.16075413249914328]
step  15 :  [-0.10613688701324385]
step  16 :  [-0.07239533764645384]
step  17 :  [-0.06697071192155973]
step  18 :  [-0.03768204597674197]
step  19 :  [-0.08061364387142793]
step  20 :  [-0.10833079111905132]
step  21 :  [-0.0857678242952864]
step  22 :  [-0.060847081298286684]
step  23 :  [-0.10024585470312812]
step  24 :  [-0.08721536285416283]
episode  33 : steps 25 , return [-15.94]
step  0 :  [-1.5047991131798124]
step  1 :  [-1.4833930121687857]
step  2 :  [-1.450951911244412]
step  3 :  [-1.4168650681003094]
step  4 :  [-1.3509584798817442]
step  5 :  [-1.2563238931906515]
step  6 :  [-1.2009070557242691]
step  7 :  [-1.1346477819626173]
step  8 :  [-1.0410210723221995]
step  9 :  [-0.9250283885015438]
step  10 :  [-0.7918987499985504]
step  11 :  [-0.6468238500296134]
step  12 :  [-0.4958089167418098]
step  13 :  [-0.3492465544056996]
step  14 :  [-0.22545300659078232]
step  15 :  [-0.10324823013484254]
step  16 :  [-0.04486106711775365]
step  17 :  [-0.03817378673808882]
step  18 :  [-0.05909800183953169]
step  19 :  [-0.05980973973708809]
step  20 :  [-0.04061671960308599]
step  21 :  [-0.040110085926147496]
step  22 :  [-0.04315485289673981]
step  23 :  [-0.04251174598964346]
step  24 :  [-0.03645340834456946]
episode  34 : steps 25 , return [-15.78]
step  0 :  [-1.4720188019501212]
step  1 :  [-1.4417999926176657]
step  2 :  [-1.409226362379332]
step  3 :  [-1.3415102146108435]
step  4 :  [-1.244059506469629]
step  5 :  [-1.1608560244415966]
step  6 :  [-1.0513289880971255]
step  7 :  [-0.922018630249118]
step  8 :  [-0.77732897985567]
step  9 :  [-0.6213580039277875]
step  10 :  [-0.4584212222710402]
step  11 :  [-0.2956913937528071]
step  12 :  [-0.16087013393230018]
step  13 :  [-0.036617960099524484]
step  14 :  [-0.03942794850909431]
step  15 :  [-0.04588161193309776]
step  16 :  [-0.07835479585974432]
step  17 :  [-0.0741624140618517]
step  18 :  [-0.044962350166779914]
step  19 :  [-0.03118322650699941]
step  20 :  [-0.052128007766072314]
step  21 :  [-0.03468576136005752]
step  22 :  [-0.03140237620424301]
step  23 :  [-0.008326436944218515]
step  24 :  [-0.05155891477223244]
episode  35 : steps 25 , return [-12.89]
step  0 :  [-1.5603403784502126]
step  1 :  [-1.5246931680028004]
step  2 :  [-1.4842015805586395]
step  3 :  [-1.446821650132105]
step  4 :  [-1.377440090769904]
step  5 :  [-1.2798026348737248]
step  6 :  [-1.158936015689801]
step  7 :  [-1.0196286646631845]
step  8 :  [-0.865989030590498]
step  9 :  [-0.7013852555608762]
step  10 :  [-0.528573002880166]
step  11 :  [-0.3500321374881967]
step  12 :  [-0.16976755562439175]
step  13 :  [-0.02483703584276926]
step  14 :  [-0.04008593116624529]
step  15 :  [-0.05461783489186306]
step  16 :  [-0.022749258280946323]
step  17 :  [-0.04255971272093911]
step  18 :  [-0.041145489656675305]
step  19 :  [-0.04356335341174782]
step  20 :  [-0.04967270477286925]
step  21 :  [-0.010460331178544648]
step  22 :  [-0.023716162599965156]
step  23 :  [-0.03691603787357455]
step  24 :  [-0.002989066937388748]
episode  36 : steps 25 , return [-13.86]
step  0 :  [-1.7520269827377228]
step  1 :  [-1.7179019571308003]
step  2 :  [-1.6787499030207442]
step  3 :  [-1.6417839446148046]
step  4 :  [-1.5718525607087892]
step  5 :  [-1.4733614183025352]
step  6 :  [-1.3515788700410967]
step  7 :  [-1.2113771527286321]
step  8 :  [-1.056861800785296]
step  9 :  [-0.8913422502580849]
step  10 :  [-0.7174229906062345]
step  11 :  [-0.537127132466804]
step  12 :  [-0.3520240384270266]
step  13 :  [-0.16341472142848254]
step  14 :  [-0.043523340590810464]
step  15 :  [-0.07879994993677587]
step  16 :  [-0.09937005586222661]
step  17 :  [-0.06764228007439467]
step  18 :  [-0.053052229684585304]
step  19 :  [-0.03386992272174612]
step  20 :  [-0.020374824329979]
step  21 :  [-0.051686337463409594]
step  22 :  [-0.03142433785265612]
step  23 :  [-0.06550217211982676]
step  24 :  [-0.04168763268155994]
episode  37 : steps 25 , return [-16.7]
step  0 :  [-1.576397611703585]
step  1 :  [-1.5493807779975086]
step  2 :  [-1.520682177282081]
step  3 :  [-1.4552825175905515]
step  4 :  [-1.3592954575651839]
step  5 :  [-1.238903126827604]
step  6 :  [-1.0995380998319597]
step  7 :  [-0.9454979098628589]
step  8 :  [-0.7802444017073911]
step  9 :  [-0.6064677672603717]
step  10 :  [-0.42623809975532934]
step  11 :  [-0.24114704053450509]
step  12 :  [-0.11204530885283381]
step  13 :  [-0.028093964228920278]
step  14 :  [-0.03323621300115566]
step  15 :  [-0.005255421844127899]
step  16 :  [-0.05229334476795656]
step  17 :  [-0.04781959453403559]
step  18 :  [-0.0163671933910657]
step  19 :  [-0.06316188800712505]
step  20 :  [-0.061700332353430414]
step  21 :  [-0.09695002057675697]
step  22 :  [-0.09111506458033006]
step  23 :  [-0.047157188135561884]
step  24 :  [-0.017136611697514167]
episode  38 : steps 25 , return [-13.47]
step  0 :  [-1.7003474210143927]
step  1 :  [-1.6641389115646663]
step  2 :  [-1.6223021314728199]
step  3 :  [-1.582335878218466]
step  4 :  [-1.510519364489418]
step  5 :  [-1.4107863350106093]
step  6 :  [-1.2881519976480422]
step  7 :  [-1.1473533427139118]
step  8 :  [-0.9908694302764082]
step  9 :  [-0.824656009685869]
step  10 :  [-0.6508647907699479]
step  11 :  [-0.47144142910147335]
step  12 :  [-0.2885957215409624]
step  13 :  [-0.14718154297277453]
step  14 :  [-0.04907499758898043]
step  15 :  [-0.04252438395242602]
step  16 :  [-0.006277497473438876]
step  17 :  [-0.032141825058878616]
step  18 :  [-0.043211004030096346]
step  19 :  [-0.05238641526460758]
step  20 :  [-0.02380408025948039]
step  21 :  [-0.04502663162893005]
step  22 :  [-0.04226205654511596]
step  23 :  [-0.03144833663554623]
step  24 :  [-0.033707574808847084]
episode  39 : steps 25 , return [-15.7]
step  0 :  [-1.569756831667943]
step  1 :  [-1.5238624911909093]
step  2 :  [-1.469022564743112]
step  3 :  [-1.4136673087990757]
step  4 :  [-1.3654821769660495]
step  5 :  [-1.2905433431339108]
step  6 :  [-1.223254743733664]
step  7 :  [-1.1480877477030282]
step  8 :  [-1.0468287824898062]
step  9 :  [-0.9245044767971385]
step  10 :  [-0.78611450164072]
step  11 :  [-0.6365224524675671]
step  12 :  [-0.4813376278470844]
step  13 :  [-0.3306042791092652]
step  14 :  [-0.20422670453218822]
step  15 :  [-0.08074586854295333]
step  16 :  [-0.02267900414851027]
step  17 :  [-0.015264490410697525]
step  18 :  [-0.07064480706731123]
step  19 :  [-0.06445966701211486]
step  20 :  [-0.058127842241973204]
step  21 :  [-0.04923185210015099]
step  22 :  [-0.05990789764260458]
step  23 :  [-0.045586380006924755]
step  24 :  [-0.009584490025496094]
episode  40 : steps 25 , return [-15.89]
step  0 :  [-1.599699132206213]
step  1 :  [-1.554659105082283]
step  2 :  [-1.5009039803562962]
step  3 :  [-1.446718971251486]
step  4 :  [-1.3996143701031991]
step  5 :  [-1.3252308346451287]
step  6 :  [-1.225228787298129]
step  7 :  [-1.1255742093515573]
step  8 :  [-1.0057452812804608]
step  9 :  [-0.8695461400447928]
step  10 :  [-0.7210215813849435]
step  11 :  [-0.5645459100077969]
step  12 :  [-0.4063472000669151]
step  13 :  [-0.274296906901593]
step  14 :  [-0.15451801146489197]
step  15 :  [-0.08562875543759654]
step  16 :  [-0.0790097723430469]
step  17 :  [-0.04083090059457971]
step  18 :  [-0.08524916083463864]
step  19 :  [-0.10097180948977032]
step  20 :  [-0.06695327079487583]
step  21 :  [-0.03728354027732812]
step  22 :  [-0.08340704995178637]
step  23 :  [-0.0772732831064091]
step  24 :  [-0.06908001651219955]
episode  41 : steps 25 , return [-15.9]
step  0 :  [-1.5966091873246822]
step  1 :  [-1.5651663237475886]
step  2 :  [-1.530314269325628]
step  3 :  [-1.4606585130748166]
step  4 :  [-1.3616895019688362]
step  5 :  [-1.2392115593471087]
step  6 :  [-1.1510755056390347]
step  7 :  [-1.0347804452300018]
step  8 :  [-0.9021185615569736]
step  9 :  [-0.7564167976087816]
step  10 :  [-0.6014859815520223]
step  11 :  [-0.44238054005256666]
step  12 :  [-0.28988130199175893]
step  13 :  [-0.1659956597972537]
step  14 :  [-0.11601233447667236]
step  15 :  [-0.03733844194770613]
step  16 :  [-0.03111709979365579]
step  17 :  [-0.03495478180870747]
step  18 :  [-0.028769941056981278]
step  19 :  [-0.037619672931771375]
step  20 :  [-0.061429605358753976]
step  21 :  [-0.049796893868842416]
step  22 :  [-0.08854627241866542]
step  23 :  [-0.0802098722870857]
step  24 :  [-0.039084742552581916]
episode  42 : steps 25 , return [-14.7]
step  0 :  [-1.503740034212254]
step  1 :  [-1.4741323819400325]
step  2 :  [-1.4422361606416192]
step  3 :  [-1.374873121593958]
step  4 :  [-1.2776151873953883]
step  5 :  [-1.1757391194698414]
step  6 :  [-1.0534863267455898]
step  7 :  [-0.9147594527742449]
step  8 :  [-0.7630706876687812]
step  9 :  [-0.6018726808321868]
step  10 :  [-0.4350790057694579]
step  11 :  [-0.27014941017672073]
step  12 :  [-0.14283750648195476]
step  13 :  [-0.12094718316296324]
step  14 :  [-0.1474211392839911]
step  15 :  [-0.1306830452900632]
step  16 :  [-0.07120222097364888]
step  17 :  [-0.06388696451568904]
step  18 :  [-0.037434258036557276]
step  19 :  [-0.0768596093058399]
step  20 :  [-0.09546812379238609]
step  21 :  [-0.06896525249537513]
step  22 :  [-0.0415948006625026]
step  23 :  [-0.0798046157034679]
step  24 :  [-0.09782538384751491]
episode  43 : steps 25 , return [-13.46]
step  0 :  [-1.557976389954402]
step  1 :  [-1.5305074996512629]
step  2 :  [-1.5012771900478306]
step  3 :  [-1.4355683900553617]
step  4 :  [-1.339390531995963]
step  5 :  [-1.21887427933277]
step  6 :  [-1.0831747578914879]
step  7 :  [-0.932220064701118]
step  8 :  [-0.7695220208248391]
step  9 :  [-0.5978896591244839]
step  10 :  [-0.41959500176485653]
step  11 :  [-0.23679205807903128]
step  12 :  [-0.0989104554573559]
step  13 :  [-0.06515568060021643]
step  14 :  [-0.021916118929483638]
step  15 :  [-0.05792589322138701]
step  16 :  [-0.05438925982901717]
step  17 :  [-0.016009351752933765]
step  18 :  [-0.06038958503890054]
step  19 :  [-0.06935336851654929]
step  20 :  [-0.07229192418681811]
step  21 :  [-0.07340630659569944]
step  22 :  [-0.030022453700968104]
step  23 :  [-0.02609373690190569]
step  24 :  [-0.036453778403409035]
episode  44 : steps 25 , return [-13.31]
step  0 :  [-1.755012222904316]
step  1 :  [-1.7248562807641212]
step  2 :  [-1.6911376358759649]
step  3 :  [-1.6218274816460783]
step  4 :  [-1.5229008889851343]
step  5 :  [-1.4422313303911143]
step  6 :  [-1.335494491169509]
step  7 :  [-1.2075592517797111]
step  8 :  [-1.062912273056603]
step  9 :  [-0.9053608024932683]
step  10 :  [-0.7380497408012889]
step  11 :  [-0.563652525960748]
step  12 :  [-0.38489445342665046]
step  13 :  [-0.2072696368912068]
step  14 :  [-0.06278277551837781]
step  15 :  [-0.003389032000240036]
step  16 :  [-0.022477027031807366]
step  17 :  [-0.01672314013869297]
step  18 :  [-0.04709127133398619]
step  19 :  [-0.05486991175497028]
step  20 :  [-0.016466937398335883]
step  21 :  [-0.039075436352020564]
step  22 :  [-0.013545248484434138]
step  23 :  [-0.035479300789723646]
step  24 :  [-0.05751136693565385]
episode  45 : steps 25 , return [-16.53]
step  0 :  [-1.7528643458220245]
step  1 :  [-1.7134297345042757]
step  2 :  [-1.6669430470423552]
step  3 :  [-1.6209222847210243]
step  4 :  [-1.5819903170101974]
step  5 :  [-1.512463202580259]
step  6 :  [-1.4153540891851306]
step  7 :  [-1.2953173257540873]
step  8 :  [-1.1569841935853953]
step  9 :  [-1.004414922183246]
step  10 :  [-0.841010617588747]
step  11 :  [-0.6696428554140831]
step  12 :  [-0.4930192804572619]
step  13 :  [-0.31497972321855894]
step  14 :  [-0.17019501254741087]
step  15 :  [-0.11035240224047077]
step  16 :  [-0.08179326182711773]
step  17 :  [-0.06618264792852853]
step  18 :  [-0.07842787373370097]
step  19 :  [-0.06776524639836788]
step  20 :  [-0.021177827614460222]
step  21 :  [-0.03253943360822686]
step  22 :  [-0.04627775265410371]
step  23 :  [-0.017906765495128363]
step  24 :  [-0.021006083909442173]
episode  46 : steps 25 , return [-17.75]
step  0 :  [-1.6551631330652352]
step  1 :  [-1.6117857439464314]
step  2 :  [-1.5601531035403429]
step  3 :  [-1.5082852096353423]
step  4 :  [-1.463378840375091]
step  5 :  [-1.3901872678943825]
step  6 :  [-1.2906882356300298]
step  7 :  [-1.168987177763253]
step  8 :  [-1.02940711409045]
step  9 :  [-0.8758187748971826]
step  10 :  [-0.7114912788048235]
step  11 :  [-0.5391945335043115]
step  12 :  [-0.3616247818362239]
step  13 :  [-0.22340110163831867]
step  14 :  [-0.12628959071108367]
step  15 :  [-0.0459144823569108]
step  16 :  [-0.04715256636457395]
step  17 :  [-0.03401173438657698]
step  18 :  [-0.03750020807082656]
step  19 :  [-0.027833964512581265]
step  20 :  [-0.03213634037485434]
step  21 :  [-0.02466263489982318]
step  22 :  [-0.029152706183227413]
step  23 :  [-0.023020028191623396]
step  24 :  [-0.04325859478018224]
episode  47 : steps 25 , return [-15.86]
step  0 :  [-1.5657964911121787]
step  1 :  [-1.5399315576357147]
step  2 :  [-1.5128535622437682]
step  3 :  [-1.4486156632798808]
step  4 :  [-1.3534850472664393]
step  5 :  [-1.2337434189848775]
step  6 :  [-1.0948241368276357]
step  7 :  [-0.9411524014514966]
step  8 :  [-0.7762293709549382]
step  9 :  [-0.6027911927081785]
step  10 :  [-0.42299774219603936]
step  11 :  [-0.23877120167789928]
step  12 :  [-0.056363782393706506]
step  13 :  [-0.05351594577074861]
step  14 :  [-0.07105894218680972]
step  15 :  [-0.07592696093174575]
step  16 :  [-0.08569576215548426]
step  17 :  [-0.045838498421221334]
step  18 :  [-0.029823728328401786]
step  19 :  [-0.01465714901530306]
step  20 :  [-0.02110547264538279]
step  21 :  [-0.016662514649037986]
step  22 :  [-0.03423050023643672]
step  23 :  [-0.031409374869525816]
step  24 :  [-0.036247045143724926]
episode  48 : steps 25 , return [-13.3]
step  0 :  [-1.5112906591997313]
step  1 :  [-1.4697742962528817]
step  2 :  [-1.421329968463014]
step  3 :  [-1.374434556284614]
step  4 :  [-1.2986999862277078]
step  5 :  [-1.2344359031941399]
step  6 :  [-1.2164887135611169]
step  7 :  [-1.172025293191386]
step  8 :  [-1.0931261203343257]
step  9 :  [-0.9868851314341613]
step  10 :  [-0.859726091396481]
step  11 :  [-0.7172626596936816]
step  12 :  [-0.5648022882516133]
step  13 :  [-0.4090214087811274]
step  14 :  [-0.26493434277812195]
step  15 :  [-0.15134568417245492]
step  16 :  [-0.06937308213062429]
step  17 :  [-0.06388219852161961]
step  18 :  [-0.08271877871778181]
step  19 :  [-0.047155646244605456]
step  20 :  [-0.0466202295553005]
step  21 :  [-0.027662442587651312]
step  22 :  [-0.038562795373052225]
step  23 :  [-0.0845464940072479]
step  24 :  [-0.08991253644367922]
episode  49 : steps 25 , return [-16.3]
step  0 :  [-1.7363856100834976]
step  1 :  [-1.6979153839813803]
step  2 :  [-1.6528212352288414]
step  3 :  [-1.6086187410902644]
step  4 :  [-1.5719197750823704]
step  5 :  [-1.504078159090859]
step  6 :  [-1.4082869111947849]
step  7 :  [-1.2893345708498183]
step  8 :  [-1.151957379170653]
step  9 :  [-1.0003114993016278]
step  10 :  [-0.8379115382906228]
step  11 :  [-0.66781256983499]
step  12 :  [-0.4931270811399181]
step  13 :  [-0.31893894360908576]
step  14 :  [-0.16558272225530785]
step  15 :  [-0.0885646092119232]
step  16 :  [-0.10237167565524431]
step  17 :  [-0.08551881171569121]
step  18 :  [-0.02672080067136767]
step  19 :  [-0.01760638029686621]
step  20 :  [-0.05738980611821865]
step  21 :  [-0.09430876150584348]
step  22 :  [-0.09281544641547285]
step  23 :  [-0.05310165344508635]
step  24 :  [-0.05971748123192571]
episode  50 : steps 25 , return [-17.78]
step  0 :  [-1.6614382333506523]
step  1 :  [-1.6187707371634574]
step  2 :  [-1.568107179451569]
step  3 :  [-1.517414378083253]
step  4 :  [-1.4738237600577622]
step  5 :  [-1.4015223637401033]
step  6 :  [-1.3026578269251734]
step  7 :  [-1.181436587949391]
step  8 :  [-1.0422460519636074]
step  9 :  [-0.8890053596226526]
step  10 :  [-0.7250311698463503]
step  11 :  [-0.5531618722469178]
step  12 :  [-0.37624253307947647]
step  13 :  [-0.19980781325530872]
step  14 :  [-0.056649256582763194]
step  15 :  [-0.006464313617600025]
step  16 :  [-0.02382264723555758]
step  17 :  [-0.01346038301436961]
step  18 :  [-0.022734671887130974]
step  19 :  [-0.023989082707826584]
step  20 :  [-0.046310959693577784]
step  21 :  [-0.06301128129844831]
step  22 :  [-0.04408369748326322]
step  23 :  [-0.02455038541843808]
step  24 :  [-0.016877637821107412]
episode  51 : steps 25 , return [-15.85]
step  0 :  [-1.737037492002243]
step  1 :  [-1.7035878045780257]
step  2 :  [-1.6654180781677201]
step  3 :  [-1.629743458994566]
step  4 :  [-1.5607749553802772]
step  5 :  [-1.463011410844215]
step  6 :  [-1.3417901528303517]
step  7 :  [-1.2020333078620702]
step  8 :  [-1.0478839821125623]
step  9 :  [-0.8826833068559805]
step  10 :  [-0.7090695661262563]
step  11 :  [-0.5291193016891494]
step  12 :  [-0.3445430239494842]
step  13 :  [-0.15742545064739277]
step  14 :  [-0.07104941853644832]
step  15 :  [-0.015189766509222165]
step  16 :  [-0.056387507176503926]
step  17 :  [-0.046883388540073685]
step  18 :  [-0.025857074201464266]
step  19 :  [-0.029622581160347456]
step  20 :  [-0.016591591027233545]
step  21 :  [-0.000581131336472288]
step  22 :  [-0.03805843993535942]
step  23 :  [-0.017067075954422528]
step  24 :  [-0.05049303170639598]
episode  52 : steps 25 , return [-16.34]
step  0 :  [-1.4866957886357457]
step  1 :  [-1.4685006389227708]
step  2 :  [-1.4396869186358896]
step  3 :  [-1.4096821156025063]
step  4 :  [-1.3467064303295915]
step  5 :  [-1.2541944546013295]
step  6 :  [-1.1780276429270518]
step  7 :  [-1.0762531090278828]
step  8 :  [-0.9533736811590128]
step  9 :  [-0.8139530510755743]
step  10 :  [-0.6623325848552433]
step  11 :  [-0.5030371239339997]
step  12 :  [-0.3429156191570006]
step  13 :  [-0.2031041048758125]
step  14 :  [-0.11593772636035432]
step  15 :  [-0.10357257899645542]
step  16 :  [-0.0791473365339151]
step  17 :  [-0.04895290369769005]
step  18 :  [-0.035467041525790215]
step  19 :  [-0.024305443054378737]
step  20 :  [-0.019033707075580844]
step  21 :  [-0.046750940206019775]
step  22 :  [-0.08862033156801402]
step  23 :  [-0.09647795305193907]
step  24 :  [-0.06992582873047565]
episode  53 : steps 25 , return [-14.87]
step  0 :  [-1.5226477559371259]
step  1 :  [-1.48503439719152]
step  2 :  [-1.4419852840267928]
step  3 :  [-1.401723429049992]
step  4 :  [-1.3305145357779222]
step  5 :  [-1.2316488847253353]
step  6 :  [-1.1363858086898873]
step  7 :  [-1.0190297721603976]
step  8 :  [-0.8838988606543131]
step  9 :  [-0.7352035741614178]
step  10 :  [-0.5770660175586395]
step  11 :  [-0.4145368344699577]
step  12 :  [-0.2808377813979517]
step  13 :  [-0.16816710074301514]
step  14 :  [-0.09494914534958068]
step  15 :  [-0.05743714116895342]
step  16 :  [-0.03307192708339676]
step  17 :  [-0.04018077866881351]
step  18 :  [-0.05788474581971384]
step  19 :  [-0.025187163929455185]
step  20 :  [-0.04880867974640558]
step  21 :  [-0.01778857115072093]
step  22 :  [-0.0443716630474055]
step  23 :  [-0.014540059107838937]
step  24 :  [-0.05307666558282081]
episode  54 : steps 25 , return [-14.12]
step  0 :  [-1.4620074179112088]
step  1 :  [-1.435152472775011]
step  2 :  [-1.4072447366064174]
step  3 :  [-1.342790832293405]
step  4 :  [-1.2476966318583176]
step  5 :  [-1.1294824410468267]
step  6 :  [-0.9918895573104932]
step  7 :  [-0.8393645939237833]
step  8 :  [-0.6754758457381688]
step  9 :  [-0.5030930681429605]
step  10 :  [-0.32475157866280535]
step  11 :  [-0.1446904184662819]
step  12 :  [-0.000780975550624811]
step  13 :  [-0.06347166418987131]
step  14 :  [-0.0727189956268364]
step  15 :  [-0.04535459160277689]
step  16 :  [-0.06095279036761716]
step  17 :  [-0.035264792070156856]
step  18 :  [-0.02512896394016492]
step  19 :  [-0.07218807477970965]
step  20 :  [-0.09491275987032957]
step  21 :  [-0.06824940559681364]
step  22 :  [-0.05180438118338195]
step  23 :  [-0.030809707977543403]
step  24 :  [-0.03778927570652705]
episode  55 : steps 25 , return [-12.16]
step  0 :  [-1.4877857410421098]
step  1 :  [-1.4522202634369716]
step  2 :  [-1.412181949669394]
step  3 :  [-1.3759177775987375]
step  4 :  [-1.3077086900064514]
step  5 :  [-1.211355323345356]
step  6 :  [-1.0952515643140508]
step  7 :  [-0.9604175193846788]
step  8 :  [-0.811005299962295]
step  9 :  [-0.650703987803351]
step  10 :  [-0.4830715605757038]
step  11 :  [-0.31309932994009243]
step  12 :  [-0.1738946375876511]
step  13 :  [-0.0641938919913567]
step  14 :  [-0.029092711644641556]
step  15 :  [-0.03817066099751668]
step  16 :  [-0.028127497406410965]
step  17 :  [-0.029099148309111887]
step  18 :  [-0.02422149432779566]
step  19 :  [-0.059285815233748616]
step  20 :  [-0.08049483646595751]
step  21 :  [-0.050980459986038736]
step  22 :  [-0.041001475086616446]
step  23 :  [-0.08509497334006798]
step  24 :  [-0.08901451224099285]
episode  56 : steps 25 , return [-13.35]
step  0 :  [-1.5830934083773598]
step  1 :  [-1.5534569204565998]
step  2 :  [-1.5211441659625395]
step  3 :  [-1.4532427172305242]
step  4 :  [-1.3554856672859816]
step  5 :  [-1.233825108427436]
step  6 :  [-1.1191334674130407]
step  7 :  [-0.9850119709241212]
step  8 :  [-0.8359075707370089]
step  9 :  [-0.6752896995596898]
step  10 :  [-0.5062383334979597]
step  11 :  [-0.33211077098441677]
step  12 :  [-0.16137222599412968]
step  13 :  [-0.03549859793226345]
step  14 :  [-0.04851233067904875]
step  15 :  [-0.04214575427132844]
step  16 :  [-0.039863537959062924]
step  17 :  [-0.0625732737245646]
step  18 :  [-0.05417376060206513]
step  19 :  [-0.054425052889725135]
step  20 :  [-0.0687800343233494]
step  21 :  [-0.03187511993523775]
step  22 :  [-0.05156945903049815]
step  23 :  [-0.019617094592497542]
step  24 :  [-0.04189286797021511]
episode  57 : steps 25 , return [-13.87]
step  0 :  [-1.5326513879653791]
step  1 :  [-1.506254954791536]
step  2 :  [-1.468292981785802]
step  3 :  [-1.4280621508285425]
step  4 :  [-1.393642169433385]
step  5 :  [-1.3289947089846108]
step  6 :  [-1.2362548363368655]
step  7 :  [-1.11990688708942]
step  8 :  [-0.9846378530326403]
step  9 :  [-0.8346824651673225]
step  10 :  [-0.673709983651553]
step  11 :  [-0.5051080572746133]
step  12 :  [-0.3331629239409612]
step  13 :  [-0.19341765388305784]
step  14 :  [-0.11337129277852023]
step  15 :  [-0.04191257084542193]
step  16 :  [-0.015450774208299389]
step  17 :  [-0.04794696021083297]
step  18 :  [-0.08741931874378919]
step  19 :  [-0.08137710258872183]
step  20 :  [-0.04761025417203049]
step  21 :  [-0.060880919491822914]
step  22 :  [-0.029887168108616694]
step  23 :  [-0.05472293261164287]
step  24 :  [-0.025353041199451646]
episode  58 : steps 25 , return [-15.14]
step  0 :  [-1.5959665305148818]
step  1 :  [-1.562390857174099]
step  2 :  [-1.5246055158853127]
step  3 :  [-1.4903017764271222]
step  4 :  [-1.4229169475006775]
step  5 :  [-1.3266577269292925]
step  6 :  [-1.2068005325378321]
step  7 :  [-1.0682941177141045]
step  8 :  [-0.9153526633767713]
step  9 :  [-0.7514391474025719]
step  10 :  [-0.5794323630311091]
step  11 :  [-0.4020486746945006]
step  12 :  [-0.22374386906451327]
step  13 :  [-0.07878227220342274]
step  14 :  [-0.020400887677333283]
step  15 :  [-0.029931467195512054]
step  16 :  [-0.051787246112160304]
step  17 :  [-0.03946595717294814]
step  18 :  [-0.003769376395155964]
step  19 :  [-0.026589341629362245]
step  20 :  [-0.024401067416797772]
step  21 :  [-0.035442730917063535]
step  22 :  [-0.049174274447628646]
step  23 :  [-0.034693234409349134]
step  24 :  [-0.005728675880596504]
episode  59 : steps 25 , return [-14.47]
step  0 :  [-1.5748490308387744]
step  1 :  [-1.5297682067274474]
step  2 :  [-1.476052730987587]
step  3 :  [-1.4220820329411978]
step  4 :  [-1.375473261173769]
step  5 :  [-1.3016079340732412]
step  6 :  [-1.2208433910365526]
step  7 :  [-1.1284552439119624]
step  8 :  [-1.013646607501642]
step  9 :  [-0.880881345200799]
step  10 :  [-0.7346002904139696]
step  11 :  [-0.579325108916462]
step  12 :  [-0.4209847745216676]
step  13 :  [-0.2730183114177075]
step  14 :  [-0.15540439911033851]
step  15 :  [-0.06173862807659287]
step  16 :  [-0.0498282202462102]
step  17 :  [-0.06920919266758514]
step  18 :  [-0.034657054812853166]
step  19 :  [-0.013910752168080331]
step  20 :  [-0.01962284960788192]
step  21 :  [-0.04370261273939533]
step  22 :  [-0.04392323161530769]
step  23 :  [-0.06287099452799924]
step  24 :  [-0.06509261145148104]
episode  60 : steps 25 , return [-15.55]
step  0 :  [-1.6978163293767232]
step  1 :  [-1.6663736325430334]
step  2 :  [-1.631106295593773]
step  3 :  [-1.5992182020530694]
step  4 :  [-1.5330866461128825]
step  5 :  [-1.4375002390045721]
step  6 :  [-1.3180095418887787]
step  7 :  [-1.179696055617101]
step  8 :  [-1.026834874559678]
step  9 :  [-0.8629015597733026]
step  10 :  [-0.6907218382785971]
step  11 :  [-0.5127500060934277]
step  12 :  [-0.33184183367678455]
step  13 :  [-0.1566277123041338]
step  14 :  [-0.03501569432010574]
step  15 :  [-0.06231150351419425]
step  16 :  [-0.05930696415977155]
step  17 :  [-0.04913240239463262]
step  18 :  [-0.04789467922642671]
step  19 :  [-0.03968329699531521]
step  20 :  [-0.04935541593816455]
step  21 :  [-0.037084394514068884]
step  22 :  [-0.016045031121697063]
step  23 :  [-0.020097437301691726]
step  24 :  [-0.011087286945085751]
episode  61 : steps 25 , return [-16.07]
step  0 :  [-1.5333377046886243]
step  1 :  [-1.5136864060938022]
step  2 :  [-1.4811993587078192]
step  3 :  [-1.4454408746876586]
step  4 :  [-1.3785508056188371]
step  5 :  [-1.2833541774512909]
step  6 :  [-1.2143042323472584]
step  7 :  [-1.209000229239024]
step  8 :  [-1.1775204687685237]
step  9 :  [-1.1092261195270496]
step  10 :  [-1.011433122523256]
step  11 :  [-0.8909713563721408]
step  12 :  [-0.7538584913863413]
step  13 :  [-0.6057188521055663]
step  14 :  [-0.4532251672524822]
step  15 :  [-0.30934842546451613]
step  16 :  [-0.19002749490969859]
step  17 :  [-0.07845273195194945]
step  18 :  [-0.025861720547360852]
step  19 :  [-0.04337232857068711]
step  20 :  [-0.055434817436635676]
step  21 :  [-0.05879342883544122]
step  22 :  [-0.03886890242955248]
step  23 :  [-0.018020419041111447]
step  24 :  [-0.020844711867047946]
episode  62 : steps 25 , return [-17.9]
step  0 :  [-1.390344834679418]
step  1 :  [-1.3952872279284085]
step  2 :  [-1.39187858148774]
step  3 :  [-1.3464944519214495]
step  4 :  [-1.2659284018851396]
step  5 :  [-1.1572949628421794]
step  6 :  [-1.026800389665381]
step  7 :  [-0.8795108786235509]
step  8 :  [-0.7194386865265214]
step  9 :  [-0.5497346578064287]
step  10 :  [-0.37295182738073857]
step  11 :  [-0.19179222802883203]
step  12 :  [-0.05351080599592507]
step  13 :  [-0.045161106639488795]
step  14 :  [-0.07024215475382278]
step  15 :  [-0.04163155784925694]
step  16 :  [-0.06817575889994985]
step  17 :  [-0.04349150859622739]
step  18 :  [-0.022496178461697873]
step  19 :  [-0.07019101865888697]
step  20 :  [-0.07545790353596357]
step  21 :  [-0.03961601564206428]
step  22 :  [-0.05162914296847073]
step  23 :  [-0.027529196827699012]
step  24 :  [-0.020067971633490986]
episode  63 : steps 25 , return [-12.32]
step  0 :  [-1.685365271122474]
step  1 :  [-1.6537657103948393]
step  2 :  [-1.6183314622920553]
step  3 :  [-1.586316658064266]
step  4 :  [-1.5201483735446286]
step  5 :  [-1.4245647051708183]
step  6 :  [-1.3050949972643298]
step  7 :  [-1.1668124898814984]
step  8 :  [-1.0139907621494337]
step  9 :  [-0.8501092935245989]
step  10 :  [-0.6780066701267112]
step  11 :  [-0.5001763833964751]
step  12 :  [-0.31963830037948465]
step  13 :  [-0.14648012616865008]
step  14 :  [-0.04068492174617115]
step  15 :  [-0.07520252389582853]
step  16 :  [-0.07079873345807583]
step  17 :  [-0.062063733966706995]
step  18 :  [-0.05948074010686731]
step  19 :  [-0.0551466800483787]
step  20 :  [-0.05313328790720818]
step  21 :  [-0.05147396330426498]
step  22 :  [-0.04957139421681427]
step  23 :  [-0.0494944085851211]
step  24 :  [-0.047571210523938305]
episode  64 : steps 25 , return [-16.08]
step  0 :  [-1.5420691296274227]
step  1 :  [-1.4979208340933086]
step  2 :  [-1.4456499329990808]
step  3 :  [-1.3937256313478887]
step  4 :  [-1.3498524365594557]
step  5 :  [-1.278156790522289]
step  6 :  [-1.205918500772236]
step  7 :  [-1.10626758583323]
step  8 :  [-0.9843828118365533]
step  9 :  [-0.8452254293867983]
step  10 :  [-0.6932546185038845]
step  11 :  [-0.5327845982647956]
step  12 :  [-0.3695437606863832]
step  13 :  [-0.21885684063178298]
step  14 :  [-0.1086187460620591]
step  15 :  [-0.07873408505007638]
step  16 :  [-0.05389450787460191]
step  17 :  [-0.03557820062241755]
step  18 :  [-0.022465792590625287]
step  19 :  [-0.06313336455662875]
step  20 :  [-0.10181627376422396]
step  21 :  [-0.10051976581709667]
step  22 :  [-0.06912720206877133]
step  23 :  [-0.08940123500680305]
step  24 :  [-0.06117176098221056]
episode  65 : steps 25 , return [-15.25]
step  0 :  [-1.7154514475191223]
step  1 :  [-1.6813111005383026]
step  2 :  [-1.6422702876292268]
step  3 :  [-1.605654048056589]
step  4 :  [-1.5361113739409202]
step  5 :  [-1.4379775147329152]
step  6 :  [-1.3165044881568997]
step  7 :  [-1.1765672214376504]
step  8 :  [-1.0222807282840343]
step  9 :  [-0.8569674772782528]
step  10 :  [-0.6832505012697279]
step  11 :  [-0.5031881585422393]
step  12 :  [-0.3184555995715277]
step  13 :  [-0.13107232537531377]
step  14 :  [-0.026641549731026188]
step  15 :  [-0.08886803332683178]
step  16 :  [-0.1016593774238075]
step  17 :  [-0.07424142820806849]
step  18 :  [-0.02693678432518426]
step  19 :  [-0.01309983358062625]
step  20 :  [-0.048816208085380126]
step  21 :  [-0.031816639054079256]
step  22 :  [-0.07544763974347973]
step  23 :  [-0.06579149335698604]
step  24 :  [-0.01734924495886884]
episode  66 : steps 25 , return [-16.2]
step  0 :  [-1.633997871751007]
step  1 :  [-1.5964942888267024]
step  2 :  [-1.5531202861767586]
step  3 :  [-1.5116709318292842]
step  4 :  [-1.4790330963860991]
step  5 :  [-1.4147398019181352]
step  6 :  [-1.3220358095535394]
step  7 :  [-1.2058765642475366]
step  8 :  [-1.0712108350931353]
step  9 :  [-0.9224723812472705]
step  10 :  [-0.7636151890362239]
step  11 :  [-0.5985753081283237]
step  12 :  [-0.4327459533960904]
step  13 :  [-0.27918626549579784]
step  14 :  [-0.1572247229895592]
step  15 :  [-0.1091433730576704]
step  16 :  [-0.08917135366757507]
step  17 :  [-0.04093961667543656]
step  18 :  [-0.045656547616376615]
step  19 :  [-0.015612452934546115]
step  20 :  [-0.019387181897231]
step  21 :  [-0.02990089003273846]
step  22 :  [-0.015288383935321658]
step  23 :  [-0.04147948881565659]
step  24 :  [-0.07372347422131648]
episode  67 : steps 25 , return [-16.42]
step  0 :  [-1.5729554696943406]
step  1 :  [-1.538331246637348]
step  2 :  [-1.4991988826837221]
step  3 :  [-1.4634024437196387]
step  4 :  [-1.395074110904052]
step  5 :  [-1.2981781508237409]
step  6 :  [-1.1778608135966557]
step  7 :  [-1.038995080007228]
step  8 :  [-0.8857449749983806]
step  9 :  [-0.7215321587551129]
step  10 :  [-0.5491886504283828]
step  11 :  [-0.3713638076421208]
step  12 :  [-0.1925961525432754]
step  13 :  [-0.047672949903055394]
step  14 :  [-0.017176816904108376]
step  15 :  [-0.06298896663926275]
step  16 :  [-0.08089029305111534]
step  17 :  [-0.10822507739030364]
step  18 :  [-0.08713608786287147]
step  19 :  [-0.048508933014330104]
step  20 :  [-0.047724155560877404]
step  21 :  [-0.015070432087014267]
step  22 :  [-0.03245606000023833]
step  23 :  [-0.004935926631819039]
step  24 :  [-0.03038772140910116]
episode  68 : steps 25 , return [-14.29]
step  0 :  [-1.6159856014180367]
step  1 :  [-1.583572935778293]
step  2 :  [-1.5473038510614774]
step  3 :  [-1.5147208836171877]
step  4 :  [-1.4484625249105934]
step  5 :  [-1.3529898734849302]
step  6 :  [-1.2337209118614496]
step  7 :  [-1.0956905456775732]
step  8 :  [-0.943173755530133]
step  9 :  [-0.7796884860491227]
step  10 :  [-0.6081834075259975]
step  11 :  [-0.4314959309781018]
step  12 :  [-0.25424151123373323]
step  13 :  [-0.10941701270468775]
step  14 :  [-0.04838511866194383]
step  15 :  [-0.0357252232515322]
step  16 :  [-0.023834099394519356]
step  17 :  [-0.018479651229744556]
step  18 :  [-0.02841384503499142]
step  19 :  [-0.04091384605093243]
step  20 :  [-0.037386876829449626]
step  21 :  [-0.01666209840001738]
step  22 :  [-0.07464495117399446]
step  23 :  [-0.12153018032876674]
step  24 :  [-0.11666401622293952]
episode  69 : steps 25 , return [-15.08]
step  0 :  [-1.5243261716444978]
step  1 :  [-1.4968226155793969]
step  2 :  [-1.4677069479404266]
step  3 :  [-1.4021890225537492]
step  4 :  [-1.3062053185662856]
step  5 :  [-1.1858639961478443]
step  6 :  [-1.0482381390087145]
step  7 :  [-0.8959890808401458]
step  8 :  [-0.7324760556153437]
step  9 :  [-0.560453188751809]
step  10 :  [-0.3823142220368712]
step  11 :  [-0.20119260327599758]
step  12 :  [-0.0583846903557997]
step  13 :  [-0.03050902220607058]
step  14 :  [-0.05538300299534258]
step  15 :  [-0.030158233222097264]
step  16 :  [-0.023126923149704826]
step  17 :  [-0.022561026819252716]
step  18 :  [-0.05632880565770891]
step  19 :  [-0.05068433780875019]
step  20 :  [-0.006553891201137388]
step  21 :  [-0.02266180830466]
step  22 :  [-0.03877253792872347]
step  23 :  [-0.02319637903109918]
step  24 :  [-0.03215757188535211]
episode  70 : steps 25 , return [-12.65]
step  0 :  [-1.6679609992685411]
step  1 :  [-1.6376605436166103]
step  2 :  [-1.6040765781196653]
step  3 :  [-1.5350750909545379]
step  4 :  [-1.436454674043169]
step  5 :  [-1.3141631824443936]
step  6 :  [-1.1735807628572297]
step  7 :  [-1.0209769056624278]
step  8 :  [-0.8617656703902432]
step  9 :  [-0.6969260828069086]
step  10 :  [-0.5288773364581092]
step  11 :  [-0.36314069456793235]
step  12 :  [-0.22860550237550026]
step  13 :  [-0.10640506966547038]
step  14 :  [-0.04366727588630222]
step  15 :  [-0.038988174521311404]
step  16 :  [-0.01748252280369324]
step  17 :  [-0.0058415046898664886]
step  18 :  [-0.04464511895310538]
step  19 :  [-0.02557629329669965]
step  20 :  [-0.06132993568615213]
step  21 :  [-0.03825646856621244]
step  22 :  [-0.07081718164400089]
step  23 :  [-0.0454378977216955]
step  24 :  [-0.05094057147727483]
episode  71 : steps 25 , return [-14.62]
step  0 :  [-1.7359730801473325]
step  1 :  [-1.7101882047462282]
step  2 :  [-1.6450060215514422]
step  3 :  [-1.5869899995279513]
step  4 :  [-1.4973750155200813]
step  5 :  [-1.3821812502611948]
step  6 :  [-1.2468655193835878]
step  7 :  [-1.0960123324903626]
step  8 :  [-0.9332112074151049]
step  9 :  [-0.7613144756183357]
step  10 :  [-0.5825315755371713]
step  11 :  [-0.39858035063174113]
step  12 :  [-0.21090495412121663]
step  13 :  [-0.1200967122194035]
step  14 :  [-0.1015507691823137]
step  15 :  [-0.03851606378024047]
step  16 :  [-0.040177699557437586]
step  17 :  [-0.011097922392824266]
step  18 :  [-0.007104793118345508]
step  19 :  [-0.04823451368997768]
step  20 :  [-0.04103923462133602]
step  21 :  [-0.03297555184177175]
step  22 :  [-0.01911691079494629]
step  23 :  [-0.04390869101496169]
step  24 :  [-0.02210354664574301]
episode  72 : steps 25 , return [-15.31]
step  0 :  [-1.7550672566481103]
step  1 :  [-1.725234061803396]
step  2 :  [-1.6919565419916531]
step  3 :  [-1.6621540287877699]
step  4 :  [-1.5972733084095485]
step  5 :  [-1.5024883260372293]
step  6 :  [-1.383546265075031]
step  7 :  [-1.2456356956373382]
step  8 :  [-1.0930944051655471]
step  9 :  [-0.9294373883642251]
step  10 :  [-0.7575140719370983]
step  11 :  [-0.5797713527883542]
step  12 :  [-0.39886587618588765]
step  13 :  [-0.22069435765369994]
step  14 :  [-0.07539399613834954]
step  15 :  [-0.013036523723108874]
step  16 :  [-0.017091561833029963]
step  17 :  [-0.025868250143952415]
step  18 :  [-0.0478233482842192]
step  19 :  [-0.027314779248736206]
step  20 :  [-0.04536274317424396]
step  21 :  [-0.05867085110932644]
step  22 :  [-0.05963124700220132]
step  23 :  [-0.03416168195010265]
step  24 :  [-0.028064006803681735]
episode  73 : steps 25 , return [-16.98]
step  0 :  [-1.6988803346302201]
step  1 :  [-1.6631272295446637]
step  2 :  [-1.6219247440859024]
step  3 :  [-1.582749203418797]
step  4 :  [-1.511487573275567]
step  5 :  [-1.4121528349832901]
step  6 :  [-1.2898101194604976]
step  7 :  [-1.14922095476479]
step  8 :  [-0.9936663292283164]
step  9 :  [-0.8277213839927627]
step  10 :  [-0.6537578671959958]
step  11 :  [-0.47373029881002515]
step  12 :  [-0.2894119840923064]
step  13 :  [-0.15122893134609422]
step  14 :  [-0.04591274544206403]
step  15 :  [-0.04701097253738064]
step  16 :  [-0.07289129259967703]
step  17 :  [-0.055878150978829776]
step  18 :  [-0.007588383533652741]
step  19 :  [-0.02041781220530013]
step  20 :  [-0.03010962184938204]
step  21 :  [-0.051605253819337546]
step  22 :  [-0.06977414237190842]
step  23 :  [-0.03942656134836329]
step  24 :  [-0.06631656447963277]
episode  74 : steps 25 , return [-15.83]
step  0 :  [-1.571956359850666]
step  1 :  [-1.546062246691905]
step  2 :  [-1.518915687967641]
step  3 :  [-1.4546098694681673]
step  4 :  [-1.3594192778001823]
step  5 :  [-1.239626139868592]
step  6 :  [-1.1006621567493633]
step  7 :  [-0.946949993719852]
step  8 :  [-0.7819873037228411]
step  9 :  [-0.6085042035724376]
step  10 :  [-0.42864560419899383]
step  11 :  [-0.2442699505796896]
step  12 :  [-0.10766359233702695]
step  13 :  [-0.07651603415580097]
step  14 :  [-0.033327719945657364]
step  15 :  [-0.06574897756902907]
step  16 :  [-0.05588952728879949]
step  17 :  [-0.01854823915314315]
step  18 :  [-0.035428847995086485]
step  19 :  [-0.011750759914730938]
step  20 :  [-0.07151050481350185]
step  21 :  [-0.07814142161386525]
step  22 :  [-0.04108468596716655]
step  23 :  [-0.01744493239966012]
step  24 :  [-0.03329145409783772]
episode  75 : steps 25 , return [-13.45]
step  0 :  [-1.6461246007081007]
step  1 :  [-1.6147540094544655]
step  2 :  [-1.5797912493949464]
step  3 :  [-1.5099236955761646]
step  4 :  [-1.4107507400948363]
step  5 :  [-1.3298932485128796]
step  6 :  [-1.2232979943801912]
step  7 :  [-1.095668458533794]
step  8 :  [-0.9514397410733773]
step  9 :  [-0.794442526995078]
step  10 :  [-0.6279444944066033]
step  11 :  [-0.4550109921146427]
step  12 :  [-0.2800123567353528]
step  13 :  [-0.13771656037180552]
step  14 :  [-0.0796359341132624]
step  15 :  [-0.05573155690514499]
step  16 :  [-0.014081064934952276]
step  17 :  [-0.039721465038079426]
step  18 :  [-0.0625111969055338]
step  19 :  [-0.05247816437557853]
step  20 :  [-0.015310791520226644]
step  21 :  [-0.03050810036549777]
step  22 :  [-0.057797581309637316]
step  23 :  [-0.052505434219425745]
step  24 :  [-0.01761033748133989]
episode  76 : steps 25 , return [-15.13]
step  0 :  [-1.677204553901373]
step  1 :  [-1.641392743239851]
step  2 :  [-1.6001910248769762]
step  3 :  [-1.5611493061302972]
step  4 :  [-1.4900701010877553]
step  5 :  [-1.3909126617135323]
step  6 :  [-1.2687258507341141]
step  7 :  [-1.128382318508942]
step  8 :  [-0.9736049228704634]
step  9 :  [-0.8079788344344492]
step  10 :  [-0.6340424859295388]
step  11 :  [-0.4537933631215482]
step  12 :  [-0.26883433372987714]
step  13 :  [-0.13524029083513292]
step  14 :  [-0.03180225878225355]
step  15 :  [-0.004634677831824019]
step  16 :  [-0.04933222418174145]
step  17 :  [-0.07408459621020345]
step  18 :  [-0.05852361577836333]
step  19 :  [-0.02532499240490042]
step  20 :  [-0.06129569957551021]
step  21 :  [-0.04870484325599054]
step  22 :  [-0.016758848859465877]
step  23 :  [-0.03075124884200397]
step  24 :  [-0.007478068313902388]
episode  77 : steps 25 , return [-15.44]
step  0 :  [-1.757981782305611]
step  1 :  [-1.7286923409583599]
step  2 :  [-1.6961472916714693]
step  3 :  [-1.6276183470466739]
step  4 :  [-1.529211345254397]
step  5 :  [-1.4495630025362845]
step  6 :  [-1.3435998149600754]
step  7 :  [-1.2162879350676474]
step  8 :  [-1.0721838386358522]
step  9 :  [-0.9151557362936387]
step  10 :  [-0.748420679746315]
step  11 :  [-0.5747743850562962]
step  12 :  [-0.3972358238336697]
step  13 :  [-0.22229204243772932]
step  14 :  [-0.07991223449846739]
step  15 :  [-0.01980061388389501]
step  16 :  [-0.016759322232288335]
step  17 :  [-0.034795980124407364]
step  18 :  [-0.027405930294411695]
step  19 :  [-0.04401302107919322]
step  20 :  [-0.0341339964920575]
step  21 :  [-0.04929361775822226]
step  22 :  [-0.05730837529785327]
step  23 :  [-0.07263811530957032]
step  24 :  [-0.036971706160089844]
episode  78 : steps 25 , return [-16.75]
step  0 :  [-1.496370742388832]
step  1 :  [-1.4654149624112294]
step  2 :  [-1.43170282256898]
step  3 :  [-1.363127750464141]
step  4 :  [-1.2650396213877007]
step  5 :  [-1.1836463527906524]
step  6 :  [-1.081720663225792]
step  7 :  [-0.9598406717703859]
step  8 :  [-0.8219654879573699]
step  9 :  [-0.6722409824982291]
step  10 :  [-0.5152951098854508]
step  11 :  [-0.35845224469981063]
step  12 :  [-0.2232221629919257]
step  13 :  [-0.1351246582272938]
step  14 :  [-0.11636666929759996]
step  15 :  [-0.09253598597568692]
step  16 :  [-0.03334610936741553]
step  17 :  [-0.028956988486853907]
step  18 :  [-0.039784529231946794]
step  19 :  [-0.03265006812752013]
step  20 :  [-0.028014039155562064]
step  21 :  [-0.031446430562908856]
step  22 :  [-0.01847434248352683]
step  23 :  [-0.05681303797818541]
step  24 :  [-0.037089092000433685]
episode  79 : steps 25 , return [-13.49]
step  0 :  [-1.4535083953844348]
step  1 :  [-1.4273829341283077]
step  2 :  [-1.3942753447358522]
step  3 :  [-1.3271617080873026]
step  4 :  [-1.290994933698313]
step  5 :  [-1.2524667131152505]
step  6 :  [-1.190013022464329]
step  7 :  [-1.0962900928992587]
step  8 :  [-0.9779903017063631]
step  9 :  [-0.8408819089510342]
step  10 :  [-0.6898243051464871]
step  11 :  [-0.5291946857114428]
step  12 :  [-0.3642350110381304]
step  13 :  [-0.22789878658506585]
step  14 :  [-0.15220400780059237]
step  15 :  [-0.07664147688244452]
step  16 :  [-0.05319035172364399]
step  17 :  [-0.07603812519284275]
step  18 :  [-0.09300881508984875]
step  19 :  [-0.08271512462612213]
step  20 :  [-0.05109586914943413]
step  21 :  [-0.03060867690493718]
step  22 :  [-0.025566642450544585]
step  23 :  [-0.04771267496144981]
step  24 :  [-0.031643332057418344]
episode  80 : steps 25 , return [-14.78]
step  0 :  [-1.5168877008530977]
step  1 :  [-1.477319911539909]
step  2 :  [-1.4315744088442928]
step  3 :  [-1.3880059460511458]
step  4 :  [-1.3145296886980444]
step  5 :  [-1.2291223086416743]
step  6 :  [-1.1686155993470477]
step  7 :  [-1.0784695091115062]
step  8 :  [-0.9642074093101818]
step  9 :  [-0.831211292907005]
step  10 :  [-0.6844144919825278]
step  11 :  [-0.5287185445770329]
step  12 :  [-0.37088006860296147]
step  13 :  [-0.22879894530866918]
step  14 :  [-0.12697570064192212]
step  15 :  [-0.09849253779282727]
step  16 :  [-0.07394922990286659]
step  17 :  [-0.07916870423901003]
step  18 :  [-0.0569209233729306]
step  19 :  [-0.0406772610824723]
step  20 :  [-0.07744768124898056]
step  21 :  [-0.05880841413742752]
step  22 :  [-0.04533267997357972]
step  23 :  [-0.05613523019714972]
step  24 :  [-0.03926843181884612]
episode  81 : steps 25 , return [-14.97]
step  0 :  [-1.6665312987510674]
step  1 :  [-1.642900506909097]
step  2 :  [-1.6184148883366765]
step  3 :  [-1.5556847349383767]
step  4 :  [-1.4614907982740144]
step  5 :  [-1.342367934124364]
step  6 :  [-1.2038837191529637]
step  7 :  [-1.0505404502372249]
step  8 :  [-0.8858886557921495]
step  9 :  [-0.7127020259463391]
step  10 :  [-0.5331745296820863]
step  11 :  [-0.3492152247393249]
step  12 :  [-0.16380165601188146]
step  13 :  [-0.08082778545562073]
step  14 :  [-0.0020984918276103]
step  15 :  [-0.05456072847360869]
step  16 :  [-0.04844228813529893]
step  17 :  [-0.03772421922390165]
step  18 :  [-0.04154620852189505]
step  19 :  [-0.008186740021230642]
step  20 :  [-0.011405596279509872]
step  21 :  [-0.026901590417732515]
step  22 :  [-0.00554912868983371]
step  23 :  [-0.039270918517083746]
step  24 :  [-0.015085612002765971]
episode  82 : steps 25 , return [-14.56]
step  0 :  [-1.6207774835508069]
step  1 :  [-1.595905056791093]
step  2 :  [-1.5699287047345298]
step  3 :  [-1.5062878662030652]
step  4 :  [-1.4115000638578747]
step  5 :  [-1.291965680211748]
step  6 :  [-1.1531779810356788]
step  7 :  [-0.9995941191026718]
step  8 :  [-0.8347329121648149]
step  9 :  [-0.6613393538405621]
step  10 :  [-0.4815697678530565]
step  11 :  [-0.29726605007889934]
step  12 :  [-0.15895865621789396]
step  13 :  [-0.05367134907154636]
step  14 :  [-0.046921776289832164]
step  15 :  [-0.07536785092381688]
step  16 :  [-0.05511579576503674]
step  17 :  [-0.07996471320279519]
step  18 :  [-0.06087558230276267]
step  19 :  [-0.08310990170639831]
step  20 :  [-0.06437556722789908]
step  21 :  [-0.016178348774832534]
step  22 :  [-0.017667817797396117]
step  23 :  [-0.02547512172386556]
step  24 :  [-0.05631186531757267]
episode  83 : steps 25 , return [-14.22]
step  0 :  [-1.5675828680656252]
step  1 :  [-1.536733477988618]
step  2 :  [-1.5028266136120572]
step  3 :  [-1.4338922720095044]
step  4 :  [-1.3354499542707952]
step  5 :  [-1.2133355768893879]
step  6 :  [-1.109498183231982]
step  7 :  [-0.9857313267257735]
step  8 :  [-0.8457746885713779]
step  9 :  [-0.6934114981482405]
step  10 :  [-0.5324956905366454]
step  11 :  [-0.3681859885948853]
step  12 :  [-0.21427834992940273]
step  13 :  [-0.10029718464938697]
step  14 :  [-0.06930231457430476]
step  15 :  [-0.0461038080422668]
step  16 :  [-0.05828064536300192]
step  17 :  [-0.047405019206365875]
step  18 :  [-0.05709645135010698]
step  19 :  [-0.05050088398975926]
step  20 :  [-0.038144523804718604]
step  21 :  [-0.03265486013905947]
step  22 :  [-0.06042794210862482]
step  23 :  [-0.08754172076476371]
step  24 :  [-0.08401382325920254]
episode  84 : steps 25 , return [-14.07]
step  0 :  [-1.7402193917209594]
step  1 :  [-1.7018828298641853]
step  2 :  [-1.656960452549041]
step  3 :  [-1.6129488877757197]
step  4 :  [-1.538195340367781]
step  5 :  [-1.436331995827761]
step  6 :  [-1.31216226989515]
step  7 :  [-1.173699047123243]
step  8 :  [-1.023345985802202]
step  9 :  [-0.8667118084287969]
step  10 :  [-0.704662023768757]
step  11 :  [-0.5398098900204176]
step  12 :  [-0.37830505510371004]
step  13 :  [-0.2467636873271372]
step  14 :  [-0.12449647756503893]
step  15 :  [-0.06815253135614605]
step  16 :  [-0.06426917079304709]
step  17 :  [-0.021318583478317]
step  18 :  [-0.025759941638491633]
step  19 :  [-0.02387393049807817]
step  20 :  [-0.010208120214330348]
step  21 :  [-0.03764629724190742]
step  22 :  [-0.01515308018793187]
step  23 :  [-0.04627493071366759]
step  24 :  [-0.020961756135215958]
episode  85 : steps 25 , return [-16.39]
step  0 :  [-1.4869505044952518]
step  1 :  [-1.4707530705365097]
step  2 :  [-1.4435428089839901]
step  3 :  [-1.4148239824799793]
step  4 :  [-1.352822929514389]
step  5 :  [-1.261040969769178]
step  6 :  [-1.1814955486694336]
step  7 :  [-1.0778432016720367]
step  8 :  [-0.9535786349137632]
step  9 :  [-0.8131202506276212]
step  10 :  [-0.660701064475594]
step  11 :  [-0.5007604552086625]
step  12 :  [-0.34008443466064653]
step  13 :  [-0.20000572755014517]
step  14 :  [-0.1141722171405]
step  15 :  [-0.10363025235155746]
step  16 :  [-0.07947288353985127]
step  17 :  [-0.04140757285345269]
step  18 :  [-0.03536811897503685]
step  19 :  [-0.01985614051777091]
step  20 :  [-0.08101703375298734]
step  21 :  [-0.1000534849907582]
step  22 :  [-0.11543088447105417]
step  23 :  [-0.10249462636272436]
step  24 :  [-0.07293774934170143]
episode  86 : steps 25 , return [-15.02]
step  0 :  [-1.6286029809673717]
step  1 :  [-1.5901023999267827]
step  2 :  [-1.5453665787738626]
step  3 :  [-1.5022652273153274]
step  4 :  [-1.4285834658967698]
step  5 :  [-1.3276873822651316]
step  6 :  [-1.20430063082634]
step  7 :  [-1.088500452639954]
step  8 :  [-0.9566425725652814]
step  9 :  [-0.8115808070799896]
step  10 :  [-0.6567156042848263]
step  11 :  [-0.49627549183718744]
step  12 :  [-0.33789050267634557]
step  13 :  [-0.20674278592099232]
step  14 :  [-0.08235170065562755]
step  15 :  [-0.04031481631538446]
step  16 :  [-0.03769520165045154]
step  17 :  [-0.0461402986192426]
step  18 :  [-0.03441401974065078]
step  19 :  [-0.05319018069829]
step  20 :  [-0.04950745811561926]
step  21 :  [-0.02809536602082645]
step  22 :  [-0.056392438750163205]
step  23 :  [-0.038828822942334716]
step  24 :  [-0.0298498255385291]
episode  87 : steps 25 , return [-15.28]
step  0 :  [-1.4192535235256214]
step  1 :  [-1.389415051195884]
step  2 :  [-1.3559731539889985]
step  3 :  [-1.2880728524860452]
step  4 :  [-1.2326551395579328]
step  5 :  [-1.2052929566905983]
step  6 :  [-1.1448488957592866]
step  7 :  [-1.0531518827234596]
step  8 :  [-0.9369222752893538]
step  9 :  [-0.8020974625854096]
step  10 :  [-0.6539041086773816]
step  11 :  [-0.4975827116541897]
step  12 :  [-0.3409670543326987]
step  13 :  [-0.20864758808921197]
step  14 :  [-0.08365759058576522]
step  15 :  [-0.029256189558475247]
step  16 :  [-0.022589887183514082]
step  17 :  [-0.034144897291053]
step  18 :  [-0.02699775665545917]
step  19 :  [-0.04108093636566624]
step  20 :  [-0.08136348624704778]
step  21 :  [-0.09213373643394775]
step  22 :  [-0.06678510330780552]
step  23 :  [-0.048116485211337094]
step  24 :  [-0.01927020669017329]
episode  88 : steps 25 , return [-14.07]
step  0 :  [-1.7559450854188747]
step  1 :  [-1.7256162590207376]
step  2 :  [-1.691657752736723]
step  3 :  [-1.6610207966165678]
step  4 :  [-1.5955411360051994]
step  5 :  [-1.5003062559987612]
step  6 :  [-1.381008050871896]
step  7 :  [-1.242796983554205]
step  8 :  [-1.0899806784286243]
step  9 :  [-0.9260441795333524]
step  10 :  [-0.7537965635192267]
step  11 :  [-0.5756096208805874]
step  12 :  [-0.39394755203234005]
step  13 :  [-0.2139862605661239]
step  14 :  [-0.067182374088555]
step  15 :  [-0.0025220540501297494]
step  16 :  [-0.02413082621842082]
step  17 :  [-0.017092234342812148]
step  18 :  [-0.0447645125136021]
step  19 :  [-0.06511921203298247]
step  20 :  [-0.047446283277321276]
step  21 :  [-0.023692851812337695]
step  22 :  [-0.020620706083341097]
step  23 :  [-0.011817040348325073]
step  24 :  [-0.05342094309749299]
episode  89 : steps 25 , return [-16.89]
step  0 :  [-1.628280747203537]
step  1 :  [-1.6025713324575837]
step  2 :  [-1.575423423911576]
step  3 :  [-1.5109412705665564]
step  4 :  [-1.4155309507383538]
step  5 :  [-1.2955207203625159]
step  6 :  [-1.156355196477214]
step  7 :  [-1.0024557954396829]
step  8 :  [-0.8373103599499152]
step  9 :  [-0.6636275452065902]
step  10 :  [-0.4834973980179237]
step  11 :  [-0.2985559708818553]
step  12 :  [-0.11042842164264463]
step  13 :  [-0.024882216853174304]
step  14 :  [-0.058384691500511905]
step  15 :  [-0.08253759504011869]
step  16 :  [-0.06658120734368715]
step  17 :  [-0.02259370067063612]
step  18 :  [-0.019180149040842063]
step  19 :  [-0.055625902109056685]
step  20 :  [-0.08017265827620826]
step  21 :  [-0.0698592429398457]
step  22 :  [-0.03731550645324616]
step  23 :  [-0.06493118346803106]
step  24 :  [-0.042650476894108856]
episode  90 : steps 25 , return [-14.21]
step  0 :  [-1.6924413994546388]
step  1 :  [-1.662470483372813]
step  2 :  [-1.6292406454424024]
step  3 :  [-1.5604133924571437]
step  4 :  [-1.4618807048391835]
step  5 :  [-1.3821664606981519]
step  6 :  [-1.2763225816973118]
step  7 :  [-1.149224111548984]
step  8 :  [-1.005402234309669]
step  9 :  [-0.8487446138948587]
step  10 :  [-0.6825485140943438]
step  11 :  [-0.5098488414759625]
step  12 :  [-0.33457081178306186]
step  13 :  [-0.16928085152679273]
step  14 :  [-0.05962451813973129]
step  15 :  [-0.06577396350219249]
step  16 :  [-0.05107527145391197]
step  17 :  [-0.05685634405512122]
step  18 :  [-0.040554823808308035]
step  19 :  [-0.017389639048122175]
step  20 :  [-0.060261045993549055]
step  21 :  [-0.06261871572491791]
step  22 :  [-0.029680896728760474]
step  23 :  [-0.058841635842318975]
step  24 :  [-0.09378806246064665]
episode  91 : steps 25 , return [-15.96]
step  0 :  [-1.7063394057562251]
step  1 :  [-1.6728725435205059]
step  2 :  [-1.6347924565867138]
step  3 :  [-1.599409840166378]
step  4 :  [-1.5307703836655993]
step  5 :  [-1.4333134842979522]
step  6 :  [-1.3123632495846682]
step  7 :  [-1.172845320379382]
step  8 :  [-1.0189132417935176]
step  9 :  [-0.8539240172737611]
step  10 :  [-0.680542384772096]
step  11 :  [-0.5009032093248645]
step  12 :  [-0.31691111158983537]
step  13 :  [-0.13208745870310287]
step  14 :  [-0.016443339257955568]
step  15 :  [-0.0816364988758575]
step  16 :  [-0.09078921623423593]
step  17 :  [-0.06647190362021797]
step  18 :  [-0.010844166637163994]
step  19 :  [-0.013830928093739467]
step  20 :  [-0.03729805380224613]
step  21 :  [-0.03317654047217559]
step  22 :  [-0.012305895344616829]
step  23 :  [-0.011189645971654559]
step  24 :  [-0.035077519751543475]
episode  92 : steps 25 , return [-15.98]
step  0 :  [-1.771588236026495]
step  1 :  [-1.7387104626948626]
step  2 :  [-1.7012034758095471]
step  3 :  [-1.6661437517655218]
step  4 :  [-1.5974734552713787]
step  5 :  [-1.4998547763432226]
step  6 :  [-1.3787012753015617]
step  7 :  [-1.2389719454302266]
step  8 :  [-1.0848279603789726]
step  9 :  [-0.9196186538864395]
step  10 :  [-0.7459837999376023]
step  11 :  [-0.5659922770432416]
step  12 :  [-0.3813148206140902]
step  13 :  [-0.19369400852481736]
step  14 :  [-0.10490494541627406]
step  15 :  [-0.03590447251192112]
step  16 :  [-0.019479038699648673]
step  17 :  [-0.01392302907924395]
step  18 :  [-0.02981834625588326]
step  19 :  [-0.012672261460329124]
step  20 :  [-0.012203562728285463]
step  21 :  [-0.038671867501268054]
step  22 :  [-0.023359142862390204]
step  23 :  [-0.03004632168568133]
step  24 :  [-0.020041742012735585]
episode  93 : steps 25 , return [-16.83]
step  0 :  [-1.3925695889711198]
step  1 :  [-1.3954343636656659]
step  2 :  [-1.390186842578898]
step  3 :  [-1.3434361089637736]
step  4 :  [-1.2618510817444182]
step  5 :  [-1.1538459557360896]
step  6 :  [-1.023888061528144]
step  7 :  [-0.8770354286001836]
step  8 :  [-0.7173082340150851]
step  9 :  [-0.5478695492214429]
step  10 :  [-0.37128208953195796]
step  11 :  [-0.19024334968498438]
step  12 :  [-0.05239521461976144]
step  13 :  [-0.04566513880593146]
step  14 :  [-0.07044387891001104]
step  15 :  [-0.04143824744697309]
step  16 :  [-0.03163050935296338]
step  17 :  [-0.07696270743470453]
step  18 :  [-0.0885725799713832]
step  19 :  [-0.05477547231590051]
step  20 :  [-0.04818295191398191]
step  21 :  [-0.01899184137858864]
step  22 :  [-0.04982581690542556]
step  23 :  [-0.05020495809195973]
step  24 :  [-0.05049252670883048]
episode  94 : steps 25 , return [-12.34]
step  0 :  [-1.4356277946804432]
step  1 :  [-1.4012846330785835]
step  2 :  [-1.3631452349719433]
step  3 :  [-1.3295830744284687]
step  4 :  [-1.263684401828203]
step  5 :  [-1.18003685138336]
step  6 :  [-1.0709593646061115]
step  7 :  [-0.9416467333296126]
step  8 :  [-0.7968491140724625]
step  9 :  [-0.6408600666684962]
step  10 :  [-0.4781401858241859]
step  11 :  [-0.3159151473331722]
step  12 :  [-0.18061619764013198]
step  13 :  [-0.05488418583682805]
step  14 :  [-0.04686049251669147]
step  15 :  [-0.03408391847787643]
step  16 :  [-0.022030668163372274]
step  17 :  [-0.020919572083390462]
step  18 :  [-0.025127533811686704]
step  19 :  [-0.0748725094530108]
step  20 :  [-0.0864619217464362]
step  21 :  [-0.12055533661722323]
step  22 :  [-0.11621030766581025]
step  23 :  [-0.07769499208913469]
step  24 :  [-0.07938593336934]
episode  95 : steps 25 , return [-13.16]
step  0 :  [-1.533835907271145]
step  1 :  [-1.4915077999100068]
step  2 :  [-1.4418264701280845]
step  3 :  [-1.393214093808125]
step  4 :  [-1.3161993099305669]
step  5 :  [-1.2392754762035463]
step  6 :  [-1.2206202772090249]
step  7 :  [-1.2072908396204878]
step  8 :  [-1.152145780044343]
step  9 :  [-1.0635358382683406]
step  10 :  [-0.9490219779888239]
step  11 :  [-0.8149573617340973]
step  12 :  [-0.6666974616106333]
step  13 :  [-0.509269929926825]
step  14 :  [-0.3494263281961969]
step  15 :  [-0.20619159609325502]
step  16 :  [-0.10980620013680051]
step  17 :  [-0.09112493743112803]
step  18 :  [-0.06461870144305566]
step  19 :  [-0.04186194609853144]
step  20 :  [-0.027259402376252857]
step  21 :  [-0.04012596833176256]
step  22 :  [-0.03452158429659349]
step  23 :  [-0.06334038916237743]
step  24 :  [-0.0942972287776017]
episode  96 : steps 25 , return [-17.12]
step  0 :  [-1.700070401320006]
step  1 :  [-1.6682181924313408]
step  2 :  [-1.6323803441095535]
step  3 :  [-1.5997812643227916]
step  4 :  [-1.5331349646600358]
step  5 :  [-1.4371602746028447]
step  6 :  [-1.317361820016364]
step  7 :  [-1.1787887383547537]
step  8 :  [-1.0256898452774652]
step  9 :  [-0.8615135190624896]
step  10 :  [-0.689046409361805]
step  11 :  [-0.5106629308473913]
step  12 :  [-0.32898215515567375]
step  13 :  [-0.1514645688092909]
step  14 :  [-0.0268604304217816]
step  15 :  [-0.06386169401127195]
step  16 :  [-0.06421598066819768]
step  17 :  [-0.04966500785089344]
step  18 :  [-0.05284928698204652]
step  19 :  [-0.04199708482742447]
step  20 :  [-0.04646670460349727]
step  21 :  [-0.037853103682706675]
step  22 :  [-0.04288180018805383]
step  23 :  [-0.035596671526619696]
step  24 :  [-0.040867459185712676]
episode  97 : steps 25 , return [-16.14]
step  0 :  [-1.4826578941075843]
step  1 :  [-1.4482361947956985]
step  2 :  [-1.4098086012008637]
step  3 :  [-1.3755713287318032]
step  4 :  [-1.308830756118633]
step  5 :  [-1.2133966053707321]
step  6 :  [-1.0944205032897665]
step  7 :  [-0.9568457270923659]
step  8 :  [-0.8049599848289033]
step  9 :  [-0.642414573049726]
step  10 :  [-0.47258955217020265]
step  11 :  [-0.3000312922572915]
step  12 :  [-0.14185747215875125]
step  13 :  [-0.06772432500062905]
step  14 :  [-0.09450025072703111]
step  15 :  [-0.08169925447296231]
step  16 :  [-0.029733286038372886]
step  17 :  [-0.02699162431577368]
step  18 :  [-0.05040993694199038]
step  19 :  [-0.1259521265089719]
step  20 :  [-0.18087067155984127]
step  21 :  [-0.17766745945297135]
step  22 :  [-0.13334705656797874]
step  23 :  [-0.08013518306908941]
step  24 :  [-0.0704297539924611]
episode  98 : steps 25 , return [-13.77]
step  0 :  [-1.431717118989445]
step  1 :  [-1.3991745747221391]
step  2 :  [-1.3636128410442487]
step  3 :  [-1.294013709016588]
step  4 :  [-1.2732744647398655]
step  5 :  [-1.2214551393838666]
step  6 :  [-1.136808144093094]
step  7 :  [-1.026042704316012]
step  8 :  [-0.8952050060957993]
step  9 :  [-0.7495240544154222]
step  10 :  [-0.59379494449552]
step  11 :  [-0.43362451394064155]
step  12 :  [-0.2804718874595238]
step  13 :  [-0.1549013549316056]
step  14 :  [-0.10256550889446925]
step  15 :  [-0.08878297393590558]
step  16 :  [-0.1209903343327495]
step  17 :  [-0.10444172666341262]
step  18 :  [-0.07489431244764636]
step  19 :  [-0.07846244908008554]
step  20 :  [-0.03152418060051237]
step  21 :  [-0.045852624108488546]
step  22 :  [-0.007772026707390853]
step  23 :  [-0.027522071831677035]
step  24 :  [-0.06828201750988007]
episode  99 : steps 25 , return [-14.]
step  0 :  [-1.3962890046594731]
step  1 :  [-1.367603105405408]
step  2 :  [-1.3375556517973572]
step  3 :  [-1.2718768048093287]
step  4 :  [-1.208211033386325]
step  5 :  [-1.119434873946696]
step  6 :  [-1.0058156514166385]
step  7 :  [-0.8727623322944004]
step  8 :  [-0.725063663611388]
step  9 :  [-0.5670941321216594]
step  10 :  [-0.40385326766390567]
step  11 :  [-0.24591738796456136]
step  12 :  [-0.11831854017875969]
step  13 :  [-0.06744034488939839]
step  14 :  [-0.0530867240195955]
step  15 :  [-0.026088423219587247]
step  16 :  [-0.016441795252168843]
step  17 :  [-0.058520943642767054]
step  18 :  [-0.04908406258007021]
step  19 :  [-0.04800959919438081]
step  20 :  [-0.07637315004994913]
step  21 :  [-0.08673778319773837]
step  22 :  [-0.06535862508323866]
step  23 :  [-0.03775035524799534]
step  24 :  [-0.03145182840667382]
episode  100 : steps 25 , return [-12.26]
step  0 :  [-1.6404522533757853]
step  1 :  [-1.614251920705417]
step  2 :  [-1.5863831985915853]
step  3 :  [-1.5213638775748286]
step  4 :  [-1.425548801846007]
step  5 :  [-1.3052284490248427]
step  6 :  [-1.1658204017651677]
step  7 :  [-1.0117262376744227]
step  8 :  [-0.84641802755509]
step  9 :  [-0.6725892720289367]
step  10 :  [-0.49230847350157586]
step  11 :  [-0.3071546738485168]
step  12 :  [-0.11833719587839427]
step  13 :  [-0.02712871991145332]
step  14 :  [-0.011383939780362952]
step  15 :  [-0.04540505227897659]
step  16 :  [-0.024690273384452788]
step  17 :  [-0.03587661321211755]
step  18 :  [-0.02380218574606595]
step  19 :  [-0.033374074509114324]
step  20 :  [-0.01216019772050817]
step  21 :  [-0.048436572905941624]
step  22 :  [-0.03467525277427126]
step  23 :  [-0.03307307609036009]
step  24 :  [-0.05915128692785117]
episode  101 : steps 25 , return [-14.1]
step  0 :  [-1.5363949642069805]
step  1 :  [-1.500231046430131]
step  2 :  [-1.4541101421778466]
step  3 :  [-1.4069337795863988]
step  4 :  [-1.3666235764417765]
step  5 :  [-1.2976330392231963]
step  6 :  [-1.215020979541092]
step  7 :  [-1.1102296198823762]
step  8 :  [-0.9846181614931498]
step  9 :  [-0.8427169036371627]
step  10 :  [-0.6886807430675628]
step  11 :  [-0.5266000432453345]
step  12 :  [-0.3620504963002124]
step  13 :  [-0.2258481535766985]
step  14 :  [-0.10857571071428813]
step  15 :  [-0.033846016113863835]
step  16 :  [-0.027707274215206062]
step  17 :  [-0.050443580337060354]
step  18 :  [-0.0351582392873082]
step  19 :  [-0.06980994256301154]
step  20 :  [-0.05400784033547329]
step  21 :  [-0.06669393371698173]
step  22 :  [-0.0483343679478996]
step  23 :  [-0.08123714368212417]
step  24 :  [-0.06248416881215799]
episode  102 : steps 25 , return [-15.16]
step  0 :  [-1.672582579297021]
step  1 :  [-1.6332863631165513]
step  2 :  [-1.5872763916167683]
step  3 :  [-1.5423151402423723]
step  4 :  [-1.5052795614016583]
step  5 :  [-1.437574005575263]
step  6 :  [-1.3421095861044479]
step  7 :  [-1.2235713133542716]
step  8 :  [-1.0866738401624512]
step  9 :  [-0.9356035547371885]
step  10 :  [-0.773968687217077]
step  11 :  [-0.6050614966297301]
step  12 :  [-0.43271117437505374]
step  13 :  [-0.2651116508501457]
step  14 :  [-0.12781859989470262]
step  15 :  [-0.06886347063877796]
step  16 :  [-0.058678957369267336]
step  17 :  [-0.08620508796879763]
step  18 :  [-0.09131735009686778]
step  19 :  [-0.06339118444747045]
step  20 :  [-0.035289923698706475]
step  21 :  [-0.07043224171557257]
step  22 :  [-0.053924599661460654]
step  23 :  [-0.08495417585400043]
step  24 :  [-0.06938415322240253]
episode  103 : steps 25 , return [-16.85]
step  0 :  [-1.5085101932072191]
step  1 :  [-1.4665484796317303]
step  2 :  [-1.4174924934828201]
step  3 :  [-1.3698519175073585]
step  4 :  [-1.2936340310751273]
step  5 :  [-1.235676143058627]
step  6 :  [-1.226761779354959]
step  7 :  [-1.1960263828474667]
step  8 :  [-1.1271137582504502]
step  9 :  [-1.0279692778363936]
step  10 :  [-0.9056052642005534]
step  11 :  [-0.7659275618907132]
step  12 :  [-0.6140869215819965]
step  13 :  [-0.4554787085061168]
step  14 :  [-0.2993875282750248]
step  15 :  [-0.17978174611298117]
step  16 :  [-0.1358463241378585]
step  17 :  [-0.14494349671248388]
step  18 :  [-0.12236883519783323]
step  19 :  [-0.06498364208483337]
step  20 :  [-0.0617734332878744]
step  21 :  [-0.022783324214207364]
step  22 :  [-0.07710893953153759]
step  23 :  [-0.08911610168052213]
step  24 :  [-0.04855398707010515]
episode  104 : steps 25 , return [-16.86]
step  0 :  [-1.772578697390281]
step  1 :  [-1.7422377536528293]
step  2 :  [-1.7082030944367717]
step  3 :  [-1.6386405218502056]
step  4 :  [-1.5799865244876965]
step  5 :  [-1.4910600608998859]
step  6 :  [-1.3770817508780198]
step  7 :  [-1.2431526917579179]
step  8 :  [-1.0936826668020982]
step  9 :  [-0.9322952224923448]
step  10 :  [-0.7619212469776933]
step  11 :  [-0.5849971567885099]
step  12 :  [-0.4038917090810055]
step  13 :  [-0.22285303658186298]
step  14 :  [-0.14315441025595338]
step  15 :  [-0.061438688958851115]
step  16 :  [-0.05119300375651335]
step  17 :  [-0.05536313598940848]
step  18 :  [-0.04149519869911402]
step  19 :  [-0.03861388102847911]
step  20 :  [-0.02745781216719445]
step  21 :  [-0.00789969117063947]
step  22 :  [-0.048856885793416835]
step  23 :  [-0.06695893098116651]
step  24 :  [-0.04746551710074193]
episode  105 : steps 25 , return [-17.14]
step  0 :  [-1.612877808596972]
step  1 :  [-1.572372305525494]
step  2 :  [-1.5249098569639417]
step  3 :  [-1.4785219622027155]
step  4 :  [-1.4026586498155185]
step  5 :  [-1.3002821068650057]
step  6 :  [-1.2018226035016342]
step  7 :  [-1.1262094494130541]
step  8 :  [-1.0267475801961456]
step  9 :  [-0.9071654331595995]
step  10 :  [-0.7720013572900986]
step  11 :  [-0.6261787499053151]
step  12 :  [-0.4759558165274726]
step  13 :  [-0.33331621694363583]
step  14 :  [-0.21469221707023808]
step  15 :  [-0.09898571602041285]
step  16 :  [-0.037496043016259924]
step  17 :  [-0.044123295952161815]
step  18 :  [-0.021197375719702708]
step  19 :  [-0.03911369337936933]
step  20 :  [-0.04951697991922742]
step  21 :  [-0.02306028384609319]
step  22 :  [-0.026551473930731363]
step  23 :  [-0.015518404847125388]
step  24 :  [-0.027029472205549857]
episode  106 : steps 25 , return [-15.96]
step  0 :  [-1.5838738752042074]
step  1 :  [-1.540779976183319]
step  2 :  [-1.4898168537785454]
step  3 :  [-1.4392460716637712]
step  4 :  [-1.3965268305396863]
step  5 :  [-1.3253498870069775]
step  6 :  [-1.2276168343558294]
step  7 :  [-1.1084507877859804]
step  8 :  [-0.9712098336574373]
step  9 :  [-0.8199096723109511]
step  10 :  [-0.6581018165519014]
step  11 :  [-0.4891895033859848]
step  12 :  [-0.31787551819271626]
step  13 :  [-0.177925457522748]
step  14 :  [-0.10452414756530244]
step  15 :  [-0.047347200732556896]
step  16 :  [-0.026356102172329792]
step  17 :  [-0.0289479265504906]
step  18 :  [-0.07291674799352048]
step  19 :  [-0.08890579733385416]
step  20 :  [-0.10672358543833764]
step  21 :  [-0.12548742872252547]
step  22 :  [-0.10206484596728198]
step  23 :  [-0.0611532435867629]
step  24 :  [-0.06725857229534819]
episode  107 : steps 25 , return [-15.38]
step  0 :  [-1.7252043545691538]
step  1 :  [-1.6916367015089464]
step  2 :  [-1.6533479262283755]
step  3 :  [-1.6175966809385802]
step  4 :  [-1.548621453253144]
step  5 :  [-1.4508783639798046]
step  6 :  [-1.3296871514181225]
step  7 :  [-1.1899630149452185]
step  8 :  [-1.0358470149050045]
step  9 :  [-0.8706810185551056]
step  10 :  [-0.6971068965702282]
step  11 :  [-0.5172111536818007]
step  12 :  [-0.3327402272896953]
step  13 :  [-0.1460587166052973]
step  14 :  [-0.06174025399133705]
step  15 :  [-0.0503389474392485]
step  16 :  [-0.08047156605120431]
step  17 :  [-0.063471254156267]
step  18 :  [-0.029302443702818388]
step  19 :  [-0.01847241316819451]
step  20 :  [-0.031005648089465158]
step  21 :  [-0.010105898616878242]
step  22 :  [-0.04529173464125712]
step  23 :  [-0.02341483705900169]
step  24 :  [-0.06367311843630763]
episode  108 : steps 25 , return [-16.28]
step  0 :  [-1.601194527960289]
step  1 :  [-1.5698722338073061]
step  2 :  [-1.5351658386794564]
step  3 :  [-1.465594574777709]
step  4 :  [-1.4076220948142926]
step  5 :  [-1.3197582985323952]
step  6 :  [-1.2069575096002045]
step  7 :  [-1.074260044712861]
step  8 :  [-0.9261231273327866]
step  9 :  [-0.7663222347257993]
step  10 :  [-0.5981472561626537]
step  11 :  [-0.42504039227793394]
step  12 :  [-0.2534723606809188]
step  13 :  [-0.12079188970378292]
step  14 :  [-0.1283747150181753]
step  15 :  [-0.13738549598578975]
step  16 :  [-0.12353031290117521]
step  17 :  [-0.06922966587421281]
step  18 :  [-0.03102180380127637]
step  19 :  [-0.03167692583953122]
step  20 :  [-0.01952601976086752]
step  21 :  [-0.05269940527290765]
step  22 :  [-0.04744608126074303]
step  23 :  [-0.07078593305114357]
step  24 :  [-0.06322964334185836]
episode  109 : steps 25 , return [-15.05]
step  0 :  [-1.81101230748281]
step  1 :  [-1.7736118990298655]
step  2 :  [-1.729747470747592]
step  3 :  [-1.6866590247939293]
step  4 :  [-1.6506665644935612]
step  5 :  [-1.582929408593847]
step  6 :  [-1.4869815480575732]
step  7 :  [-1.3677498479931633]
step  8 :  [-1.2300164173058774]
step  9 :  [-1.0779307711089683]
step  10 :  [-0.9149499100338258]
step  11 :  [-0.7439750093007216]
step  12 :  [-0.5676780239041063]
step  13 :  [-0.38944619064771385]
step  14 :  [-0.2184119074678837]
step  15 :  [-0.08365331268680784]
step  16 :  [-0.03990056591910967]
step  17 :  [-0.0141723208399857]
step  18 :  [-0.04533372108913127]
step  19 :  [-0.02010227894947608]
step  20 :  [-0.05027141679908609]
step  21 :  [-0.02524761295045794]
step  22 :  [-0.05347615864367616]
step  23 :  [-0.028396349319668925]
step  24 :  [-0.05538866154228709]
episode  110 : steps 25 , return [-18.65]
step  0 :  [-1.666092913052003]
step  1 :  [-1.6371027575628494]
step  2 :  [-1.6053197689765573]
step  3 :  [-1.5778775094795177]
step  4 :  [-1.515070382646848]
step  5 :  [-1.4220753333830982]
step  6 :  [-1.3047184395581775]
step  7 :  [-1.168291526286098]
step  8 :  [-1.017259581257117]
step  9 :  [-0.8553209424632072]
step  10 :  [-0.6856574457431754]
step  11 :  [-0.5114948584484947]
step  12 :  [-0.3379956857996176]
step  13 :  [-0.1940537968405704]
step  14 :  [-0.13161706269747073]
step  15 :  [-0.11301188067633386]
step  16 :  [-0.07005673363840405]
step  17 :  [-0.08163825251776875]
step  18 :  [-0.048612330140827206]
step  19 :  [-0.07567336268248796]
step  20 :  [-0.048333748015386126]
step  21 :  [-0.03834380005088958]
step  22 :  [-0.08468216683081058]
step  23 :  [-0.09068690128659436]
step  24 :  [-0.054753910636866174]
episode  111 : steps 25 , return [-16.34]
step  0 :  [-1.4417364050477226]
step  1 :  [-1.4101269798921015]
step  2 :  [-1.375799128417187]
step  3 :  [-1.3069977106672022]
step  4 :  [-1.2295391284283428]
step  5 :  [-1.1762826385302312]
step  6 :  [-1.091823372000612]
step  7 :  [-0.9819989007640187]
step  8 :  [-0.8523546434966885]
step  9 :  [-0.7079603809185401]
step  10 :  [-0.5537086737039404]
step  11 :  [-0.3958252382267145]
step  12 :  [-0.24889363700382539]
step  13 :  [-0.1348195366443522]
step  14 :  [-0.09390384033535779]
step  15 :  [-0.04024756341195294]
step  16 :  [-0.0647194892991836]
step  17 :  [-0.036553420108646394]
step  18 :  [-0.03984528788387529]
step  19 :  [-0.10971908724528212]
step  20 :  [-0.12659467199584315]
step  21 :  [-0.10483186989034408]
step  22 :  [-0.06935630784608839]
step  23 :  [-0.06522396236769941]
step  24 :  [-0.013252792811402327]
episode  112 : steps 25 , return [-13.67]
step  0 :  [-1.5922515827559243]
step  1 :  [-1.5546426980378178]
step  2 :  [-1.5112933568265563]
step  3 :  [-1.4701547548466896]
step  4 :  [-1.3979930606028297]
step  5 :  [-1.2982579814870736]
step  6 :  [-1.183321385779926]
step  7 :  [-1.0541489034673979]
step  8 :  [-0.9106992496182799]
step  9 :  [-0.7559125088355759]
step  10 :  [-0.5929630063786692]
step  11 :  [-0.4259061460008033]
step  12 :  [-0.26369158439261037]
step  13 :  [-0.13249197794375675]
step  14 :  [-0.01899275633894073]
step  15 :  [-0.05344678093270399]
step  16 :  [-0.06434683972380803]
step  17 :  [-0.03458722011044894]
step  18 :  [-0.025182519545518398]
step  19 :  [-0.03864799624139012]
step  20 :  [-0.07952333614185683]
step  21 :  [-0.0707095723719859]
step  22 :  [-0.034393775697777386]
step  23 :  [-0.03604219381500143]
step  24 :  [-0.05678308558478122]
episode  113 : steps 25 , return [-14.66]
step  0 :  [-1.6941141281703296]
step  1 :  [-1.657372995886386]
step  2 :  [-1.614823289112888]
step  3 :  [-1.5740149732706705]
step  4 :  [-1.5016405307534704]
step  5 :  [-1.4015250888199344]
step  6 :  [-1.2786218426313836]
step  7 :  [-1.143962061695083]
step  8 :  [-0.9920842117859487]
step  9 :  [-0.8297329614770761]
step  10 :  [-0.6592122362572589]
step  11 :  [-0.48273801401053584]
step  12 :  [-0.303127244146913]
step  13 :  [-0.1616370609493636]
step  14 :  [-0.07138833242260609]
step  15 :  [-0.022294229789299756]
step  16 :  [-0.031754406385215865]
step  17 :  [-0.03792980533148723]
step  18 :  [-0.0397714001193366]
step  19 :  [-0.030515731941519592]
step  20 :  [-0.04338992596730364]
step  21 :  [-0.07150154349712778]
step  22 :  [-0.0900608090002128]
step  23 :  [-0.10427183139257802]
step  24 :  [-0.1163247678447927]
episode  114 : steps 25 , return [-15.95]
step  0 :  [-1.4923694971973551]
step  1 :  [-1.4555467371688917]
step  2 :  [-1.4137400808643719]
step  3 :  [-1.375253473192565]
step  4 :  [-1.3054507513192362]
step  5 :  [-1.217744632053985]
step  6 :  [-1.1163011498166457]
step  7 :  [-0.9937361822223969]
step  8 :  [-0.8544406581927266]
step  9 :  [-0.7025761907529539]
step  10 :  [-0.5422816572461301]
step  11 :  [-0.379079619033693]
step  12 :  [-0.22733140079111971]
step  13 :  [-0.11353619367598045]
step  14 :  [-0.07874828380500004]
step  15 :  [-0.05577389509258809]
step  16 :  [-0.06837617491373861]
step  17 :  [-0.05652051765808213]
step  18 :  [-0.01848522750087106]
step  19 :  [-0.011530133525962808]
step  20 :  [-0.056663866175742164]
step  21 :  [-0.042271632112981586]
step  22 :  [-0.0744867243476524]
step  23 :  [-0.12899171739788048]
step  24 :  [-0.1333146741942875]
episode  115 : steps 25 , return [-13.91]
step  0 :  [-1.7010066977186278]
step  1 :  [-1.6607638377451306]
step  2 :  [-1.613335179358181]
step  3 :  [-1.5664402873804688]
step  4 :  [-1.5269211834464873]
step  5 :  [-1.4572704247887345]
step  6 :  [-1.3602400017990506]
step  7 :  [-1.2403763041425093]
step  8 :  [-1.1022726433716528]
step  9 :  [-0.9499905842028052]
step  10 :  [-0.7869703925023864]
step  11 :  [-0.6161970219523021]
step  12 :  [-0.44073357738803676]
step  13 :  [-0.26603862107506804]
step  14 :  [-0.12254657890635709]
step  15 :  [-0.07646862085225896]
step  16 :  [-0.09364104197407255]
step  17 :  [-0.06808029481674734]
step  18 :  [-0.024167989418934097]
step  19 :  [-0.051806451351106654]
step  20 :  [-0.0722041910780403]
step  21 :  [-0.05300577433050919]
step  22 :  [-0.012044045935256441]
step  23 :  [-0.045060603675115496]
step  24 :  [-0.039477776500774955]
episode  116 : steps 25 , return [-16.95]
step  0 :  [-1.5384047196322925]
step  1 :  [-1.505977725611855]
step  2 :  [-1.4700352319480892]
step  3 :  [-1.4384103842790166]
step  4 :  [-1.3732266416286099]
step  5 :  [-1.2787908048154044]
step  6 :  [-1.1605057871878652]
step  7 :  [-1.0234502114113788]
step  8 :  [-0.8719882691587665]
step  9 :  [-0.7098071888770043]
step  10 :  [-0.5402432428217251]
step  11 :  [-0.367330581534966]
step  12 :  [-0.20168506804241448]
step  13 :  [-0.0750490456900813]
step  14 :  [-0.044703415947268475]
step  15 :  [-0.020312373855000763]
step  16 :  [-0.04637863236055397]
step  17 :  [-0.0874775418008087]
step  18 :  [-0.09505912484439222]
step  19 :  [-0.05671449171360604]
step  20 :  [-0.04282464402563632]
step  21 :  [-0.09618023025746193]
step  22 :  [-0.11608221956882449]
step  23 :  [-0.14868276408724157]
step  24 :  [-0.13159340961344201]
episode  117 : steps 25 , return [-14.44]
step  0 :  [-1.4642885133944061]
step  1 :  [-1.437513649930854]
step  2 :  [-1.409703145213098]
step  3 :  [-1.3453086769195042]
step  4 :  [-1.2502534201359443]
step  5 :  [-1.1311632682728652]
step  6 :  [-0.992847416425474]
step  7 :  [-0.8397320811570917]
step  8 :  [-0.6753538278054012]
step  9 :  [-0.5025387386908942]
step  10 :  [-0.3237353939002367]
step  11 :  [-0.14278200678459677]
step  12 :  [-0.06649779018444767]
step  13 :  [-0.05962500571924146]
step  14 :  [-0.02030010998414256]
step  15 :  [-0.02187904261849761]
step  16 :  [-0.05548719399350674]
step  17 :  [-0.055292784753548097]
step  18 :  [-0.03385075409349445]
step  19 :  [-0.03219280878821037]
step  20 :  [-0.035707901573775264]
step  21 :  [-0.02416351406043943]
step  22 :  [-0.041624709381378244]
step  23 :  [-0.02336340008705034]
step  24 :  [-0.045954100133847056]
episode  118 : steps 25 , return [-12.03]
step  0 :  [-1.731219063451327]
step  1 :  [-1.6890143420007937]
step  2 :  [-1.6387518310403262]
step  3 :  [-1.5881535850656585]
step  4 :  [-1.5440809026955]
step  5 :  [-1.4710323984747704]
step  6 :  [-1.371387756228357]
step  7 :  [-1.249419916420054]
step  8 :  [-1.1095141633372547]
step  9 :  [-0.9555494690637452]
step  10 :  [-0.7907579151980282]
step  11 :  [-0.617788575560771]
step  12 :  [-0.43892170629188465]
step  13 :  [-0.25683732829078715]
step  14 :  [-0.08460995155343617]
step  15 :  [-0.068005350882792]
step  16 :  [-0.08144841011560731]
step  17 :  [-0.06384706928643405]
step  18 :  [-0.07945032212657648]
step  19 :  [-0.07888383853870745]
step  20 :  [-0.04708685236843928]
step  21 :  [-0.0038699133661076234]
step  22 :  [-0.032186991336796617]
step  23 :  [-0.04859670573278463]
step  24 :  [-0.043079376132078205]
episode  119 : steps 25 , return [-17.08]
step  0 :  [-1.7613158422456856]
step  1 :  [-1.7294637895713694]
step  2 :  [-1.693400032833545]
step  3 :  [-1.6601634748602083]
step  4 :  [-1.59281750633013]
step  5 :  [-1.4961883946014367]
step  6 :  [-1.375799713955928]
step  7 :  [-1.2366865933823958]
step  8 :  [-1.083067538531794]
step  9 :  [-0.9183427750629611]
step  10 :  [-0.7452118816834498]
step  11 :  [-0.5658462836122693]
step  12 :  [-0.3821851914360849]
step  13 :  [-0.19721717196015012]
step  14 :  [-0.0499137887640026]
step  15 :  [-0.030284400106817506]
step  16 :  [-0.05450262142719062]
step  17 :  [-0.024295836209062453]
step  18 :  [-0.06183703114288332]
step  19 :  [-0.05564930046741947]
step  20 :  [-0.031504026231305146]
step  21 :  [-0.047716594944541946]
step  22 :  [-0.07965629112434006]
step  23 :  [-0.058938447765266695]
step  24 :  [-0.05001101384934065]
episode  120 : steps 25 , return [-16.98]
step  0 :  [-1.5896628933787675]
step  1 :  [-1.5552666231614654]
step  2 :  [-1.5163761364404071]
step  3 :  [-1.48075861361347]
step  4 :  [-1.4124747725840932]
step  5 :  [-1.3155660030014245]
step  6 :  [-1.1952104153007272]
step  7 :  [-1.0562929289697436]
step  8 :  [-0.9029789806714442]
step  9 :  [-0.7386822825231694]
step  10 :  [-0.5662082823336454]
step  11 :  [-0.38810966891102594]
step  12 :  [-0.2083048529680925]
step  13 :  [-0.0633326017820302]
step  14 :  [-0.018304509812230328]
step  15 :  [-0.04390093971464484]
step  16 :  [-0.025438322296065706]
step  17 :  [-0.02598045689595299]
step  18 :  [-0.05651414676917326]
step  19 :  [-0.049643159012038814]
step  20 :  [-0.013330839781669702]
step  21 :  [-0.049319299080016185]
step  22 :  [-0.04144743416438284]
step  23 :  [-0.00686689686170095]
step  24 :  [-0.021217983214354405]
episode  121 : steps 25 , return [-14.34]
step  0 :  [-1.6716668282127587]
step  1 :  [-1.6281104953190815]
step  2 :  [-1.5761682037482316]
step  3 :  [-1.5238126977516553]
step  4 :  [-1.478190323489593]
step  5 :  [-1.4043940954314609]
step  6 :  [-1.3043945481696968]
step  7 :  [-1.1822718284105314]
step  8 :  [-1.0430616024823143]
step  9 :  [-0.8899937495527169]
step  10 :  [-0.726237198761181]
step  11 :  [-0.5545438049415483]
step  12 :  [-0.37766509808534976]
step  13 :  [-0.2008017691771458]
step  14 :  [-0.057483837225729466]
step  15 :  [-0.0043929081785336705]
step  16 :  [-0.025873115703873267]
step  17 :  [-0.015203733484755554]
step  18 :  [-0.025474185488138897]
step  19 :  [-0.026223656261571495]
step  20 :  [-0.02876066051681091]
step  21 :  [-0.03242249941113462]
step  22 :  [-0.03142417608963215]
step  23 :  [-0.03590936698042074]
step  24 :  [-0.04444815711259274]
episode  122 : steps 25 , return [-15.89]
step  0 :  [-1.4297023439092431]
step  1 :  [-1.4264318045656474]
step  2 :  [-1.4133288324633677]
step  3 :  [-1.3999747151745958]
step  4 :  [-1.3491449326679579]
step  5 :  [-1.2657205956445878]
step  6 :  [-1.1558214999968506]
step  7 :  [-1.025161057096952]
step  8 :  [-0.8786224490414374]
step  9 :  [-0.7203181625839631]
step  10 :  [-0.5539621710352757]
step  11 :  [-0.383992199830944]
step  12 :  [-0.22125636984827204]
step  13 :  [-0.0936413954247014]
step  14 :  [-0.05076545281951369]
step  15 :  [-0.026455529550944223]
step  16 :  [-0.04114020823407653]
step  17 :  [-0.022625586073669084]
step  18 :  [-0.017149330569821864]
step  19 :  [-0.027620187874823454]
step  20 :  [-0.013299145417742715]
step  21 :  [-0.0482441653329229]
step  22 :  [-0.030193061337213747]
step  23 :  [-0.0604813430617594]
step  24 :  [-0.03972738832943348]
episode  123 : steps 25 , return [-13.69]
step  0 :  [-1.6125026982632462]
step  1 :  [-1.5778026291772846]
step  2 :  [-1.538395358905873]
step  3 :  [-1.5019842499546148]
step  4 :  [-1.4330323701676408]
step  5 :  [-1.3355715309925893]
step  6 :  [-1.2147517393804437]
step  7 :  [-1.0754263917170006]
step  8 :  [-0.921726198877723]
step  9 :  [-0.7570180806043192]
step  10 :  [-0.5840207164400504]
step  11 :  [-0.4050507563934807]
step  12 :  [-0.26884891280908313]
step  13 :  [-0.1680250766921589]
step  14 :  [-0.0941454731281377]
step  15 :  [-0.03470468055381282]
step  16 :  [-0.031097183786312845]
step  17 :  [-0.040308868689705964]
step  18 :  [-0.02084484566369147]
step  19 :  [-0.053736247339202084]
step  20 :  [-0.06814669045351894]
step  21 :  [-0.051789431772188074]
step  22 :  [-0.014493151110693093]
step  23 :  [-0.040287891341779306]
step  24 :  [-0.024881950567984014]
episode  124 : steps 25 , return [-14.87]
step  0 :  [-1.4400302899278525]
step  1 :  [-1.4113173002996988]
step  2 :  [-1.3809839064566205]
step  3 :  [-1.3149255176089711]
step  4 :  [-1.2200975813677148]
step  5 :  [-1.1189422783650884]
step  6 :  [-0.9963436750904217]
step  7 :  [-0.8567234680988945]
step  8 :  [-0.7041858066608875]
step  9 :  [-0.54265233570217]
step  10 :  [-0.3769775965856832]
step  11 :  [-0.219154104289561]
step  12 :  [-0.09755652155210912]
step  13 :  [-0.05886892227568467]
step  14 :  [-0.03629286962241114]
step  15 :  [-0.07053483644740159]
step  16 :  [-0.10045269247062315]
step  17 :  [-0.09164258125638157]
step  18 :  [-0.0571533094089288]
step  19 :  [-0.07500231713685625]
step  20 :  [-0.045700950840512386]
step  21 :  [-0.025420952017782196]
step  22 :  [-0.02899491623215156]
step  23 :  [-0.04747759264556896]
step  24 :  [-0.03730378909994594]
episode  125 : steps 25 , return [-12.35]
step  0 :  [-1.6440577569867274]
step  1 :  [-1.605566109569339]
step  2 :  [-1.5607818916553717]
step  3 :  [-1.5175204961747832]
step  4 :  [-1.443662198141464]
step  5 :  [-1.342608796056183]
step  6 :  [-1.262372125746665]
step  7 :  [-1.15739565844882]
step  8 :  [-1.0319131833869442]
step  9 :  [-0.8902697881896406]
step  10 :  [-0.73650458992653]
step  11 :  [-0.5745533437143281]
step  12 :  [-0.4094248050581571]
step  13 :  [-0.2529071318984964]
step  14 :  [-0.128739011871706]
step  15 :  [-0.08129475848482984]
step  16 :  [-0.06348935667989304]
step  17 :  [-0.09403745711509813]
step  18 :  [-0.15033730884563348]
step  19 :  [-0.15390931745156722]
step  20 :  [-0.12504675843253835]
step  21 :  [-0.0679770105404884]
step  22 :  [-0.05892635215932099]
step  23 :  [-0.02817048889839722]
step  24 :  [-0.022582752127892174]
episode  126 : steps 25 , return [-16.4]
step  0 :  [-1.5674691586088225]
step  1 :  [-1.523645311450561]
step  2 :  [-1.4717250644750992]
step  3 :  [-1.4200642444749298]
step  4 :  [-1.3762363730431737]
step  5 :  [-1.3043883284691025]
step  6 :  [-1.213072655207074]
step  7 :  [-1.1020402369225866]
step  8 :  [-0.9717478635795788]
step  9 :  [-0.8263710542816062]
step  10 :  [-0.6698116015687032]
step  11 :  [-0.5060550158951536]
step  12 :  [-0.341004465492118]
step  13 :  [-0.20435066150463915]
step  14 :  [-0.14030525818865303]
step  15 :  [-0.0802048968148503]
step  16 :  [-0.055034697596219706]
step  17 :  [-0.013784430892413362]
step  18 :  [-0.016102657869197307]
step  19 :  [-0.018164157136594927]
step  20 :  [-0.0198349011250532]
step  21 :  [-0.04195604138032965]
step  22 :  [-0.08112855178870929]
step  23 :  [-0.0864647300473658]
step  24 :  [-0.09826520060731532]
episode  127 : steps 25 , return [-15.15]
step  0 :  [-1.3859689060557263]
step  1 :  [-1.3631991536423396]
step  2 :  [-1.338365511046052]
step  3 :  [-1.2766141769066304]
step  4 :  [-1.202875623991388]
step  5 :  [-1.1021576533283868]
step  6 :  [-0.9786370650616426]
step  7 :  [-0.8374788323703038]
step  8 :  [-0.683062561765655]
step  9 :  [-0.5192720501906962]
step  10 :  [-0.3505466230424729]
step  11 :  [-0.18804567971708477]
step  12 :  [-0.06606362663672058]
step  13 :  [-0.045027037494653054]
step  14 :  [-0.02263970663221724]
step  15 :  [-0.042812511418164174]
step  16 :  [-0.0166115484081322]
step  17 :  [-0.04600132784534373]
step  18 :  [-0.019071007897451708]
step  19 :  [-0.048986314591586776]
step  20 :  [-0.021976077244903004]
step  21 :  [-0.05097505126488743]
step  22 :  [-0.023919311474388232]
step  23 :  [-0.052179652769613304]
step  24 :  [-0.025085776133788918]
episode  128 : steps 25 , return [-11.71]
step  0 :  [-1.5077765801727492]
step  1 :  [-1.4792359382927147]
step  2 :  [-1.4487828842544546]
step  3 :  [-1.3823970981148828]
step  4 :  [-1.2858222356814641]
step  5 :  [-1.16973109323503]
step  6 :  [-1.0344638731296305]
step  7 :  [-0.8848559225700687]
step  8 :  [-0.7240820150401087]
step  9 :  [-0.5550398090938264]
step  10 :  [-0.38082912065448643]
step  11 :  [-0.2078265760441648]
step  12 :  [-0.06812833892570157]
step  13 :  [-0.012405205724244686]
step  14 :  [-0.014414360282613952]
step  15 :  [-0.03029529854151]
step  16 :  [-0.024076703572141818]
step  17 :  [-0.04172768010908098]
step  18 :  [-0.057257506736404444]
step  19 :  [-0.05787997680937034]
step  20 :  [-0.03002658120136548]
step  21 :  [-0.03181773889255664]
step  22 :  [-0.0034432325111098086]
step  23 :  [-0.03543241811934296]
step  24 :  [-0.019692240686123467]
episode  129 : steps 25 , return [-12.49]
step  0 :  [-1.6203918464571139]
step  1 :  [-1.588412270121293]
step  2 :  [-1.5527201597378628]
step  3 :  [-1.4824359762002097]
step  4 :  [-1.3830184461024204]
step  5 :  [-1.2602423556757276]
step  6 :  [-1.1715719502820852]
step  7 :  [-1.0575627460789576]
step  8 :  [-0.9289684180815967]
step  9 :  [-0.7880984470767042]
step  10 :  [-0.6385175237590359]
step  11 :  [-0.48554266152501024]
step  12 :  [-0.34013540248851276]
step  13 :  [-0.22048922967945928]
step  14 :  [-0.10386282470051662]
step  15 :  [-0.04429360446499489]
step  16 :  [-0.048017830755471565]
step  17 :  [-0.0117709328419487]
step  18 :  [-0.03089513922629892]
step  19 :  [-0.03219542015295565]
step  20 :  [-0.035728181495016005]
step  21 :  [-0.04637148606833425]
step  22 :  [-0.04242628788741651]
step  23 :  [-0.048789779341182345]
step  24 :  [-0.05735921871734657]
episode  130 : steps 25 , return [-15.02]
step  0 :  [-1.5985702973772686]
step  1 :  [-1.5705973888003408]
step  2 :  [-1.5404923679404277]
step  3 :  [-1.4740534552576372]
step  4 :  [-1.3772933919417827]
step  5 :  [-1.2563209947191796]
step  6 :  [-1.1212250228343692]
step  7 :  [-0.9702238409525732]
step  8 :  [-0.8074675739835171]
step  9 :  [-0.6357074510414933]
step  10 :  [-0.45711043346595853]
step  11 :  [-0.27341963874498065]
step  12 :  [-0.08676287342648964]
step  13 :  [-0.021412732532084453]
step  14 :  [-0.03466432870866588]
step  15 :  [-0.04244662991447706]
step  16 :  [-0.047525273145138415]
step  17 :  [-0.007565972575210963]
step  18 :  [-0.06977178895027729]
step  19 :  [-0.07727990885447053]
step  20 :  [-0.05685681756936762]
step  21 :  [-0.06716835624942176]
step  22 :  [-0.0639751034194392]
step  23 :  [-0.07894288057155756]
step  24 :  [-0.042645775978607955]
episode  131 : steps 25 , return [-13.78]
step  0 :  [-1.6113821593817632]
step  1 :  [-1.5808810157796733]
step  2 :  [-1.5472577946700843]
step  3 :  [-1.4783857792712414]
step  4 :  [-1.3799252622404166]
step  5 :  [-1.2577711870913428]
step  6 :  [-1.1513745876471553]
step  7 :  [-1.0201468355558443]
step  8 :  [-0.8752638196094406]
step  9 :  [-0.7195652906944152]
step  10 :  [-0.5562609095809588]
step  11 :  [-0.3898498991524262]
step  12 :  [-0.2320337831139727]
step  13 :  [-0.11031413505051665]
step  14 :  [-0.06916985273929802]
step  15 :  [-0.050928158136684186]
step  16 :  [-0.04026910916896435]
step  17 :  [-0.03827760829148416]
step  18 :  [-0.03907290117670159]
step  19 :  [-0.04628997782948873]
step  20 :  [-0.04260172873437992]
step  21 :  [-0.04139970349752417]
step  22 :  [-0.06987761755267417]
step  23 :  [-0.0901846561434463]
step  24 :  [-0.07865803340064843]
episode  132 : steps 25 , return [-14.52]
step  0 :  [-1.4957677411931651]
step  1 :  [-1.4558002961247014]
step  2 :  [-1.4095943921834966]
step  3 :  [-1.3656151009547035]
step  4 :  [-1.2919649125164154]
step  5 :  [-1.2286503086090717]
step  6 :  [-1.182482518261185]
step  7 :  [-1.1031928604025232]
step  8 :  [-0.9970317009483102]
step  9 :  [-0.8700093091903148]
step  10 :  [-0.7274869693169879]
step  11 :  [-0.5744981664677329]
step  12 :  [-0.41711923566556136]
step  13 :  [-0.2683387290500107]
step  14 :  [-0.14849830906711525]
step  15 :  [-0.05278997166959034]
step  16 :  [-0.050034659466569285]
step  17 :  [-0.060029593111357145]
step  18 :  [-0.04167823996090381]
step  19 :  [-0.031745697475067745]
step  20 :  [-0.040980997379736366]
step  21 :  [-0.015513580267881442]
step  22 :  [-0.021406617203601066]
step  23 :  [-0.06955310425100401]
step  24 :  [-0.06464072437627609]
episode  133 : steps 25 , return [-14.98]
step  0 :  [-1.5906748779093371]
step  1 :  [-1.5494522292990296]
step  2 :  [-1.50107863489467]
step  3 :  [-1.4537026448116277]
step  4 :  [-1.3772648134138612]
step  5 :  [-1.2745421935349865]
step  6 :  [-1.2022365160602075]
step  7 :  [-1.1495381056349852]
step  8 :  [-1.0673701154241608]
step  9 :  [-0.9605432169079035]
step  10 :  [-0.8344723710271243]
step  11 :  [-0.6945229910274956]
step  12 :  [-0.5464910406566549]
step  13 :  [-0.39898381702906316]
step  14 :  [-0.272966526113368]
step  15 :  [-0.15045506005585066]
step  16 :  [-0.09648882756337693]
step  17 :  [-0.08999136693044192]
step  18 :  [-0.07540205518840351]
step  19 :  [-0.07194811752352548]
step  20 :  [-0.021491047927394064]
step  21 :  [-0.03375609579782713]
step  22 :  [-0.021496334689003298]
step  23 :  [-0.02283720943271125]
step  24 :  [-0.03216902156634725]
episode  134 : steps 25 , return [-16.49]
step  0 :  [-1.6528289530529099]
step  1 :  [-1.6255301479261812]
step  2 :  [-1.5961118261905594]
step  3 :  [-1.529986180937882]
step  4 :  [-1.4333673444021442]
step  5 :  [-1.3124548199603996]
step  6 :  [-1.172607363100644]
step  7 :  [-1.018821134340676]
step  8 :  [-0.8541146312702368]
step  9 :  [-0.6809908076361416]
step  10 :  [-0.5014617492696116]
step  11 :  [-0.3171999361160942]
step  12 :  [-0.13031062021745285]
step  13 :  [-0.04664191182463296]
step  14 :  [-0.03520034919788278]
step  15 :  [-0.059595062070355316]
step  16 :  [-0.04171162172715057]
step  17 :  [-0.06586831149703863]
step  18 :  [-0.045699790444731374]
step  19 :  [-0.017960400347705463]
step  20 :  [-0.00544391888789564]
step  21 :  [-0.034614379387887896]
step  22 :  [-0.019535227754966713]
step  23 :  [-0.030053770551707108]
step  24 :  [-0.07262385180963515]
episode  135 : steps 25 , return [-14.3]
step  0 :  [-1.7030957742254378]
step  1 :  [-1.6670921649405557]
step  2 :  [-1.6255281867428526]
step  3 :  [-1.5858817504091818]
step  4 :  [-1.514276013616336]
step  5 :  [-1.4146871092928561]
step  6 :  [-1.2921542561726294]
step  7 :  [-1.1514213407285174]
step  8 :  [-0.9952290856244436]
step  9 :  [-0.8290925251896977]
step  10 :  [-0.6552321155017643]
step  11 :  [-0.47558984388933134]
step  12 :  [-0.29220618729327635]
step  13 :  [-0.15160039870377998]
step  14 :  [-0.05029654298736814]
step  15 :  [-0.037926974243324404]
step  16 :  [-0.0056890180265544675]
step  17 :  [-0.023624711664162027]
step  18 :  [-0.038273126945411545]
step  19 :  [-0.0442098617606664]
step  20 :  [-0.016915141769616438]
step  21 :  [-0.0364429873354791]
step  22 :  [-0.03904440588415713]
step  23 :  [-0.04838254083441251]
step  24 :  [-0.022178637715609024]
episode  136 : steps 25 , return [-15.72]
step  0 :  [-1.7906461121233512]
step  1 :  [-1.755959931649437]
step  2 :  [-1.7159026261799781]
step  3 :  [-1.6776104959607372]
step  4 :  [-1.6066110819449864]
step  5 :  [-1.507280525922335]
step  6 :  [-1.3848420521256644]
step  7 :  [-1.2441272146758904]
step  8 :  [-1.0893138638204078]
step  9 :  [-0.9235590523776402]
step  10 :  [-0.7494528509369587]
step  11 :  [-0.569008452571483]
step  12 :  [-0.3837889628790467]
step  13 :  [-0.19508188692472142]
step  14 :  [-0.08241074697350388]
step  15 :  [-0.09665397329001742]
step  16 :  [-0.08479326041572068]
step  17 :  [-0.05923156323173773]
step  18 :  [-0.05306292320125255]
step  19 :  [-0.044277923847956514]
step  20 :  [-0.026283261451685077]
step  21 :  [-0.0151175224741813]
step  22 :  [-0.05950734387088246]
step  23 :  [-0.04450280140407395]
step  24 :  [-0.03453969438500019]
episode  137 : steps 25 , return [-17.19]
step  0 :  [-1.6231512079249433]
step  1 :  [-1.5994885601673772]
step  2 :  [-1.5751453502573594]
step  3 :  [-1.5126461376319809]
step  4 :  [-1.4186932092329319]
step  5 :  [-1.299798770464253]
step  6 :  [-1.161529195299225]
step  7 :  [-1.008395893193702]
step  8 :  [-0.8439678868919408]
step  9 :  [-0.6710555900690537]
step  10 :  [-0.49194417832983783]
step  11 :  [-0.30887457905300786]
step  12 :  [-0.16692418041755294]
step  13 :  [-0.06549168283833688]
step  14 :  [-0.024012289089085124]
step  15 :  [-0.05204422788133762]
step  16 :  [-0.034629506696574774]
step  17 :  [-0.08503098751254431]
step  18 :  [-0.07889952099738365]
step  19 :  [-0.07124789057124557]
step  20 :  [-0.046959092097104]
step  21 :  [-0.031294715374723246]
step  22 :  [-0.009721367896244417]
step  23 :  [-0.028831685342501846]
step  24 :  [-0.017474767170786134]
episode  138 : steps 25 , return [-14.23]
step  0 :  [-1.4514326380003661]
step  1 :  [-1.428563636415987]
step  2 :  [-1.3982160164882884]
step  3 :  [-1.3694228229883567]
step  4 :  [-1.307117300872057]
step  5 :  [-1.2164029118355943]
step  6 :  [-1.105572022320859]
step  7 :  [-0.9747903726167855]
step  8 :  [-0.8284573621432282]
step  9 :  [-0.6704590729630983]
step  10 :  [-0.5044553548637959]
step  11 :  [-0.335206679866358]
step  12 :  [-0.19683598697615698]
step  13 :  [-0.140894793255962]
step  14 :  [-0.11770485410687308]
step  15 :  [-0.07921538102430874]
step  16 :  [-0.08100835975198022]
step  17 :  [-0.0491118708003691]
step  18 :  [-0.06769919935780398]
step  19 :  [-0.037854407574393095]
step  20 :  [-0.0643545458044509]
step  21 :  [-0.03549702229063267]
step  22 :  [-0.050035626811325534]
step  23 :  [-0.09562559255569211]
step  24 :  [-0.09403931608681008]
episode  139 : steps 25 , return [-13.7]
step  0 :  [-1.7347782918330845]
step  1 :  [-1.7032935952912323]
step  2 :  [-1.6678294828131508]
step  3 :  [-1.6354788018172604]
step  4 :  [-1.5688653473654033]
step  5 :  [-1.4728349766231505]
step  6 :  [-1.3529440007843112]
step  7 :  [-1.2142605514824947]
step  8 :  [-1.0610359325172842]
step  9 :  [-0.8967083723946809]
step  10 :  [-0.7240347492238051]
step  11 :  [-0.5453051155310435]
step  12 :  [-0.3628139747332525]
step  13 :  [-0.1814743049571176]
step  14 :  [-0.034655873587213164]
step  15 :  [-0.030903762845189156]
step  16 :  [-0.04277124033009093]
step  17 :  [-0.015681050196556766]
step  18 :  [-0.06790551998637526]
step  19 :  [-0.07260759661140823]
step  20 :  [-0.026474748463676725]
step  21 :  [-0.04160070625924789]
step  22 :  [-0.07349304722597927]
step  23 :  [-0.0880644321225407]
step  24 :  [-0.06742916023645976]
episode  140 : steps 25 , return [-16.68]
step  0 :  [-1.6569087620699798]
step  1 :  [-1.632215443430395]
step  2 :  [-1.6063274749211782]
step  3 :  [-1.5426405239211354]
step  4 :  [-1.4477618585301704]
step  5 :  [-1.3281257363333654]
step  6 :  [-1.189236863096279]
step  7 :  [-1.0355537718978103]
step  8 :  [-0.8705904343613144]
step  9 :  [-0.6970790481249735]
step  10 :  [-0.5171423268165962]
step  11 :  [-0.3324958785574588]
step  12 :  [-0.1451400363452528]
step  13 :  [-0.05865596632476507]
step  14 :  [-0.04549077929978781]
step  15 :  [-0.045832993913163964]
step  16 :  [-0.04609913433520567]
step  17 :  [-0.03006547993895492]
step  18 :  [-0.026245652142722592]
step  19 :  [-0.04618835662494989]
step  20 :  [-0.030840327131727487]
step  21 :  [-0.05853982686699245]
step  22 :  [-0.03791154510861372]
step  23 :  [-0.0659166562312489]
step  24 :  [-0.04263674000122708]
episode  141 : steps 25 , return [-14.54]
step  0 :  [-1.7345261825163973]
step  1 :  [-1.6962694869723796]
step  2 :  [-1.651477460983136]
step  3 :  [-1.6076595978657084]
step  4 :  [-1.5714194545483051]
step  5 :  [-1.5039168527464695]
step  6 :  [-1.4083876382576432]
step  7 :  [-1.2896500946534821]
step  8 :  [-1.1524627407952046]
step  9 :  [-1.0010015532631793]
step  10 :  [-0.8388041601297243]
step  11 :  [-0.6689621577033946]
step  12 :  [-0.49466597927704914]
step  13 :  [-0.32122113098431654]
step  14 :  [-0.16966898678393916]
step  15 :  [-0.09300357054850762]
step  16 :  [-0.10444925398065392]
step  17 :  [-0.08664649779067644]
step  18 :  [-0.027895756759164076]
step  19 :  [-0.03362836132109007]
step  20 :  [-0.054364971671706896]
step  21 :  [-0.04729473651818794]
step  22 :  [-0.003057658758900874]
step  23 :  [-0.05507521657599087]
step  24 :  [-0.07070081850215759]
episode  142 : steps 25 , return [-17.69]
step  0 :  [-1.5463972475453747]
step  1 :  [-1.5051586819564946]
step  2 :  [-1.456948197456356]
step  3 :  [-1.410085590445083]
step  4 :  [-1.334201186123566]
step  5 :  [-1.236727915864262]
step  6 :  [-1.2003469228685835]
step  7 :  [-1.1510745480496782]
step  8 :  [-1.0707288552655632]
step  9 :  [-0.9648988474242266]
step  10 :  [-0.8394061420636463]
step  11 :  [-0.6998393703645359]
step  12 :  [-0.552125098257766]
step  13 :  [-0.4049230860540034]
step  14 :  [-0.2786993041307556]
step  15 :  [-0.16229695909309297]
step  16 :  [-0.12551526038280708]
step  17 :  [-0.11153601713922513]
step  18 :  [-0.0539484617240266]
step  19 :  [-0.058950287875924635]
step  20 :  [-0.05999059708378121]
step  21 :  [-0.0587515308761403]
step  22 :  [-0.08013054905126776]
step  23 :  [-0.07821832395499582]
step  24 :  [-0.04679614476029975]
episode  143 : steps 25 , return [-16.49]
step  0 :  [-1.413726768835658]
step  1 :  [-1.3849453327197399]
step  2 :  [-1.3546656755689301]
step  3 :  [-1.2887466630470863]
step  4 :  [-1.2146848734208695]
step  5 :  [-1.1229250745163033]
step  6 :  [-1.0072744533820805]
step  7 :  [-0.8728068734002956]
step  8 :  [-0.7240998804317338]
step  9 :  [-0.5653885649262376]
step  10 :  [-0.4015775190327231]
step  11 :  [-0.24323685605233467]
step  12 :  [-0.11581987952128392]
step  13 :  [-0.033928606865576194]
step  14 :  [-0.07378531993855716]
step  15 :  [-0.08695630142317484]
step  16 :  [-0.05553337814255589]
step  17 :  [-0.020991488893634124]
step  18 :  [-0.07069939975014652]
step  19 :  [-0.07537313183659619]
step  20 :  [-0.03904864231953451]
step  21 :  [-0.05945828797516888]
step  22 :  [-0.027744558135401245]
step  23 :  [-0.007914266123148923]
step  24 :  [-0.040787486553485595]
episode  144 : steps 25 , return [-12.3]
step  0 :  [-1.4114769979893769]
step  1 :  [-1.3804208556956603]
step  2 :  [-1.34702329621305]
step  3 :  [-1.2789835224415569]
step  4 :  [-1.2264947681358012]
step  5 :  [-1.1759154488019925]
step  6 :  [-1.0923125936248994]
step  7 :  [-0.9822980546936673]
step  8 :  [-0.8519002046409314]
step  9 :  [-0.7063455709805699]
step  10 :  [-0.5504289893248988]
step  11 :  [-0.3898742637931244]
step  12 :  [-0.237724713662624]
step  13 :  [-0.11815465287295354]
step  14 :  [-0.07482027782348719]
step  15 :  [-0.05396219692344028]
step  16 :  [-0.08184719844206001]
step  17 :  [-0.07184436310604835]
step  18 :  [-0.018618486132971304]
step  19 :  [-0.02400768989993586]
step  20 :  [-0.019500627898994254]
step  21 :  [-0.005098737630168142]
step  22 :  [-0.0620439487316643]
step  23 :  [-0.05988635333147129]
step  24 :  [-0.06868179935595858]
episode  145 : steps 25 , return [-13.29]
step  0 :  [-1.4946895158663254]
step  1 :  [-1.458746510678734]
step  2 :  [-1.4181505478404355]
step  3 :  [-1.381142401951276]
step  4 :  [-1.3123686844963678]
step  5 :  [-1.2155251922208714]
step  6 :  [-1.1021349578142676]
step  7 :  [-0.9697665285145279]
step  8 :  [-0.8225238133048934]
step  9 :  [-0.664161266110304]
step  10 :  [-0.4983893009868081]
step  11 :  [-0.3304685813889246]
step  12 :  [-0.19244920104097754]
step  13 :  [-0.07788547908621]
step  14 :  [-0.012979340410349142]
step  15 :  [-0.019291055404241975]
step  16 :  [-0.025072058833333067]
step  17 :  [-0.04658200039698518]
step  18 :  [-0.0755046225064006]
step  19 :  [-0.07418303817260034]
step  20 :  [-0.04485311042261798]
step  21 :  [-0.0691264138507209]
step  22 :  [-0.1081448156076579]
step  23 :  [-0.11918096407153446]
step  24 :  [-0.145154881984105]
episode  146 : steps 25 , return [-13.68]
step  0 :  [-1.5112788824104009]
step  1 :  [-1.4829427023624286]
step  2 :  [-1.4527522298065654]
step  3 :  [-1.3865355012315252]
step  4 :  [-1.2900748211292186]
step  5 :  [-1.1702766453497717]
step  6 :  [-1.0321717597745796]
step  7 :  [-0.8802952508950116]
step  8 :  [-0.7176984619679617]
step  9 :  [-0.5471438085945742]
step  10 :  [-0.3715611798794702]
step  11 :  [-0.19707923941809227]
step  12 :  [-0.05662592661928607]
step  13 :  [-0.011010755365303795]
step  14 :  [-0.016222709126233748]
step  15 :  [-0.018914968648428815]
step  16 :  [-0.015365039305348256]
step  17 :  [-0.029366799553159354]
step  18 :  [-0.02073303502140603]
step  19 :  [-0.035550456974997514]
step  20 :  [-0.02459654367304793]
step  21 :  [-0.03907476253405151]
step  22 :  [-0.026915167104246344]
step  23 :  [-0.04106757867749343]
step  24 :  [-0.056572072195398344]
episode  147 : steps 25 , return [-12.43]
step  0 :  [-1.4059119886892415]
step  1 :  [-1.3845414139267953]
step  2 :  [-1.3589302494716233]
step  3 :  [-1.2968337528838543]
step  4 :  [-1.2298346620254699]
step  5 :  [-1.1641151832990237]
step  6 :  [-1.0687036899366669]
step  7 :  [-0.9496164727734446]
step  8 :  [-0.8123009441150252]
step  9 :  [-0.6615207925719637]
step  10 :  [-0.5018155345648931]
step  11 :  [-0.33930955282531666]
step  12 :  [-0.20404092738368043]
step  13 :  [-0.06891359221781983]
step  14 :  [-0.044521223650221105]
step  15 :  [-0.029286129193884104]
step  16 :  [-0.061300038438572124]
step  17 :  [-0.040124331350111744]
step  18 :  [-0.03186398279863319]
step  19 :  [-0.0310004908913991]
step  20 :  [-0.04826794086383525]
step  21 :  [-0.03921746128097641]
step  22 :  [-0.0335490729976498]
step  23 :  [-0.06787638108797514]
step  24 :  [-0.09700909557763274]
episode  148 : steps 25 , return [-12.97]
step  0 :  [-1.4400332369726956]
step  1 :  [-1.4133541264543281]
step  2 :  [-1.3858071146778868]
step  3 :  [-1.3216901956827307]
step  4 :  [-1.2268892097024013]
step  5 :  [-1.1098891627661922]
step  6 :  [-0.9734051426245076]
step  7 :  [-0.8218961547401238]
step  8 :  [-0.6590002347724222]
step  9 :  [-0.48775337585366385]
step  10 :  [-0.3112117173627839]
step  11 :  [-0.13697739144083396]
step  12 :  [-0.07673722294327177]
step  13 :  [-0.04041029508329615]
step  14 :  [-0.03339933820342414]
step  15 :  [-0.03548314200302976]
step  16 :  [-0.04668901110273755]
step  17 :  [-0.031634861908054694]
step  18 :  [-0.03800732754891784]
step  19 :  [-0.033460006054383054]
step  20 :  [-0.034343854042330806]
step  21 :  [-0.035636533863167195]
step  22 :  [-0.03282391186791642]
step  23 :  [-0.03531595944194014]
step  24 :  [-0.05644422332831591]
episode  149 : steps 25 , return [-11.82]
step  0 :  [-1.5114314299285383]
step  1 :  [-1.482874704650452]
step  2 :  [-1.4523813416566353]
step  3 :  [-1.385955276817126]
step  4 :  [-1.2893454377114923]
step  5 :  [-1.1715631362096537]
step  6 :  [-1.0353758047042032]
step  7 :  [-0.8851666305164083]
step  8 :  [-0.7240159756750827]
step  9 :  [-0.5547767328579459]
step  10 :  [-0.3805689239346277]
step  11 :  [-0.20802241305404057]
step  12 :  [-0.06904633259551875]
step  13 :  [-0.015194503726635899]
step  14 :  [-0.01174731741816775]
step  15 :  [-0.032169298023405624]
step  16 :  [-0.05901214871238331]
step  17 :  [-0.06405508274601801]
step  18 :  [-0.03539446691063085]
step  19 :  [-0.03864837460254096]
step  20 :  [-0.08681253757907963]
step  21 :  [-0.08646972078131791]
step  22 :  [-0.0676939260966903]
step  23 :  [-0.04258555278742667]
step  24 :  [-0.012859251708153035]
episode  150 : steps 25 , return [-12.7]
step  0 :  [-1.4113977542753928]
step  1 :  [-1.383002390939412]
step  2 :  [-1.3532661295421062]
step  3 :  [-1.2877336487581295]
step  4 :  [-1.2115009879077847]
step  5 :  [-1.1151060205441912]
step  6 :  [-0.9956523033287441]
step  7 :  [-0.8581251821551685]
step  8 :  [-0.7069625985272595]
step  9 :  [-0.5462626540878125]
step  10 :  [-0.3808751468898035]
step  11 :  [-0.22216423766709514]
step  12 :  [-0.0978029047196656]
step  13 :  [-0.055186656973980695]
step  14 :  [-0.03357987018309687]
step  15 :  [-0.0677873659496617]
step  16 :  [-0.046623097156127946]
step  17 :  [-0.07689614927860658]
step  18 :  [-0.09688358146474538]
step  19 :  [-0.08231497365225529]
step  20 :  [-0.04832607045459247]
step  21 :  [-0.043223366268426]
step  22 :  [-0.10552360840492785]
step  23 :  [-0.11389082748118218]
step  24 :  [-0.10553905397655454]
episode  151 : steps 25 , return [-12.45]
step  0 :  [-1.6643883666142307]
step  1 :  [-1.623651418529593]
step  2 :  [-1.5756687137471665]
step  3 :  [-1.5283044233651697]
step  4 :  [-1.4885590407330935]
step  5 :  [-1.4189683640660724]
step  6 :  [-1.3221126452139347]
step  7 :  [-1.202473514091272]
step  8 :  [-1.0646282684590984]
step  9 :  [-0.9126521375957833]
step  10 :  [-0.7500338963338152]
step  11 :  [-0.5798868345111644]
step  12 :  [-0.4056861467007782]
step  13 :  [-0.23493542731806963]
step  14 :  [-0.09607707671718221]
step  15 :  [-0.037868042298461115]
step  16 :  [-0.0652704993769472]
step  17 :  [-0.062426035004843346]
step  18 :  [-0.028361227553036165]
step  19 :  [-0.04196844663015668]
step  20 :  [-0.07816467701247261]
step  21 :  [-0.0759605371521577]
step  22 :  [-0.038694978458928865]
step  23 :  [-0.045987608285908185]
step  24 :  [-0.018291329311453098]
episode  152 : steps 25 , return [-16.36]
step  0 :  [-1.609270861540726]
step  1 :  [-1.5735468088648656]
step  2 :  [-1.5327378451241491]
step  3 :  [-1.4946221108477011]
step  4 :  [-1.4244885764347026]
step  5 :  [-1.3261730548810358]
step  6 :  [-1.2047057502015277]
step  7 :  [-1.067065503495535]
step  8 :  [-0.9149306828917944]
step  9 :  [-0.7516084501538608]
step  10 :  [-0.5798467866162517]
step  11 :  [-0.4020877171234551]
step  12 :  [-0.2216232164674412]
step  13 :  [-0.07819825435798615]
step  14 :  [-0.03256188607647434]
step  15 :  [-0.05628923949218576]
step  16 :  [-0.04285691166876791]
step  17 :  [-0.05994993514446754]
step  18 :  [-0.05108753382571446]
step  19 :  [-0.06342408513121463]
step  20 :  [-0.05613675912268073]
step  21 :  [-0.06575407585526905]
step  22 :  [-0.05907248479878104]
step  23 :  [-0.0671703060318834]
step  24 :  [-0.060749214291654814]
episode  153 : steps 25 , return [-14.8]
step  0 :  [-1.4677942258961463]
step  1 :  [-1.4409717880547164]
step  2 :  [-1.4063478764984598]
step  3 :  [-1.3729094359643061]
step  4 :  [-1.307198210615318]
step  5 :  [-1.2266975837729452]
step  6 :  [-1.1398621587895852]
step  7 :  [-1.0288263010006145]
step  8 :  [-0.8984353279980973]
step  9 :  [-0.7533030557701768]
step  10 :  [-0.5978290550759762]
step  11 :  [-0.43713033401460466]
step  12 :  [-0.28133225987240856]
step  13 :  [-0.15328632051697316]
step  14 :  [-0.0998639536781041]
step  15 :  [-0.06496066664511897]
step  16 :  [-0.013066982514449692]
step  17 :  [-0.03405027059054664]
step  18 :  [-0.07214555351661757]
step  19 :  [-0.07328778378625646]
step  20 :  [-0.03630989277332457]
step  21 :  [-0.024701599286630512]
step  22 :  [-0.02412621045474595]
step  23 :  [-0.018426536455638028]
step  24 :  [-0.0858580968436182]
episode  154 : steps 25 , return [-14.06]
step  0 :  [-1.4208993035067092]
step  1 :  [-1.392703852774225]
step  2 :  [-1.3631875703000373]
step  3 :  [-1.2977702855176514]
step  4 :  [-1.213029222424861]
step  5 :  [-1.1112570214870925]
step  6 :  [-0.9876848728369685]
step  7 :  [-0.847006535877516]
step  8 :  [-0.6934192313772677]
step  9 :  [-0.5308378942402493]
step  10 :  [-0.364046515236616]
step  11 :  [-0.20527612987790383]
step  12 :  [-0.08545128177045538]
step  13 :  [-0.05418606861152435]
step  14 :  [-0.02918056447430331]
step  15 :  [-0.039743337483072204]
step  16 :  [-0.04003719432354304]
step  17 :  [-0.04087125690978652]
step  18 :  [-0.015537945184611327]
step  19 :  [-0.014796262839839355]
step  20 :  [-0.04135724501672099]
step  21 :  [-0.025681810950905087]
step  22 :  [-0.056954861114844726]
step  23 :  [-0.0361270753749631]
step  24 :  [-0.06580389041742833]
episode  155 : steps 25 , return [-11.97]
step  0 :  [-1.5804808466834102]
step  1 :  [-1.5374733139287573]
step  2 :  [-1.4866448376915098]
step  3 :  [-1.4362659044665786]
step  4 :  [-1.3578439233324013]
step  5 :  [-1.2538024204321927]
step  6 :  [-1.2478735933886456]
step  7 :  [-1.2309064965385872]
step  8 :  [-1.1742025543439045]
step  9 :  [-1.0853402566499826]
step  10 :  [-0.9715508474577277]
step  11 :  [-0.8391482897645957]
step  12 :  [-0.6937445578903462]
step  13 :  [-0.5411233740497938]
step  14 :  [-0.389909875322962]
step  15 :  [-0.2601626677682087]
step  16 :  [-0.13405982328262803]
step  17 :  [-0.08486614763552246]
step  18 :  [-0.07021558543109731]
step  19 :  [-0.05337258987833283]
step  20 :  [-0.04079245831763117]
step  21 :  [-0.03490745726762657]
step  22 :  [-0.03366862608465994]
step  23 :  [-0.034006054290750244]
step  24 :  [-0.02167541361061774]
episode  156 : steps 25 , return [-17.59]
step  0 :  [-1.809250567343452]
step  1 :  [-1.769809919972007]
step  2 :  [-1.7231308750408123]
step  3 :  [-1.6765702812195131]
step  4 :  [-1.6365824943869323]
step  5 :  [-1.5660085577545286]
step  6 :  [-1.4679520495401677]
step  7 :  [-1.3470664603853428]
step  8 :  [-1.2079481451751262]
step  9 :  [-1.0546022871281202]
step  10 :  [-0.8903452722747073]
step  11 :  [-0.7178915169446699]
step  12 :  [-0.5395685724561782]
step  13 :  [-0.35789601995132714]
step  14 :  [-0.17909335496881096]
step  15 :  [-0.10758289811839405]
step  16 :  [-0.035246065231982204]
step  17 :  [-0.0019068481829569378]
step  18 :  [-0.02584195032737878]
step  19 :  [-0.0057393125617792775]
step  20 :  [-0.020650619820925278]
step  21 :  [-0.06553875207020879]
step  22 :  [-0.06785354415994099]
step  23 :  [-0.03447026038517389]
step  24 :  [-0.04396055396478988]
episode  157 : steps 25 , return [-18.35]
step  0 :  [-1.6675061468497991]
step  1 :  [-1.642767738825168]
step  2 :  [-1.6167743159902432]
step  3 :  [-1.5529828551448868]
step  4 :  [-1.4580120567023482]
step  5 :  [-1.338297267280325]
step  6 :  [-1.1993409871175882]
step  7 :  [-1.0455983989522446]
step  8 :  [-0.8805792316663285]
step  9 :  [-0.7070093972304219]
step  10 :  [-0.5269988428223173]
step  11 :  [-0.342223218396345]
step  12 :  [-0.15441120901326677]
step  13 :  [-0.028834679375679573]
step  14 :  [-0.0748214481357573]
step  15 :  [-0.09359486509621252]
step  16 :  [-0.07027898787746173]
step  17 :  [-0.07609555730253634]
step  18 :  [-0.053464353192761674]
step  19 :  [-0.0872458428470544]
step  20 :  [-0.06791888419406114]
step  21 :  [-0.010226194797745237]
step  22 :  [-0.017757761446918752]
step  23 :  [-0.029115959970742837]
step  24 :  [-0.014692133707504386]
episode  158 : steps 25 , return [-14.76]
step  0 :  [-1.6238900574316442]
step  1 :  [-1.5988679202139073]
step  2 :  [-1.5726743363178322]
step  3 :  [-1.5088718511541799]
step  4 :  [-1.4139611776960943]
step  5 :  [-1.294330608064617]
step  6 :  [-1.1554646071585595]
step  7 :  [-1.0018133487255005]
step  8 :  [-0.8368889915368501]
step  9 :  [-0.6634278009425152]
step  10 :  [-0.4835687091284911]
step  11 :  [-0.2990968120438696]
step  12 :  [-0.11274805103204337]
step  13 :  [-0.03716787858267927]
step  14 :  [-0.10273804902794238]
step  15 :  [-0.11210350715000797]
step  16 :  [-0.08807892846890089]
step  17 :  [-0.03127165332897498]
step  18 :  [-0.02212240979967626]
step  19 :  [-0.006474461519873678]
step  20 :  [-0.03630382080965888]
step  21 :  [-0.027639208453423526]
step  22 :  [-0.01806623933327432]
step  23 :  [-0.011968263119368532]
step  24 :  [-0.04085720218020732]
episode  159 : steps 25 , return [-14.1]
step  0 :  [-1.5472559936930255]
step  1 :  [-1.5147047327455283]
step  2 :  [-1.4785496500903939]
step  3 :  [-1.4465976442525317]
step  4 :  [-1.381132899438526]
step  5 :  [-1.2864564197021966]
step  6 :  [-1.167957090902887]
step  7 :  [-1.0306964056836587]
step  8 :  [-0.8790162281159847]
step  9 :  [-0.716567101610767]
step  10 :  [-0.5466052569330652]
step  11 :  [-0.37292201961916166]
step  12 :  [-0.2049502082190598]
step  13 :  [-0.07344871120299717]
step  14 :  [-0.036283296428747745]
step  15 :  [-0.011279391629162203]
step  16 :  [-0.04024764394164398]
step  17 :  [-0.015060630934761825]
step  18 :  [-0.04574772010696256]
step  19 :  [-0.0780224005814932]
step  20 :  [-0.08164260953576116]
step  21 :  [-0.0512448387580922]
step  22 :  [-0.05313540703163246]
step  23 :  [-0.024837501230218967]
step  24 :  [-0.04688925793566965]
episode  160 : steps 25 , return [-14.13]
step  0 :  [-1.4418633904107705]
step  1 :  [-1.4175307614729056]
step  2 :  [-1.3866869739920082]
step  3 :  [-1.3582361068111783]
step  4 :  [-1.2961437927797046]
step  5 :  [-1.2048630447845026]
step  6 :  [-1.0890593465522678]
step  7 :  [-0.9538754802020053]
step  8 :  [-0.8037695339324527]
step  9 :  [-0.6425200132063884]
step  10 :  [-0.4735781440199657]
step  11 :  [-0.3014302516964551]
step  12 :  [-0.14228610411114165]
step  13 :  [-0.06408749853981621]
step  14 :  [-0.09049363087028099]
step  15 :  [-0.07789717591664821]
step  16 :  [-0.07714708286562495]
step  17 :  [-0.06535160840204976]
step  18 :  [-0.017984026152392762]
step  19 :  [-0.03638066078092394]
step  20 :  [-0.04886347501399625]
step  21 :  [-0.018393060220907035]
step  22 :  [-0.04788759075235414]
step  23 :  [-0.028733862062400514]
step  24 :  [-0.05315988238997606]
episode  161 : steps 25 , return [-13.14]
step  0 :  [-1.627950046739097]
step  1 :  [-1.5830022253917335]
step  2 :  [-1.529270017596013]
step  3 :  [-1.4749337644248757]
step  4 :  [-1.4273845572696304]
step  5 :  [-1.3525047348028736]
step  6 :  [-1.2518648740452913]
step  7 :  [-1.1533840688693628]
step  8 :  [-1.0330040905906208]
step  9 :  [-0.8950947040664123]
step  10 :  [-0.7437404595350328]
step  11 :  [-0.5827522758163405]
step  12 :  [-0.41643097838418147]
step  13 :  [-0.25347058781769377]
step  14 :  [-0.12050585090113976]
step  15 :  [-0.0650858282773618]
step  16 :  [-0.01738570470311298]
step  17 :  [-0.038235680667190616]
step  18 :  [-0.023970703988175857]
step  19 :  [-0.0298598199271119]
step  20 :  [-0.03489409763327849]
step  21 :  [-0.06716770138238265]
step  22 :  [-0.061611210582944734]
step  23 :  [-0.01766707468303986]
step  24 :  [-0.028629448151457227]
episode  162 : steps 25 , return [-15.83]
step  0 :  [-1.6617886462692553]
step  1 :  [-1.6219010653812875]
step  2 :  [-1.5751097556979297]
step  3 :  [-1.5292442740601169]
step  4 :  [-1.4535313492584756]
step  5 :  [-1.3511579034706613]
step  6 :  [-1.2267136147825792]
step  7 :  [-1.149050370355294]
step  8 :  [-1.0429075929300478]
step  9 :  [-0.9183717563263355]
step  10 :  [-0.7792008383369426]
step  11 :  [-0.6296428890881561]
step  12 :  [-0.4750960156679862]
step  13 :  [-0.3472044746391033]
step  14 :  [-0.2080736712426039]
step  15 :  [-0.0813196239793992]
step  16 :  [-0.03855402819410538]
step  17 :  [-0.015825599717899604]
step  18 :  [-0.03391071025253747]
step  19 :  [-0.02148415709630078]
step  20 :  [-0.05561057324105727]
step  21 :  [-0.042184111993550946]
step  22 :  [-0.013094087371997215]
step  23 :  [-0.008307901395564985]
step  24 :  [-0.035202187414164074]
episode  163 : steps 25 , return [-16.31]
step  0 :  [-1.505749388897791]
step  1 :  [-1.469114596562427]
step  2 :  [-1.4275048452067667]
step  3 :  [-1.3891560187689842]
step  4 :  [-1.3193770983942001]
step  5 :  [-1.2216869755833772]
step  6 :  [-1.1144851660763577]
step  7 :  [-0.987513480178328]
step  8 :  [-0.844846796748117]
step  9 :  [-0.6903865194951225]
step  10 :  [-0.5280778262591058]
step  11 :  [-0.3634013631323529]
step  12 :  [-0.21184262729550318]
step  13 :  [-0.10362593990415392]
step  14 :  [-0.07815019995758467]
step  15 :  [-0.053860209461993415]
step  16 :  [-0.05098612815674656]
step  17 :  [-0.03826617002827379]
step  18 :  [-0.046406465323190524]
step  19 :  [-0.03973973410437434]
step  20 :  [-0.07582002971347918]
step  21 :  [-0.10877094312536967]
step  22 :  [-0.10489750731149881]
step  23 :  [-0.0788087820737118]
step  24 :  [-0.09497490584885383]
episode  164 : steps 25 , return [-13.95]
step  0 :  [-1.7052246781647484]
step  1 :  [-1.6692250794378884]
step  2 :  [-1.6276587749441025]
step  3 :  [-1.587996701097102]
step  4 :  [-1.5163715627999685]
step  5 :  [-1.416764420389441]
step  6 :  [-1.2942159236560495]
step  7 :  [-1.153470122957999]
step  8 :  [-0.9972021939730052]
step  9 :  [-0.8310469992226907]
step  10 :  [-0.6572060886495141]
step  11 :  [-0.4776203512451595]
step  12 :  [-0.2943626386182446]
step  13 :  [-0.11374199896313603]
step  14 :  [-0.05733931861160824]
step  15 :  [-0.06312959604389778]
step  16 :  [-0.07384781578336481]
step  17 :  [-0.06027675927250656]
step  18 :  [-0.08496264634016079]
step  19 :  [-0.10370198984677095]
step  20 :  [-0.07790842861779343]
step  21 :  [-0.02765753681446695]
step  22 :  [-0.030900237928984994]
step  23 :  [-0.015160715773763534]
step  24 :  [-0.030615987942390826]
episode  165 : steps 25 , return [-15.97]
step  0 :  [-1.559915096608677]
step  1 :  [-1.5154428778055173]
step  2 :  [-1.4626429197715796]
step  3 :  [-1.4099274592232387]
step  4 :  [-1.3649421972157567]
step  5 :  [-1.2923285460028087]
step  6 :  [-1.2145384235406047]
step  7 :  [-1.1154716842567225]
step  8 :  [-0.9946482240280246]
step  9 :  [-0.8567055393930278]
step  10 :  [-0.7059950083035221]
step  11 :  [-0.5468478696329215]
step  12 :  [-0.3850827739008562]
step  13 :  [-0.2505632526938122]
step  14 :  [-0.11137591709178449]
step  15 :  [-0.06096086810491804]
step  16 :  [-0.04860044237580261]
step  17 :  [-0.0407816357747767]
step  18 :  [-0.03629324937599401]
step  19 :  [-0.0733551418512282]
step  20 :  [-0.05863323162543792]
step  21 :  [-0.08963559754103197]
step  22 :  [-0.07501413577605788]
step  23 :  [-0.09292688020989956]
step  24 :  [-0.07534488542878082]
episode  166 : steps 25 , return [-15.44]
step  0 :  [-1.5486795517206537]
step  1 :  [-1.5117514157722378]
step  2 :  [-1.469536010268868]
step  3 :  [-1.430111774205693]
step  4 :  [-1.3593550771234229]
step  5 :  [-1.2607449827676345]
step  6 :  [-1.1554818962640228]
step  7 :  [-1.028812619791556]
step  8 :  [-0.8852981379763651]
step  9 :  [-0.7288552641060547]
step  10 :  [-0.5628583565177262]
step  11 :  [-0.39063904241367553]
step  12 :  [-0.21810509607182985]
step  13 :  [-0.07737053589341719]
step  14 :  [-0.01696353904273797]
step  15 :  [-0.04390599093992577]
step  16 :  [-0.05461404897296945]
step  17 :  [-0.030461038160445056]
step  18 :  [-0.01871137300583405]
step  19 :  [-0.05843276955158973]
step  20 :  [-0.06634143312516648]
step  21 :  [-0.03648075754310533]
step  22 :  [-0.02377936155929878]
step  23 :  [-0.04548824467010961]
step  24 :  [-0.0229907627659054]
episode  167 : steps 25 , return [-14.05]
step  0 :  [-1.5515685514549986]
step  1 :  [-1.5071187499027676]
step  2 :  [-1.4543845472100818]
step  3 :  [-1.4018099322917448]
step  4 :  [-1.3570758398259561]
step  5 :  [-1.284700247592877]
step  6 :  [-1.2117386194571516]
step  7 :  [-1.1141510675912532]
step  8 :  [-0.9942016985496321]
step  9 :  [-0.856745095086938]
step  10 :  [-0.7062414265403734]
step  11 :  [-0.5470447228773543]
step  12 :  [-0.3848658291626417]
step  13 :  [-0.2341118491544675]
step  14 :  [-0.11972575240057336]
step  15 :  [-0.08252041462924699]
step  16 :  [-0.0598606044613752]
step  17 :  [-0.058209290914989546]
step  18 :  [-0.036724813469082705]
step  19 :  [-0.029443710146438273]
step  20 :  [-0.023730952167724657]
step  21 :  [-0.03314078414557956]
step  22 :  [-0.028084993828962294]
step  23 :  [-0.06816695764269091]
step  24 :  [-0.05327710182056641]
episode  168 : steps 25 , return [-15.2]
step  0 :  [-1.7242869341835163]
step  1 :  [-1.6859840460732554]
step  2 :  [-1.6411639974282273]
step  3 :  [-1.597370211068364]
step  4 :  [-1.52282506486985]
step  5 :  [-1.4211343727635923]
step  6 :  [-1.2970963075945017]
step  7 :  [-1.169369221852182]
step  8 :  [-1.0240609103540825]
step  9 :  [-0.8703832106053488]
step  10 :  [-0.7097515472059319]
step  11 :  [-0.544902739751856]
step  12 :  [-0.3813851059509654]
step  13 :  [-0.24795790526863376]
step  14 :  [-0.1269803263506494]
step  15 :  [-0.06106642391740434]
step  16 :  [-0.055257006671087176]
step  17 :  [-0.0904268603078391]
step  18 :  [-0.0757199254163591]
step  19 :  [-0.03932778267236067]
step  20 :  [-0.046028431404233655]
step  21 :  [-0.07965834949450369]
step  22 :  [-0.05679711506121124]
step  23 :  [-0.020550611544033662]
step  24 :  [-0.025312847704677243]
episode  169 : steps 25 , return [-16.51]
step  0 :  [-1.7154369932526714]
step  1 :  [-1.6881322960047382]
step  2 :  [-1.6584547291411011]
step  3 :  [-1.5919808699366742]
step  4 :  [-1.495033679232046]
step  5 :  [-1.3738463863425798]
step  6 :  [-1.233785768262389]
step  7 :  [-1.0846512993627153]
step  8 :  [-0.9232652023557426]
step  9 :  [-0.7524969417614424]
step  10 :  [-0.5745803828077141]
step  11 :  [-0.3912424096342499]
step  12 :  [-0.20381948343735606]
step  13 :  [-0.08418883299339547]
step  14 :  [-0.08869601390455215]
step  15 :  [-0.0712765205886765]
step  16 :  [-0.04604223809100964]
step  17 :  [-0.07917270274694406]
step  18 :  [-0.056740470075373764]
step  19 :  [-0.050071403225297295]
step  20 :  [-0.028745723923463192]
step  21 :  [-0.05215005754802492]
step  22 :  [-0.028102341696269784]
step  23 :  [-0.05345760271707862]
step  24 :  [-0.036052115305572494]
episode  170 : steps 25 , return [-15.36]
step  0 :  [-1.658469901150865]
step  1 :  [-1.6324981649732286]
step  2 :  [-1.6048648665552812]
step  3 :  [-1.5399567333875601]
step  4 :  [-1.4441944363361672]
step  5 :  [-1.323898322124881]
step  6 :  [-1.184500229509541]
step  7 :  [-1.030408811821089]
step  8 :  [-0.8650997297008337]
step  9 :  [-0.6912682899008987]
step  10 :  [-0.5109837624198662]
step  11 :  [-0.32582490298223993]
step  12 :  [-0.13699472186233236]
step  13 :  [-0.04554292754713228]
step  14 :  [-0.02762913862085076]
step  15 :  [-0.0423724922125211]
step  16 :  [-0.025942277834600666]
step  17 :  [-0.046835804820854296]
step  18 :  [-0.02684713430127924]
step  19 :  [-0.052036749202635395]
step  20 :  [-0.03353313884876733]
step  21 :  [-0.04866660476112785]
step  22 :  [-0.028006847618614536]
step  23 :  [-0.05513507219245483]
step  24 :  [-0.03594039842923408]
episode  171 : steps 25 , return [-14.42]
step  0 :  [-1.6814184790436166]
step  1 :  [-1.656189307769668]
step  2 :  [-1.6294718023666144]
step  3 :  [-1.5651353870144782]
step  4 :  [-1.469749966328814]
step  5 :  [-1.3497137986710435]
step  6 :  [-1.2105021310344433]
step  7 :  [-1.056549395790872]
step  8 :  [-0.8913477316569678]
step  9 :  [-0.7176043095757363]
step  10 :  [-0.5373995810552216]
step  11 :  [-0.35233122236454345]
step  12 :  [-0.16368652478020046]
step  13 :  [-0.07279043147380694]
step  14 :  [-0.06417918503274943]
step  15 :  [-0.07258395368617442]
step  16 :  [-0.05967831141972971]
step  17 :  [-0.046902442101421554]
step  18 :  [-0.040575468010527964]
step  19 :  [-0.01920280493674215]
step  20 :  [-0.009430599618643317]
step  21 :  [-0.04811068310355355]
step  22 :  [-0.029779395970653856]
step  23 :  [-0.05083881598418892]
step  24 :  [-0.037297425428112284]
episode  172 : steps 25 , return [-14.83]
step  0 :  [-1.6015276864515764]
step  1 :  [-1.5712626768896079]
step  2 :  [-1.5380062319466037]
step  3 :  [-1.4694102929766248]
step  4 :  [-1.371150790356598]
step  5 :  [-1.2922620704412022]
step  6 :  [-1.1873325408540956]
step  7 :  [-1.0611929975751477]
step  8 :  [-0.9184189439720699]
step  9 :  [-0.7630299659851019]
step  10 :  [-0.5986352852935916]
step  11 :  [-0.4291556886212331]
step  12 :  [-0.2621504990419521]
step  13 :  [-0.12482214279037249]
step  14 :  [-0.06573860657059066]
step  15 :  [-0.025452293926985038]
step  16 :  [-0.037570601676206246]
step  17 :  [-0.032788313036782084]
step  18 :  [-0.029292481837011896]
step  19 :  [-0.05145515169691626]
step  20 :  [-0.044335574670365]
step  21 :  [-0.010753570920108672]
step  22 :  [-0.05046145106201602]
step  23 :  [-0.07577923246443205]
step  24 :  [-0.09595417157009374]
episode  173 : steps 25 , return [-14.71]
step  0 :  [-1.6028940425870695]
step  1 :  [-1.5647073917091021]
step  2 :  [-1.520511568763598]
step  3 :  [-1.4782511316211548]
step  4 :  [-1.4052636169911186]
step  5 :  [-1.3049155289554593]
step  6 :  [-1.190121340577373]
step  7 :  [-1.0668531078165888]
step  8 :  [-0.9289515631433521]
step  9 :  [-0.7791986679215384]
step  10 :  [-0.6209114811513323]
step  11 :  [-0.4585060192589086]
step  12 :  [-0.3011944307665251]
step  13 :  [-0.17254814534082172]
step  14 :  [-0.049982472694575245]
step  15 :  [-0.012515155841752792]
step  16 :  [-0.021778572917663882]
step  17 :  [-0.014223126452687123]
step  18 :  [-0.010861179893635291]
step  19 :  [-0.04897777728607928]
step  20 :  [-0.04768828650218468]
step  21 :  [-0.014796011688120099]
step  22 :  [-0.030923371480192512]
step  23 :  [-0.0028310415938004657]
step  24 :  [-0.03259657804926167]
episode  174 : steps 25 , return [-14.68]
step  0 :  [-1.5307197951788603]
step  1 :  [-1.4939360856721209]
step  2 :  [-1.452002676505647]
step  3 :  [-1.413061274987774]
step  4 :  [-1.342734239496302]
step  5 :  [-1.2444871474307704]
step  6 :  [-1.1399590714329577]
step  7 :  [-1.0143572770695473]
step  8 :  [-0.8720846610705569]
step  9 :  [-0.7170959738752314]
step  10 :  [-0.553004870603199]
step  11 :  [-0.3839049052865572]
step  12 :  [-0.21891859938015976]
step  13 :  [-0.0871327400643214]
step  14 :  [-0.038511713551227095]
step  15 :  [-0.02063142946212133]
step  16 :  [-0.020989920528821947]
step  17 :  [-0.045732511265983704]
step  18 :  [-0.03500363882568229]
step  19 :  [-0.05986212692550267]
step  20 :  [-0.11450901291897604]
step  21 :  [-0.1204540824024931]
step  22 :  [-0.10841991791684316]
step  23 :  [-0.07157689980514895]
step  24 :  [-0.038415841579226284]
episode  175 : steps 25 , return [-14.14]
step  0 :  [-1.6901056586623777]
step  1 :  [-1.6639244760687062]
step  2 :  [-1.635876852421288]
step  3 :  [-1.570593004480701]
step  4 :  [-1.4745174822116869]
step  5 :  [-1.3539684927752123]
step  6 :  [-1.2143692590171176]
step  7 :  [-1.060119978116489]
step  8 :  [-0.8946886169948826]
step  9 :  [-0.7207659940635185]
step  10 :  [-0.5404214573520968]
step  11 :  [-0.35524664679913515]
step  12 :  [-0.16653642242526925]
step  13 :  [-0.07499507714544372]
step  14 :  [-0.008617348923831977]
step  15 :  [-0.005598641522570826]
step  16 :  [-0.051799073977591883]
step  17 :  [-0.03772861031024415]
step  18 :  [-0.0771475348704079]
step  19 :  [-0.05674173855825646]
step  20 :  [-0.06548248473209704]
step  21 :  [-0.04834235646184228]
step  22 :  [-0.0767820468602756]
step  23 :  [-0.05651610536692134]
step  24 :  [-0.019732701804242195]
episode  176 : steps 25 , return [-14.92]
step  0 :  [-1.5451268344757343]
step  1 :  [-1.5077452310629196]
step  2 :  [-1.4649160132338934]
step  3 :  [-1.4247580799755466]
step  4 :  [-1.3535067670734258]
step  5 :  [-1.25454762174943]
step  6 :  [-1.1558784779810616]
step  7 :  [-1.0346254194842865]
step  8 :  [-0.8954990553996536]
step  9 :  [-0.7426346255811249]
step  10 :  [-0.5796680288116067]
step  11 :  [-0.41028157780318586]
step  12 :  [-0.24095965555618262]
step  13 :  [-0.10217853772105158]
step  14 :  [-0.042817209397262745]
step  15 :  [-0.053682707549718225]
step  16 :  [-0.07156004321773937]
step  17 :  [-0.04212762769770644]
step  18 :  [-0.014419076713017646]
step  19 :  [-0.01787503754852922]
step  20 :  [-0.044165722453877176]
step  21 :  [-0.045118808876368204]
step  22 :  [-0.0660051366630133]
step  23 :  [-0.06359733467688052]
step  24 :  [-0.08562500242840376]
episode  177 : steps 25 , return [-14.26]
step  0 :  [-1.7775412709505276]
step  1 :  [-1.745272564463535]
step  2 :  [-1.7085804297458422]
step  3 :  [-1.674484530900675]
step  4 :  [-1.6064698551304124]
step  5 :  [-1.5093167275884487]
step  6 :  [-1.3885080641909486]
step  7 :  [-1.2490459626210835]
step  8 :  [-1.0951207725121348]
step  9 :  [-0.9301046535731459]
step  10 :  [-0.7566605043181367]
step  11 :  [-0.5768918091917026]
step  12 :  [-0.39255114116817624]
step  13 :  [-0.20571812667398798]
step  14 :  [-0.06232465863365724]
step  15 :  [-0.04413555959271381]
step  16 :  [-0.04135088751384835]
step  17 :  [-0.018474166077807896]
step  18 :  [-0.047526066041067426]
step  19 :  [-0.049836609016093915]
step  20 :  [-0.044985578343497104]
step  21 :  [-0.04038996372119139]
step  22 :  [-0.018436937738887486]
step  23 :  [-0.054521964431327674]
step  24 :  [-0.07746268247287581]
episode  178 : steps 25 , return [-17.12]
step  0 :  [-1.7225954323504082]
step  1 :  [-1.690227994838482]
step  2 :  [-1.6535979728286585]
step  3 :  [-1.6198940794278112]
step  4 :  [-1.5523717998727804]
step  5 :  [-1.4556976430038175]
step  6 :  [-1.3353249337418784]
step  7 :  [-1.1962580863792573]
step  8 :  [-1.0427040724033962]
step  9 :  [-0.8780634776276558]
step  10 :  [-0.70504952592872]
step  11 :  [-0.5258783824816916]
step  12 :  [-0.3426637944588597]
step  13 :  [-0.15973623049871236]
step  14 :  [-0.08288932600581657]
step  15 :  [-0.015121226635213512]
step  16 :  [-0.024642209359257185]
step  17 :  [-0.0119643364742634]
step  18 :  [-0.06583883067646898]
step  19 :  [-0.06109093901242877]
step  20 :  [-0.04224654538105397]
step  21 :  [-0.03803027439220768]
step  22 :  [-0.035621402034080714]
step  23 :  [-0.061749763021462414]
step  24 :  [-0.09279955143072341]
episode  179 : steps 25 , return [-16.41]
step  0 :  [-1.6816030425141781]
step  1 :  [-1.6400873470156967]
step  2 :  [-1.590957199985788]
step  3 :  [-1.5420582373246325]
step  4 :  [-1.5003792687052504]
step  5 :  [-1.4293089134113894]
step  6 :  [-1.3312865886043421]
step  7 :  [-1.210681209652963]
step  8 :  [-1.0719772786842117]
step  9 :  [-0.9191598069851078]
step  10 :  [-0.7556011567160137]
step  11 :  [-0.5842040295134132]
step  12 :  [-0.4079051771277986]
step  13 :  [-0.23212526656202387]
step  14 :  [-0.08855133587910541]
step  15 :  [-0.026259143097434545]
step  16 :  [-0.041690310899822065]
step  17 :  [-0.047990060992190144]
step  18 :  [-0.024683425274791025]
step  19 :  [-0.018813430799413392]
step  20 :  [-0.016834536126321034]
step  21 :  [-0.03672057759442499]
step  22 :  [-0.0357237843173868]
step  23 :  [-0.05068858016779996]
step  24 :  [-0.04697609436921843]
episode  180 : steps 25 , return [-16.33]
step  0 :  [-1.4940632080973577]
step  1 :  [-1.4648886174424909]
step  2 :  [-1.4336356132422434]
step  3 :  [-1.3667467892850977]
step  4 :  [-1.2698393274674944]
step  5 :  [-1.167220291734438]
step  6 :  [-1.042285312451081]
step  7 :  [-0.9008003419410388]
step  8 :  [-0.7464409279587568]
step  9 :  [-0.5825876753783577]
step  10 :  [-0.41283400833403616]
step  11 :  [-0.2438733049479491]
step  12 :  [-0.10584237919728069]
step  13 :  [-0.04710667910660972]
step  14 :  [-0.04801005815955858]
step  15 :  [-0.07004892071187177]
step  16 :  [-0.06911412666315352]
step  17 :  [-0.04268753619787188]
step  18 :  [-0.014625203130667772]
step  19 :  [-0.05211237978789699]
step  20 :  [-0.043164476108850075]
step  21 :  [-0.07093376367039914]
step  22 :  [-0.06173233811409573]
step  23 :  [-0.013380251390698183]
step  24 :  [-0.03126024948573316]
episode  181 : steps 25 , return [-12.8]
step  0 :  [-1.5055290780215436]
step  1 :  [-1.4937041609291073]
step  2 :  [-1.4690143219106666]
step  3 :  [-1.4412129276703227]
step  4 :  [-1.3800763337355675]
step  5 :  [-1.2890177165504986]
step  6 :  [-1.2053707027679186]
step  7 :  [-1.12336783863539]
step  8 :  [-1.0174836034573562]
step  9 :  [-0.8920408846406004]
step  10 :  [-0.7516397595317199]
step  11 :  [-0.6010149411899545]
step  12 :  [-0.4461249504889682]
step  13 :  [-0.2991382477130387]
step  14 :  [-0.17889027094862242]
step  15 :  [-0.06738409609721771]
step  16 :  [-0.09051630702384941]
step  17 :  [-0.09160899895846891]
step  18 :  [-0.07896536409523458]
step  19 :  [-0.052865673285576564]
step  20 :  [-0.022568337560956497]
step  21 :  [-0.02258325672386382]
step  22 :  [-0.011409570624712524]
step  23 :  [-0.07058409910260773]
step  24 :  [-0.10491372590554224]
episode  182 : steps 25 , return [-15.71]
step  0 :  [-1.5003728151133477]
step  1 :  [-1.4874189184664546]
step  2 :  [-1.4620878313894008]
step  3 :  [-1.4340689217304863]
step  4 :  [-1.3727181270091442]
step  5 :  [-1.2814744102349354]
step  6 :  [-1.2010167960387477]
step  7 :  [-1.1121525172704076]
step  8 :  [-1.000712970496268]
step  9 :  [-0.8709449923183034]
step  10 :  [-0.7273094789189383]
step  11 :  [-0.5744942042113084]
step  12 :  [-0.4188050049303789]
step  13 :  [-0.2746361747115356]
step  14 :  [-0.16090891927212655]
step  15 :  [-0.11780308705326864]
step  16 :  [-0.0470902404265807]
step  17 :  [-0.010875625817776046]
step  18 :  [-0.023496627613071787]
step  19 :  [-0.08613168703334191]
step  20 :  [-0.08366086776793503]
step  21 :  [-0.0357183295729662]
step  22 :  [-0.028576889455089596]
step  23 :  [-0.04104515329443631]
step  24 :  [-0.011455328268270955]
episode  183 : steps 25 , return [-15.36]
step  0 :  [-1.7330757090600226]
step  1 :  [-1.6943248913028368]
step  2 :  [-1.6488535986935389]
step  3 :  [-1.6042027717896374]
step  4 :  [-1.567013177966991]
step  5 :  [-1.4988393617404454]
step  6 :  [-1.4028089042455438]
step  7 :  [-1.2836720415686738]
step  8 :  [-1.146140614262732]
step  9 :  [-0.9943527511330594]
step  10 :  [-0.8318061739886671]
step  11 :  [-0.661534666865046]
step  12 :  [-0.48661634613333965]
step  13 :  [-0.31208703745403843]
step  14 :  [-0.16816885554671845]
step  15 :  [-0.10616193892320686]
step  16 :  [-0.08849973054091029]
step  17 :  [-0.04609644431499612]
step  18 :  [-0.056354684490684426]
step  19 :  [-0.0888050926874637]
step  20 :  [-0.08305510185449091]
step  21 :  [-0.04370614696501458]
step  22 :  [-0.04799016985992115]
step  23 :  [-0.08405683760216688]
step  24 :  [-0.08802373877840572]
episode  184 : steps 25 , return [-17.77]
step  0 :  [-1.5528312889984999]
step  1 :  [-1.5133844344278973]
step  2 :  [-1.4676473003955117]
step  3 :  [-1.4238227883337153]
step  4 :  [-1.3499907371513915]
step  5 :  [-1.2491666360179996]
step  6 :  [-1.1798599960692773]
step  7 :  [-1.0853516905777285]
step  8 :  [-0.9692010892866134]
step  9 :  [-0.8358091642051187]
step  10 :  [-0.6897013221150246]
step  11 :  [-0.5358246181273165]
step  12 :  [-0.3816436920526774]
step  13 :  [-0.24695685237736298]
step  14 :  [-0.15151921691247272]
step  15 :  [-0.12345931233893385]
step  16 :  [-0.10062950685474496]
step  17 :  [-0.03417101067711842]
step  18 :  [-0.034496828012564984]
step  19 :  [-0.06664600434006014]
step  20 :  [-0.05948409818888414]
step  21 :  [-0.043799683020608896]
step  22 :  [-0.03638631333552583]
step  23 :  [-0.08296100034364257]
step  24 :  [-0.06891388040282462]
episode  185 : steps 25 , return [-15.28]
step  0 :  [-1.559624836061436]
step  1 :  [-1.5346811912975868]
step  2 :  [-1.508887175499834]
step  3 :  [-1.4455697069500362]
step  4 :  [-1.3511237269569143]
step  5 :  [-1.231913127711503]
step  6 :  [-1.093427613697617]
step  7 :  [-0.9401363383487372]
step  8 :  [-0.7755840362872314]
step  9 :  [-0.6025695618207558]
step  10 :  [-0.42339391480446836]
step  11 :  [-0.2405215015683549]
step  12 :  [-0.09867038809594685]
step  13 :  [-0.057856372317285396]
step  14 :  [-0.012085071850349445]
step  15 :  [-0.049837447173194736]
step  16 :  [-0.051576073632611984]
step  17 :  [-0.017007254525666617]
step  18 :  [-0.031265843594972]
step  19 :  [-0.02757800132430178]
step  20 :  [-0.014832515047996828]
step  21 :  [-0.0284628502402136]
step  22 :  [-0.0342581772679057]
step  23 :  [-0.04399878918065049]
step  24 :  [-0.02039054504071251]
episode  186 : steps 25 , return [-13.2]
step  0 :  [-1.6102166115252654]
step  1 :  [-1.5786373953331359]
step  2 :  [-1.5435389536559392]
step  3 :  [-1.4736794731430785]
step  4 :  [-1.4152265552545564]
step  5 :  [-1.3269719690243116]
step  6 :  [-1.2138403465053602]
step  7 :  [-1.0808437007822458]
step  8 :  [-0.9324091939932815]
step  9 :  [-0.7722712865888617]
step  10 :  [-0.6036435753729168]
step  11 :  [-0.4297714143265487]
step  12 :  [-0.25636091584339776]
step  13 :  [-0.11390609898976893]
step  14 :  [-0.05223138753667251]
step  15 :  [-0.051020062115908996]
step  16 :  [-0.03134187102864573]
step  17 :  [-0.004319595314442169]
step  18 :  [-0.03981888225582929]
step  19 :  [-0.05709836909637062]
step  20 :  [-0.11393877607342313]
step  21 :  [-0.1284897563101991]
step  22 :  [-0.10973013405696064]
step  23 :  [-0.10379453402251303]
step  24 :  [-0.05488532088838696]
episode  187 : steps 25 , return [-15.1]
step  0 :  [-1.6821401802069136]
step  1 :  [-1.645322804493414]
step  2 :  [-1.6027124778295223]
step  3 :  [-1.5619023477809901]
step  4 :  [-1.4895753966101437]
step  5 :  [-1.3895185927283304]
step  6 :  [-1.2666708035383256]
step  7 :  [-1.136863651683062]
step  8 :  [-0.9896062415823491]
step  9 :  [-0.8304790017733259]
step  10 :  [-0.6621634483342375]
step  11 :  [-0.48707213758109374]
step  12 :  [-0.3079164669332339]
step  13 :  [-0.1677854920508533]
step  14 :  [-0.07344950471612159]
step  15 :  [-0.011940472812088253]
step  16 :  [-0.0310878230279735]
step  17 :  [-0.026174528965422165]
step  18 :  [-0.0851076770656839]
step  19 :  [-0.08499812805527869]
step  20 :  [-0.06421122961058133]
step  21 :  [-0.06695903621353214]
step  22 :  [-0.05034887340163168]
step  23 :  [-0.0642322074408568]
step  24 :  [-0.07786057555703324]
episode  188 : steps 25 , return [-15.86]
step  0 :  [-1.5588967659518909]
step  1 :  [-1.530991348659224]
step  2 :  [-1.5011599398570514]
step  3 :  [-1.435033054193093]
step  4 :  [-1.338555953883996]
step  5 :  [-1.217820263272404]
step  6 :  [-1.0851027486250422]
step  7 :  [-0.9367069466474011]
step  8 :  [-0.7761664106928814]
step  9 :  [-0.6063882782238874]
step  10 :  [-0.42983490640258576]
step  11 :  [-0.24920161340360278]
step  12 :  [-0.10866082300108632]
step  13 :  [-0.020035161984625047]
step  14 :  [-0.04009595681638217]
step  15 :  [-0.04221780208923007]
step  16 :  [-0.03517528323970516]
step  17 :  [-0.01986679422161604]
step  18 :  [-0.018740067335600276]
step  19 :  [-0.039683981462637394]
step  20 :  [-0.05189902771897239]
step  21 :  [-0.027236137255911976]
step  22 :  [-0.018806390854793416]
step  23 :  [-0.0354976218936793]
step  24 :  [-0.02656094723862043]
episode  189 : steps 25 , return [-13.15]
step  0 :  [-1.422171007226764]
step  1 :  [-1.389824448765635]
step  2 :  [-1.354586014529434]
step  3 :  [-1.2852439309347734]
step  4 :  [-1.2303389360082124]
step  5 :  [-1.198606132636305]
step  6 :  [-1.1322345361442874]
step  7 :  [-1.0358253824043873]
step  8 :  [-0.9159436602633781]
step  9 :  [-0.778349831534952]
step  10 :  [-0.6281507274660176]
step  11 :  [-0.4706463098223889]
step  12 :  [-0.314505989116483]
step  13 :  [-0.18313704435454384]
step  14 :  [-0.056408560137967426]
step  15 :  [-0.039751184729585824]
step  16 :  [-0.04020140972178762]
step  17 :  [-0.01666387174908227]
step  18 :  [-0.07404121906888839]
step  19 :  [-0.08282578701848729]
step  20 :  [-0.05098999311893965]
step  21 :  [-0.07074532692015355]
step  22 :  [-0.0887004313707723]
step  23 :  [-0.053615721375954446]
step  24 :  [-0.07666287609751757]
episode  190 : steps 25 , return [-13.99]
step  0 :  [-1.4565848860687651]
step  1 :  [-1.4296616621547846]
step  2 :  [-1.4016898602452326]
step  3 :  [-1.3372116526537894]
step  4 :  [-1.2421106593831894]
step  5 :  [-1.1253167738287906]
step  6 :  [-0.9889190020384049]
step  7 :  [-0.8373914205118361]
step  8 :  [-0.6743567578011447]
step  9 :  [-0.5027721063715256]
step  10 :  [-0.32537396949153335]
step  11 :  [-0.1474116827906216]
step  12 :  [-0.07668829129587011]
step  13 :  [-0.021159289667273148]
step  14 :  [-0.025600452019652664]
step  15 :  [-0.01646144004795701]
step  16 :  [-0.06963551919028267]
step  17 :  [-0.10367147319024733]
step  18 :  [-0.0900707053218316]
step  19 :  [-0.06519283636221748]
step  20 :  [-0.06417031294510384]
step  21 :  [-0.04360825899799351]
step  22 :  [-0.051045172709564116]
step  23 :  [-0.03152902863333728]
step  24 :  [-0.027317614650951356]
episode  191 : steps 25 , return [-12.15]
step  0 :  [-1.6093373518112672]
step  1 :  [-1.5698110954474092]
step  2 :  [-1.5237265847989412]
step  3 :  [-1.4790775262931204]
step  4 :  [-1.4044174314543685]
step  5 :  [-1.302880284378173]
step  6 :  [-1.1982938930056513]
step  7 :  [-1.099069328233351]
step  8 :  [-0.9811428224426663]
step  9 :  [-0.8475734208219096]
step  10 :  [-0.7022504500100955]
step  11 :  [-0.5499165100208555]
step  12 :  [-0.39814818827875664]
step  13 :  [-0.26648414834783024]
step  14 :  [-0.171050403068658]
step  15 :  [-0.10938145040508825]
step  16 :  [-0.09384956294781598]
step  17 :  [-0.05824423031554585]
step  18 :  [-0.05457486701107718]
step  19 :  [-0.023871929512610537]
step  20 :  [-0.005226858150734921]
step  21 :  [-0.03301711076201008]
step  22 :  [-0.015559759512147059]
step  23 :  [-0.03307869752447608]
step  24 :  [-0.026480605321458694]
episode  192 : steps 25 , return [-15.56]
step  0 :  [-1.4364152081829586]
step  1 :  [-1.414431738251904]
step  2 :  [-1.3858696516377502]
step  3 :  [-1.3596788404180082]
step  4 :  [-1.299262222312337]
step  5 :  [-1.2086895286439479]
step  6 :  [-1.0934329984769495]
step  7 :  [-0.9587213689036224]
step  8 :  [-0.8090813290329758]
step  9 :  [-0.6483741874337617]
step  10 :  [-0.4802046160792217]
step  11 :  [-0.30947672315098185]
step  12 :  [-0.1694873436802745]
step  13 :  [-0.09776992290505239]
step  14 :  [-0.04685698254328346]
step  15 :  [-0.02959930302260266]
step  16 :  [-0.021172949536053764]
step  17 :  [-0.0175340789113208]
step  18 :  [-0.050915140075896564]
step  19 :  [-0.07228199718815559]
step  20 :  [-0.061794902420210344]
step  21 :  [-0.027800122423262484]
step  22 :  [-0.04891873965638762]
step  23 :  [-0.02261812184351909]
step  24 :  [-0.053411505541390694]
episode  193 : steps 25 , return [-13.12]
step  0 :  [-1.4079434122046033]
step  1 :  [-1.378633572369654]
step  2 :  [-1.3476610599585288]
step  3 :  [-1.2812853946517735]
step  4 :  [-1.216509318030622]
step  5 :  [-1.134070185547686]
step  6 :  [-1.025778275748485]
step  7 :  [-0.897049603643412]
step  8 :  [-0.7528036547349494]
step  9 :  [-0.5975470681467512]
step  10 :  [-0.43624754364659235]
step  11 :  [-0.2782161781768828]
step  12 :  [-0.14757388837556212]
step  13 :  [-0.09231119044884757]
step  14 :  [-0.08580757017765427]
step  15 :  [-0.04480815510947072]
step  16 :  [-0.022631740757967395]
step  17 :  [-0.028187427147292186]
step  18 :  [-0.06284124219545553]
step  19 :  [-0.07055845863454827]
step  20 :  [-0.07444073389921455]
step  21 :  [-0.08123946788837509]
step  22 :  [-0.03723381871526066]
step  23 :  [-0.05429640153659995]
step  24 :  [-0.08615182346557569]
episode  194 : steps 25 , return [-12.64]
step  0 :  [-1.744985721149249]
step  1 :  [-1.7039826857954155]
step  2 :  [-1.6553456758639349]
step  3 :  [-1.6066967755721417]
step  4 :  [-1.5647810113005782]
step  5 :  [-1.4931794097291793]
step  6 :  [-1.3945555412772492]
step  7 :  [-1.2733485483862057]
step  8 :  [-1.1340474629605604]
step  9 :  [-0.9806043003020338]
step  10 :  [-0.8163151789514864]
step  11 :  [-0.6439085816464689]
step  12 :  [-0.46581275131030725]
step  13 :  [-0.28510754843708913]
step  14 :  [-0.14093104279624796]
step  15 :  [-0.05420851021106629]
step  16 :  [-0.055971363212744984]
step  17 :  [-0.021382961569409678]
step  18 :  [-0.0472227792868643]
step  19 :  [-0.041630811905418785]
step  20 :  [-0.056788760205132176]
step  21 :  [-0.05741201036801091]
step  22 :  [-0.0652696730337959]
step  23 :  [-0.06665433569382889]
step  24 :  [-0.038125291866784136]
episode  195 : steps 25 , return [-17.41]
step  0 :  [-1.473247524383536]
step  1 :  [-1.4417739082063248]
step  2 :  [-1.4074665870521843]
step  3 :  [-1.3385672814623497]
step  4 :  [-1.2402941906241107]
step  5 :  [-1.1753481137286033]
step  6 :  [-1.0828271017288122]
step  7 :  [-0.9680688250169033]
step  8 :  [-0.8356224567106948]
step  9 :  [-0.690100241169817]
step  10 :  [-0.5364644016183803]
step  11 :  [-0.3820531435667288]
step  12 :  [-0.24612427239104256]
step  13 :  [-0.1488416115921602]
step  14 :  [-0.09890115748466104]
step  15 :  [-0.09834840264643561]
step  16 :  [-0.07594418694003117]
step  17 :  [-0.04792092896813489]
step  18 :  [-0.023592494673305785]
step  19 :  [-0.023699854505847936]
step  20 :  [-0.045514320925239146]
step  21 :  [-0.031839112758612786]
step  22 :  [-0.02698612661557173]
step  23 :  [-0.013477106643222115]
step  24 :  [-0.047285841321965984]
episode  196 : steps 25 , return [-13.5]
step  0 :  [-1.6238266817672042]
step  1 :  [-1.5908651870304602]
step  2 :  [-1.553807714510765]
step  3 :  [-1.5202057073295001]
step  4 :  [-1.4531861948232532]
step  5 :  [-1.3571241997777572]
step  6 :  [-1.2373754899454994]
step  7 :  [-1.0989272477518366]
step  8 :  [-0.9460112097858994]
step  9 :  [-0.7820935015786933]
step  10 :  [-0.6100349684094423]
step  11 :  [-0.43246009718746836]
step  12 :  [-0.25319470191540977]
step  13 :  [-0.10819531996334775]
step  14 :  [-0.05070990450512049]
step  15 :  [-0.024297442171284312]
step  16 :  [-0.02198604434959035]
step  17 :  [-0.04720945396219351]
step  18 :  [-0.04078957755186536]
step  19 :  [-0.015146113807993427]
step  20 :  [-0.043692828494336484]
step  21 :  [-0.046888493392086804]
step  22 :  [-0.032030504365506036]
step  23 :  [-0.06039964198441728]
step  24 :  [-0.06589612103068017]
episode  197 : steps 25 , return [-15.02]
step  0 :  [-1.7969720045710658]
step  1 :  [-1.7616518476366443]
step  2 :  [-1.7207009268749673]
step  3 :  [-1.6812764113787018]
step  4 :  [-1.609469146667995]
step  5 :  [-1.5095548494396605]
step  6 :  [-1.3866908834370966]
step  7 :  [-1.2456662745999099]
step  8 :  [-1.0964656617055804]
step  9 :  [-0.9350396017418603]
step  10 :  [-0.7643278475489634]
step  11 :  [-0.5865056131323431]
step  12 :  [-0.4032693739738207]
step  13 :  [-0.2159361932747373]
step  14 :  [-0.08851174433072141]
step  15 :  [-0.08052656854454042]
step  16 :  [-0.05594630935060345]
step  17 :  [-0.0322741876981924]
step  18 :  [-0.06854868012764823]
step  19 :  [-0.049439518866075366]
step  20 :  [-0.04035077257478041]
step  21 :  [-0.01876668345535344]
step  22 :  [-0.0706056562500569]
step  23 :  [-0.08589092276313304]
step  24 :  [-0.05582033957862315]
episode  198 : steps 25 , return [-17.36]
step  0 :  [-1.4833017432317988]
step  1 :  [-1.4446535959257385]
step  2 :  [-1.3996498493835712]
step  3 :  [-1.3567544307056432]
step  4 :  [-1.2840079881694961]
step  5 :  [-1.2285751428071505]
step  6 :  [-1.1848038634108446]
step  7 :  [-1.1072996272613835]
step  8 :  [-1.0024758073238482]
step  9 :  [-0.8764661192913771]
step  10 :  [-0.7347220317741329]
step  11 :  [-0.5823355955494273]
step  12 :  [-0.4253752188609219]
step  13 :  [-0.2764377948775614]
step  14 :  [-0.155341871685296]
step  15 :  [-0.10616557326075246]
step  16 :  [-0.02795148004176037]
step  17 :  [-0.038565940495142705]
step  18 :  [-0.02034734303370405]
step  19 :  [-0.03481676098036343]
step  20 :  [-0.01607177771172185]
step  21 :  [-0.04084287939832345]
step  22 :  [-0.043757102015054256]
step  23 :  [-0.05992984866014384]
step  24 :  [-0.06465636267470183]
episode  199 : steps 25 , return [-15.]
step  0 :  [-1.4642612843596252]
step  1 :  [-1.431870371365776]
step  2 :  [-1.3963445336309537]
step  3 :  [-1.3266540667019289]
step  4 :  [-1.2331884173537138]
step  5 :  [-1.1865867987933834]
step  6 :  [-1.1131007844664182]
step  7 :  [-1.0135104077030284]
step  8 :  [-0.8928980374661172]
step  9 :  [-0.7564451517676207]
step  10 :  [-0.6094090851782339]
step  11 :  [-0.458371553197871]
step  12 :  [-0.31634207560776273]
step  13 :  [-0.1991717173210902]
step  14 :  [-0.08823057540216858]
step  15 :  [-0.1002034441108514]
step  16 :  [-0.09923508601683781]
step  17 :  [-0.07179133363945059]
step  18 :  [-0.07493855481835505]
step  19 :  [-0.06254752042984389]
step  20 :  [-0.06389890397398965]
step  21 :  [-0.03737314772339417]
step  22 :  [-0.05244210261311574]
step  23 :  [-0.03003265157774698]
step  24 :  [-0.02758908815826735]
episode  200 : steps 25 , return [-14.11]
step  0 :  [-1.502599148481336]
step  1 :  [-1.491999186694899]
step  2 :  [-1.468461558353171]
step  3 :  [-1.4417716121776134]
step  4 :  [-1.3814482642229142]
step  5 :  [-1.2909841292555704]
step  6 :  [-1.2038702990701833]
step  7 :  [-1.1145541752399213]
step  8 :  [-1.002882267788183]
step  9 :  [-0.8729766384620761]
step  10 :  [-0.7292222274879521]
step  11 :  [-0.5762394621094703]
step  12 :  [-0.4202182260166961]
step  13 :  [-0.2752073097715389]
step  14 :  [-0.1604302807499544]
step  15 :  [-0.06809639065984589]
step  16 :  [-0.04967041955433065]
step  17 :  [-0.06939343246484227]
step  18 :  [-0.08890494429011606]
step  19 :  [-0.09474053912567218]
step  20 :  [-0.051454471303605295]
step  21 :  [-0.020208015694325256]
step  22 :  [-0.039055594160467624]
step  23 :  [-0.030303337811492647]
step  24 :  [-0.01712374240023472]
episode  201 : steps 25 , return [-15.46]
step  0 :  [-1.5361538497812974]
step  1 :  [-1.5095629866772222]
step  2 :  [-1.481636448427624]
step  3 :  [-1.416904911114086]
step  4 :  [-1.321467757155245]
step  5 :  [-1.2015239570025722]
step  6 :  [-1.062465753523266]
step  7 :  [-0.9086899916045815]
step  8 :  [-0.7436813383449773]
step  9 :  [-0.5701625050119719]
step  10 :  [-0.3902776965917774]
step  11 :  [-0.205937653252848]
step  12 :  [-0.07137837689863033]
step  13 :  [-0.059949735772528996]
step  14 :  [-0.08594183934094579]
step  15 :  [-0.059050286896149336]
step  16 :  [-0.0887262942433697]
step  17 :  [-0.0764223268639467]
step  18 :  [-0.01969790706168894]
step  19 :  [-0.04312123315702526]
step  20 :  [-0.0666912095071235]
step  21 :  [-0.04007210144061646]
step  22 :  [-0.03708370142404196]
step  23 :  [-0.0439402716868343]
step  24 :  [-0.04059276590092284]
episode  202 : steps 25 , return [-13.08]
step  0 :  [-1.4410461257984208]
step  1 :  [-1.4114515314979883]
step  2 :  [-1.379901707230724]
step  3 :  [-1.3130001801675983]
step  4 :  [-1.223739812740022]
step  5 :  [-1.1352325088188238]
step  6 :  [-1.0227108749832536]
step  7 :  [-0.8909710308310168]
step  8 :  [-0.744529485857369]
step  9 :  [-0.5876232136781228]
step  10 :  [-0.4250548053832234]
step  11 :  [-0.26629633951603454]
step  12 :  [-0.1361823370259198]
step  13 :  [-0.08196383768922846]
step  14 :  [-0.07398436497400947]
step  15 :  [-0.034930553352360345]
step  16 :  [-0.040243375387536244]
step  17 :  [-0.009779600767845417]
step  18 :  [-0.02363496433265941]
step  19 :  [-0.06302152544772158]
step  20 :  [-0.08165483377592522]
step  21 :  [-0.06147493198873528]
step  22 :  [-0.038680223406698695]
step  23 :  [-0.07933144348402281]
step  24 :  [-0.10155539651434818]
episode  203 : steps 25 , return [-12.67]
step  0 :  [-1.4336462422153482]
step  1 :  [-1.4041814087184568]
step  2 :  [-1.3728506938979814]
step  3 :  [-1.3061279422316354]
step  4 :  [-1.22232270162499]
step  5 :  [-1.1345151343067772]
step  6 :  [-1.0224153922345047]
step  7 :  [-0.8909372556975166]
step  8 :  [-0.7446643321023529]
step  9 :  [-0.587874224741692]
step  10 :  [-0.4253978119184882]
step  11 :  [-0.2667315113119365]
step  12 :  [-0.13660472253320735]
step  13 :  [-0.08230340897173938]
step  14 :  [-0.07425587518619908]
step  15 :  [-0.03511367951321385]
step  16 :  [-0.04046338879302612]
step  17 :  [-0.00976606964129448]
step  18 :  [-0.026468513546850855]
step  19 :  [-0.0043348097218960805]
step  20 :  [-0.07650337510803416]
step  21 :  [-0.08115457375300862]
step  22 :  [-0.09253589264951916]
step  23 :  [-0.08318615552322425]
step  24 :  [-0.051697596649403287]
episode  204 : steps 25 , return [-12.61]
step  0 :  [-1.8641190250065611]
step  1 :  [-1.8248800433912378]
step  2 :  [-1.778311930896346]
step  3 :  [-1.73161443640975]
step  4 :  [-1.6910768112881571]
step  5 :  [-1.619846460386967]
step  6 :  [-1.5211563769100958]
step  7 :  [-1.3996909275128206]
step  8 :  [-1.2600389073768066]
step  9 :  [-1.1061793028909261]
step  10 :  [-0.941384460216274]
step  11 :  [-0.7682893689809944]
step  12 :  [-0.5890417140229107]
step  13 :  [-0.40559211530011685]
step  14 :  [-0.2209124031355906]
step  15 :  [-0.07347928780908401]
step  16 :  [-0.028323214719909794]
step  17 :  [-0.02559270802663306]
step  18 :  [-0.06367771960882627]
step  19 :  [-0.05992654556193622]
step  20 :  [-0.02179507633991582]
step  21 :  [-0.046568341317003256]
step  22 :  [-0.03300116398545668]
step  23 :  [-0.013164249436285642]
step  24 :  [-0.013505866192005708]
episode  205 : steps 25 , return [-19.1]
step  0 :  [-1.6467556434769797]
step  1 :  [-1.6124456659570614]
step  2 :  [-1.5734360753581837]
step  3 :  [-1.5372861056695166]
step  4 :  [-1.4683619512716461]
step  5 :  [-1.3708359070840264]
step  6 :  [-1.2499149782457983]
step  7 :  [-1.1104737091048487]
step  8 :  [-0.9566463166803134]
step  9 :  [-0.7917900653515503]
step  10 :  [-0.6185925887439145]
step  11 :  [-0.4392705963368236]
step  12 :  [-0.2561146551807778]
step  13 :  [-0.11491658908043102]
step  14 :  [-0.07139518686836861]
step  15 :  [-0.02315220157154636]
step  16 :  [-0.04293846885270826]
step  17 :  [-0.036059700998721245]
step  18 :  [-0.06672551007537011]
step  19 :  [-0.06501524618857665]
step  20 :  [-0.023058433988921375]
step  21 :  [-0.030673165034533087]
step  22 :  [-0.030900471263131828]
step  23 :  [-0.04912758881460004]
step  24 :  [-0.028273941838694736]
episode  206 : steps 25 , return [-15.21]
step  0 :  [-1.7041926785133528]
step  1 :  [-1.6777475512997408]
step  2 :  [-1.6492847238278447]
step  3 :  [-1.5836758832177324]
step  4 :  [-1.4873508012759626]
step  5 :  [-1.3666117978214098]
step  6 :  [-1.2268693823782117]
step  7 :  [-1.0725307844387206]
step  8 :  [-0.9070392180774396]
step  9 :  [-0.7330853232968355]
step  10 :  [-0.5527466756794901]
step  11 :  [-0.367648820235958]
step  12 :  [-0.17927260653155372]
step  13 :  [-0.08822352250935038]
step  14 :  [-0.06921320624854929]
step  15 :  [-0.013361113836599067]
step  16 :  [-0.01213232272523945]
step  17 :  [-0.057680299328009534]
step  18 :  [-0.04627365560826745]
step  19 :  [-0.03772898855862322]
step  20 :  [-0.05309818735383275]
step  21 :  [-0.04063057876437161]
step  22 :  [-0.07569615381775507]
step  23 :  [-0.05658014449324484]
step  24 :  [-0.0903728759169759]
episode  207 : steps 25 , return [-15.15]
step  0 :  [-1.6849800184113537]
step  1 :  [-1.6590115158275889]
step  2 :  [-1.6312739577241417]
step  3 :  [-1.5662188963965544]
step  4 :  [-1.4703134086232104]
step  5 :  [-1.3498918534237005]
step  6 :  [-1.21038858279443]
step  7 :  [-1.0562108805753117]
step  8 :  [-0.8908320164455498]
step  9 :  [-0.7169450920485254]
step  10 :  [-0.536618142713974]
step  11 :  [-0.35143157424518395]
step  12 :  [-0.16260714327261053]
step  13 :  [-0.070926851530206]
step  14 :  [-0.05212029227408719]
step  15 :  [-0.06145602474849096]
step  16 :  [-0.04353014333658164]
step  17 :  [-0.03010512552774086]
step  18 :  [-0.06600600607386954]
step  19 :  [-0.046851077061802915]
step  20 :  [-0.0645283407612783]
step  21 :  [-0.09546721357509623]
step  22 :  [-0.1000113547008869]
step  23 :  [-0.07624664003564802]
step  24 :  [-0.03640753441829161]
episode  208 : steps 25 , return [-15.03]
step  0 :  [-1.5762397151337064]
step  1 :  [-1.5430670690264514]
step  2 :  [-1.5059238407038344]
step  3 :  [-1.4725477966214582]
step  4 :  [-1.4059187313650474]
step  5 :  [-1.3102789544841096]
step  6 :  [-1.190947831063449]
step  7 :  [-1.052916543023518]
step  8 :  [-0.9004458197125411]
step  9 :  [-0.7370643612322301]
step  10 :  [-0.5657787447797601]
step  11 :  [-0.38965986556978]
step  12 :  [-0.21478226404424489]
step  13 :  [-0.07223545064896551]
step  14 :  [-0.011222880624153522]
step  15 :  [-0.019755735974450427]
step  16 :  [-0.028264044048282522]
step  17 :  [-0.02769508896046366]
step  18 :  [-0.038466679452481]
step  19 :  [-0.04894267982125351]
step  20 :  [-0.053277330671290694]
step  21 :  [-0.030194536660169205]
step  22 :  [-0.022788460036509642]
step  23 :  [-0.006694485134597561]
step  24 :  [-0.02740845726201484]
episode  209 : steps 25 , return [-14.25]
step  0 :  [-1.5346420473688522]
step  1 :  [-1.5092536546113895]
step  2 :  [-1.4829745192555952]
step  3 :  [-1.4194006941259816]
step  4 :  [-1.3248117719817156]
step  5 :  [-1.2055178347586235]
step  6 :  [-1.066982033630146]
step  7 :  [-0.913660077563457]
step  8 :  [-0.7490907102393791]
step  9 :  [-0.5760741412727352]
step  10 :  [-0.39693406933700076]
step  11 :  [-0.21432719881699214]
step  12 :  [-0.07224913832318504]
step  13 :  [-0.041608048039688615]
step  14 :  [-0.025489117165502992]
step  15 :  [-0.007760289595037832]
step  16 :  [-0.030786569142643157]
step  17 :  [-0.023383663070025366]
step  18 :  [-0.02256605258862885]
step  19 :  [-0.056275099613678686]
step  20 :  [-0.04243370761092987]
step  21 :  [-0.008358103666068956]
step  22 :  [-0.015344849540932022]
step  23 :  [-0.03417798441729548]
step  24 :  [-0.03086688538678334]
episode  210 : steps 25 , return [-12.8]
step  0 :  [-1.5386944655419315]
step  1 :  [-1.5105743492883752]
step  2 :  [-1.4805452547494742]
step  3 :  [-1.41434775224633]
step  4 :  [-1.3178538464892267]
step  5 :  [-1.1971237369499763]
step  6 :  [-1.063160277404847]
step  7 :  [-0.9142302950782051]
step  8 :  [-0.7536506077085807]
step  9 :  [-0.5842955325726762]
step  10 :  [-0.40888554366327334]
step  11 :  [-0.23157291443493586]
step  12 :  [-0.08859562301613745]
step  13 :  [-0.0326287683066759]
step  14 :  [-0.050610938681955736]
step  15 :  [-0.050353463787061896]
step  16 :  [-0.031200535889809106]
step  17 :  [-0.027424783424178378]
step  18 :  [-0.0241396241089334]
step  19 :  [-0.018524788483059045]
step  20 :  [-0.03801072549796502]
step  21 :  [-0.05108153535387012]
step  22 :  [-0.025626773989764897]
step  23 :  [-0.05055356659100804]
step  24 :  [-0.05480464396042885]
episode  211 : steps 25 , return [-12.96]
step  0 :  [-1.475119014036493]
step  1 :  [-1.4380993117711707]
step  2 :  [-1.3961033433008492]
step  3 :  [-1.357521839995952]
step  4 :  [-1.2877488235406904]
step  5 :  [-1.2146517742227498]
step  6 :  [-1.1210609021637195]
step  7 :  [-1.0042877339949123]
step  8 :  [-0.8692533551713378]
step  9 :  [-0.7204931986805617]
step  10 :  [-0.5623554626788262]
step  11 :  [-0.4002342405698904]
step  12 :  [-0.2465820714218434]
step  13 :  [-0.12525715530732395]
step  14 :  [-0.08000039567193185]
step  15 :  [-0.06156042754266166]
step  16 :  [-0.044682056412607626]
step  17 :  [-0.028278179279904697]
step  18 :  [-0.03434776631693878]
step  19 :  [-0.03601587677199762]
step  20 :  [-0.04406212625330837]
step  21 :  [-0.04393489748517225]
step  22 :  [-0.05798361003409779]
step  23 :  [-0.0563745046974403]
step  24 :  [-0.055765098765753154]
episode  212 : steps 25 , return [-13.76]
step  0 :  [-1.5277829572632549]
step  1 :  [-1.4929497197359558]
step  2 :  [-1.4537338031124296]
step  3 :  [-1.4181691970746773]
step  4 :  [-1.3502366729050852]
step  5 :  [-1.2537652064306988]
step  6 :  [-1.133864217754332]
step  7 :  [-0.9954104303276189]
step  8 :  [-0.842597404603934]
step  9 :  [-0.6789122702934085]
step  10 :  [-0.5073483105498265]
step  11 :  [-0.33110659882193894]
step  12 :  [-0.19142902979318954]
step  13 :  [-0.09914772465861653]
step  14 :  [-0.08648375744416935]
step  15 :  [-0.048064239336336974]
step  16 :  [-0.05080174817719447]
step  17 :  [-0.019352147621138197]
step  18 :  [-0.0334056466365272]
step  19 :  [-0.0034137070465333095]
step  20 :  [-0.02646307408873678]
step  21 :  [-0.00610304678991179]
step  22 :  [-0.024406973442933078]
step  23 :  [-0.044681123721456224]
step  24 :  [-0.013985266428662577]
episode  213 : steps 25 , return [-13.63]
step  0 :  [-1.7560332810047403]
step  1 :  [-1.7271689562058188]
step  2 :  [-1.695211530131156]
step  3 :  [-1.6270838662355622]
step  4 :  [-1.5289502306712595]
step  5 :  [-1.4069320960740959]
step  6 :  [-1.266325294777796]
step  7 :  [-1.1290537698160388]
step  8 :  [-0.9733883480391968]
step  9 :  [-0.8087919933273054]
step  10 :  [-0.6371320529419909]
step  11 :  [-0.460549890746748]
step  12 :  [-0.2826357430765523]
step  13 :  [-0.14045809651554597]
step  14 :  [-0.082905952428102]
step  15 :  [-0.05895689383886256]
step  16 :  [-0.07486992153135397]
step  17 :  [-0.09498145054613485]
step  18 :  [-0.0715693042754389]
step  19 :  [-0.02063688510682362]
step  20 :  [-0.05130248607969417]
step  21 :  [-0.06840464459513458]
step  22 :  [-0.04115190242701565]
step  23 :  [-0.016861498493347102]
step  24 :  [-0.057628653730808]
episode  214 : steps 25 , return [-16.08]
step  0 :  [-1.7735146337275056]
step  1 :  [-1.73479888406291]
step  2 :  [-1.68923883263711]
step  3 :  [-1.6442534121174825]
step  4 :  [-1.606356592360696]
step  5 :  [-1.537455315222076]
step  6 :  [-1.4407490302866968]
step  7 :  [-1.3209891670402565]
step  8 :  [-1.182860428019793]
step  9 :  [-1.0304543964169983]
step  10 :  [-0.8671914682058363]
step  11 :  [-0.6959525966578282]
step  12 :  [-0.5194285518064188]
step  13 :  [-0.34126563333975785]
step  14 :  [-0.1964842915184688]
step  15 :  [-0.11204683633803854]
step  16 :  [-0.038075014454597565]
step  17 :  [-0.01078124171102258]
step  18 :  [-0.041317549463881845]
step  19 :  [-0.018306803317193667]
step  20 :  [-0.045341016211407584]
step  21 :  [-0.02393626294507281]
step  22 :  [-0.0294913566685715]
step  23 :  [-0.06850653192208538]
step  24 :  [-0.092965915009907]
episode  215 : steps 25 , return [-18.06]
step  0 :  [-1.690085779693321]
step  1 :  [-1.6644074820811445]
step  2 :  [-1.637044229083338]
step  3 :  [-1.5722346729631853]
step  4 :  [-1.4764972917468917]
step  5 :  [-1.3561947703411301]
step  6 :  [-1.2167779268352514]
step  7 :  [-1.0626640410242418]
step  8 :  [-0.8973326232301533]
step  9 :  [-0.7234805417010439]
step  10 :  [-0.5431774604451676]
step  11 :  [-0.35800165012464813]
step  12 :  [-0.1691522438003856]
step  13 :  [-0.07751230661176126]
step  14 :  [-0.05892396496768308]
step  15 :  [-0.09502338697287084]
step  16 :  [-0.07227568996941956]
step  17 :  [-0.06803980972111744]
step  18 :  [-0.049614053162817334]
step  19 :  [-0.02458239572024146]
step  20 :  [-0.01567054840646079]
step  21 :  [-0.05399102605480971]
step  22 :  [-0.03691531093236468]
step  23 :  [-0.07390990243125084]
step  24 :  [-0.051894779464612226]
episode  216 : steps 25 , return [-15.05]
step  0 :  [-1.7162483781023796]
step  1 :  [-1.6907982641417407]
step  2 :  [-1.6636419054888738]
step  3 :  [-1.5989049456118454]
step  4 :  [-1.5031830763696767]
step  5 :  [-1.3828723167072343]
step  6 :  [-1.2434383743791557]
step  7 :  [-1.0893052870730595]
step  8 :  [-0.9239556301834972]
step  9 :  [-0.7500876956077651]
step  10 :  [-0.5697720541100112]
step  11 :  [-0.3845885814251473]
step  12 :  [-0.19574412255715676]
step  13 :  [-0.10406720434332523]
step  14 :  [-0.0353306497259547]
step  15 :  [-0.03392550543417644]
step  16 :  [-0.05596677008223053]
step  17 :  [-0.044714671566300275]
step  18 :  [-0.042731896696470116]
step  19 :  [-0.039363567225234146]
step  20 :  [-0.04193642285552689]
step  21 :  [-0.035610682335801974]
step  22 :  [-0.06843283643248879]
step  23 :  [-0.0526889908342846]
step  24 :  [-0.08523675530377475]
episode  217 : steps 25 , return [-15.35]
step  0 :  [-1.6493922270572048]
step  1 :  [-1.6201871147431406]
step  2 :  [-1.5881786652499346]
step  3 :  [-1.5202922480901133]
step  4 :  [-1.422453479340117]
step  5 :  [-1.300693047883517]
step  6 :  [-1.1604190827404495]
step  7 :  [-1.0014026458413565]
step  8 :  [-0.8348882372460813]
step  9 :  [-0.6623267987950795]
step  10 :  [-0.4857285260969262]
step  11 :  [-0.3089351032644906]
step  12 :  [-0.16705842542308258]
step  13 :  [-0.10846797581290728]
step  14 :  [-0.08841999985829976]
step  15 :  [-0.04860129554305954]
step  16 :  [-0.06292776586581555]
step  17 :  [-0.08141325942866909]
step  18 :  [-0.10467359267865714]
step  19 :  [-0.10992465427916971]
step  20 :  [-0.06694055747460546]
step  21 :  [-0.0680492804904959]
step  22 :  [-0.05553684488166824]
step  23 :  [-0.06826751689612776]
step  24 :  [-0.05287890169581692]
episode  218 : steps 25 , return [-14.64]
step  0 :  [-1.5172162508777078]
step  1 :  [-1.4753158122277488]
step  2 :  [-1.4263068574341686]
step  3 :  [-1.378659851148226]
step  4 :  [-1.302382629285148]
step  5 :  [-1.2362127249559927]
step  6 :  [-1.2225853768898824]
step  7 :  [-1.1923275295715088]
step  8 :  [-1.124161923188128]
step  9 :  [-1.0258148039728285]
step  10 :  [-0.904235109334872]
step  11 :  [-0.7653420476633007]
step  12 :  [-0.6143618328012794]
step  13 :  [-0.456875263326205]
step  14 :  [-0.30266363219298315]
step  15 :  [-0.17321119752526667]
step  16 :  [-0.11750639492151489]
step  17 :  [-0.04171199066303367]
step  18 :  [-0.01669879108132566]
step  19 :  [-0.0405394046873998]
step  20 :  [-0.013410407086982065]
step  21 :  [-0.04063093680675479]
step  22 :  [-0.08208068107462516]
step  23 :  [-0.08802170085367593]
step  24 :  [-0.05041218929744062]
episode  219 : steps 25 , return [-16.61]
step  0 :  [-1.7112347530024756]
step  1 :  [-1.6811067276203604]
step  2 :  [-1.647589191809516]
step  3 :  [-1.617753582407569]
step  4 :  [-1.5530292712906753]
step  5 :  [-1.458464497998474]
step  6 :  [-1.3397627373479806]
step  7 :  [-1.2021038624370135]
step  8 :  [-1.0498362182929006]
step  9 :  [-0.8865044958281785]
step  10 :  [-0.7150243744927169]
step  11 :  [-0.5380132293715573]
step  12 :  [-0.35871984688530245]
step  13 :  [-0.1866360624072844]
step  14 :  [-0.12424769157593846]
step  15 :  [-0.05926832206360784]
step  16 :  [-0.02523510606454222]
step  17 :  [-0.04951484279200704]
step  18 :  [-0.018381191573590094]
step  19 :  [-0.04413386694285757]
step  20 :  [-0.014898619890788382]
step  21 :  [-0.04115502717027585]
step  22 :  [-0.013164708506670413]
step  23 :  [-0.03949844068485574]
step  24 :  [-0.012295127331890926]
episode  220 : steps 25 , return [-16.39]
step  0 :  [-1.5951582315625714]
step  1 :  [-1.5705361797253075]
step  2 :  [-1.5450146573333041]
step  3 :  [-1.481773045210828]
step  4 :  [-1.3873203892310755]
step  5 :  [-1.2680675526552536]
step  6 :  [-1.1295229257775767]
step  7 :  [-0.9761606346552248]
step  8 :  [-0.8115206861209728]
step  9 :  [-0.6383826402110879]
step  10 :  [-0.45898328266877025]
step  11 :  [-0.2754635090978326]
step  12 :  [-0.13479951947781746]
step  13 :  [-0.09044860472801611]
step  14 :  [-0.04292725800357102]
step  15 :  [-0.05961789234150058]
step  16 :  [-0.07631118751605427]
step  17 :  [-0.04533761233845904]
step  18 :  [-0.01468108415996995]
step  19 :  [-0.016734625185918797]
step  20 :  [-0.04475532118487928]
step  21 :  [-0.04540033592548194]
step  22 :  [-0.0676177997293463]
step  23 :  [-0.06279044726329519]
step  24 :  [-0.016501043244107328]
episode  221 : steps 25 , return [-13.86]
step  0 :  [-1.5151616433972759]
step  1 :  [-1.4790276657311894]
step  2 :  [-1.4380685673022882]
step  3 :  [-1.4004507738186618]
step  4 :  [-1.3311355907936382]
step  5 :  [-1.2336767467148133]
step  6 :  [-1.1227736680172538]
step  7 :  [-0.9921391537165698]
step  8 :  [-0.8460012276910812]
step  9 :  [-0.6881431900217996]
step  10 :  [-0.5221076326167081]
step  11 :  [-0.3523008605001309]
step  12 :  [-0.19082624577087315]
step  13 :  [-0.07276210929554063]
step  14 :  [-0.05324987356333237]
step  15 :  [-0.030235506125693454]
step  16 :  [-0.05339787611418645]
step  17 :  [-0.08489366232323463]
step  18 :  [-0.0989215897482721]
step  19 :  [-0.06296948314068913]
step  20 :  [-0.07656238361679493]
step  21 :  [-0.12046367132840866]
step  22 :  [-0.11495534675863074]
step  23 :  [-0.10024267385854888]
step  24 :  [-0.07387398255522427]
episode  222 : steps 25 , return [-14.05]
step  0 :  [-1.4256652813812396]
step  1 :  [-1.4188448362827561]
step  2 :  [-1.4032051983547529]
step  3 :  [-1.3490392778611877]
step  4 :  [-1.2620956658440752]
step  5 :  [-1.2020841598503427]
step  6 :  [-1.1309296541359497]
step  7 :  [-1.0327790885869075]
step  8 :  [-0.9127810391464379]
step  9 :  [-0.7760670923333846]
step  10 :  [-0.6275999305979352]
step  11 :  [-0.4730361185895805]
step  12 :  [-0.3224463558168631]
step  13 :  [-0.19632492144608152]
step  14 :  [-0.07316099720790363]
step  15 :  [-0.06230483377437924]
step  16 :  [-0.060573548616567434]
step  17 :  [-0.042552980697179346]
step  18 :  [-0.056651349109911056]
step  19 :  [-0.07634837891393538]
step  20 :  [-0.050044830683933665]
step  21 :  [-0.022224799689712405]
step  22 :  [-0.006979951869585136]
step  23 :  [-0.03368588253831954]
step  24 :  [-0.01447856223688612]
episode  223 : steps 25 , return [-14.03]
step  0 :  [-1.6083409021457256]
step  1 :  [-1.568932116273103]
step  2 :  [-1.5230150936688238]
step  3 :  [-1.478580943385217]
step  4 :  [-1.404072575563915]
step  5 :  [-1.3026433137601223]
step  6 :  [-1.197658658468484]
step  7 :  [-1.0960300583395097]
step  8 :  [-0.9761469148408296]
step  9 :  [-0.8410354761472122]
step  10 :  [-0.6945327547976585]
step  11 :  [-0.5413668147804175]
step  12 :  [-0.3892807092596937]
step  13 :  [-0.2617148698325974]
step  14 :  [-0.14352710708724933]
step  15 :  [-0.07452279114229365]
step  16 :  [-0.07798452066271407]
step  17 :  [-0.05934517207011632]
step  18 :  [-0.034027522907966304]
step  19 :  [-0.0699695627435961]
step  20 :  [-0.05115498250724032]
step  21 :  [-0.03445722822235387]
step  22 :  [-0.01586460938703239]
step  23 :  [-0.035490355344738524]
step  24 :  [-0.011632420974002633]
episode  224 : steps 25 , return [-15.49]
step  0 :  [-1.5570318980013118]
step  1 :  [-1.5285396647470368]
step  2 :  [-1.4979141075623645]
step  3 :  [-1.4312466579590846]
step  4 :  [-1.3343901691416846]
step  5 :  [-1.2133822468098414]
step  6 :  [-1.0845167856521383]
step  7 :  [-0.9395853590901164]
step  8 :  [-0.7820892275287927]
step  9 :  [-0.6150638265041721]
step  10 :  [-0.44129876649224214]
step  11 :  [-0.2644992179654659]
step  12 :  [-0.12289513700513695]
step  13 :  [-0.06830827034930109]
step  14 :  [-0.0372806695960331]
step  15 :  [-0.005414746159306633]
step  16 :  [-0.03857137846528046]
step  17 :  [-0.048899166891794035]
step  18 :  [-0.034985989447180316]
step  19 :  [-0.011591888750938422]
step  20 :  [-0.029395274220601335]
step  21 :  [-0.04343461633492176]
step  22 :  [-0.035952961801841606]
step  23 :  [-0.015352861361020589]
step  24 :  [-0.02655287488046239]
episode  225 : steps 25 , return [-13.21]
step  0 :  [-1.6575203578061206]
step  1 :  [-1.625391393135633]
step  2 :  [-1.5893406729635742]
step  3 :  [-1.5567491046016275]
step  4 :  [-1.4902931971840718]
step  5 :  [-1.3945642062219537]
step  6 :  [-1.2750233467877152]
step  7 :  [-1.1367116945618416]
step  8 :  [-0.983889018320557]
step  9 :  [-0.8200336538330532]
step  10 :  [-0.6480004455636323]
step  11 :  [-0.4703508522931219]
step  12 :  [-0.2904548156677092]
step  13 :  [-0.1225501282797821]
step  14 :  [-0.08620863596199854]
step  15 :  [-0.07895306116541781]
step  16 :  [-0.0695364303205405]
step  17 :  [-0.028138658811004195]
step  18 :  [-0.01983369080982768]
step  19 :  [-0.03493619090086394]
step  20 :  [-0.02316634004931603]
step  21 :  [-0.0448920865978887]
step  22 :  [-0.045418797886047836]
step  23 :  [-0.05723190951901833]
step  24 :  [-0.05812691493566672]
episode  226 : steps 25 , return [-15.61]
step  0 :  [-1.410834898040267]
step  1 :  [-1.382577463834318]
step  2 :  [-1.3530337204463643]
step  3 :  [-1.2876374011579075]
step  4 :  [-1.2104067307325912]
step  5 :  [-1.1123675428243918]
step  6 :  [-0.9915635266395714]
step  7 :  [-0.8529458144170285]
step  8 :  [-0.7009000858455958]
step  9 :  [-0.5394703384156202]
step  10 :  [-0.3734730504944464]
step  11 :  [-0.21454315707845903]
step  12 :  [-0.09156019218415559]
step  13 :  [-0.053021771398266054]
step  14 :  [-0.029266516580832975]
step  15 :  [-0.03865991817369387]
step  16 :  [-0.04073407227785922]
step  17 :  [-0.022997640796589724]
step  18 :  [-0.023213073288595447]
step  19 :  [-0.047509618813672314]
step  20 :  [-0.0344429638441226]
step  21 :  [-0.05326451138258341]
step  22 :  [-0.05268085464081266]
step  23 :  [-0.03235873292483035]
step  24 :  [-0.04984933378737976]
episode  227 : steps 25 , return [-12.]
step  0 :  [-1.5127518806169404]
step  1 :  [-1.4731711578398397]
step  2 :  [-1.4255470170750428]
step  3 :  [-1.3785277893962955]
step  4 :  [-1.3399172535723847]
step  5 :  [-1.272232258921916]
step  6 :  [-1.1858118274277312]
step  7 :  [-1.0751589647428437]
step  8 :  [-0.9450658829734796]
step  9 :  [-0.8000921166723746]
step  10 :  [-0.6445128825919848]
step  11 :  [-0.48301404452124613]
step  12 :  [-0.3236527048938062]
step  13 :  [-0.19052829669848598]
step  14 :  [-0.06335957579915398]
step  15 :  [-0.03322919297033689]
step  16 :  [-0.016510586373174638]
step  17 :  [-0.06097733882619582]
step  18 :  [-0.04814333780182728]
step  19 :  [-0.031135150091164587]
step  20 :  [-0.03471098571731373]
step  21 :  [-0.017479811004835418]
step  22 :  [-0.009245661462056227]
step  23 :  [-0.03661036585686593]
step  24 :  [-0.015746267898239644]
episode  228 : steps 25 , return [-14.42]
step  0 :  [-1.7831486547737612]
step  1 :  [-1.7424561534905603]
step  2 :  [-1.6941251809680227]
step  3 :  [-1.6456506691248125]
step  4 :  [-1.603640167649006]
step  5 :  [-1.5317681235052794]
step  6 :  [-1.432830316159195]
step  7 :  [-1.3113101662382312]
step  8 :  [-1.1717040598079533]
step  9 :  [-1.0179523433597726]
step  10 :  [-0.8533217132053995]
step  11 :  [-0.6804766234203851]
step  12 :  [-0.5016746395831645]
step  13 :  [-0.3193200268086224]
step  14 :  [-0.14012426665022165]
step  15 :  [-0.07558229892272862]
step  16 :  [-0.04039582687804294]
step  17 :  [-0.03736443940051687]
step  18 :  [-0.039687015193084506]
step  19 :  [-0.05052839308959048]
step  20 :  [-0.03233514760458195]
step  21 :  [-0.019079767390964543]
step  22 :  [-0.009969341134332373]
step  23 :  [-0.023950229907482183]
step  24 :  [-0.019434255380842376]
episode  229 : steps 25 , return [-17.78]
step  0 :  [-1.6125829932647222]
step  1 :  [-1.584471536835211]
step  2 :  [-1.55411534124489]
step  3 :  [-1.4874619924036165]
step  4 :  [-1.3905302888306004]
step  5 :  [-1.2694249196183438]
step  6 :  [-1.1319945897185772]
step  7 :  [-0.9783013084337301]
step  8 :  [-0.813793512409752]
step  9 :  [-0.6409292146732455]
step  10 :  [-0.46173674222356703]
step  11 :  [-0.27805780560439136]
step  12 :  [-0.14062091984238836]
step  13 :  [-0.03547086994026856]
step  14 :  [-0.017094736666100636]
step  15 :  [-0.026749514085984184]
step  16 :  [-0.02880961958855414]
step  17 :  [-0.01658965537554158]
step  18 :  [-0.02797554123496621]
step  19 :  [-0.08491087788482465]
step  20 :  [-0.08734832003889918]
step  21 :  [-0.076859800981999]
step  22 :  [-0.04613144556807542]
step  23 :  [-0.01728128559249624]
step  24 :  [-0.011760492083810511]
episode  230 : steps 25 , return [-13.82]
step  0 :  [-1.5283239449902009]
step  1 :  [-1.487737294113529]
step  2 :  [-1.4384444699766947]
step  3 :  [-1.3891112921696414]
step  4 :  [-1.3475649817726805]
step  5 :  [-1.277676672619545]
step  6 :  [-1.2032183371566891]
step  7 :  [-1.1018622816296915]
step  8 :  [-0.9787418996436907]
step  9 :  [-0.8387518210436722]
step  10 :  [-0.6863273054531192]
step  11 :  [-0.5258543623610356]
step  12 :  [-0.3634337948223468]
step  13 :  [-0.2161792000064608]
step  14 :  [-0.11261761799815644]
step  15 :  [-0.08794058205142313]
step  16 :  [-0.0628497197192422]
step  17 :  [-0.05384200461836302]
step  18 :  [-0.08320380396278276]
step  19 :  [-0.06373599227947914]
step  20 :  [-0.07815115768586733]
step  21 :  [-0.05814395771098499]
step  22 :  [-0.04335498954362759]
step  23 :  [-0.032008826741138426]
step  24 :  [-0.02073875907675271]
episode  231 : steps 25 , return [-15.08]
step  0 :  [-1.6286853759769695]
step  1 :  [-1.587112324971601]
step  2 :  [-1.5380992766747104]
step  3 :  [-1.4896741464794665]
step  4 :  [-1.449022356678561]
step  5 :  [-1.3790133569343859]
step  6 :  [-1.2819776171336954]
step  7 :  [-1.162283283877091]
step  8 :  [-1.0244589179130474]
step  9 :  [-0.8725682151150258]
step  10 :  [-0.7101251299686661]
step  11 :  [-0.5403482394052754]
step  12 :  [-0.3671385362019449]
step  13 :  [-0.22677647939678733]
step  14 :  [-0.12153066798457883]
step  15 :  [-0.09237656184623602]
step  16 :  [-0.09352344100481849]
step  17 :  [-0.08249181680057968]
step  18 :  [-0.047853995116073696]
step  19 :  [-0.04407823685527305]
step  20 :  [-0.03840434984182258]
step  21 :  [-0.05512758696721138]
step  22 :  [-0.06708092633430747]
step  23 :  [-0.04365753661637805]
step  24 :  [-0.047845958446337315]
episode  232 : steps 25 , return [-15.99]
step  0 :  [-1.7032241260704508]
step  1 :  [-1.6699912343171268]
step  2 :  [-1.632244669252503]
step  3 :  [-1.597289851830401]
step  4 :  [-1.5289644618544767]
step  5 :  [-1.4317442709355885]
step  6 :  [-1.3109786382841546]
step  7 :  [-1.1716111906838909]
step  8 :  [-1.0178095606863147]
step  9 :  [-0.8529441364158628]
step  10 :  [-0.6796971352601903]
step  11 :  [-0.5002375779637207]
step  12 :  [-0.3165754840688226]
step  13 :  [-0.13291378575242982]
step  14 :  [-0.05931137196108437]
step  15 :  [-0.05496474895635378]
step  16 :  [-0.006162463709545028]
step  17 :  [-0.022642242942047395]
step  18 :  [-0.03614091042237071]
step  19 :  [-0.024514024649180212]
step  20 :  [-0.028557430112424058]
step  21 :  [-0.08366369013281841]
step  22 :  [-0.07808834974810604]
step  23 :  [-0.06334294319671716]
step  24 :  [-0.05811380528615434]
episode  233 : steps 25 , return [-16.06]
step  0 :  [-1.7820931233751984]
step  1 :  [-1.747886671974586]
step  2 :  [-1.7085181240699323]
step  3 :  [-1.67111831413059]
step  4 :  [-1.6007710890278104]
step  5 :  [-1.5019220178747679]
step  6 :  [-1.3798429315889986]
step  7 :  [-1.2393984700155722]
step  8 :  [-1.0846840536860536]
step  9 :  [-0.91899898091537]
step  10 :  [-0.7449375626501987]
step  11 :  [-0.5645102727178986]
step  12 :  [-0.3792607987837256]
step  13 :  [-0.1903676524719039]
step  14 :  [-0.07055652794903698]
step  15 :  [-0.06689470491395033]
step  16 :  [-0.0897367852118653]
step  17 :  [-0.06054382661891982]
step  18 :  [-0.012576892723487602]
step  19 :  [-0.014653056080156473]
step  20 :  [-0.017526340180223147]
step  21 :  [-0.046660734108174944]
step  22 :  [-0.034435552188348297]
step  23 :  [-0.07305048952093499]
step  24 :  [-0.05993015464574565]
episode  234 : steps 25 , return [-17.06]
step  0 :  [-1.4218124683643254]
step  1 :  [-1.4170731325422627]
step  2 :  [-1.4033852057913574]
step  3 :  [-1.3506503289194232]
step  4 :  [-1.2647516667282959]
step  5 :  [-1.197820849787647]
step  6 :  [-1.1146265342476354]
step  7 :  [-1.0069001168227236]
step  8 :  [-0.8794722203145863]
step  9 :  [-0.7371123937191819]
step  10 :  [-0.584552674322148]
step  11 :  [-0.4276707900065237]
step  12 :  [-0.27890929764320654]
step  13 :  [-0.15852402878499455]
step  14 :  [-0.05439135511349111]
step  15 :  [-0.036492351734232]
step  16 :  [-0.05482729306867292]
step  17 :  [-0.08208625133595857]
step  18 :  [-0.08443971687995286]
step  19 :  [-0.10992720767121299]
step  20 :  [-0.10366402841928755]
step  21 :  [-0.0559260188791718]
step  22 :  [-0.06577526138640342]
step  23 :  [-0.02663741624144154]
step  24 :  [-0.046784855543305755]
episode  235 : steps 25 , return [-13.96]
step  0 :  [-1.793563511326918]
step  1 :  [-1.7594101390643078]
step  2 :  [-1.7200756530518084]
step  3 :  [-1.6826551030503896]
step  4 :  [-1.6122514986055856]
step  5 :  [-1.5133402141565413]
step  6 :  [-1.3912036743953209]
step  7 :  [-1.2507096766890378]
step  8 :  [-1.0959539636073627]
step  9 :  [-0.9302352330042887]
step  10 :  [-0.7561470450368373]
step  11 :  [-0.5756995207588393]
step  12 :  [-0.390437439440968]
step  13 :  [-0.20154817104391085]
step  14 :  [-0.10982559331520766]
step  15 :  [-0.06481928752094405]
step  16 :  [-0.0359462196063949]
step  17 :  [-0.022608877405023688]
step  18 :  [-0.04278406532889027]
step  19 :  [-0.02275368413256516]
step  20 :  [-0.05263381755242697]
step  21 :  [-0.03600813233633485]
step  22 :  [-0.026184836506909063]
step  23 :  [-0.06679158696546839]
step  24 :  [-0.050110257606689274]
episode  236 : steps 25 , return [-17.2]
step  0 :  [-1.6140015538735117]
step  1 :  [-1.582105345192193]
step  2 :  [-1.5465549920081003]
step  3 :  [-1.476383033480346]
step  4 :  [-1.4174356876744145]
step  5 :  [-1.328800509794376]
step  6 :  [-1.2153601702796155]
step  7 :  [-1.082094640178211]
step  8 :  [-0.9334022941039734]
step  9 :  [-0.772983327146103]
step  10 :  [-0.6039936105345668]
step  11 :  [-0.4295403699787814]
step  12 :  [-0.254839872931556]
step  13 :  [-0.1116807738006278]
step  14 :  [-0.050456491974958564]
step  15 :  [-0.009971037034224224]
step  16 :  [-0.03650634813212385]
step  17 :  [-0.04449175849389941]
step  18 :  [-0.04083843588057612]
step  19 :  [-0.02772689567811494]
step  20 :  [-0.010905791229345888]
step  21 :  [-0.0333397004164766]
step  22 :  [-0.04925355327097054]
step  23 :  [-0.10880172377279798]
step  24 :  [-0.12300702185127185]
episode  237 : steps 25 , return [-14.9]
step  0 :  [-1.7987260736453567]
step  1 :  [-1.763389041200297]
step  2 :  [-1.7224090616852605]
step  3 :  [-1.6829394126864488]
step  4 :  [-1.6110946825484396]
step  5 :  [-1.5111507925630001]
step  6 :  [-1.3882640876779735]
step  7 :  [-1.2472224975047934]
step  8 :  [-1.0980567961530303]
step  9 :  [-0.9365750623452002]
step  10 :  [-0.7658429811838804]
step  11 :  [-0.5880198397890382]
step  12 :  [-0.40479508233010086]
step  13 :  [-0.21749016315401587]
step  14 :  [-0.1272592747799441]
step  15 :  [-0.07083999184330571]
step  16 :  [-0.023379293581641994]
step  17 :  [-0.06607280312611177]
step  18 :  [-0.0874866812680944]
step  19 :  [-0.05865389174230003]
step  20 :  [-0.04149619647591246]
step  21 :  [-0.035273735935669175]
step  22 :  [-0.06800888503403006]
step  23 :  [-0.05456894230312914]
step  24 :  [-0.04891449651019897]
episode  238 : steps 25 , return [-17.42]
step  0 :  [-1.6020525336403817]
step  1 :  [-1.562444519281378]
step  2 :  [-1.5162757270988385]
step  3 :  [-1.4715706970417703]
step  4 :  [-1.396904617125173]
step  5 :  [-1.2953795249865476]
step  6 :  [-1.1976986750247074]
step  7 :  [-1.1018098864100172]
step  8 :  [-0.9863182123334996]
step  9 :  [-0.8544979035022935]
step  10 :  [-0.7103803126104702]
step  11 :  [-0.558746442579499]
step  12 :  [-0.4069583029260744]
step  13 :  [-0.27331744049460976]
step  14 :  [-0.17364127539807298]
step  15 :  [-0.1398236077670343]
step  16 :  [-0.08015169198552233]
step  17 :  [-0.024977830852387056]
step  18 :  [-0.028370643570019696]
step  19 :  [-0.017098822568283708]
step  20 :  [-0.019922615570404093]
step  21 :  [-0.03041822149603875]
step  22 :  [-0.02988639006132346]
step  23 :  [-0.0678095406626728]
step  24 :  [-0.0691075273418894]
episode  239 : steps 25 , return [-15.62]
step  0 :  [-1.610742611900607]
step  1 :  [-1.5652163414613054]
step  2 :  [-1.51073615822741]
step  3 :  [-1.4555664398195751]
step  4 :  [-1.407199362285931]
step  5 :  [-1.3318567733933275]
step  6 :  [-1.2309452448047993]
step  7 :  [-1.1395387568774276]
step  8 :  [-1.0261527200053975]
step  9 :  [-0.8948150946454131]
step  10 :  [-0.7497758006318251]
step  11 :  [-0.595437491776461]
step  12 :  [-0.43747414946350544]
step  13 :  [-0.2880691324411466]
step  14 :  [-0.16708178136907822]
step  15 :  [-0.059519820556252004]
step  16 :  [-0.0300313451480695]
step  17 :  [-0.04970343692549479]
step  18 :  [-0.018430910993643863]
step  19 :  [-0.03625685628928266]
step  20 :  [-0.03819749945840312]
step  21 :  [-0.007208422862445049]
step  22 :  [-0.027762177776804665]
step  23 :  [-0.008368181812843921]
step  24 :  [-0.04506116405272403]
episode  240 : steps 25 , return [-15.73]
step  0 :  [-1.537484033827073]
step  1 :  [-1.4929580546358896]
step  2 :  [-1.4401641898323212]
step  3 :  [-1.3875976112991508]
step  4 :  [-1.343000681833619]
step  5 :  [-1.2708746081052904]
step  6 :  [-1.2076057455056566]
step  7 :  [-1.1153499078166376]
step  8 :  [-0.9992717425214237]
step  9 :  [-0.8646329554044273]
step  10 :  [-0.7161700817407621]
step  11 :  [-0.5583956304529863]
step  12 :  [-0.39696882947270573]
step  13 :  [-0.24520465365908833]
step  14 :  [-0.12647822608322443]
step  15 :  [-0.08336337938799833]
step  16 :  [-0.06307852337355319]
step  17 :  [-0.05027034720773701]
step  18 :  [-0.031796322434585106]
step  19 :  [-0.06277280310720121]
step  20 :  [-0.058909329460283266]
step  21 :  [-0.011023041751678085]
step  22 :  [-0.05534267897562075]
step  23 :  [-0.0709882458499801]
step  24 :  [-0.04352781194294033]
episode  241 : steps 25 , return [-15.23]
step  0 :  [-1.5467519470874336]
step  1 :  [-1.5188738082391848]
step  2 :  [-1.4891371598091014]
step  3 :  [-1.4231149775661478]
step  4 :  [-1.326732312587289]
step  5 :  [-1.2060761229702983]
step  6 :  [-1.0721616950468258]
step  7 :  [-0.9229703497782996]
step  8 :  [-0.7619367307915327]
step  9 :  [-0.5919312336114549]
step  10 :  [-0.4154835076548048]
step  11 :  [-0.2357938716019106]
step  12 :  [-0.07303547521771599]
step  13 :  [-0.08147061730645178]
step  14 :  [-0.09701504767630688]
step  15 :  [-0.08299869801467274]
step  16 :  [-0.04001341341217893]
step  17 :  [-0.0178577587376684]
step  18 :  [-0.021231066839065147]
step  19 :  [-0.03164833708233354]
step  20 :  [-0.03001356343581511]
step  21 :  [-0.035779149123926025]
step  22 :  [-0.03327793877003594]
step  23 :  [-0.015678179634420548]
step  24 :  [-0.04366429912385499]
episode  242 : steps 25 , return [-13.11]
step  0 :  [-1.7541363604549993]
step  1 :  [-1.7128136452561586]
step  2 :  [-1.6637019111577471]
step  3 :  [-1.614411812110267]
step  4 :  [-1.571678439757744]
step  5 :  [-1.4994492885495896]
step  6 :  [-1.4003353265972478]
step  7 :  [-1.2787322809231887]
step  8 :  [-1.1390942767557932]
step  9 :  [-0.9853421906536918]
step  10 :  [-0.8207372668003451]
step  11 :  [-0.6479537238956615]
step  12 :  [-0.46929759516200575]
step  13 :  [-0.2874243408805446]
step  14 :  [-0.14419925817142143]
step  15 :  [-0.09169875565281692]
step  16 :  [-0.0496866235142107]
step  17 :  [-0.0292593372733619]
step  18 :  [-0.006483145625189221]
step  19 :  [-0.03226145052008629]
step  20 :  [-0.03421345238467748]
step  21 :  [-0.025449526099251857]
step  22 :  [-0.042531564916805466]
step  23 :  [-0.028224252623920566]
step  24 :  [-0.028568859035757344]
episode  243 : steps 25 , return [-17.36]
step  0 :  [-1.589812317660195]
step  1 :  [-1.5577625186870507]
step  2 :  [-1.5221057170553651]
step  3 :  [-1.4519312222406635]
step  4 :  [-1.3526251167054097]
step  5 :  [-1.2299353598390557]
step  6 :  [-1.1533115933916327]
step  7 :  [-1.0460063528755243]
step  8 :  [-0.9209296603310029]
step  9 :  [-0.781563800589045]
step  10 :  [-0.6320160811832755]
step  11 :  [-0.47762134502314846]
step  12 :  [-0.3286775456674865]
step  13 :  [-0.20529884774059062]
step  14 :  [-0.08510704899133019]
step  15 :  [-0.025912953049942157]
step  16 :  [-0.025305285690012537]
step  17 :  [-0.022442921543092343]
step  18 :  [-0.022818435362120706]
step  19 :  [-0.02253621614219804]
step  20 :  [-0.02086325548574928]
step  21 :  [-0.025249623827971298]
step  22 :  [-0.023073404424783815]
step  23 :  [-0.05077333528082377]
step  24 :  [-0.040465376670996984]
episode  244 : steps 25 , return [-14.61]
step  0 :  [-1.5740430741270706]
step  1 :  [-1.5495523422995146]
step  2 :  [-1.5243066107017142]
step  3 :  [-1.4613273804330438]
step  4 :  [-1.3671049288781323]
step  5 :  [-1.2480521865795975]
step  6 :  [-1.109686368873145]
step  7 :  [-0.9564939570293353]
step  8 :  [-0.7920328758885914]
step  9 :  [-0.6191156392436591]
step  10 :  [-0.4400633418984451]
step  11 :  [-0.2573638206663432]
step  12 :  [-0.1149983055251828]
step  13 :  [-0.06932362374119665]
step  14 :  [-0.021739757398674786]
step  15 :  [-0.039629895397737154]
step  16 :  [-0.03475519845550748]
step  17 :  [-0.008666579913793536]
step  18 :  [-0.03606945757819828]
step  19 :  [-0.04333733168309829]
step  20 :  [-0.01705729960688246]
step  21 :  [-0.02903721588783464]
step  22 :  [-0.040285428926186785]
step  23 :  [-0.06388189782285818]
step  24 :  [-0.0672372066650102]
episode  245 : steps 25 , return [-13.49]
step  0 :  [-1.5695229255161771]
step  1 :  [-1.5255534083978142]
step  2 :  [-1.4734203817945222]
step  3 :  [-1.4214779838749367]
step  4 :  [-1.3772999273648663]
step  5 :  [-1.3051891717617798]
step  6 :  [-1.2143991808708974]
step  7 :  [-1.1049835891548743]
step  8 :  [-0.9761070381096894]
step  9 :  [-0.8319416053522156]
step  10 :  [-0.6764326835404229]
step  11 :  [-0.5136368101703436]
step  12 :  [-0.34953264165699616]
step  13 :  [-0.20245070291753933]
step  14 :  [-0.10575119143818715]
step  15 :  [-0.09043530374058628]
step  16 :  [-0.0662258854149586]
step  17 :  [-0.041772432482628186]
step  18 :  [-0.0973139171349835]
step  19 :  [-0.11214582376491002]
step  20 :  [-0.08039740090755414]
step  21 :  [-0.022074674954999575]
step  22 :  [-0.014671161377613678]
step  23 :  [-0.055178235183410466]
step  24 :  [-0.04431850117831348]
episode  246 : steps 25 , return [-15.27]
step  0 :  [-1.6319946412909374]
step  1 :  [-1.5999322007667738]
step  2 :  [-1.5640774826131576]
step  3 :  [-1.4936533176738989]
step  4 :  [-1.3941292755232353]
step  5 :  [-1.2712809557400502]
step  6 :  [-1.1759456392034793]
step  7 :  [-1.0612724022461986]
step  8 :  [-0.9328715890385976]
step  9 :  [-0.792661397499619]
step  10 :  [-0.6440623004134484]
step  11 :  [-0.49242345009326005]
step  12 :  [-0.3488492978599233]
step  13 :  [-0.230655083120411]
step  14 :  [-0.11493783506916946]
step  15 :  [-0.05593757801011577]
step  16 :  [-0.0592942486091292]
step  17 :  [-0.016758348405130633]
step  18 :  [-0.037284494977148176]
step  19 :  [-0.02346446028607674]
step  20 :  [-0.03657729269400186]
step  21 :  [-0.053991856717996646]
step  22 :  [-0.08383312986316546]
step  23 :  [-0.09747326054636185]
step  24 :  [-0.06538784897245895]
episode  247 : steps 25 , return [-15.28]
step  0 :  [-1.5420823889647164]
step  1 :  [-1.5163704328085164]
step  2 :  [-1.4896140621170613]
step  3 :  [-1.4256800683499835]
step  4 :  [-1.3308132206700014]
step  5 :  [-1.2112971546998832]
step  6 :  [-1.0725746672354206]
step  7 :  [-0.9190837276670353]
step  8 :  [-0.754343160507802]
step  9 :  [-0.5811207171957122]
step  10 :  [-0.40165861668512337]
step  11 :  [-0.21825380233925748]
step  12 :  [-0.07835418437656452]
step  13 :  [-0.027142623282340645]
step  14 :  [-0.057577752692570545]
step  15 :  [-0.07905054225838398]
step  16 :  [-0.0670545625475944]
step  17 :  [-0.02982958041488234]
step  18 :  [-0.04688157281147041]
step  19 :  [-0.08002527472763052]
step  20 :  [-0.07502023812608102]
step  21 :  [-0.03689627053642724]
step  22 :  [-0.062105458320228416]
step  23 :  [-0.03771338625133984]
step  24 :  [-0.02224735402411621]
episode  248 : steps 25 , return [-13.16]
step  0 :  [-1.5124052135071064]
step  1 :  [-1.4741188142921708]
step  2 :  [-1.4301804668286686]
step  3 :  [-1.3888937885499988]
step  4 :  [-1.3170237722014004]
step  5 :  [-1.2254749477825824]
step  6 :  [-1.1412124134501838]
step  7 :  [-1.032972930233439]
step  8 :  [-0.9052547757142759]
step  9 :  [-0.7626133924973086]
step  10 :  [-0.6095539224336456]
step  11 :  [-0.45145320209548084]
step  12 :  [-0.29880886125772593]
step  13 :  [-0.17283906668573232]
step  14 :  [-0.05305831023698025]
step  15 :  [-0.011680098396873692]
step  16 :  [-0.02755648483173547]
step  17 :  [-0.009145975581415965]
step  18 :  [-0.05568660235809911]
step  19 :  [-0.06222756859503392]
step  20 :  [-0.02653235195239851]
step  21 :  [-0.058083062578099]
step  22 :  [-0.04618481215913015]
step  23 :  [-0.026890480039130808]
step  24 :  [-0.07402053945897974]
episode  249 : steps 25 , return [-14.17]
step  0 :  [-1.6950536397260194]
step  1 :  [-1.6618976208542637]
step  2 :  [-1.624287807595304]
step  3 :  [-1.5895505166041644]
step  4 :  [-1.5214125661070685]
step  5 :  [-1.4243484590422708]
step  6 :  [-1.3037134275832918]
step  7 :  [-1.1644585447638334]
step  8 :  [-1.010759472505094]
step  9 :  [-0.8459963406326255]
step  10 :  [-0.6728667481543831]
step  11 :  [-0.49357390448529487]
step  12 :  [-0.3102446759000507]
step  13 :  [-0.12798631288795123]
step  14 :  [-0.02274892325346618]
step  15 :  [-0.08434217129241668]
step  16 :  [-0.08977687303958186]
step  17 :  [-0.06916501596643708]
step  18 :  [-0.010516536147772404]
step  19 :  [-0.026237899311720648]
step  20 :  [-0.032921732865664056]
step  21 :  [-0.03187441915015397]
step  22 :  [-0.024474131678932493]
step  23 :  [-0.03241928016164518]
step  24 :  [-0.014969014738912843]
episode  250 : steps 25 , return [-15.89]
step  0 :  [-1.616058552492552]
step  1 :  [-1.581876594491665]
step  2 :  [-1.5431695644773233]
step  3 :  [-1.5075954083447909]
step  4 :  [-1.439216738311184]
step  5 :  [-1.3421682601409024]
step  6 :  [-1.2216613630978563]
step  7 :  [-1.082588940458829]
step  8 :  [-0.9291109380581029]
step  9 :  [-0.7646221511623668]
step  10 :  [-0.591880313197265]
step  11 :  [-0.4132870975357296]
step  12 :  [-0.23194479557169276]
step  13 :  [-0.08798558817600492]
step  14 :  [-0.04077165993519793]
step  15 :  [-0.0076320740457824455]
step  16 :  [-0.04635412365898115]
step  17 :  [-0.06022855633256142]
step  18 :  [-0.03405730932540575]
step  19 :  [-0.014600946096712907]
step  20 :  [-0.01854592273699484]
step  21 :  [-0.03427031197388532]
step  22 :  [-0.04120925503272774]
step  23 :  [-0.019854878198613556]
step  24 :  [-0.039047756107108644]
episode  251 : steps 25 , return [-14.71]
step  0 :  [-1.6998737769124523]
step  1 :  [-1.6591873399813224]
step  2 :  [-1.6111460689903858]
step  3 :  [-1.5634956562457254]
step  4 :  [-1.5231100906697357]
step  5 :  [-1.452849553973928]
step  6 :  [-1.3553674355840655]
step  7 :  [-1.235148021926809]
step  8 :  [-1.096742194010156]
step  9 :  [-0.9441772827423592]
step  10 :  [-0.7808571764748999]
step  11 :  [-0.6097120206008996]
step  12 :  [-0.4336890259515382]
step  13 :  [-0.25792146995283516]
step  14 :  [-0.11394675857548216]
step  15 :  [-0.0519615009752925]
step  16 :  [-0.05823250537520529]
step  17 :  [-0.07077219151267855]
step  18 :  [-0.07047946281040332]
step  19 :  [-0.08138325796685292]
step  20 :  [-0.06235168881159561]
step  21 :  [-0.02459387628953716]
step  22 :  [-0.015781278668273765]
step  23 :  [-0.045187058567153965]
step  24 :  [-0.054247357839416574]
episode  252 : steps 25 , return [-16.87]
step  0 :  [-1.6919297932655117]
step  1 :  [-1.6593162131420183]
step  2 :  [-1.6224640502035044]
step  3 :  [-1.5886741355663814]
step  4 :  [-1.5212185129890476]
step  5 :  [-1.4246638966496086]
step  6 :  [-1.3044259906290332]
step  7 :  [-1.16549772187529]
step  8 :  [-1.0120874312200772]
step  9 :  [-0.8476070848942423]
step  10 :  [-0.6747976298487434]
step  11 :  [-0.49594957746296076]
step  12 :  [-0.31345962382878445]
step  13 :  [-0.13405001857823556]
step  14 :  [-0.07061144061486677]
step  15 :  [-0.04384776284821811]
step  16 :  [-0.043992280507255566]
step  17 :  [-0.043178256566406566]
step  18 :  [-0.05087753493795978]
step  19 :  [-0.04473636549691575]
step  20 :  [-0.046222691082449266]
step  21 :  [-0.030976396462261174]
step  22 :  [-0.0439190087313492]
step  23 :  [-0.017171997034601073]
step  24 :  [-0.03304380373814605]
episode  253 : steps 25 , return [-15.92]
step  0 :  [-1.6001559994099963]
step  1 :  [-1.5663429954026942]
step  2 :  [-1.5282123147183602]
step  3 :  [-1.4934553657608207]
step  4 :  [-1.425729364549794]
step  5 :  [-1.329205359046911]
step  6 :  [-1.209133026589221]
step  7 :  [-1.070440221166509]
step  8 :  [-0.9173219677106381]
step  9 :  [-0.7532179638900736]
step  10 :  [-0.5809664244761836]
step  11 :  [-0.4031798898284025]
step  12 :  [-0.22388240558561343]
step  13 :  [-0.07885202483102396]
step  14 :  [-0.024204868599669745]
step  15 :  [-0.024473389032229797]
step  16 :  [-0.035476889123325146]
step  17 :  [-0.01561233427978563]
step  18 :  [-0.035692225490872406]
step  19 :  [-0.09446848185678632]
step  20 :  [-0.09574788007228698]
step  21 :  [-0.07530698544103533]
step  22 :  [-0.07836767679230973]
step  23 :  [-0.06767517246595023]
step  24 :  [-0.0696762937403829]
episode  254 : steps 25 , return [-14.8]
step  0 :  [-1.6967166199886679]
step  1 :  [-1.655270340336958]
step  2 :  [-1.6061829306203883]
step  3 :  [-1.557247790029381]
step  4 :  [-1.5153969637999933]
step  5 :  [-1.444115020568926]
step  6 :  [-1.3458838648669378]
step  7 :  [-1.2250813367383009]
step  8 :  [-1.0861869127098713]
step  9 :  [-0.9331717751385954]
step  10 :  [-0.7693818934749146]
step  11 :  [-0.5976618485265697]
step  12 :  [-0.42077778449277276]
step  13 :  [-0.2433422337651908]
step  14 :  [-0.09879225601080684]
step  15 :  [-0.0381123461853336]
step  16 :  [-0.050392457753718554]
step  17 :  [-0.05624051548121907]
step  18 :  [-0.040341019501808906]
step  19 :  [-0.025069576218748214]
step  20 :  [-0.01631899222616646]
step  21 :  [-0.025217897157411982]
step  22 :  [-0.03503845672451741]
step  23 :  [-0.04864800936596312]
step  24 :  [-0.05234140890905582]
episode  255 : steps 25 , return [-16.58]
step  0 :  [-1.6559222065391077]
step  1 :  [-1.626867016989263]
step  2 :  [-1.5950366878712094]
step  3 :  [-1.527253222348381]
step  4 :  [-1.4294765412893855]
step  5 :  [-1.3077542339400539]
step  6 :  [-1.1673553202538915]
step  7 :  [-1.0116935205810125]
step  8 :  [-0.8476059101812105]
step  9 :  [-0.6767468140280838]
step  10 :  [-0.5012043738138391]
step  11 :  [-0.3245367976844148]
step  12 :  [-0.1830898565378508]
step  13 :  [-0.034395999809408835]
step  14 :  [-0.04294795907440982]
step  15 :  [-0.04144039495015916]
step  16 :  [-0.018775525348924637]
step  17 :  [-0.054853266353019264]
step  18 :  [-0.06405003468144727]
step  19 :  [-0.03379376311166613]
step  20 :  [-0.05023679900147478]
step  21 :  [-0.09319843721706701]
step  22 :  [-0.11085432947153177]
step  23 :  [-0.11455139619474733]
step  24 :  [-0.08575649278558095]
episode  256 : steps 25 , return [-14.6]
step  0 :  [-1.4751084638202883]
step  1 :  [-1.443566276387901]
step  2 :  [-1.4091548449503928]
step  3 :  [-1.3401786637076198]
step  4 :  [-1.2418496654753686]
step  5 :  [-1.1775415742028665]
step  6 :  [-1.0862643024550211]
step  7 :  [-0.9726026558655346]
step  8 :  [-0.8410799655290346]
step  9 :  [-0.6963215062279804]
step  10 :  [-0.5433022869502264]
step  11 :  [-0.38929153395055605]
step  12 :  [-0.2528629474530907]
step  13 :  [-0.15315295380378488]
step  14 :  [-0.12146050796467044]
step  15 :  [-0.09949106015334527]
step  16 :  [-0.034162721525415884]
step  17 :  [-0.03653273769880804]
step  18 :  [-0.02348225956177243]
step  19 :  [-0.021673173755424813]
step  20 :  [-0.04927711742214225]
step  21 :  [-0.03512442892453984]
step  22 :  [-0.050212030998588675]
step  23 :  [-0.04973775093962374]
step  24 :  [-0.09414788684301817]
episode  257 : steps 25 , return [-13.64]
step  0 :  [-1.5191577707997026]
step  1 :  [-1.4836195066792501]
step  2 :  [-1.4434676690048625]
step  3 :  [-1.4068156234576767]
step  4 :  [-1.3381600967760765]
step  5 :  [-1.2411772048493486]
step  6 :  [-1.124641505442095]
step  7 :  [-0.9890651798173336]
step  8 :  [-0.8386682331101596]
step  9 :  [-0.6770463714494349]
step  10 :  [-0.5073801271636258]
step  11 :  [-0.33328406567020613]
step  12 :  [-0.16459552025360424]
step  13 :  [-0.043974398145280695]
step  14 :  [-0.052707781833838334]
step  15 :  [-0.042712248111387685]
step  16 :  [-0.032349896587240475]
step  17 :  [-0.05959328701902131]
step  18 :  [-0.05494851165003216]
step  19 :  [-0.028772185911441803]
step  20 :  [-0.06950606029904118]
step  21 :  [-0.0996746233004704]
step  22 :  [-0.08294289607433963]
step  23 :  [-0.051390283559528974]
step  24 :  [-0.05221630479798169]
episode  258 : steps 25 , return [-13.74]
step  0 :  [-1.7025070043215895]
step  1 :  [-1.6740679866390042]
step  2 :  [-1.6428931259155]
step  3 :  [-1.5754305377356161]
step  4 :  [-1.4778147352189395]
step  5 :  [-1.3561736128196544]
step  6 :  [-1.215814539944533]
step  7 :  [-1.0762447537168827]
step  8 :  [-0.9230048481345784]
step  9 :  [-0.7590319320517693]
step  10 :  [-0.5868503189751304]
step  11 :  [-0.40872640060146]
step  12 :  [-0.22759745846281781]
step  13 :  [-0.08517454346281]
step  14 :  [-0.04003371634802852]
step  15 :  [-0.009387602161369496]
step  16 :  [-0.026221881420339297]
step  17 :  [-0.02779534062094897]
step  18 :  [-0.03936663286211634]
step  19 :  [-0.048700684485469464]
step  20 :  [-0.052131171439362245]
step  21 :  [-0.028384701787570788]
step  22 :  [-0.02879832512112192]
step  23 :  [-0.03422399874935366]
step  24 :  [-0.015628328935589766]
episode  259 : steps 25 , return [-15.06]
step  0 :  [-1.5747430145724597]
step  1 :  [-1.540243113591167]
step  2 :  [-1.501274655777904]
step  3 :  [-1.4656670737975508]
step  4 :  [-1.3974633099157003]
step  5 :  [-1.3006546012138192]
step  6 :  [-1.1804024281325642]
step  7 :  [-1.0415891514541484]
step  8 :  [-0.8883855227838506]
step  9 :  [-0.7242195128767903]
step  10 :  [-0.5519318793476443]
step  11 :  [-0.37419004360415686]
step  12 :  [-0.19557659458416712]
step  13 :  [-0.11904255192328654]
step  14 :  [-0.03926197737091405]
step  15 :  [-0.03161663849615411]
step  16 :  [-0.03486753588325312]
step  17 :  [-0.040562585609965354]
step  18 :  [-0.0568551818181823]
step  19 :  [-0.04425350094922096]
step  20 :  [-0.018719365100129903]
step  21 :  [-0.05045196860647037]
step  22 :  [-0.058244412550495665]
step  23 :  [-0.03834274292114733]
step  24 :  [-0.0448157927972946]
episode  260 : steps 25 , return [-14.31]
step  0 :  [-1.505628576276762]
step  1 :  [-1.496272010530056]
step  2 :  [-1.4735851497441421]
step  3 :  [-1.4474113655272816]
step  4 :  [-1.3875084323132]
step  5 :  [-1.2973739859371216]
step  6 :  [-1.2062733685633587]
step  7 :  [-1.1196059691524463]
step  8 :  [-1.0101038551770967]
step  9 :  [-0.8818891316640961]
step  10 :  [-0.7393816884417801]
step  11 :  [-0.5871975407656461]
step  12 :  [-0.43133831617535906]
step  13 :  [-0.2847919168178682]
step  14 :  [-0.16679829221647638]
step  15 :  [-0.06412346082014116]
step  16 :  [-0.035614057454218896]
step  17 :  [-0.055303705367235896]
step  18 :  [-0.024782865183920953]
step  19 :  [-0.022487139856725076]
step  20 :  [-0.03143259079997121]
step  21 :  [-0.05025357813979104]
step  22 :  [-0.028896648995883473]
step  23 :  [-0.04508155101025743]
step  24 :  [-0.02940826948476368]
episode  261 : steps 25 , return [-15.42]
step  0 :  [-1.7635494493765516]
step  1 :  [-1.7241160890657612]
step  2 :  [-1.6775953188826722]
step  3 :  [-1.6314735566753529]
step  4 :  [-1.5923406260653563]
step  5 :  [-1.522612419821203]
step  6 :  [-1.42531983492359]
step  7 :  [-1.3051169653283858]
step  8 :  [-1.166627917169346]
step  9 :  [-1.0139013092903082]
step  10 :  [-0.8503197167345158]
step  11 :  [-0.6787190366194706]
step  12 :  [-0.5017174898840828]
step  13 :  [-0.3228312783499535]
step  14 :  [-0.1547133423257411]
step  15 :  [-0.05450054424373808]
step  16 :  [-0.07749780585777445]
step  17 :  [-0.06769207099204926]
step  18 :  [-0.06657876007678064]
step  19 :  [-0.05708118009700217]
step  20 :  [-0.061313935213692175]
step  21 :  [-0.05130838304916912]
step  22 :  [-0.01825999738006918]
step  23 :  [-0.04277999744276145]
step  24 :  [-0.04632872314207782]
episode  262 : steps 25 , return [-17.87]
step  0 :  [-1.7340989448975404]
step  1 :  [-1.7036903605075324]
step  2 :  [-1.6697027483892621]
step  3 :  [-1.639157491729203]
step  4 :  [-1.573831207430044]
step  5 :  [-1.4787606394944672]
step  6 :  [-1.3596230033036656]
step  7 :  [-1.221568804484347]
step  8 :  [-1.068913618203076]
step  9 :  [-0.9051586294657069]
step  10 :  [-0.7331453038415325]
step  11 :  [-0.5553238705246869]
step  12 :  [-0.374417450249889]
step  13 :  [-0.1970967034284385]
step  14 :  [-0.05491783275671098]
step  15 :  [-0.02194175685751618]
step  16 :  [-0.02062200957461389]
step  17 :  [-0.01621588261908892]
step  18 :  [-0.01181249653710626]
step  19 :  [-0.018541348493222556]
step  20 :  [-0.009664680329993302]
step  21 :  [-0.021300388031486]
step  22 :  [-0.01018416162431322]
step  23 :  [-0.0231502658567767]
step  24 :  [-0.01099952799479525]
episode  263 : steps 25 , return [-16.43]
step  0 :  [-1.6597470593965942]
step  1 :  [-1.6214359125648976]
step  2 :  [-1.5768415905818867]
step  3 :  [-1.533716100964705]
step  4 :  [-1.4598852152982864]
step  5 :  [-1.3588177265975303]
step  6 :  [-1.2352751662043304]
step  7 :  [-1.1291984288397259]
step  8 :  [-1.0022285924398366]
step  9 :  [-0.8593342076010879]
step  10 :  [-0.7041551648446789]
step  11 :  [-0.5401797600316689]
step  12 :  [-0.37160285944039123]
step  13 :  [-0.20864329602563036]
step  14 :  [-0.08190032012368315]
step  15 :  [-0.04297583807900492]
step  16 :  [-0.020096800348970226]
step  17 :  [-0.05865687117535749]
step  18 :  [-0.11033746759274708]
step  19 :  [-0.11008004737101203]
step  20 :  [-0.09401930186703669]
step  21 :  [-0.06276774855067115]
step  22 :  [-0.03366676786000983]
step  23 :  [-0.06274920250807295]
step  24 :  [-0.03684965262518381]
episode  264 : steps 25 , return [-15.98]
step  0 :  [-1.4222589801753824]
step  1 :  [-1.4061250972955848]
step  2 :  [-1.3833181055931496]
step  3 :  [-1.3628794426968491]
step  4 :  [-1.3067273625526195]
step  5 :  [-1.219407396244148]
step  6 :  [-1.106740931489975]
step  7 :  [-0.9742261407138613]
step  8 :  [-0.8266330484656972]
step  9 :  [-0.6681128749870354]
step  10 :  [-0.5027631454960141]
step  11 :  [-0.3366551121297321]
step  12 :  [-0.19826380100228064]
step  13 :  [-0.0758459698438083]
step  14 :  [-0.0027334197353388566]
step  15 :  [-0.008711381681267791]
step  16 :  [-0.039102552713538165]
step  17 :  [-0.07985659451153382]
step  18 :  [-0.08417574586024769]
step  19 :  [-0.053796681421308154]
step  20 :  [-0.044984731466643786]
step  21 :  [-0.0362445232934998]
step  22 :  [-0.05618365054113045]
step  23 :  [-0.05156175180607794]
step  24 :  [-0.04284333216444132]
episode  265 : steps 25 , return [-13.29]
step  0 :  [-1.629071280661062]
step  1 :  [-1.6004021239427544]
step  2 :  [-1.569212264752244]
step  3 :  [-1.5019403904552384]
step  4 :  [-1.4045534533161157]
step  5 :  [-1.2831167087838946]
step  6 :  [-1.145769049836728]
step  7 :  [-0.9906568751011893]
step  8 :  [-0.8258771242703322]
step  9 :  [-0.6535035420209396]
step  10 :  [-0.47556190609224613]
step  11 :  [-0.29467339897289935]
step  12 :  [-0.15279386382824367]
step  13 :  [-0.06166073660294968]
step  14 :  [-0.059236132025759676]
step  15 :  [-0.018496454274106636]
step  16 :  [-0.04366179703660288]
step  17 :  [-0.06170023348432073]
step  18 :  [-0.06993900913511876]
step  19 :  [-0.03276187208134997]
step  20 :  [-0.05562198186362439]
step  21 :  [-0.038054876985913394]
step  22 :  [-0.044266731084058014]
step  23 :  [-0.033000230060832296]
step  24 :  [-0.03642039583655298]
episode  266 : steps 25 , return [-14.08]
step  0 :  [-1.5579269236531312]
step  1 :  [-1.5133773258288414]
step  2 :  [-1.4604767394310116]
step  3 :  [-1.407648317353456]
step  4 :  [-1.3625511081711117]
step  5 :  [-1.2898725542220688]
step  6 :  [-1.2144086542197268]
step  7 :  [-1.117049475943128]
step  8 :  [-0.9975385267748104]
step  9 :  [-0.8605981288221907]
step  10 :  [-0.7106492438638455]
step  11 :  [-0.5520674222779642]
step  12 :  [-0.3906460710785632]
step  13 :  [-0.24082377336674982]
step  14 :  [-0.12640779969558277]
step  15 :  [-0.08776095633379846]
step  16 :  [-0.0661032040433866]
step  17 :  [-0.059852461521001515]
step  18 :  [-0.06658897539235088]
step  19 :  [-0.0892026358933864]
step  20 :  [-0.056679871855813226]
step  21 :  [-0.019062385492909176]
step  22 :  [-0.07407138900740552]
step  23 :  [-0.06585066630711969]
step  24 :  [-0.07951459557924483]
episode  267 : steps 25 , return [-15.47]
step  0 :  [-1.759976413077796]
step  1 :  [-1.7227699144795428]
step  2 :  [-1.6793423533484073]
step  3 :  [-1.6370680693270463]
step  4 :  [-1.563430697415483]
step  5 :  [-1.4623026669731767]
step  6 :  [-1.338619671145205]
step  7 :  [-1.1970464106603311]
step  8 :  [-1.0580036525383079]
step  9 :  [-0.9071405286101677]
step  10 :  [-0.7466885720196068]
step  11 :  [-0.5792503684809508]
step  12 :  [-0.40837318647733994]
step  13 :  [-0.24271082298858132]
step  14 :  [-0.11058182571642315]
step  15 :  [-0.058791354982789194]
step  16 :  [-0.04764107157666116]
step  17 :  [-0.09243568362140742]
step  18 :  [-0.08389582275167223]
step  19 :  [-0.028301057082956653]
step  20 :  [-0.014208120556178138]
step  21 :  [-0.011860356928385407]
step  22 :  [-0.041478701131868405]
step  23 :  [-0.03739507433362706]
step  24 :  [-0.07130725889480526]
episode  268 : steps 25 , return [-16.9]
step  0 :  [-1.6877626370668215]
step  1 :  [-1.656390721685611]
step  2 :  [-1.6212594428537408]
step  3 :  [-1.589599799919964]
step  4 :  [-1.523673927501306]
step  5 :  [-1.4282653543074082]
step  6 :  [-1.3089300704000484]
step  7 :  [-1.1707583594538258]
step  8 :  [-1.0180364072098576]
step  9 :  [-0.8542555452403217]
step  10 :  [-0.6822698885358083]
step  11 :  [-0.504601749013969]
step  12 :  [-0.3243434927393407]
step  13 :  [-0.15173060995261]
step  14 :  [-0.09604484708875527]
step  15 :  [-0.05518812979492941]
step  16 :  [-0.03639212329558841]
step  17 :  [-0.0495765399941748]
step  18 :  [-0.03715215682602353]
step  19 :  [-0.047117308309925304]
step  20 :  [-0.038261992633486966]
step  21 :  [-0.04599648118915878]
step  22 :  [-0.05981076101974277]
step  23 :  [-0.06179307896920352]
step  24 :  [-0.0723147685805024]
episode  269 : steps 25 , return [-16.12]
step  0 :  [-1.697286689120702]
step  1 :  [-1.662711442351191]
step  2 :  [-1.6231394451385273]
step  3 :  [-1.5859800856044093]
step  4 :  [-1.5161312627210235]
step  5 :  [-1.417815440556784]
step  6 :  [-1.2962287287720984]
step  7 :  [-1.156216859815018]
step  8 :  [-1.0018787257936344]
step  9 :  [-0.8365272871093556]
step  10 :  [-0.6627794028613516]
step  11 :  [-0.48268890242659074]
step  12 :  [-0.29793023787000456]
step  13 :  [-0.11066411432391984]
step  14 :  [-0.030534826407729206]
step  15 :  [-0.055231120148156614]
step  16 :  [-0.07609063127253927]
step  17 :  [-0.06192157048545735]
step  18 :  [-0.013167851394277811]
step  19 :  [-0.017901947042503127]
step  20 :  [-0.04731689132712895]
step  21 :  [-0.039510903517530116]
step  22 :  [-0.040737375378435525]
step  23 :  [-0.009831639939429345]
step  24 :  [-0.05164674533493159]
episode  270 : steps 25 , return [-15.79]
step  0 :  [-1.4643302528048647]
step  1 :  [-1.4314714492752016]
step  2 :  [-1.392214318540712]
step  3 :  [-1.355278920287739]
step  4 :  [-1.286906769897453]
step  5 :  [-1.2216771539174645]
step  6 :  [-1.1408300468655577]
step  7 :  [-1.034234088632566]
step  8 :  [-0.9071603584156196]
step  9 :  [-0.7645381880726256]
step  10 :  [-0.6109938723848871]
step  11 :  [-0.45176227634850685]
step  12 :  [-0.29662172269666]
step  13 :  [-0.16786101529072023]
step  14 :  [-0.04433869082754169]
step  15 :  [-0.01977304596923954]
step  16 :  [-0.027978919348188122]
step  17 :  [-0.014245580050008972]
step  18 :  [-0.012942781536628383]
step  19 :  [-0.02125356354339298]
step  20 :  [-0.004565108754355398]
step  21 :  [-0.026529841606663884]
step  22 :  [-0.0011988600011603697]
step  23 :  [-0.029684070053782548]
step  24 :  [-0.07393300815237008]
episode  271 : steps 25 , return [-13.8]
step  0 :  [-1.4817448150405619]
step  1 :  [-1.4431518431761368]
step  2 :  [-1.3989317756555029]
step  3 :  [-1.3575365634281633]
step  4 :  [-1.285755743139979]
step  5 :  [-1.2240438938596563]
step  6 :  [-1.1561769662125505]
step  7 :  [-1.0600441702086685]
step  8 :  [-0.9411814593349164]
step  9 :  [-0.8048898836232184]
step  10 :  [-0.6560868143389336]
step  11 :  [-0.49997242557736243]
step  12 :  [-0.3447628431151601]
step  13 :  [-0.213934211846288]
step  14 :  [-0.08864050523160986]
step  15 :  [-0.04125887600413584]
step  16 :  [-0.03540215954711882]
step  17 :  [-0.050425979985849384]
step  18 :  [-0.0364731263396812]
step  19 :  [-0.043884945671056635]
step  20 :  [-0.03962437240331994]
step  21 :  [-0.042140680352978126]
step  22 :  [-0.0333257098298278]
step  23 :  [-0.025488129066284452]
step  24 :  [-0.012722308136566924]
episode  272 : steps 25 , return [-14.32]
step  0 :  [-1.5981250089927943]
step  1 :  [-1.5645380947818177]
step  2 :  [-1.526727947247744]
step  3 :  [-1.4923787038341776]
step  4 :  [-1.4249512034987857]
step  5 :  [-1.3286543708195366]
step  6 :  [-1.208763877335599]
step  7 :  [-1.0702266680011467]
step  8 :  [-0.9172543352032871]
step  9 :  [-0.7533057355662502]
step  10 :  [-0.5812511952827067]
step  11 :  [-0.40378279566418995]
step  12 :  [-0.26522742448564907]
step  13 :  [-0.16785910180901753]
step  14 :  [-0.06553927723318845]
step  15 :  [-0.06554691940010376]
step  16 :  [-0.07431835254825507]
step  17 :  [-0.03734960931611124]
step  18 :  [-0.056898286009141104]
step  19 :  [-0.06142315310927209]
step  20 :  [-0.0703567193764037]
step  21 :  [-0.08310977218333818]
step  22 :  [-0.08321176812361092]
step  23 :  [-0.0380280708947136]
step  24 :  [-0.05681679947350108]
episode  273 : steps 25 , return [-15.]
step  0 :  [-1.801805997986611]
step  1 :  [-1.7668178958188263]
step  2 :  [-1.7263079263011887]
step  3 :  [-1.687399596241181]
step  4 :  [-1.6159325838730643]
step  5 :  [-1.5162498344187603]
step  6 :  [-1.3935467854690222]
step  7 :  [-1.2526345889942392]
step  8 :  [-1.0989361654376724]
step  9 :  [-0.9338321677755788]
step  10 :  [-0.7602816944901135]
step  11 :  [-0.5802855350485046]
step  12 :  [-0.39539981254136375]
step  13 :  [-0.20685317120232877]
step  14 :  [-0.11532515256975971]
step  15 :  [-0.07122614300957865]
step  16 :  [-0.037945251427809946]
step  17 :  [-0.02626692682435741]
step  18 :  [-0.022296485096656635]
step  19 :  [-0.029764570589992264]
step  20 :  [-0.01168745662653583]
step  21 :  [-0.052105268474406656]
step  22 :  [-0.049429509811235804]
step  23 :  [-0.09742210427544515]
step  24 :  [-0.08350825063100152]
episode  274 : steps 25 , return [-17.33]
step  0 :  [-1.5372469257069517]
step  1 :  [-1.5066364771930054]
step  2 :  [-1.473199299532716]
step  3 :  [-1.4046767682115422]
step  4 :  [-1.3065605106156777]
step  5 :  [-1.1934741740808104]
step  6 :  [-1.0774726842394855]
step  7 :  [-0.9454050144706401]
step  8 :  [-0.8001774416412317]
step  9 :  [-0.6452388185282151]
step  10 :  [-0.48492819199274345]
step  11 :  [-0.32732309350635574]
step  12 :  [-0.19703171220541438]
step  13 :  [-0.0724494431446946]
step  14 :  [-0.033109306837084844]
step  15 :  [-0.012900420657161267]
step  16 :  [-0.04610181975789078]
step  17 :  [-0.03133416805541399]
step  18 :  [-0.03427394493314796]
step  19 :  [-0.013492583625709608]
step  20 :  [-0.04796961784265062]
step  21 :  [-0.025817862661918455]
step  22 :  [-0.04068076765586312]
step  23 :  [-0.024845625690233804]
step  24 :  [-0.03764764872784991]
episode  275 : steps 25 , return [-13.32]
step  0 :  [-1.6763993743659285]
step  1 :  [-1.643410606982746]
step  2 :  [-1.6061029230492454]
step  3 :  [-1.5718518636604508]
step  4 :  [-1.5041366635417501]
step  5 :  [-1.407427341680338]
step  6 :  [-1.2870919872000988]
step  7 :  [-1.1480988132841725]
step  8 :  [-0.994642724675418]
step  9 :  [-0.8301283752689623]
step  10 :  [-0.6572941175080358]
step  11 :  [-0.4784377856958879]
step  12 :  [-0.2960239344283816]
step  13 :  [-0.11796931461956613]
step  14 :  [-0.04063488618907679]
step  15 :  [-0.09672468582885956]
step  16 :  [-0.0976911263582278]
step  17 :  [-0.07066941722892267]
step  18 :  [-0.02972489379876312]
step  19 :  [-0.007483512928959754]
step  20 :  [-0.03709707419891228]
step  21 :  [-0.03191964606752752]
step  22 :  [-0.020889709741168595]
step  23 :  [-0.034652302715998444]
step  24 :  [-0.05344978990291021]
episode  276 : steps 25 , return [-15.74]
step  0 :  [-1.4304285546963151]
step  1 :  [-1.3987553121482632]
step  2 :  [-1.3644010753838667]
step  3 :  [-1.2956232136820747]
step  4 :  [-1.2290343854451904]
step  5 :  [-1.1813253445639011]
step  6 :  [-1.1008223785080062]
step  7 :  [-0.9935862619043181]
step  8 :  [-0.8655488746378496]
step  9 :  [-0.7219634192758171]
step  10 :  [-0.5676849435646738]
step  11 :  [-0.4084209575863151]
step  12 :  [-0.25634279184856285]
step  13 :  [-0.13390428375087823]
step  14 :  [-0.08555094163181041]
step  15 :  [-0.0695054373880732]
step  16 :  [-0.043569471036063324]
step  17 :  [-0.0335377178953066]
step  18 :  [-0.04056210289870833]
step  19 :  [-0.04589706448194267]
step  20 :  [-0.05656469874968851]
step  21 :  [-0.05776748301084559]
step  22 :  [-0.016289767926314917]
step  23 :  [-0.02587121602073125]
step  24 :  [-0.014390965949845198]
episode  277 : steps 25 , return [-13.44]
step  0 :  [-1.673006279232248]
step  1 :  [-1.630111316924145]
step  2 :  [-1.5790882955748489]
step  3 :  [-1.5278759315326809]
step  4 :  [-1.483577135851055]
step  5 :  [-1.4107052821536863]
step  6 :  [-1.311379775512608]
step  7 :  [-1.1897745079738673]
step  8 :  [-1.0502460480116371]
step  9 :  [-0.8966813048150492]
step  10 :  [-0.7323539911487558]
step  11 :  [-0.5600217665948715]
step  12 :  [-0.38230618715392367]
step  13 :  [-0.20367945300499923]
step  14 :  [-0.058999601681880315]
step  15 :  [-0.010280264302444308]
step  16 :  [-0.035147185902453824]
step  17 :  [-0.017725705733571455]
step  18 :  [-0.03516406065668244]
step  19 :  [-0.027338213094432667]
step  20 :  [-0.033851779452638904]
step  21 :  [-0.055510111115992994]
step  22 :  [-0.04354841629625574]
step  23 :  [-0.060184961252511125]
step  24 :  [-0.08755970980941809]
episode  278 : steps 25 , return [-16.1]
step  0 :  [-1.5864093263293706]
step  1 :  [-1.5604786570258375]
step  2 :  [-1.5332156374996593]
step  3 :  [-1.4687822623112987]
step  4 :  [-1.3734747391538398]
step  5 :  [-1.2535794918659122]
step  6 :  [-1.1145264229238623]
step  7 :  [-0.9607339991353725]
step  8 :  [-0.7956936361597697]
step  9 :  [-0.6221246869231395]
step  10 :  [-0.44214589348447425]
step  11 :  [-0.25750805744526806]
step  12 :  [-0.12203252045737582]
step  13 :  [-0.018823063418718037]
step  14 :  [-0.01372425107232737]
step  15 :  [-0.05250197085689171]
step  16 :  [-0.05414943396806646]
step  17 :  [-0.013183121796993219]
step  18 :  [-0.04646265261280587]
step  19 :  [-0.04403679361398588]
step  20 :  [-0.007993267431710452]
step  21 :  [-0.050123458512361524]
step  22 :  [-0.07454405609335311]
step  23 :  [-0.055942038483227194]
step  24 :  [-0.02411541519416534]
episode  279 : steps 25 , return [-13.55]
step  0 :  [-1.559928259332732]
step  1 :  [-1.521117437720423]
step  2 :  [-1.476235385758255]
step  3 :  [-1.4334230151125493]
step  4 :  [-1.3602552478725478]
step  5 :  [-1.2598836104311495]
step  6 :  [-1.178064027188412]
step  7 :  [-1.0727775324622622]
step  8 :  [-0.9478638043326668]
step  9 :  [-0.8074218611750267]
step  10 :  [-0.6556081780956114]
step  11 :  [-0.49707122695520145]
step  12 :  [-0.3394952894926056]
step  13 :  [-0.2073838681563217]
step  14 :  [-0.13085205766267724]
step  15 :  [-0.12175010342583874]
step  16 :  [-0.09785248456407751]
step  17 :  [-0.06315429020369703]
step  18 :  [-0.06756458167573881]
step  19 :  [-0.07743120620268891]
step  20 :  [-0.10151267911976193]
step  21 :  [-0.06986409371704973]
step  22 :  [-0.07168877804751332]
step  23 :  [-0.052974860547695526]
step  24 :  [-0.05108429796649247]
episode  280 : steps 25 , return [-15.22]
step  0 :  [-1.5590962773859418]
step  1 :  [-1.5313950182689007]
step  2 :  [-1.501841825610075]
step  3 :  [-1.435906275545157]
step  4 :  [-1.339564884878197]
step  5 :  [-1.2189278754299606]
step  6 :  [-1.0848140371880763]
step  7 :  [-0.9352067127137539]
step  8 :  [-0.7736341669002565]
step  9 :  [-0.6029572105083877]
step  10 :  [-0.4255412722925995]
step  11 :  [-0.24379538888398927]
step  12 :  [-0.10435531967091677]
step  13 :  [-0.06431230336408912]
step  14 :  [-0.01668325386046541]
step  15 :  [-0.03192388802210264]
step  16 :  [-0.0536243295616285]
step  17 :  [-0.05750184250006288]
step  18 :  [-0.09201752701384505]
step  19 :  [-0.09726414650571924]
step  20 :  [-0.0711391421033078]
step  21 :  [-0.017739484362015764]
step  22 :  [-0.027255202052256695]
step  23 :  [-0.03605756471535007]
step  24 :  [-0.017978299336795917]
episode  281 : steps 25 , return [-13.34]
step  0 :  [-1.5936002208769444]
step  1 :  [-1.5544413308455258]
step  2 :  [-1.508932284975135]
step  3 :  [-1.4651049198225872]
step  4 :  [-1.391079490295875]
step  5 :  [-1.2900214210378238]
step  6 :  [-1.1937199633746736]
step  7 :  [-1.0898783935006149]
step  8 :  [-0.9676469785446676]
step  9 :  [-0.8303298081056677]
step  10 :  [-0.6818303435726835]
step  11 :  [-0.5268614302856957]
step  12 :  [-0.373258832846819]
step  13 :  [-0.2431126548825884]
step  14 :  [-0.15617334811629238]
step  15 :  [-0.1340319604885144]
step  16 :  [-0.11144648315355006]
step  17 :  [-0.04679494206331937]
step  18 :  [-0.04563445069561151]
step  19 :  [-0.07321063332040972]
step  20 :  [-0.06172693495471068]
step  21 :  [-0.030358028940739617]
step  22 :  [-0.022676183047154252]
step  23 :  [-0.03496775868360865]
step  24 :  [-0.015292626321995932]
episode  282 : steps 25 , return [-15.44]
step  0 :  [-1.5564853848243703]
step  1 :  [-1.5362441871950618]
step  2 :  [-1.502185882643628]
step  3 :  [-1.4639198175185677]
step  4 :  [-1.4296824194351738]
step  5 :  [-1.365180486239255]
step  6 :  [-1.2724557680432338]
step  7 :  [-1.1621645492025208]
step  8 :  [-1.0315464808343793]
step  9 :  [-0.8849578804597277]
step  10 :  [-0.7261351508779628]
step  11 :  [-0.5582912233132264]
step  12 :  [-0.38462196873576765]
step  13 :  [-0.2110122291629289]
step  14 :  [-0.06967106225254424]
step  15 :  [-0.008925474429570694]
step  16 :  [-0.037258269585755954]
step  17 :  [-0.03616305155944978]
step  18 :  [-0.004003618426925407]
step  19 :  [-0.04806038257658932]
step  20 :  [-0.05437552206915961]
step  21 :  [-0.017794184229890028]
step  22 :  [-0.043763016023720513]
step  23 :  [-0.023406487288459725]
step  24 :  [-0.04571737118152027]
episode  283 : steps 25 , return [-15.47]
step  0 :  [-1.4732920779565484]
step  1 :  [-1.441975149279481]
step  2 :  [-1.4078834858662892]
step  3 :  [-1.339130075986912]
step  4 :  [-1.2409571804749295]
step  5 :  [-1.1735459731878766]
step  6 :  [-1.078518748785037]
step  7 :  [-0.961650292983361]
step  8 :  [-0.8274653200974806]
step  9 :  [-0.6805094642686162]
step  10 :  [-0.5256826863634695]
step  11 :  [-0.37037696983661034]
step  12 :  [-0.23991947721491563]
step  13 :  [-0.11752386206922184]
step  14 :  [-0.05612534543007168]
step  15 :  [-0.024842685202020716]
step  16 :  [-0.052003095582284144]
step  17 :  [-0.03188999436667571]
step  18 :  [-0.04994892038824392]
step  19 :  [-0.038772576635990076]
step  20 :  [-0.01839019157233601]
step  21 :  [-0.013454234749700613]
step  22 :  [-0.046712640569687276]
step  23 :  [-0.04007219061958285]
step  24 :  [-0.043797289218632726]
episode  284 : steps 25 , return [-13.29]
step  0 :  [-1.4596375729159938]
step  1 :  [-1.4233940422638909]
step  2 :  [-1.3825553194882076]
step  3 :  [-1.345534377018648]
step  4 :  [-1.2769515273115084]
step  5 :  [-1.2036921535461649]
step  6 :  [-1.1030208117246738]
step  7 :  [-0.9799507247485019]
step  8 :  [-0.8395185917443725]
step  9 :  [-0.686125715073362]
step  10 :  [-0.5238683865696531]
step  11 :  [-0.3578866042292006]
step  12 :  [-0.22119717415671036]
step  13 :  [-0.07592280401631207]
step  14 :  [-0.026625882550784116]
step  15 :  [-0.010617916392955395]
step  16 :  [-0.0487371473664756]
step  17 :  [-0.027818955927893282]
step  18 :  [-0.06148267136241461]
step  19 :  [-0.03753329578735751]
step  20 :  [-0.06868941833644483]
step  21 :  [-0.0995961061428809]
step  22 :  [-0.11241972184375948]
step  23 :  [-0.07447687903387186]
step  24 :  [-0.09557651564340539]
episode  285 : steps 25 , return [-13.54]
step  0 :  [-1.5784436706271656]
step  1 :  [-1.53683050890376]
step  2 :  [-1.4879613864174417]
step  3 :  [-1.4400497622477058]
step  4 :  [-1.4004812015627333]
step  5 :  [-1.3315867220619666]
step  6 :  [-1.2355960209749295]
step  7 :  [-1.1168864787833943]
step  8 :  [-0.9800451436920975]
step  9 :  [-0.8292407166633248]
step  10 :  [-0.6681877112994551]
step  11 :  [-0.5005850666804423]
step  12 :  [-0.3319214346076074]
step  13 :  [-0.18088693612235135]
step  14 :  [-0.09080461726645299]
step  15 :  [-0.08992328721972917]
step  16 :  [-0.06853092086547291]
step  17 :  [-0.06079298340203064]
step  18 :  [-0.05669071199546054]
step  19 :  [-0.034055471181929725]
step  20 :  [-0.050933116461034364]
step  21 :  [-0.060851844980892765]
step  22 :  [-0.034558900830282444]
step  23 :  [-0.04956546901538613]
step  24 :  [-0.0430701073984598]
episode  286 : steps 25 , return [-15.26]
step  0 :  [-1.5819275270278386]
step  1 :  [-1.5446699042269016]
step  2 :  [-1.5018517808460328]
step  3 :  [-1.4614427491162143]
step  4 :  [-1.3898366148754397]
step  5 :  [-1.2905253752201595]
step  6 :  [-1.1769351743597396]
step  7 :  [-1.0458138470426293]
step  8 :  [-0.9001429304596124]
step  9 :  [-0.743063996786438]
step  10 :  [-0.5777026083921233]
step  11 :  [-0.4077899788881368]
step  12 :  [-0.2414769471976857]
step  13 :  [-0.10717270825190608]
step  14 :  [-0.05237588888483382]
step  15 :  [-0.0437050250226401]
step  16 :  [-0.07377250871915887]
step  17 :  [-0.08516813606390623]
step  18 :  [-0.06388422634240971]
step  19 :  [-0.032521188255332824]
step  20 :  [-0.06514018183317549]
step  21 :  [-0.09225549335714381]
step  22 :  [-0.0772342521454277]
step  23 :  [-0.040118278234499725]
step  24 :  [-0.03423094755346616]
episode  287 : steps 25 , return [-14.63]
step  0 :  [-1.4268785345577029]
step  1 :  [-1.3974641218619221]
step  2 :  [-1.3662403877889346]
step  3 :  [-1.2996172536684225]
step  4 :  [-1.2210887593929505]
step  5 :  [-1.1348195397671412]
step  6 :  [-1.0238150424790458]
step  7 :  [-0.8931265635880042]
step  8 :  [-0.7474296879914389]
step  9 :  [-0.5910618939992909]
step  10 :  [-0.4288787381850798]
step  11 :  [-0.2702664353553286]
step  12 :  [-0.13983061652776954]
step  13 :  [-0.08510742663365921]
step  14 :  [-0.07773425361907516]
step  15 :  [-0.10784764146510062]
step  16 :  [-0.09603614846709363]
step  17 :  [-0.05036347731069402]
step  18 :  [-0.025386980816775352]
step  19 :  [-0.03519293975229412]
step  20 :  [-0.022217043042044932]
step  21 :  [-0.030090618768743426]
step  22 :  [-0.021231215613249046]
step  23 :  [-0.04347966737855231]
step  24 :  [-0.06903810020592858]
episode  288 : steps 25 , return [-12.6]
step  0 :  [-1.4671651981688298]
step  1 :  [-1.4385964112724667]
step  2 :  [-1.408314162383184]
step  3 :  [-1.3421900184602025]
step  4 :  [-1.2458755316253571]
step  5 :  [-1.1433135393164902]
step  6 :  [-1.0185312093834282]
step  7 :  [-0.8763231909521088]
step  8 :  [-0.7207724465340942]
step  9 :  [-0.5553517839865769]
step  10 :  [-0.38342913623426833]
step  11 :  [-0.21087959330977046]
step  12 :  [-0.0701540950154574]
step  13 :  [-0.009776834392977246]
step  14 :  [-0.026557280114705272]
step  15 :  [-0.03132933185823482]
step  16 :  [-0.035474940065477585]
step  17 :  [-0.043455462704189804]
step  18 :  [-0.04421103200359298]
step  19 :  [-0.04434078007677839]
step  20 :  [-0.02348052292134948]
step  21 :  [-0.018143002129201113]
step  22 :  [-0.05645331696555687]
step  23 :  [-0.06605085195003532]
step  24 :  [-0.038735670436258876]
episode  289 : steps 25 , return [-12.32]
step  0 :  [-1.5014418509006204]
step  1 :  [-1.4801148055665152]
step  2 :  [-1.4479227817677527]
step  3 :  [-1.4142434582677978]
step  4 :  [-1.3486149041871838]
step  5 :  [-1.2541727795279063]
step  6 :  [-1.197126397876144]
step  7 :  [-1.1231264678396786]
step  8 :  [-1.0233522645904285]
step  9 :  [-0.9026495954920561]
step  10 :  [-0.7660535440034473]
step  11 :  [-0.6186713186521401]
step  12 :  [-0.4667829705963473]
step  13 :  [-0.32245718485886365]
step  14 :  [-0.22307840555055278]
step  15 :  [-0.18220979298320414]
step  16 :  [-0.18233568714546236]
step  17 :  [-0.15835713800142429]
step  18 :  [-0.1097363117251141]
step  19 :  [-0.040570088722237746]
step  20 :  [-0.014614972421523468]
step  21 :  [-0.029288707320217974]
step  22 :  [-0.03635996717333841]
step  23 :  [-0.03633204982465168]
step  24 :  [-0.04954687418105964]
episode  290 : steps 25 , return [-15.93]
step  0 :  [-1.52999328697291]
step  1 :  [-1.4982551586586152]
step  2 :  [-1.4633014417481818]
step  3 :  [-1.4329511112998252]
step  4 :  [-1.3687269758053766]
step  5 :  [-1.275049519249333]
step  6 :  [-1.1574050429897647]
step  7 :  [-1.0209400620617617]
step  8 :  [-0.8700881765502145]
step  9 :  [-0.7086341285610116]
step  10 :  [-0.5401050470213749]
step  11 :  [-0.36905066773663137]
step  12 :  [-0.2080515215499918]
step  13 :  [-0.08807034042482251]
step  14 :  [-0.05898336958479401]
step  15 :  [-0.03362621123246001]
step  16 :  [-0.040539368430017375]
step  17 :  [-0.0820032815521748]
step  18 :  [-0.11997124555147161]
step  19 :  [-0.11080808307064771]
step  20 :  [-0.07932108326021306]
step  21 :  [-0.08768441828394742]
step  22 :  [-0.059561237941300554]
step  23 :  [-0.0782711899275566]
step  24 :  [-0.05076825625837794]
episode  291 : steps 25 , return [-14.33]
step  0 :  [-1.6635675315314287]
step  1 :  [-1.6298224517283053]
step  2 :  [-1.591524317338368]
step  3 :  [-1.556139848276358]
step  4 :  [-1.4876805272999232]
step  5 :  [-1.3904545410451077]
step  6 :  [-1.2697394102759494]
step  7 :  [-1.1304487440545796]
step  8 :  [-0.9767404102994941]
step  9 :  [-0.8119881974928905]
step  10 :  [-0.6388944974488562]
step  11 :  [-0.45969381232508383]
step  12 :  [-0.2766867132406614]
step  13 :  [-0.09764871016396107]
step  14 :  [-0.054264731800947194]
step  15 :  [-0.07567771109917694]
step  16 :  [-0.08103418850961536]
step  17 :  [-0.058765428638145906]
step  18 :  [-0.02278027077721455]
step  19 :  [-0.013855947860109257]
step  20 :  [-0.027394010591212117]
step  21 :  [-0.032799199295929726]
step  22 :  [-0.02587837487499657]
step  23 :  [-0.04052743930663745]
step  24 :  [-0.05611727420273564]
episode  292 : steps 25 , return [-15.47]
step  0 :  [-1.6238644470197652]
step  1 :  [-1.5796362891882363]
step  2 :  [-1.526928489302449]
step  3 :  [-1.4739060407078124]
step  4 :  [-1.4279352412651876]
step  5 :  [-1.354191091598385]
step  6 :  [-1.2543978723283054]
step  7 :  [-1.1461703462599127]
step  8 :  [-1.017842572466435]
step  9 :  [-0.8735807688565377]
step  10 :  [-0.7171703952817008]
step  11 :  [-0.5521249092223123]
step  12 :  [-0.38254956720337296]
step  13 :  [-0.21800553808193837]
step  14 :  [-0.08764438380074202]
step  15 :  [-0.04168648318094097]
step  16 :  [-0.021379203324838073]
step  17 :  [-0.06693578863451279]
step  18 :  [-0.11742937284052077]
step  19 :  [-0.11533727442357931]
step  20 :  [-0.08905224463208222]
step  21 :  [-0.09745026933803255]
step  22 :  [-0.07383344996913888]
step  23 :  [-0.08840332428633399]
step  24 :  [-0.06569228230891293]
episode  293 : steps 25 , return [-16.01]
step  0 :  [-1.812275273420978]
step  1 :  [-1.7734844503652187]
step  2 :  [-1.7276949625461484]
step  3 :  [-1.6822204774158604]
step  4 :  [-1.6434663257787598]
step  5 :  [-1.5737531232809976]
step  6 :  [-1.4763257025291037]
step  7 :  [-1.3559246997261858]
step  8 :  [-1.2172038369686853]
step  9 :  [-1.0642110508056484]
step  10 :  [-0.9003022261167948]
step  11 :  [-0.7282416960169418]
step  12 :  [-0.550446563583809]
step  13 :  [-0.36966132319217737]
step  14 :  [-0.19286552502735613]
step  15 :  [-0.052427135213287984]
step  16 :  [-0.026639898410904056]
step  17 :  [-0.022749222153869736]
step  18 :  [-0.0199465814886621]
step  19 :  [-0.011814912760623169]
step  20 :  [-0.020833837326740833]
step  21 :  [-0.0067836342309598625]
step  22 :  [-0.022833021391875135]
step  23 :  [-0.005571248265818614]
step  24 :  [-0.02432352696871482]
episode  294 : steps 25 , return [-18.28]
step  0 :  [-1.3927170635478674]
step  1 :  [-1.3807856879224205]
step  2 :  [-1.3638413212425673]
step  3 :  [-1.308182283664815]
step  4 :  [-1.22283728384883]
step  5 :  [-1.1224325822768941]
step  6 :  [-0.9995949423165262]
step  7 :  [-0.8591852816357191]
step  8 :  [-0.7054393879862354]
step  9 :  [-0.5421396341526159]
step  10 :  [-0.3734759907995415]
step  11 :  [-0.20880377880559142]
step  12 :  [-0.07810136818102156]
step  13 :  [-0.0341797326620534]
step  14 :  [-0.011518193956433281]
step  15 :  [-0.06280482251742925]
step  16 :  [-0.11060553110178477]
step  17 :  [-0.1066586661588086]
step  18 :  [-0.08386638005644902]
step  19 :  [-0.0500532629821479]
step  20 :  [-0.020704128409637965]
step  21 :  [-0.05057298912909246]
step  22 :  [-0.02663354827826004]
step  23 :  [-0.05642525091756365]
step  24 :  [-0.08001162036677481]
episode  295 : steps 25 , return [-12.25]
step  0 :  [-1.4967729971947217]
step  1 :  [-1.4660829727750775]
step  2 :  [-1.4327344310369867]
step  3 :  [-1.3644047856867916]
step  4 :  [-1.2664853647769105]
step  5 :  [-1.1814623691624466]
step  6 :  [-1.0752903910488933]
step  7 :  [-0.9498709180828625]
step  8 :  [-0.8090989634718229]
step  9 :  [-0.6569980626870275]
step  10 :  [-0.49808553757391283]
step  11 :  [-0.3397907367371768]
step  12 :  [-0.20586146949152068]
step  13 :  [-0.12730714473986526]
step  14 :  [-0.11787514536694339]
step  15 :  [-0.09412907645632031]
step  16 :  [-0.06058139114417455]
step  17 :  [-0.10900082883144523]
step  18 :  [-0.11057909633717956]
step  19 :  [-0.08123406249831663]
step  20 :  [-0.05090173500286831]
step  21 :  [-0.043008274333019986]
step  22 :  [-0.025271522220929248]
step  23 :  [-0.021835337851391672]
step  24 :  [-0.030096033246913716]
episode  296 : steps 25 , return [-13.61]
step  0 :  [-1.4346335985059937]
step  1 :  [-1.4004110108538175]
step  2 :  [-1.3625070596677875]
step  3 :  [-1.329319160112817]
step  4 :  [-1.2636391146052675]
step  5 :  [-1.1762774913068754]
step  6 :  [-1.0641547998348533]
step  7 :  [-0.9324091828866627]
step  8 :  [-0.7856877103698658]
step  9 :  [-0.628183175656603]
step  10 :  [-0.46430150228508826]
step  11 :  [-0.3014886911238854]
step  12 :  [-0.16860578028783182]
step  13 :  [-0.11548224532765694]
step  14 :  [-0.12750297598882288]
step  15 :  [-0.10700124096318686]
step  16 :  [-0.04900447061343679]
step  17 :  [-0.03251337703886216]
step  18 :  [-0.04766862408572762]
step  19 :  [-0.029888149266142194]
step  20 :  [-0.04971331284143015]
step  21 :  [-0.0699964830555896]
step  22 :  [-0.0712939668089911]
step  23 :  [-0.0429104351801719]
step  24 :  [-0.04750365391219957]
episode  297 : steps 25 , return [-13.1]
step  0 :  [-1.5601270680630661]
step  1 :  [-1.522428029081567]
step  2 :  [-1.4790912943370695]
step  3 :  [-1.4381950642019468]
step  4 :  [-1.3663550234962987]
step  5 :  [-1.2669314376615128]
step  6 :  [-1.168821581234555]
step  7 :  [-1.0482609696823277]
step  8 :  [-0.9103874382506887]
step  9 :  [-0.7590554029346703]
step  10 :  [-0.5978832738317444]
step  11 :  [-0.4308175329634997]
step  12 :  [-0.2651753871787044]
step  13 :  [-0.12919252583350097]
step  14 :  [-0.07146054270103358]
step  15 :  [-0.028137355775683808]
step  16 :  [-0.03045956563206969]
step  17 :  [-0.046220468566529005]
step  18 :  [-0.03162629859914079]
step  19 :  [-0.029150141853479576]
step  20 :  [-0.053924150960431766]
step  21 :  [-0.04335632339740105]
step  22 :  [-0.013887674230360792]
step  23 :  [-0.05742647681055244]
step  24 :  [-0.053271161318710354]
episode  298 : steps 25 , return [-14.4]
step  0 :  [-1.72024609613687]
step  1 :  [-1.690966726485028]
step  2 :  [-1.6585755763124372]
step  3 :  [-1.5902430330894122]
step  4 :  [-1.4920117031333604]
step  5 :  [-1.3699475734988176]
step  6 :  [-1.2293202997053445]
step  7 :  [-1.1022691181087747]
step  8 :  [-0.958044281121162]
step  9 :  [-0.8015909471925655]
step  10 :  [-0.6357038426640129]
step  11 :  [-0.463098832956022]
step  12 :  [-0.2874686482510074]
step  13 :  [-0.14701648908014223]
step  14 :  [-0.06206801430445933]
step  15 :  [-0.06388886220913235]
step  16 :  [-0.07284509445109562]
step  17 :  [-0.06409321355707083]
step  18 :  [-0.040035162643824264]
step  19 :  [-0.020878226255496183]
step  20 :  [-0.0097148316801994]
step  21 :  [-0.0339035742108323]
step  22 :  [-0.03214084558753105]
step  23 :  [-0.05055786805864423]
step  24 :  [-0.04611392233296878]
episode  299 : steps 25 , return [-15.64]
Averaged episode return over  300  episodes:  [-14.97]
Total number of samples:  7500

Process finished with exit code 0


