mirror of
https://github.com/gryf/coach.git
synced 2026-03-10 03:25:49 +01:00
new traces
This commit is contained in:
@@ -1,26 +1,26 @@
|
||||
Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,Total steps,Epsilon,Shaped Training Reward,Training Reward,Update Target Network,Evaluation Reward,Shaped Evaluation Reward,Success Rate,Loss/Mean,Loss/Stdev,Loss/Max,Loss/Min,Learning Rate/Mean,Learning Rate/Stdev,Learning Rate/Max,Learning Rate/Min,Grads (unclipped)/Mean,Grads (unclipped)/Stdev,Grads (unclipped)/Max,Grads (unclipped)/Min,Q/Mean,Q/Stdev,Q/Max,Q/Min
|
||||
1,0.0,1.0,486.0,486.0,486.0,486.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
2,0.0,1.0,573.0,573.0,87.0,573.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
3,0.0,1.0,722.0,722.0,149.0,722.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
4,0.0,1.0,1057.0,1057.0,335.0,1057.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
5,51.0,0.0,1260.0,1260.0,203.0,1260.0,0.9997990300000044,5.0,55.0,0.0,,,,3.931745547874301,1.1304143308005733e-05,3.9317700862884517,3.9316890239715576,0.00025,0.0,0.00025,0.00025,0.0015866637,0.0023147496,0.009720516,0.0007565144,,,,
|
||||
6,70.0,0.0,1335.0,1335.0,75.0,1335.0,0.999724780000006,2.0,15.0,0.0,,,,3.931735929689909,7.235250669185713e-06,3.9317455291748047,3.931711912155152,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.001755927,0.0026373637,0.009641058000000001,0.0007148395500000001,,,,
|
||||
7,91.0,0.0,1422.0,1422.0,87.0,1422.0,0.9996386500000078,1.0,15.0,0.0,,,,3.931701206025623,5.099185273705093e-05,3.93173623085022,3.931553602218628,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.00282516,0.0035993564000000003,0.009418896999999999,0.00070036505,,,,
|
||||
8,159.0,0.0,1693.0,1693.0,271.0,1693.0,0.9993703600000136,5.0,55.0,0.0,,,,3.931656876606728,9.226522325134514e-05,3.931716203689575,3.9311599731445312,0.00025,0.0,0.00025,0.00025,0.0017165048,0.0027771054,0.012550428999999998,0.00063557597,,,,
|
||||
9,201.0,0.0,1861.0,1861.0,168.0,1861.0,0.9992040400000172,3.0,50.0,0.0,,,,3.93158137230646,0.00010474746316658029,3.93165135383606,3.931158781051636,0.00025,0.0,0.00025,0.00025,0.0017799592,0.002852903,0.009889938000000001,0.0006321495,,,,
|
||||
10,279.0,0.0,2172.0,2172.0,311.0,2172.0,0.998896150000024,4.0,65.0,0.0,,,,3.9314154325387416,0.00022279076273676361,3.931581258773804,3.930070638656616,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0026444625,0.004101368,0.019448647,0.00062298455,,,,
|
||||
11,407.0,0.0,2683.0,2683.0,511.0,2683.0,0.9983902600000351,9.0,320.0,0.0,,,,3.931240767240524,0.00015854553450050932,3.931373834609986,3.9305694103240967,0.0002500000000000001,1.0842021724855042e-19,0.00025,0.00025,0.0017362889000000002,0.0029191163,0.011232911000000002,0.0005518816,0.024129094928503625,0.00904320207528025,0.04169573485851341,0.012993395328522341
|
||||
12,424.0,0.0,2754.0,2754.0,71.0,2754.0,0.9983199700000364,1.0,15.0,0.0,,,,3.9310134579153617,0.000358822446065362,3.9312620162963863,3.93019700050354,0.00025,0.0,0.00025,0.00025,0.0032191304,0.0045680365999999995,0.011846525,0.0005631294,,,,
|
||||
13,457.0,0.0,2886.0,2886.0,132.0,2886.0,0.9981892900000392,2.0,25.0,0.0,,,,3.931020930409432,0.00018348520436412824,3.93116307258606,3.9301931858062735,0.00025,0.0,0.00025,0.00025,0.0016074966000000001,0.002708108,0.012189938999999999,0.00064319023,,,,
|
||||
14,504.0,0.0,3074.0,3074.0,188.0,3074.0,0.9980031700000432,3.0,35.0,0.0,,,,3.931025738301485,0.00015399033015145469,3.9311008453369136,3.9300034046173096,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0009836307000000001,0.0015528154999999999,0.011335916000000001,0.0005281837,0.021890531852842,0.014466196029404797,0.03762449622154298,-0.00010702610015811408
|
||||
15,528.0,0.0,3167.0,3167.0,93.0,3167.0,0.9979111000000452,1.0,15.0,0.0,,,,3.931034368017445,6.681329033129075e-05,3.9310910701751713,3.9308130741119385,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0016258046,0.0031157003000000004,0.011724828999999999,0.0004990724,,,,
|
||||
16,598.0,0.0,3449.0,3449.0,282.0,3449.0,0.9976319200000514,2.0,55.0,0.0,,,,3.930865437643869,0.0002831683814269127,3.9310925006866455,3.9296932220458975,0.00025,0.0,0.00025,0.00025,0.0021639192000000003,0.0036756303,0.012480825,0.00047580682,0.0305326876540985,0.00923045073371262,0.0438561670482166,0.021990178897977525
|
||||
17,668.0,0.0,3729.0,3729.0,280.0,3729.0,0.9973547200000574,4.0,45.0,0.0,,,,3.930601644515991,0.0003480949830888473,3.9308652877807617,3.9292240142822266,0.00025,0.0,0.00025,0.00025,0.0027047140000000004,0.0042121527,0.013903748,0.0006515036,0.029686454000572925,0.01902240661079521,0.058909925818443724,-0.002814809605478502
|
||||
18,738.0,0.0,4008.0,4008.0,279.0,4008.0,0.9970785100000634,3.0,45.0,0.0,,,,3.930277814183917,0.0005110864544539217,3.930636167526245,3.9281198978424072,0.00025,0.0,0.00025,0.00025,0.0036887865999999997,0.0051101656,0.02086526,0.0008114038499999999,,,,
|
||||
19,792.0,0.0,4223.0,4223.0,215.0,4223.0,0.9968656600000679,4.0,90.0,0.0,,,,3.930134093319928,0.00047399490243328624,3.930522918701172,3.9284942150115967,0.00025,0.0,0.00025,0.00025,0.0037553142999999997,0.004891396,0.0151908295,0.0010129308999999999,0.030484313207368687,0.012861465171913404,0.04339803867042122,0.011251759901643564
|
||||
20,893.0,0.0,4630.0,4630.0,407.0,4630.0,0.9964627300000768,10.0,115.0,0.0,,,,3.929736850285294,0.000766311293002325,3.930368661880493,3.926426649093628,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.004180377,0.006044741700000001,0.031209853,0.0009457401,0.0355303921426342,0.014215304187277478,0.05135452747345026,0.012931596487761264
|
||||
21,937.0,0.0,4805.0,4805.0,175.0,4805.0,0.9962894800000806,1.0,5.0,0.0,,,,3.930479177208834,0.00023689537153461093,3.930684328079224,3.929489135742188,0.00025,0.0,0.00025,0.00025,0.0021777323,0.0034656142999999998,0.014414535,0.00058991817,,,,
|
||||
22,1022.0,0.0,5146.0,5146.0,341.0,5146.0,0.995951890000088,3.0,65.0,0.0,,,,3.93046441078186,0.00035790579075833815,3.9307262897491455,3.929075956344605,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0024591651999999998,0.0041425275,0.014986968,0.00047587089999999996,,,,
|
||||
23,1120.0,0.0,5538.0,5538.0,392.0,5538.0,0.9955638100000964,6.0,80.0,0.0,,,,3.9300818811986864,0.0004955548155674863,3.930469751358032,3.928221464157105,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0027119769,0.0042804847,0.020022545,0.00057932467,0.035476823337376714,0.014014476077534626,0.04927191920578547,0.007030519843102157
|
||||
24,1165.0,0.0,5718.0,5718.0,180.0,5718.0,0.9953856100001002,3.0,55.0,0.0,,,,3.9300585714253513,0.00053408662096811,3.9305152893066406,3.928401231765747,0.00025,0.0,0.00025,0.00025,0.0033172776,0.004863477299999999,0.016010353,0.0006072133999999999,,,,
|
||||
25,1190.0,0.0,5815.0,5815.0,97.0,5815.0,0.9952895800001024,0.0,0.0,0.0,,,,3.9299856324990587,0.0004047671393024133,3.9302456378936768,3.9285967350006095,0.00025,0.0,0.00025,0.00025,0.0030563176,0.004401815999999999,0.016188376,0.0011075826,,,,
|
||||
Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,Total steps,Epsilon,Shaped Training Reward,Training Reward,Update Target Network,Evaluation Reward,Shaped Evaluation Reward,Success Rate,Loss/Mean,Loss/Stdev,Loss/Max,Loss/Min,Learning Rate/Mean,Learning Rate/Stdev,Learning Rate/Max,Learning Rate/Min,Grads (unclipped)/Mean,Grads (unclipped)/Stdev,Grads (unclipped)/Max,Grads (unclipped)/Min,Discounted Return/Mean,Discounted Return/Stdev,Discounted Return/Max,Discounted Return/Min,Q/Mean,Q/Stdev,Q/Max,Q/Min
|
||||
1,0.0,1.0,486.0,486.0,486.0,486.0,1.0,,,0.0,,,,,,,,,,,,,,,,1.027285241237078,0.8961037725396955,3.502959469093688,0.0,,,,
|
||||
2,0.0,1.0,573.0,573.0,87.0,573.0,1.0,,,0.0,,,,,,,,,,,,,,,,0.2991949731169189,0.4147830569909918,1.0,0.0,,,,
|
||||
3,0.0,1.0,722.0,722.0,149.0,722.0,1.0,,,0.0,,,,,,,,,,,,,,,,1.089942054123867,0.6773639260883686,1.9560606270183023,0.0,,,,
|
||||
4,0.0,1.0,1057.0,1057.0,335.0,1057.0,1.0,,,0.0,,,,,,,,,,,,,,,,1.6150170189100268,1.2171006279541683,4.3034191502088746,0.0,,,,
|
||||
5,51.0,0.0,1260.0,1260.0,203.0,1260.0,0.9997990300000044,5.0,55.0,0.0,,,,3.9317551453908286,2.292077088878397e-05,3.9318559169769287,3.931660890579224,0.00025,0.0,0.00025,0.00025,0.0015475523,0.0022671083,0.0094129415,0.00074411946,1.5742518458459676,1.1031375801910266,3.252515696371334,0.0,,,,
|
||||
6,70.0,0.0,1335.0,1335.0,75.0,1335.0,0.999724780000006,2.0,15.0,0.0,,,,3.9317470851697416,8.424885298854481e-06,3.931761503219605,3.931729078292847,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0017113253,0.002546734,0.009262785,0.0007195934299999999,0.630055465573955,0.7534012288320482,1.886384871716129,0.0,,,,
|
||||
7,91.0,0.0,1422.0,1422.0,87.0,1422.0,0.9996386500000078,1.0,15.0,0.0,,,,3.9317100615728466,5.73015255981599e-05,3.9317591190338135,3.9315671920776367,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0028099740000000002,0.0035779825,0.009782379,0.0007102792,0.2731692938539037,0.40901966584690697,1.0,0.0,,,,
|
||||
8,159.0,0.0,1693.0,1693.0,271.0,1693.0,0.9993703600000136,5.0,55.0,0.0,,,,3.9316700857077067,9.248268140292744e-05,3.9317350387573238,3.931163787841797,0.00025,0.0,0.00025,0.00025,0.001684011,0.0027150003999999997,0.012804485,0.00063920295,1.3777471984624352,0.8115021837176055,3.11412900057984,0.0,,,,
|
||||
9,201.0,0.0,1861.0,1861.0,168.0,1861.0,0.9992040400000172,3.0,50.0,0.0,,,,3.9315996056511286,9.955738611988931e-05,3.9316680431365967,3.9312312602996826,0.00025,0.0,0.00025,0.00025,0.0017370107999999998,0.0027744581,0.00984679,0.0006291246,0.9971291228971556,0.7740837108535874,2.18976824447548,0.0,,,,
|
||||
10,279.0,0.0,2172.0,2172.0,311.0,2172.0,0.998896150000024,4.0,65.0,0.0,,,,3.9314646445787873,0.00019119701493129832,3.9316132068634033,3.930314779281616,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0025327114999999997,0.0038908190000000002,0.018312562,0.00061634305,1.0234306140936356,0.5002579938176909,2.1008995427938943,0.0,,,,
|
||||
11,406.0,0.0,2681.0,2681.0,509.0,2681.0,0.9983922400000348,9.0,320.0,0.0,,,,3.9312957084085065,0.00013851087435505692,3.931442260742188,3.9306914806365967,0.0002500000000000001,1.0842021724855042e-19,0.00025,0.00025,0.0016393426,0.0027615533,0.0106354095,0.0005250634,1.5487425802799972,0.9434112651663112,4.0430534797383535,0.0,0.01474813409149705,0.015984256512372744,0.036521559953690115,-0.011005972325801331
|
||||
12,471.0,0.0,2941.0,2941.0,260.0,2941.0,0.9981348400000404,7.0,110.0,0.0,,,,3.9310575301830575,0.00023637919856646093,3.9313013553619385,3.930120706558228,0.00025,0.0,0.00025,0.00025,0.0020334235999999997,0.0033391896000000004,0.011399643999999999,0.0005310598999999999,1.9247686125714616,1.4763974008694143,4.5174296147906645,0.0,,,,
|
||||
13,506.0,0.0,3082.0,3082.0,141.0,3082.0,0.9979952500000436,0.0,0.0,0.0,,,,3.9310955728803365,8.378595812170304e-05,3.9311645030975337,3.930620193481445,0.00025,0.0,0.00025,0.00025,0.0009987707,0.0018234361,0.011586366,0.000476817,0.0,0.0,0.0,0.0,0.02083865366876189,0.01069188830135163,0.04244580939412188,0.008185749500990408
|
||||
14,569.0,0.0,3331.0,3331.0,249.0,3331.0,0.9977487400000488,7.0,110.0,0.0,,,,3.931051877237136,0.0001388172588925505,3.931135892868042,3.9301624298095694,0.00025,0.0,0.00025,0.00025,0.0013598388,0.0028366724,0.015576748999999999,0.00043305519999999997,2.0098751682981617,1.1093871734323564,4.000165956499947,0.0,,,,
|
||||
15,655.0,0.0,3677.0,3677.0,346.0,3677.0,0.9974062000000564,0.0,0.0,0.0,,,,3.9305763106013454,0.0004229571946597187,3.9310512542724614,3.929146051406861,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0033595173,0.004646675,0.017301217,0.0005054546,0.0,0.0,0.0,0.0,0.020163115051886026,0.012127614312752187,0.04591513723135063,9.343400598105234e-06
|
||||
16,674.0,0.0,3753.0,3753.0,76.0,3753.0,0.997330960000058,1.0,10.0,0.0,,,,3.930436598627191,0.00020568950037311564,3.9305925369262695,3.9297053813934326,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0025036198,0.0035149802,0.013321203,0.0009690778,0.42667230386804816,0.4209997414589432,1.0,0.0,,,,
|
||||
17,723.0,0.0,3948.0,3948.0,195.0,3948.0,0.997137910000062,0.0,0.0,0.0,,,,3.9302857554688746,0.0006425071196169863,3.9306602478027344,3.927115440368652,0.00025,0.0,0.00025,0.00025,0.0037492486,0.005678748199999999,0.027824294,0.0008326736999999999,0.0,0.0,0.0,0.0,,,,
|
||||
18,754.0,0.0,4073.0,4073.0,125.0,4073.0,0.9970141600000648,2.0,15.0,0.0,,,,3.9300805368731098,0.000519938183415399,3.930445909500122,3.9286279678344727,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0035371382,0.004576198,0.014512276000000001,0.0012743992,0.4379218073475659,0.6904045765467619,1.886384871716129,0.0,0.02993758823722658,0.0171674576394353,0.0622341979295021,0.008454913645983247
|
||||
19,831.0,0.0,4381.0,4381.0,308.0,4381.0,0.9967092400000714,4.0,90.0,0.0,,,,3.930233079117614,0.0004857963882875383,3.930583238601685,3.927547216415405,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0025181014,0.0042537,0.026507894,0.0006471519,1.0691845626589795,0.8498240160885151,2.745451683091903,0.0,,,,
|
||||
20,929.0,0.0,4773.0,4773.0,392.0,4773.0,0.99632116000008,7.0,100.0,0.0,,,,3.9304481428496687,0.0003446659266870426,3.9306659698486333,3.9285593032836914,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0021123014999999998,0.003783748,0.020173741999999998,0.0005579767,1.4393231985989243,0.8717358172149811,3.0489377308973795,0.0,0.02544347631434653,0.0052816174871664155,0.03427363783121165,0.018676988035440902
|
||||
21,961.0,0.0,4902.0,4902.0,129.0,4902.0,0.9961934500000826,3.0,30.0,0.0,,,,3.9304565042257313,0.00026678316530055285,3.930674314498901,3.929453611373901,0.00025,0.0,0.00025,0.00025,0.0023043063,0.003955795,0.014118321000000001,0.0005571415,1.0833967298409597,0.9363232923629204,2.6221126076070793,0.0,,,,
|
||||
22,992.0,0.0,5026.0,5026.0,124.0,5026.0,0.9960706900000852,4.0,80.0,0.0,,,,3.930458211898804,0.0003279377866550192,3.930619239807129,3.929210662841797,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0016615093,0.0029473716999999997,0.01272093,0.0005844951999999999,1.3451618537673,1.1096991653941397,3.0898896329640837,0.0,,,,
|
||||
23,1044.0,0.0,5234.0,5234.0,208.0,5234.0,0.9958647700000898,2.0,20.0,0.0,,,,3.930192166683721,0.000400778065029482,3.930548429489136,3.928762674331665,0.00025,0.0,0.00025,0.00025,0.0028158217,0.00422772,0.014383723999999999,0.00077200204,0.5169876369665919,0.4173632077926255,1.3411660615140424,0.0,0.02365245558321531,0.011359249617777177,0.042664456740022255,0.00812225602567257
|
||||
24,1128.0,0.0,5570.0,5570.0,336.0,5570.0,0.995532130000097,7.0,110.0,0.0,,,,3.9301167712154164,0.00047407734783713377,3.930419206619263,3.92802357673645,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0026047395,0.004166825999999999,0.020599874,0.00068073766,1.4823424347747136,0.9778507351487692,3.63911799654736,0.0,,,,
|
||||
25,1170.0,0.0,5736.0,5736.0,166.0,5736.0,0.9953677900001006,3.0,55.0,0.0,,,,3.929852037895016,0.000608486381348064,3.930378675460816,3.927333116531372,0.00025,0.0,0.00025,0.00025,0.0033983607000000002,0.005062349,0.022029048,0.00085253065,0.9847135286993404,0.6559788450535955,2.041006253056759,0.0,,,,
|
||||
|
||||
|
Reference in New Issue
Block a user