mirror of
https://github.com/gryf/coach.git
synced 2026-04-05 03:53:32 +02:00
new traces
This commit is contained in:
@@ -1,26 +1,21 @@
|
||||
Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,Total steps,Epsilon,Shaped Training Reward,Training Reward,Update Target Network,Evaluation Reward,Shaped Evaluation Reward,Success Rate,Loss/Mean,Loss/Stdev,Loss/Max,Loss/Min,Learning Rate/Mean,Learning Rate/Stdev,Learning Rate/Max,Learning Rate/Min,Grads (unclipped)/Mean,Grads (unclipped)/Stdev,Grads (unclipped)/Max,Grads (unclipped)/Min,Q/Mean,Q/Stdev,Q/Max,Q/Min
|
||||
1,0.0,1.0,486.0,486.0,486.0,486.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
2,0.0,1.0,573.0,573.0,87.0,573.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
3,0.0,1.0,722.0,722.0,149.0,722.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
4,0.0,1.0,1057.0,1057.0,335.0,1057.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
5,51.0,0.0,1260.0,1260.0,203.0,1260.0,0.9997990300000044,5.0,55.0,0.0,,,,0.011159177685519406,0.014670889632016437,0.05586982890963554,0.00014776474563404918,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,0.06980593,0.04550845,0.23672238,0.012701003,,,,
|
||||
6,70.0,0.0,1335.0,1335.0,75.0,1335.0,0.999724780000006,2.0,15.0,0.0,,,,0.011363721369937258,0.01113743869358625,0.02980226650834084,0.00037189509021118283,0.0001,0.0,0.0001,0.0001,0.061391924,0.02929353,0.110355645,0.014809295,,,,
|
||||
7,91.0,0.0,1422.0,1422.0,87.0,1422.0,0.9996386500000078,1.0,15.0,0.0,,,,0.011624419426966813,0.013655546794886331,0.04332234337925911,0.0002809247234836221,0.0001,1.3552527156068802e-20,0.0001,0.0001,0.065822564,0.03866646,0.16192491,0.021505926,,,,
|
||||
8,159.0,0.0,1693.0,1693.0,271.0,1693.0,0.9993703600000136,5.0,55.0,0.0,,,,0.008774163406046885,0.01056874345135505,0.042830634862184525,0.0001717623672448099,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,0.05377827,0.032895934,0.16196515,0.00941183,,,,
|
||||
9,201.0,0.0,1861.0,1861.0,168.0,1861.0,0.9992040400000172,3.0,50.0,0.0,,,,0.005785983745660079,0.00916921106544553,0.04197276383638382,0.00021147351071704182,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,0.04083436,0.028236978,0.14960715,0.012452139499999999,,,,
|
||||
10,279.0,0.0,2172.0,2172.0,311.0,2172.0,0.998896150000024,4.0,65.0,0.0,,,,0.009643888652461987,0.012217253908083524,0.056894369423389435,0.00016667474119458348,0.00010000000000000003,4.0657581468206416e-20,0.0001,0.0001,0.0560394,0.039682023,0.1913731,0.008496345,,,,
|
||||
11,440.0,0.0,2815.0,2815.0,643.0,2815.0,0.9982595800000378,10.0,335.0,0.0,,,,0.00861433394022231,0.010348496102126023,0.04432229697704315,0.0001522430102340877,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,0.05220816,0.03156275,0.16941099999999998,0.009055335999999999,0.023975812000000003,0.012025122,0.040999293,0.0039341394
|
||||
12,458.0,0.0,2888.0,2888.0,73.0,2888.0,0.9981873100000394,2.0,45.0,0.0,,,,0.009530787179957971,0.010701133845478595,0.03999783843755722,0.00031216014758683736,0.0001,0.0,0.0001,0.0001,0.062311728,0.026771976,0.14921491,0.02184285,,,,
|
||||
13,478.0,0.0,2969.0,2969.0,81.0,2969.0,0.9981071200000412,0.0,0.0,0.0,,,,0.006778308925277089,0.00818221383451154,0.02816874161362648,0.0002485926379449665,0.0001,0.0,0.0001,0.0001,0.044908725,0.026523566000000002,0.117372274,0.016029207,-0.012888752,0.011372567,-0.0004688017,-0.031455092000000004
|
||||
14,532.0,0.0,3183.0,3183.0,214.0,3183.0,0.9978952600000456,4.0,50.0,0.0,,,,0.0069169835669863795,0.009669208516406907,0.030461043119430545,0.0002085747983073816,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,0.047045134,0.03206875,0.123922676,0.010909475,,,,
|
||||
15,551.0,0.0,3262.0,3262.0,79.0,3262.0,0.9978170500000474,2.0,15.0,0.0,,,,0.008465479291963243,0.01222064269286522,0.04136095941066742,0.00024427170865237713,0.0001,0.0,0.0001,0.0001,0.051463115999999996,0.036649507000000005,0.14754368,0.013367546000000001,,,,
|
||||
16,626.0,0.0,3560.0,3560.0,298.0,3560.0,0.9975220300000538,6.0,145.0,0.0,,,,0.00915405042571758,0.00990793648084188,0.038579311221838,0.0002719838812481612,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,0.055197,0.029597567,0.14903925,0.010181868,-0.011365135,0.013168923,0.013799908,-0.025668386
|
||||
17,916.0,0.0,4719.0,4719.0,1159.0,4719.0,0.9963746200000788,22.0,340.0,0.0,,,,0.00762058505652962,0.009529140287309196,0.04469184204936028,0.00013019611651543528,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,0.049977854,0.031034742999999997,0.15861663,0.008030025,0.016384887,0.018671772,0.056820348,-0.0064531965
|
||||
18,943.0,0.0,4830.0,4830.0,111.0,4830.0,0.9962647300000812,3.0,45.0,0.0,,,,0.009809370868390907,0.011517441918305206,0.04567621275782585,0.0002561989240348339,0.0001,1.3552527156068802e-20,0.0001,0.0001,0.058472212,0.027904749,0.13957499,0.021250565,,,,
|
||||
19,1006.0,0.0,5081.0,5081.0,251.0,5081.0,0.9960162400000864,0.0,0.0,0.0,,,,0.011435095637646171,0.011009362492248348,0.04369494318962097,0.0002374518953729421,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,0.06413252,0.03206017,0.17680877,0.015071165,,,,
|
||||
20,1062.0,0.0,5304.0,5304.0,223.0,5304.0,0.9957954700000912,6.0,105.0,0.0,,,,0.008425145343997948,0.010476737255273365,0.04278689250349999,0.0002318604965694249,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,0.05528172,0.033389688,0.16662869,0.013080816,0.02990371,0.01963076,0.059646500000000005,0.005463021
|
||||
21,1081.0,0.0,5379.0,5379.0,75.0,5379.0,0.9957212200000928,2.0,15.0,0.0,,,,0.007715215652225245,0.010669677149893777,0.03837666660547257,0.00035348522942513233,0.0001,0.0,0.0001,0.0001,0.055993587000000004,0.030775022000000003,0.13761143,0.023046900000000002,,,,
|
||||
22,1125.0,0.0,5556.0,5556.0,177.0,5556.0,0.9955459900000968,2.0,35.0,0.0,,,,0.007088124197418272,0.007553918383053855,0.02735380455851555,0.00016635317297186702,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,0.046250745999999995,0.027780753,0.12917177,0.009924813000000001,,,,
|
||||
23,1169.0,0.0,5733.0,5733.0,177.0,5733.0,0.9953707600001004,3.0,30.0,0.0,,,,0.007776185804686975,0.009135069977912141,0.03013703227043152,0.0002250532270409167,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,0.051641665,0.030256712999999998,0.13535246,0.012026708,,,,
|
||||
24,1190.0,0.0,5815.0,5815.0,82.0,5815.0,0.9952895800001024,1.0,5.0,0.0,,,,0.011108649816984931,0.010548835692936798,0.042301006615161896,0.00035882263910025364,0.0001,1.3552527156068802e-20,0.0001,0.0001,0.06612081,0.03200974,0.15909933,0.027230294,,,,
|
||||
25,1212.0,0.0,5904.0,5904.0,89.0,5904.0,0.9952014700001042,1.0,10.0,0.0,,,,0.004195408909502227,0.007376560022200305,0.025709044188261032,0.00019116624025627968,0.0001,1.3552527156068802e-20,0.0001,0.0001,0.03334951,0.028961857999999997,0.10913753,0.008333857,,,,
|
||||
Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,Total steps,Epsilon,Shaped Training Reward,Training Reward,Update Target Network,Evaluation Reward,Shaped Evaluation Reward,Success Rate,Loss/Mean,Loss/Stdev,Loss/Max,Loss/Min,Learning Rate/Mean,Learning Rate/Stdev,Learning Rate/Max,Learning Rate/Min,Grads (unclipped)/Mean,Grads (unclipped)/Stdev,Grads (unclipped)/Max,Grads (unclipped)/Min,Discounted Return/Mean,Discounted Return/Stdev,Discounted Return/Max,Discounted Return/Min,Q/Mean,Q/Stdev,Q/Max,Q/Min
|
||||
1,0.0,1.0,486.0,486.0,486.0,486.0,1.0,,,0.0,,,,,,,,,,,,,,,,1.027285241237078,0.8961037725396955,3.502959469093688,0.0,,,,
|
||||
2,0.0,1.0,573.0,573.0,87.0,573.0,1.0,,,0.0,,,,,,,,,,,,,,,,0.2991949731169189,0.4147830569909918,1.0,0.0,,,,
|
||||
3,0.0,1.0,722.0,722.0,149.0,722.0,1.0,,,0.0,,,,,,,,,,,,,,,,1.089942054123867,0.6773639260883686,1.9560606270183023,0.0,,,,
|
||||
4,0.0,1.0,1057.0,1057.0,335.0,1057.0,1.0,,,0.0,,,,,,,,,,,,,,,,1.6150170189100268,1.2171006279541683,4.3034191502088746,0.0,,,,
|
||||
5,51.0,0.0,1260.0,1260.0,203.0,1260.0,0.9997990300000044,5.0,55.0,0.0,,,,0.01115525748330173,0.01482958817978088,0.05945311859250069,9.304942068411036e-05,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,0.06464555,0.044470195,0.23793462,0.007608571999999999,1.5742518458459676,1.1031375801910266,3.252515696371334,0.0,,,,
|
||||
6,70.0,0.0,1335.0,1335.0,75.0,1335.0,0.999724780000006,2.0,15.0,0.0,,,,0.011412088440633131,0.011330222103483587,0.030992994084954262,0.00042172591201961035,0.0001,0.0,0.0001,0.0001,0.05938535599999999,0.02777386,0.11668128,0.020656634,0.630055465573955,0.7534012288320482,1.886384871716129,0.0,,,,
|
||||
7,91.0,0.0,1422.0,1422.0,87.0,1422.0,0.9996386500000078,1.0,15.0,0.0,,,,0.011660500895231962,0.013899003705844034,0.04478336870670319,0.0002201012684963644,0.0001,1.3552527156068802e-20,0.0001,0.0001,0.06497177,0.03783021,0.16582458,0.011831452,0.2731692938539037,0.40901966584690697,1.0,0.0,,,,
|
||||
8,159.0,0.0,1693.0,1693.0,271.0,1693.0,0.9993703600000136,5.0,55.0,0.0,,,,0.008784510728463516,0.010676103421827277,0.044153913855552666,0.00017267921066377312,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,0.052586783,0.03147318,0.16514115,0.01360802,1.3777471984624352,0.8115021837176055,3.11412900057984,0.0,,,,
|
||||
9,201.0,0.0,1861.0,1861.0,168.0,1861.0,0.9992040400000172,3.0,50.0,0.0,,,,0.0057493484051693005,0.009297238709482698,0.04292438179254532,0.0001674733939580619,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,0.038713556,0.02916971,0.15294549,0.012743682,0.9971291228971556,0.7740837108535874,2.18976824447548,0.0,,,,
|
||||
10,279.0,0.0,2172.0,2172.0,311.0,2172.0,0.998896150000024,4.0,65.0,0.0,,,,0.009585858937032008,0.012244045271861657,0.05662017315626144,8.848439028952271e-05,0.00010000000000000003,4.0657581468206416e-20,0.0001,0.0001,0.053857964,0.037834246,0.18018270000000003,0.0054985806000000005,1.0234306140936356,0.5002579938176909,2.1008995427938943,0.0,,,,
|
||||
11,406.0,0.0,2681.0,2681.0,509.0,2681.0,0.9983922400000348,9.0,320.0,0.0,,,,0.008271162704208052,0.010108575283067541,0.04325417801737785,0.00013097573537379503,0.0001,1.3552527156068802e-20,0.0001,0.0001,0.051466412999999996,0.02947413,0.15955271,0.007228236,1.5487425802799972,0.9434112651663112,4.0430534797383535,0.0,0.010711596,0.012882838,0.024684543,-0.014303938
|
||||
12,471.0,0.0,2941.0,2941.0,260.0,2941.0,0.9981348400000404,7.0,110.0,0.0,,,,0.009526190986910548,0.01270130936938865,0.0587114579975605,0.0002338076883461326,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,0.054751746,0.034732427,0.20657991,0.011495937,1.9247686125714616,1.4763974008694143,4.5174296147906645,0.0,,,,
|
||||
13,506.0,0.0,3082.0,3082.0,141.0,3082.0,0.9979952500000436,0.0,0.0,0.0,,,,0.008103997894379844,0.010146384256501963,0.02888230979442596,0.00016939456691034138,0.0001,1.3552527156068802e-20,0.0001,0.0001,0.054213032,0.03339996,0.123893134,0.00751579,0.0,0.0,0.0,0.0,0.021964371,0.014109812,0.037105702000000004,-0.004680969
|
||||
14,569.0,0.0,3331.0,3331.0,249.0,3331.0,0.9977487400000488,7.0,110.0,0.0,,,,0.007924241924727892,0.009418823926395129,0.04199397563934326,0.00015404188889078796,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,0.04968934,0.028010858,0.16092885,0.010448261,2.0098751682981617,1.1093871734323564,4.000165956499947,0.0,,,,
|
||||
15,655.0,0.0,3677.0,3677.0,346.0,3677.0,0.9974062000000564,0.0,0.0,0.0,,,,0.009106423050980084,0.010111300667633431,0.03859076648950577,0.00029026111587882037,9.999999999999998e-05,2.7105054312137605e-20,0.0001,0.0001,0.05579937,0.029248272999999998,0.14688299999999999,0.014692408,0.0,0.0,0.0,0.0,0.0037893213,0.013087699,0.021280576000000002,-0.02601921
|
||||
16,674.0,0.0,3753.0,3753.0,76.0,3753.0,0.997330960000058,1.0,10.0,0.0,,,,0.005520004818160822,0.006733671599695406,0.015792973339557648,0.00023233161482494327,0.0001,0.0,0.0001,0.0001,0.038671996,0.022766063,0.07300336,0.007988145,0.42667230386804816,0.4209997414589432,1.0,0.0,,,,
|
||||
17,723.0,0.0,3948.0,3948.0,195.0,3948.0,0.997137910000062,0.0,0.0,0.0,,,,0.006315292267554097,0.009919354506782935,0.03862195461988449,0.000192232575500384,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,0.044760402000000005,0.03878928,0.16543822,0.006780449,0.0,0.0,0.0,0.0,,,,
|
||||
18,754.0,0.0,4073.0,4073.0,125.0,4073.0,0.9970141600000648,2.0,15.0,0.0,,,,0.005961802070810189,0.007226799990202231,0.025835121050477028,0.0001774366246536374,9.999999999999996e-05,4.0657581468206416e-20,0.0001,0.0001,0.045393094,0.024198316,0.12546872,0.009217705,0.4379218073475659,0.6904045765467619,1.886384871716129,0.0,0.028437674,0.010936578999999998,0.04250892,0.011872215
|
||||
19,831.0,0.0,4381.0,4381.0,308.0,4381.0,0.9967092400000714,4.0,90.0,0.0,,,,0.006491211289842311,0.00892109273291234,0.038520261645317085,7.680161797907203e-05,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,0.046867255,0.03352056,0.15879646,0.0045105475,1.0691845626589795,0.8498240160885151,2.745451683091903,0.0,,,,
|
||||
20,933.0,0.0,4789.0,4789.0,408.0,4789.0,0.9963053200000802,5.0,35.0,0.0,,,,0.007263708718728237,0.009710189245773595,0.05345397442579269,0.0001070786820491776,0.0001,1.3552527156068802e-20,0.0001,0.0001,0.046955697000000005,0.031957038,0.18837799,0.0063061723,0.9497113318517078,0.5665372653893023,1.841181516831549,0.0,0.049459755,0.012578323999999998,0.07545762,0.038475648
|
||||
|
||||
|
Reference in New Issue
Block a user