mirror of
https://github.com/gryf/coach.git
synced 2026-01-29 11:35:51 +01:00
7 lines
2.3 KiB
CSV
7 lines
2.3 KiB
CSV
Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,Total steps,Epsilon,Shaped Training Reward,Training Reward,Update Target Network,Evaluation Reward,Shaped Evaluation Reward,Success Rate,Loss/Mean,Loss/Stdev,Loss/Max,Loss/Min,Learning Rate/Mean,Learning Rate/Stdev,Learning Rate/Max,Learning Rate/Min,Grads (unclipped)/Mean,Grads (unclipped)/Stdev,Grads (unclipped)/Max,Grads (unclipped)/Min,Discounted Return/Mean,Discounted Return/Stdev,Discounted Return/Max,Discounted Return/Min,Q/Mean,Q/Stdev,Q/Max,Q/Min
|
|
1,0.0,1.0,1117.0,1117.0,1117.0,1117.0,1.0,,,0.0,,,,,,,,,,,,,,,,-1.5180229894995567,0.6998808293377133,-0.08930329112720292,-3.148474706421977,,,,
|
|
2,205.0,0.0,1937.0,1937.0,820.0,1937.0,0.9991882000000176,-21.0,-21.0,0.0,,,,3.9304792799600734,0.0010089336974329131,3.931626558303833,3.92692494392395,0.0002500000000000001,1.0842021724855042e-19,0.00025,0.00025,0.0020478016,0.0020630334,0.012544215,0.00089145615,-2.3361342922088504,0.784322378590693,-0.38878391807422696,-3.369599601005491,,,,
|
|
3,413.0,0.0,2768.0,2768.0,831.0,2768.0,0.9983655100000356,-21.0,-21.0,0.0,,,,3.929040307035813,0.0010817403254347628,3.9303982257843018,3.922320127487183,0.0002500000000000001,1.0842021724855042e-19,0.00025,0.00025,0.0013938454,0.0020394863,0.01589611,0.0005865627,-2.320394201181889,0.6047235028955231,-0.7105532272722921,-3.350537576335216,0.06064815086623099,0.017702449170361085,0.09529060125351008,0.03914397135377001
|
|
4,667.0,0.0,3783.0,3783.0,1015.0,3783.0,0.9973606600000572,-20.0,-20.0,0.0,,,,3.928387508617611,0.000912089578133192,3.9293906688690186,3.925499677658081,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0011918317,0.0023538542000000003,0.01751554,0.00031032125,-1.7531357837449677,0.7448577440634202,-0.1288331810939122,-3.2971074888190803,0.06327697044859387,0.00742494439575548,0.0744991898536688,0.055326233059168416
|
|
5,867.0,0.0,4585.0,4585.0,802.0,4585.0,0.9965666800000744,-21.0,-21.0,0.0,,,,3.9282448422908782,0.0009522609916870672,3.929300546646118,3.924246072769165,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.00093484356,0.0019195807,0.016940815,0.00020796485,-2.406465837413259,0.5636980823469648,-0.7105532272722921,-3.36383697254212,0.0616140041810777,0.007093012206363309,0.07764012068510129,0.048625472933054525
|