mirror of
https://github.com/gryf/coach.git
synced 2026-02-14 21:15:53 +01:00
7 lines
2.5 KiB
CSV
7 lines
2.5 KiB
CSV
Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,Total steps,Epsilon,Shaped Training Reward,Training Reward,Update Target Network,Evaluation Reward,Shaped Evaluation Reward,Success Rate,Loss/Mean,Loss/Stdev,Loss/Max,Loss/Min,Learning Rate/Mean,Learning Rate/Stdev,Learning Rate/Max,Learning Rate/Min,Grads (unclipped)/Mean,Grads (unclipped)/Stdev,Grads (unclipped)/Max,Grads (unclipped)/Min,Discounted Return/Mean,Discounted Return/Stdev,Discounted Return/Max,Discounted Return/Min,Entropy/Mean,Entropy/Stdev,Entropy/Max,Entropy/Min,Advantages/Mean,Advantages/Stdev,Advantages/Max,Advantages/Min,Values/Mean,Values/Stdev,Values/Max,Values/Min,Value Loss/Mean,Value Loss/Stdev,Value Loss/Max,Value Loss/Min,Policy Loss/Mean,Policy Loss/Stdev,Policy Loss/Max,Policy Loss/Min
|
|
1,0.0,1.0,881.0,1.0,881.0,881.0,0.0,,,0.0,,,,,,,,,,,,,,,,-2.041213323423532,0.9183659584454216,0.4796594773496936,-3.352701688899176,,,,,,,,,,,,,,,,,,,,
|
|
2,0.0,1.0,1043.0,1.0,1043.0,1924.0,0.0,,,0.0,,,,,,,,,,,,,,,,-1.7995206029952229,0.6440801924897366,-0.3927560490055896,-3.2471439401326068,,,,,,,,,,,,,,,,,,,,
|
|
3,38.0,0.0,763.0,1.0,763.0,2687.0,0.0,-21.0,-21.0,0.0,,,,,,,,,,,,1.3813618,1.3755096000000002,5.5379830000000005,0.0015163413000000001,-2.5178046202451694,0.5843148195084643,-0.7105532272722921,-3.3699982440767453,1.7471887,0.055258866,1.7901558999999998,1.5866796,-0.1592098490531115,0.4154601793782861,0.5181965827941895,-1.0076508522033691,-1.0213921000000001,0.9139581,0.05576827400000001,-2.8376002000000002,0.09897748,0.11257933,0.3836943,2.9006495999999997e-06,-0.28488272,0.5594197,0.49081215,-1.4856113000000002
|
|
4,75.0,0.0,740.0,1.0,740.0,3427.0,0.0,-21.0,-21.0,0.0,,,,,,,,,,,,3.2764843,1.857115,7.888277499999999,0.25566658,-2.533184641659896,0.5861942513660167,-0.7105532272722921,-3.3699982440767453,1.1448658,0.26420638,1.5718536,0.75876945,-0.053371320168177284,0.4283249731162562,0.6155099868774414,-0.9759833812713624,-2.7395887,0.34059632,-2.3099797000000004,-3.3791809999999995,0.09315539,0.06426737,0.24503651,0.033598172999999995,-0.07731818,0.43035093,0.41724620000000007,-1.0952158
|
|
5,113.0,0.0,755.0,1.0,755.0,4182.0,0.0,-21.0,-21.0,0.0,,,,,,,,,,,,2.9129169999999998,1.8344038,7.434381,0.2987832,-2.5246431129611286,0.5835765895797549,-0.7105532272722921,-3.3699982440767453,0.9606895000000001,0.09958161,1.0971520000000001,0.79424876,-0.08736807929502953,0.4281761045632924,0.5726819038391113,-0.9797717332839966,-2.3036256,0.30664575,-1.9442793999999999,-3.1548097,0.09548396599999999,0.0768301,0.26862615,0.023751104,-0.08123907,0.3593619,0.44418138,-0.9607479999999999
|