1
0
mirror of https://github.com/gryf/coach.git synced 2026-01-09 15:24:13 +01:00
Files
coach/rl_coach/traces/Atari_NStepQ_space_invaders/trace.csv
itaicaspi-intel fa4895f840 new traces
2018-09-13 11:47:36 +03:00

6.3 KiB

1Episode #Training IterIn HeatupER #TransitionsER #EpisodesEpisode LengthTotal stepsEpsilonShaped Training RewardTraining RewardUpdate Target NetworkEvaluation RewardShaped Evaluation RewardSuccess RateLoss/MeanLoss/StdevLoss/MaxLoss/MinLearning Rate/MeanLearning Rate/StdevLearning Rate/MaxLearning Rate/MinGrads (unclipped)/MeanGrads (unclipped)/StdevGrads (unclipped)/MaxGrads (unclipped)/MinDiscounted Return/MeanDiscounted Return/StdevDiscounted Return/MaxDiscounted Return/MinEntropy/MeanEntropy/StdevEntropy/MaxEntropy/MinQ/MeanQ/StdevQ/MaxQ/MinQ Values/MeanQ Values/StdevQ Values/MaxQ Values/MinValue Loss/MeanValue Loss/StdevValue Loss/MaxValue Loss/Min
210.01.0486.01.0486.0486.00.50.01.0272852412370780.89610377253969553.5029594690936880.0
320.01.087.01.087.0573.00.50.00.29919497311691890.41478305699099181.00.0
430.01.0149.01.0149.0722.00.50.01.0899420541238670.67736392608836861.95606062701830230.0
540.01.0335.01.0335.01057.00.50.01.61501701891002681.21710062795416834.30341915020887460.0
6549.00.0250.01.0250.01307.00.49754999999999893.060.00.00.96196607160120520.52718403700284621.98772143488902490.00.065232970.0391327930.16515993-0.046982630.037158470.160621640.99862235.2241390000000005e-06
76105.00.0278.01.0278.01585.00.49482559999999782.025.00.00.65044350802126370.49903601981055541.8775210229989680.00.061059250.0289138129999999970.22512950.000310584730.0250285510.128002820.88603484.704531e-05
87215.00.0547.01.0547.02132.00.48946499999999549.070.00.01.16682192048686081.1397742862280713.9811722920312480.00.092917740.0419091170.294346060.0163877250.062406510.199667950.90468930.00021752282999999999
98256.00.0202.01.0202.02334.00.48748539999999463.030.00.01.1432544076388880.76517394732338982.68220343440795130.00.08120660.0346993470.220752150.0339637140.068269390.230264710.89685580000000015.273441e-06
109271.00.076.01.076.02410.00.48674059999999432.045.00.00.60406992504742940.67700465749463131.80972786822125830.00.082233150.0420129820000000040.200473470.00484124760.04092740.099796760.365583799999999960.0012286354
1110330.00.0292.01.0292.02702.00.4838789999999932.035.00.00.51884249874010790.32055452849231691.19827425658891440.00.071798690.0288911829999999970.1457309-0.00054408970.0201155410.1140677260.858063341.0554600499999999e-05
1211368.00.0189.01.0189.02891.00.48202679999999225.055.00.01.65141303626981121.03404721825900573.3389282128664690.00.103574090.0380707830.190727350.0131367280.071655250.209341530.966376669.3623305e-05
1312385.00.085.01.085.02976.00.48119379999999182.055.00.00.66447402524762460.64458780339492421.75471928720363260.00.085594710.0363825260.191907810.0387430640.092004580.24593150.920603330.001493881
1413439.00.0271.01.0271.03247.00.47853799999999073.030.00.00.98053522116089880.72250093158219392.69006021581602270.00.072577190.0366232620000000040.224498880.0170267020.0516127650.191617090.939021476.006258000000001e-05
1514489.00.0247.01.0247.03494.00.47611739999998963.030.00.00.72393307932373150.68667795511915872.25984915217039850.00.096246640.0284584479999999970.181221050.041366440.045211840.173297270.935282350.00010959508
1615554.00.0322.01.0322.03816.00.47296179999998837.075.00.01.70270147451351450.87854151299900723.36468158696265450.00.088180490.032326970.192984760.018026680.065667820.200025980.932025850.000119806835
1716591.00.0185.01.0185.04001.00.47114879999998753.035.00.00.9068802766263580.53051607689961531.86874581276897780.00.106462820.0308837570.196817310.0520967360.0621617770.189774890.770372570.0006098728
1817628.00.0186.01.0186.04187.00.46932599999998670.00.00.00.00.00.00.00.105036170.026369080.175136910.0581631250.00407085570.00189350910.0085545850.0012393859
1918644.00.080.01.080.04267.00.46854199999998642.015.00.00.7024102957407660.75988379781895771.8863848717161290.00.0880577340.0149628389999999990.138396220.063810060.0776885750.208103420.76853115.7868005e-05
2019663.00.093.01.093.04360.00.4676305999999862.035.00.00.78779259628821790.67710860011016791.80163058953904560.00.072378114000000010.031771110.153466640.0275093729999999970.073170080.220934170.923135040.00035924176
2120705.00.0210.01.0210.04570.00.4655725999999853.030.00.01.12642118966764880.69637002345511272.51432015564680440.00.077457340.035694840.17048967-0.00180161980.0331466979999999950.113874340.542829639.045503e-05
2221724.00.094.01.094.04664.00.46465139999998472.045.00.00.74871429775873850.65857624202900131.7700431458051550.00.0855812950.0313171930.160332860.039459910.0318897250.091075670.370298920.00048189453
2322846.00.0608.01.0608.05272.00.458692999999982112.0340.00.01.78425223779460131.25960949538376844.99279301489311860.00.1040085550.0400398040.204781530.0080270650.065217280.188979160.820460265.0944614e-05
2423885.00.0194.01.0194.05466.00.45679179999998136.080.00.02.06447943240277841.06344261042956313.980520880292830.00.1194644050.0341195580.184608950.0392332520.066161990.169747890.85552180000000010.0008571786999999999
2524904.00.095.01.095.05561.00.45586079999998091.030.00.00.217248122480362520.38550222388885411.00.00.097626550.0296755940.17338550.062558420.0315562340.118385960.51964320.0013286468
2625923.00.094.01.094.05655.00.45493959999998050.00.00.00.00.00.00.00.063507390.0140134960.102996499999999990.031822980.000332424800000000060.000192094320000000020.00074635365000000010.000114553884