1
0
mirror of https://github.com/gryf/coach.git synced 2026-01-08 23:04:15 +01:00
Files
coach/rl_coach/traces/Atari_NStepQ_space_invaders/trace.csv
2018-08-20 13:01:30 +03:00

4.0 KiB

1Episode #Training IterIn HeatupER #TransitionsER #EpisodesEpisode LengthTotal stepsEpsilonShaped Training RewardTraining RewardUpdate Target NetworkEvaluation RewardShaped Evaluation RewardSuccess RateLoss/MeanLoss/StdevLoss/MaxLoss/MinLearning Rate/MeanLearning Rate/StdevLearning Rate/MaxLearning Rate/MinGrads (unclipped)/MeanGrads (unclipped)/StdevGrads (unclipped)/MaxGrads (unclipped)/MinEntropy/MeanEntropy/StdevEntropy/MaxEntropy/MinQ/MeanQ/StdevQ/MaxQ/MinQ Values/MeanQ Values/StdevQ Values/MaxQ Values/MinValue Loss/MeanValue Loss/StdevValue Loss/MaxValue Loss/Min
210.01.0486.01.0486.0486.00.50.0
320.01.087.01.087.0573.00.50.0
430.01.0149.01.0149.0722.00.50.0
540.01.0335.01.0335.01057.00.50.0
6536.00.0180.01.0180.01237.00.49823599999999923.030.00.00.07098280.028847680.14847249-0.0250732450.155365110.677425564.07636740.00025629386
7651.00.074.01.074.01311.00.49751079999999892.015.00.00.091549960.0348548780.171960070.0297620350.063003210.14260230.494944840.0034788419
8777.00.0131.01.0131.01442.00.49622699999999842.035.00.00.076172020.0238978660.149186220.0351343079999999960.0165505150.049224390.189125120.00011201962
98118.00.0204.01.0204.01646.00.49422779999999752.015.00.00.0591036079999999950.0208528490.115871710.0068478854000000010.037765220.167416020.94840949999999997.4577442e-06
109137.00.092.01.092.01738.00.49332619999999711.05.00.00.073523630.0340355929999999960.151434720.00441058170.051406390.206718430.92840759999999990.00020915868000000003
1110201.00.0321.01.0321.02059.00.490180399999995710.0115.00.00.086821830.042597160.301257580.00205281870.083775680.184612380.69677970.00044282363
1211265.00.0317.01.0317.02376.00.48707379999999448.0130.00.00.1071656050.0367079860.231808770.013808320.092328980.225255710.873422860.0018040526999999998
1312310.00.0224.01.0224.02600.00.48487859999999343.020.00.00.0860897150.0276298820.197093640.0257831420000000020.0252148660000000020.080485480.397416539.443184499999999e-05
1413338.00.0138.01.0138.02738.00.48352619999999291.010.00.00.0566245170.0147420570.091845780.0230958440.0135570220.066710450.360113927.6326745e-05
1514378.00.0200.01.0200.02938.00.4815661999999921.05.00.00.0690437850.0307515640.164672880.00381359270.019711270.10511510.67585299999999994.7275649999999995e-05
1615422.00.0221.01.0221.03159.00.47940039999999113.030.00.00.069175300000000010.0278136020000000030.132012890.0169762560000000020.048627380.184986371.04391130000000026.747579e-05
1716460.00.0190.01.0190.03349.00.47753839999999032.045.00.00.0563442930.0236357790.10303167-0.0096497810.0328468529999999950.143941060.834435640.00015374989
1817511.00.0255.01.0255.03604.00.47503939999998926.075.00.00.079822380.037055710.15894309-0.0030642270.071160450.201188250.86395949999999990.00021242326000000001
1918583.00.0360.01.0360.03964.00.47151139999998774.050.00.00.07020580.033363750.18290229-0.00284839170.0274936220000000020.129534421.01797064.404120299999999e-06
2019623.00.0199.01.0199.04163.00.46956119999998682.035.00.00.065758280.0203134790.12968860.0317516620.028963620.147150280.9305239.032046999999998e-05
2120673.00.0247.01.0247.04410.00.46714059999998585.035.00.00.081917940.0255158380.167645770.023472380.0510371480.150771799999999980.69755030000000012.4204688e-05