1
0
mirror of https://github.com/gryf/coach.git synced 2026-02-13 04:15:45 +01:00
Files
coach/rl_coach/traces/Atari_DDQN_pong/trace.csv
itaicaspi-intel fa4895f840 new traces
2018-09-13 11:47:36 +03:00

2.2 KiB

1Episode #Training IterIn HeatupER #TransitionsER #EpisodesEpisode LengthTotal stepsEpsilonShaped Training RewardTraining RewardUpdate Target NetworkEvaluation RewardShaped Evaluation RewardSuccess RateLoss/MeanLoss/StdevLoss/MaxLoss/MinLearning Rate/MeanLearning Rate/StdevLearning Rate/MaxLearning Rate/MinGrads (unclipped)/MeanGrads (unclipped)/StdevGrads (unclipped)/MaxGrads (unclipped)/MinDiscounted Return/MeanDiscounted Return/StdevDiscounted Return/MaxDiscounted Return/MinQ/MeanQ/StdevQ/MaxQ/Min
210.01.01117.01117.01117.01117.01.00.0-1.51802298949955670.6998808293377133-0.08930329112720292-3.148474706421977
32205.00.01937.01937.0820.01937.00.9991882000000176-21.0-21.00.00.0128763607443344410.0131699370799383720.0582447163760662153.0656796297989786e-050.00025000000000000011.0842021724855042e-190.000250.000250.084594910.071301370.59828750.0070038475-2.33613429220885040.784322378590693-0.38878391807422696-3.369599601005491
43413.00.02768.02768.0831.02768.00.9983655100000356-21.0-21.00.00.0132820825827785950.0134586195686780020.085882939398288730.000108494772575795640.00025000000000000011.0842021724855042e-190.000250.000250.055030540.0284249039999999970.14831460.009207340999999999-2.3203942011818890.6047235028955231-0.7105532272722921-3.350537576335216-0.0156216550.008273302-0.0005000639-0.026964545
54667.00.03783.03783.01015.03783.00.9973606600000572-20.0-20.00.00.0131943116085874240.0129476860047098870.0542734339833259657.553023169748485e-050.00025000000000000015.421010862427521e-200.000250.000250.0515578170.0262056829999999970.152920590.007897207-1.75313578374496770.7448577440634202-0.1288331810939122-3.2971074888190803-0.035975120.008356134-0.020397818-0.04812158
65867.00.04585.04585.0802.04585.00.9965666800000744-21.0-21.00.00.0129970630240495660.0123497339540713690.058523606508970263.451433076406829e-050.00025000000000000015.421010862427521e-200.000250.000250.0550030840.0413355380.286134660.0044473526-2.4064658374132590.5636980823469648-0.7105532272722921-3.36383697254212-0.078644610.018148461-0.04457518-0.106537335