1
0
mirror of https://github.com/gryf/coach.git synced 2026-02-16 05:55:46 +01:00
Files
coach/rl_coach/traces/Atari_QR_DQN_pong/trace.csv
itaicaspi-intel fa4895f840 new traces
2018-09-13 11:47:36 +03:00

2.2 KiB

1Episode #Training IterIn HeatupER #TransitionsER #EpisodesEpisode LengthTotal stepsEpsilonShaped Training RewardTraining RewardUpdate Target NetworkEvaluation RewardShaped Evaluation RewardSuccess RateLoss/MeanLoss/StdevLoss/MaxLoss/MinLearning Rate/MeanLearning Rate/StdevLearning Rate/MaxLearning Rate/MinGrads (unclipped)/MeanGrads (unclipped)/StdevGrads (unclipped)/MaxGrads (unclipped)/MinDiscounted Return/MeanDiscounted Return/StdevDiscounted Return/MaxDiscounted Return/MinQ/MeanQ/StdevQ/MaxQ/Min
210.01.01117.01117.01117.01117.01.00.0-1.51802298949955670.6998808293377133-0.08930329112720292-3.148474706421977
32205.00.01937.01937.0820.01937.00.9991882000000176-21.0-21.00.036.3505545464957742.01083151839504200.26660156252.56333684921264655.000000000000001e-056.776263578034403e-215e-055e-0512.83259310.05785899999999967.4945453.6044636-2.33613429220885040.784322378590693-0.38878391807422696-3.369599601005491
43413.00.02768.02768.0831.02768.00.9983655100000356-21.0-21.00.038.1156401978089342.376735792713546272.3593752.47922849655151375.0000000000000016e-051.3552527156068802e-205e-055e-0534.64264334.25269297.73087.9129830000000005-2.3203942011818890.6047235028955231-0.7105532272722921-3.350537576335216-0.016137846485895960.007600676424319005-0.0064334499527467425-0.029101890049059883
54667.00.03783.03783.01015.03783.00.9973606600000572-20.0-20.00.035.28230247535104534.09448844961585136.958038330078122.9029393196105965.000000000000001e-056.776263578034403e-215e-055e-0554.84554300000000631.036062200.4751921.653633-1.75313578374496770.7448577440634202-0.1288331810939122-3.2971074888190803-0.048537609380437060.011840542664502246-0.034349839405913365-0.06640744950796945
65867.00.04585.04585.0802.04585.00.9965666800000744-21.0-21.00.033.230964983701733.90203852171519171.32331848144533.09047913551330575.000000000000001e-056.776263578034403e-215e-055e-0556.777434.80046265.0421427.841105-2.4064658374132590.5636980823469648-0.7105532272722921-3.36383697254212-0.0364136993611949360.009885933390973514-0.017495695663383236-0.05450057732872665