1
0
mirror of https://github.com/gryf/coach.git synced 2026-01-30 20:35:47 +01:00
Files
coach/rl_coach/traces/Atari_DQN_with_PER_pong/trace.csv
itaicaspi-intel fa4895f840 new traces
2018-09-13 11:47:36 +03:00

2.2 KiB

1Episode #Training IterIn HeatupER #TransitionsER #EpisodesEpisode LengthTotal stepsEpsilonShaped Training RewardTraining RewardUpdate Target NetworkEvaluation RewardShaped Evaluation RewardSuccess RateLoss/MeanLoss/StdevLoss/MaxLoss/MinLearning Rate/MeanLearning Rate/StdevLearning Rate/MaxLearning Rate/MinGrads (unclipped)/MeanGrads (unclipped)/StdevGrads (unclipped)/MaxGrads (unclipped)/MinDiscounted Return/MeanDiscounted Return/StdevDiscounted Return/MaxDiscounted Return/MinQ/MeanQ/StdevQ/MaxQ/Min
210.01.01117.01117.01117.01117.01.00.0-1.51802298949955670.6998808293377133-0.08930329112720292-3.148474706421977
32197.00.01905.01905.0788.01905.00.9992908000000232-21.0-21.00.00.00674039618927866750.00432182675391287050.031044436618685724.4621716369874775e-050.00025000000000000015.421010862427521e-200.000250.000250.0238669870000000030.017431930.228154360.004472835-2.43123295645188180.5717677860635341-0.7105532272722921-3.3662833646890835
43436.00.02862.02862.0957.02862.00.9984295000000516-20.0-20.00.00.0067799847836559440.0033410043930959930.016288518905639650.000372040551155805640.00025000000000000011.0842021724855042e-190.000250.000250.017012290.00637941300000000040.0428165940000000060.0057905857-1.96512994964373360.7810357358559473-0.3655772928295825-3.2941461345643885-0.0318792050.019740151-0.0044416133-0.077873565
54627.00.03623.03623.0761.03623.00.9977446000000744-21.0-21.00.00.0067535874732512690.0032234895231069140.0141785107553005220.00042253875290043650.00025000000000000015.421010862427521e-200.000250.000250.0149213440.00526257140.0328783170000000040.0076742154-2.51964812682642720.5839729089128289-0.7105532272722921-3.3699982440767453
65855.00.04535.04535.0912.04535.00.9969238000001012-20.0-20.00.00.0065664660953763430.00325644657705614120.015960766002535820.000409813219448551540.00025000000000000011.0842021724855042e-190.000250.000250.0137286619999999990.004757780.040373580.00424472-1.94805571959019170.7908203737498453-0.21371412100620468-3.2726053764291825-0.0381362180.013395666-0.016326109-0.0594768