1
0
mirror of https://github.com/gryf/coach.git synced 2026-01-30 20:35:47 +01:00
Files
coach/rl_coach/traces/Atari_DDQN_with_PER_pong/trace.csv
itaicaspi-intel fa4895f840 new traces
2018-09-13 11:47:36 +03:00

2.2 KiB

1Episode #Training IterIn HeatupER #TransitionsER #EpisodesEpisode LengthTotal stepsEpsilonShaped Training RewardTraining RewardUpdate Target NetworkEvaluation RewardShaped Evaluation RewardSuccess RateLoss/MeanLoss/StdevLoss/MaxLoss/MinLearning Rate/MeanLearning Rate/StdevLearning Rate/MaxLearning Rate/MinGrads (unclipped)/MeanGrads (unclipped)/StdevGrads (unclipped)/MaxGrads (unclipped)/MinDiscounted Return/MeanDiscounted Return/StdevDiscounted Return/MaxDiscounted Return/MinQ/MeanQ/StdevQ/MaxQ/Min
210.01.01117.01117.01117.01117.01.00.0-1.51802298949955670.6998808293377133-0.08930329112720292-3.148474706421977
32197.00.01905.01905.0788.01905.00.9992198800000168-21.0-21.00.00.00648663340397604650.0041318049225530680.031044436618685721.4448891306528823e-056.250000000000001e-051.3552527156068802e-206.25e-056.25e-050.038787650.0234844440.228154360.00323429-2.43123295645188180.5717677860635341-0.7105532272722921-3.3662833646890835
43436.00.02862.02862.0957.02862.00.9982724500000376-20.0-20.00.00.0057871305161749040.002609594320861060.014277644455432890.00015483902825508276.250000000000003e-052.7105054312137605e-206.25e-056.25e-050.0287592240.0117048760000000010.071632350.008223475-1.96512994964373360.7810357358559473-0.3655772928295825-3.2941461345643885-0.168238060.05095485599999999-0.08356075-0.26015088
54627.00.03623.03623.0761.03623.00.997519060000054-21.0-21.00.00.0059630453924527450.00285146009604270120.0143609466031193722.424295598757453e-056.250000000000001e-051.3552527156068802e-206.25e-056.25e-050.0272999960.0123759789999999990.073475620.0030203340000000004-2.51964812682642720.5839729089128289-0.7105532272722921-3.3699982440767453
65855.00.04535.04535.0912.04535.00.9966161800000736-20.0-20.00.00.0062358804033576970.0026864953187147790.0158764906227588620.000162674288731068376.250000000000003e-052.7105054312137605e-206.25e-056.25e-050.0281697530.010848090.077402430.011433218-1.94805571959019170.7908203737498453-0.21371412100620468-3.2726053764291825-0.193394680.031096203-0.15218829999999997-0.26763937