1
0
mirror of https://github.com/gryf/coach.git synced 2026-02-15 05:25:55 +01:00
Files
coach/rl_coach/traces/Atari_DDQN_with_PER_pong/trace.csv
2018-08-20 13:01:30 +03:00

1.7 KiB

1Episode #Training IterIn HeatupER #TransitionsER #EpisodesEpisode LengthTotal stepsEpsilonShaped Training RewardTraining RewardUpdate Target NetworkEvaluation RewardShaped Evaluation RewardSuccess RateLoss/MeanLoss/StdevLoss/MaxLoss/MinLearning Rate/MeanLearning Rate/StdevLearning Rate/MaxLearning Rate/MinGrads (unclipped)/MeanGrads (unclipped)/StdevGrads (unclipped)/MaxGrads (unclipped)/MinQ/MeanQ/StdevQ/MaxQ/Min
210.01.01117.01117.01117.01117.01.00.0
32221.00.02002.02002.0885.02002.00.999123850000019-21.0-21.00.00.0066247951047143660.003945768119718490.018638413399457936.383289291989058e-056.250000000000003e-052.7105054312137605e-206.25e-056.25e-050.0321271350.0146033430000000010.128386970.005512589
43455.00.02938.02938.0936.02938.00.9981972100000392-20.0-20.00.00.0069939585235447460.00316274189369341020.018264940008521080.0006336648948490626.250000000000003e-052.7105054312137605e-206.25e-056.25e-050.0263826750.0100495410.060189440.009578557-0.081022580.054663535-0.0028564844-0.15667786
54659.00.03754.03754.0816.03754.00.9973893700000568-21.0-21.00.00.006532420617130650.00300143680761973250.0145973619073629383.4910688555100926e-056.250000000000001e-051.3552527156068802e-206.25e-056.25e-050.0199086480.00603361599999999950.037865780.003926692
65906.00.04739.04739.0985.04739.00.9964142200000778-20.0-20.00.00.0053253663984939890.002580318728543360.018239885568618776.391682836692779e-056.250000000000003e-052.7105054312137605e-206.25e-056.25e-050.0167084750.0064446460.0512274059999999960.0036940586-0.0422566420000000040.010646114-0.030611286-0.06712968