mirror of
https://github.com/gryf/coach.git
synced 2026-04-05 03:53:32 +02:00
new traces
This commit is contained in:
@@ -1,26 +1,26 @@
|
||||
Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,Total steps,Epsilon,Shaped Training Reward,Training Reward,Update Target Network,Evaluation Reward,Shaped Evaluation Reward,Success Rate,Loss/Mean,Loss/Stdev,Loss/Max,Loss/Min,Learning Rate/Mean,Learning Rate/Stdev,Learning Rate/Max,Learning Rate/Min,Grads (unclipped)/Mean,Grads (unclipped)/Stdev,Grads (unclipped)/Max,Grads (unclipped)/Min,Q/Mean,Q/Stdev,Q/Max,Q/Min
|
||||
1,0.0,1.0,486.0,486.0,486.0,486.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
2,0.0,1.0,573.0,573.0,87.0,573.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
3,0.0,1.0,722.0,722.0,149.0,722.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
4,0.0,1.0,1057.0,1057.0,335.0,1057.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
5,63.0,0.0,1310.0,1310.0,253.0,1310.0,0.9997495300000054,4.0,50.0,0.0,,,,0.007803874562153987,0.008763884069155965,0.04718368873000145,2.0029816369060427e-05,6.25e-05,0.0,6.25e-05,6.25e-05,0.021732036,0.022223754,0.1446681,0.0012787414999999999,,,,
|
||||
6,191.0,0.0,1821.0,1821.0,511.0,1821.0,0.9992436400000164,12.0,185.0,0.0,,,,0.0076840334204318905,0.00407478669790096,0.020887335762381557,0.0006209309794940053,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.024990046000000002,0.007374348,0.05583174,0.01457165,,,,
|
||||
7,296.0,0.0,2240.0,2240.0,419.0,2240.0,0.9988288300000254,5.0,100.0,0.0,,,,0.006064200656865503,0.0026079780747149924,0.013106426224112509,0.0005442567635327578,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.022204678999999998,0.0051587676,0.03801172,0.01337866,0.04552897400000001,0.014450824,0.06804762,0.022983871
|
||||
8,339.0,0.0,2414.0,2414.0,174.0,2414.0,0.9986565700000292,1.0,5.0,0.0,,,,0.0056167520910263245,0.003348133333552833,0.01847168803215027,0.0006152484565973282,6.25e-05,0.0,6.25e-05,6.25e-05,0.022583058,0.006212645699999999,0.04925069,0.014691319,0.117131494,0.075825356,0.25262827,0.034186434
|
||||
9,368.0,0.0,2529.0,2529.0,115.0,2529.0,0.9985427200000316,3.0,30.0,0.0,,,,0.00567412653721736,0.0029112874704095106,0.012542505748569964,0.0006649551214650272,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.02317206,0.005647781,0.034866843,0.014415748999999999,,,,
|
||||
10,411.0,0.0,2702.0,2702.0,173.0,2702.0,0.9983714500000354,3.0,75.0,0.0,,,,0.005447928440421386,0.0027157055388668696,0.011556550860404968,0.0005230194656178355,6.25e-05,0.0,6.25e-05,6.25e-05,0.022507405,0.0063080876,0.04279238,0.014129612,,,,
|
||||
11,465.0,0.0,2915.0,2915.0,213.0,2915.0,0.99816058000004,3.0,20.0,0.0,,,,0.006813380568516704,0.002953363187898618,0.018070373684167862,0.0024055785033851858,6.25e-05,0.0,6.25e-05,6.25e-05,0.024714846000000002,0.0069003645,0.053911198,0.013334683,,,,
|
||||
12,510.0,0.0,3097.0,3097.0,182.0,3097.0,0.9979804000000438,4.0,60.0,0.0,,,,0.0057438461899033035,0.0028426672841737203,0.013382650911808014,0.0006364500150084497,6.25e-05,0.0,6.25e-05,6.25e-05,0.023799596,0.0060355333,0.047333322000000004,0.012709315,,,,
|
||||
13,550.0,0.0,3258.0,3258.0,161.0,3258.0,0.9978210100000472,3.0,75.0,0.0,,,,0.0061742550285998725,0.002734396119005929,0.011426813900470734,0.0025493670254945755,6.25e-05,0.0,6.25e-05,6.25e-05,0.024373332,0.0076977109999999994,0.054041553,0.015785009,,,,
|
||||
14,594.0,0.0,3433.0,3433.0,175.0,3433.0,0.9976477600000512,4.0,50.0,0.0,,,,0.0054328095094777285,0.0027096778707884584,0.01172078587114811,0.0007941549411043526,6.25e-05,0.0,6.25e-05,6.25e-05,0.023894975,0.0066084154,0.04917719,0.01552412,,,,
|
||||
15,630.0,0.0,3578.0,3578.0,145.0,3578.0,0.9975042100000542,2.0,25.0,0.0,,,,0.005161296885085499,0.002379623212789025,0.011234099976718426,0.000592207710724324,6.25e-05,0.0,6.25e-05,6.25e-05,0.022190819,0.0047294693,0.033406414,0.014175736999999999,,,,
|
||||
16,675.0,0.0,3756.0,3756.0,178.0,3756.0,0.997327990000058,0.0,0.0,0.0,,,,0.005717846387679772,0.002502733532058393,0.011211811564862728,0.0006601698696613313,6.25e-05,0.0,6.25e-05,6.25e-05,0.025067486,0.006331243,0.04131097,0.016266715,,,,
|
||||
17,779.0,0.0,4171.0,4171.0,415.0,4171.0,0.9969171400000668,6.0,80.0,0.0,,,,0.004081658166307114,0.0020001996419927288,0.009709015488624571,0.0003917928552255034,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.018329315,0.0046630735,0.031186484,0.008738925,0.022281086000000002,0.02669226,0.06086207,-0.0070810173999999995
|
||||
18,802.0,0.0,4265.0,4265.0,94.0,4265.0,0.9968240800000692,1.0,30.0,0.0,,,,0.003856045330631668,0.002170383825603264,0.007952725514769554,0.0005409078439697623,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.018558994,0.0060107456999999994,0.033156354,0.012791273999999998,,,,
|
||||
19,859.0,0.0,4494.0,4494.0,229.0,4494.0,0.996597370000074,5.0,100.0,0.0,,,,0.003978008200647309,0.0016841297405167286,0.008312854915857315,0.0003705012204591185,6.25e-05,0.0,6.25e-05,6.25e-05,0.018162485,0.0049022716,0.03275322,0.010325382,0.035759527,0.035056762000000005,0.08535823,-0.008915286
|
||||
20,925.0,0.0,4758.0,4758.0,264.0,4758.0,0.9963360100000797,6.0,75.0,0.0,,,,0.002300493763714957,0.0010825562309593726,0.0046387091279029855,0.0002016235230257735,6.25e-05,0.0,6.25e-05,6.25e-05,0.010100276,0.0024906192,0.01585796,0.0059240386,0.048761707,0.05004603,0.15401264,-0.0024325964
|
||||
21,952.0,0.0,4866.0,4866.0,108.0,4866.0,0.996229090000082,0.0,0.0,0.0,,,,0.002475268014957412,0.0012914969110412403,0.00562380813062191,0.0003233719035051763,6.25e-05,0.0,6.25e-05,6.25e-05,0.01129343,0.0028471393,0.01932526,0.007399376500000001,,,,
|
||||
22,989.0,0.0,5012.0,5012.0,146.0,5012.0,0.9960845500000849,2.0,45.0,0.0,,,,0.002166505141455369,0.000924038288373833,0.004925021436065435,0.00027738657081499696,6.25e-05,0.0,6.25e-05,6.25e-05,0.010186652,0.0026935977,0.019467099999999998,0.007402484,,,,
|
||||
23,1033.0,0.0,5187.0,5187.0,175.0,5187.0,0.9959113000000888,0.0,0.0,0.0,,,,0.0021631214036791453,0.0010276500026280158,0.004965011961758137,0.00023919624800328165,6.25e-05,0.0,6.25e-05,6.25e-05,0.009726720999999999,0.0021573787,0.01670704,0.006440047,0.13069957,0.037176996000000004,0.19228284,0.08094616
|
||||
24,1089.0,0.0,5412.0,5412.0,225.0,5412.0,0.9956885500000936,3.0,30.0,0.0,,,,0.002553392111232305,0.0011096866629888736,0.005850483663380146,0.0003285239799879492,6.25e-05,0.0,6.25e-05,6.25e-05,0.011104784,0.002389212,0.017829941999999998,0.00757342,0.0682852,0.061801534000000005,0.18812282,-0.006229040999999999
|
||||
25,1136.0,0.0,5602.0,5602.0,190.0,5602.0,0.9955004500000976,2.0,45.0,0.0,,,,0.001876247199648555,0.0011046318131782585,0.004761672578752041,0.00023924620472826064,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.009521739,0.002407699,0.016262773,0.005831246700000001,0.035645377,0.06185295,0.17193483,-0.037299167
|
||||
Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,Total steps,Epsilon,Shaped Training Reward,Training Reward,Update Target Network,Evaluation Reward,Shaped Evaluation Reward,Success Rate,Loss/Mean,Loss/Stdev,Loss/Max,Loss/Min,Learning Rate/Mean,Learning Rate/Stdev,Learning Rate/Max,Learning Rate/Min,Grads (unclipped)/Mean,Grads (unclipped)/Stdev,Grads (unclipped)/Max,Grads (unclipped)/Min,Discounted Return/Mean,Discounted Return/Stdev,Discounted Return/Max,Discounted Return/Min,Q/Mean,Q/Stdev,Q/Max,Q/Min
|
||||
1,0.0,1.0,486.0,486.0,486.0,486.0,1.0,,,0.0,,,,,,,,,,,,,,,,1.027285241237078,0.8961037725396955,3.502959469093688,0.0,,,,
|
||||
2,0.0,1.0,573.0,573.0,87.0,573.0,1.0,,,0.0,,,,,,,,,,,,,,,,0.2991949731169189,0.4147830569909918,1.0,0.0,,,,
|
||||
3,0.0,1.0,722.0,722.0,149.0,722.0,1.0,,,0.0,,,,,,,,,,,,,,,,1.089942054123867,0.6773639260883686,1.9560606270183023,0.0,,,,
|
||||
4,0.0,1.0,1057.0,1057.0,335.0,1057.0,1.0,,,0.0,,,,,,,,,,,,,,,,1.6150170189100268,1.2171006279541683,4.3034191502088746,0.0,,,,
|
||||
5,63.0,0.0,1310.0,1310.0,253.0,1310.0,0.9997495300000054,4.0,50.0,0.0,,,,0.004012163915961407,0.006262272993724664,0.04764580726623535,8.1564921856625e-06,6.25e-05,0.0,6.25e-05,6.25e-05,0.010623638999999999,0.014628718999999998,0.11750877,0.0006018049299999999,1.222244018436626,0.936837542398956,3.1882608013105234,0.0,,,,
|
||||
6,191.0,0.0,1821.0,1821.0,511.0,1821.0,0.9992436400000164,12.0,185.0,0.0,,,,0.004986882026675779,0.0024525258547375595,0.01212594285607338,0.00019069857080467043,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.012066028999999999,0.004054811,0.023936076,0.0052656345,2.2788441379494553,1.4480347036158143,5.334774783194502,0.0,,,,
|
||||
7,296.0,0.0,2240.0,2240.0,419.0,2240.0,0.9988288300000254,5.0,100.0,0.0,,,,0.002852302261384293,0.001423902026771749,0.006419077049940825,0.00032718142028898,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.008651931,0.0021564893,0.015036376,0.005514461,0.8555964976400694,1.0053707470132562,3.3749244373511424,0.0,0.045712102000000004,0.0046962714,0.051285498,0.037267745
|
||||
8,339.0,0.0,2414.0,2414.0,174.0,2414.0,0.9986565700000292,1.0,5.0,0.0,,,,0.0022072479261496906,0.0011851067892783525,0.005776813253760339,0.0002716210437938571,6.25e-05,0.0,6.25e-05,6.25e-05,0.007669631999999999,0.0017825919000000001,0.013650602,0.004986409,0.3973882352674416,0.32154192970544776,1.0,0.0,0.10220742,0.033463497,0.153544,0.06425184
|
||||
9,368.0,0.0,2529.0,2529.0,115.0,2529.0,0.9985427200000316,3.0,30.0,0.0,,,,0.0022113858742938775,0.0011680986343581435,0.004550112411379814,0.00028897859738208354,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.0072303605000000005,0.0016598894,0.010692931999999999,0.0048725903,0.6324934579648669,0.8584618010459154,2.5898325667156983,0.0,,,,
|
||||
10,411.0,0.0,2702.0,2702.0,173.0,2702.0,0.9983714500000354,3.0,75.0,0.0,,,,0.002077218892694408,0.0010814756493981728,0.004706204403191805,0.0002305081870872528,6.25e-05,0.0,6.25e-05,6.25e-05,0.007076809599999999,0.001648983,0.013651845,0.0049567529999999995,1.0608731055181009,0.7741962088105712,2.3536752936697938,0.0,,,,
|
||||
11,465.0,0.0,2915.0,2915.0,213.0,2915.0,0.99816058000004,3.0,20.0,0.0,,,,0.002422780042320912,0.0012927514366501244,0.005057375878095628,0.0002319362247362733,6.25e-05,0.0,6.25e-05,6.25e-05,0.007722950500000001,0.0019650976,0.013632878000000001,0.004534565999999999,0.9256049353481748,0.5663397851070973,1.7696505901309243,0.0,,,,
|
||||
12,510.0,0.0,3097.0,3097.0,182.0,3097.0,0.9979804000000438,4.0,60.0,0.0,,,,0.002710532541580809,0.001212259293564437,0.005337233189493418,0.00020097008382435888,6.25e-05,0.0,6.25e-05,6.25e-05,0.008514446,0.0022909213,0.014541608000000001,0.0045710043,1.3110499512651883,0.7061102045075827,2.617221396387248,0.0,,,,
|
||||
13,550.0,0.0,3258.0,3258.0,161.0,3258.0,0.9978210100000472,3.0,75.0,0.0,,,,0.002600164190880605,0.0014034534888808146,0.006483706180006266,0.00019826518837362528,6.25e-05,0.0,6.25e-05,6.25e-05,0.008385532,0.002349005,0.016131336,0.005278410999999999,1.0703466266135009,0.8490488659932097,2.503485520019768,0.0,,,,
|
||||
14,594.0,0.0,3433.0,3433.0,175.0,3433.0,0.9976477600000512,4.0,50.0,0.0,,,,0.0022486129387817885,0.0011733820626057582,0.004828908480703832,0.0002223936462542042,6.25e-05,0.0,6.25e-05,6.25e-05,0.008088347,0.0021400757,0.01399398,0.0054029343,1.3808433281553778,0.7416611931247653,2.5777888872395627,0.0,,,,
|
||||
15,630.0,0.0,3578.0,3578.0,145.0,3578.0,0.9975042100000542,2.0,25.0,0.0,,,,0.002595809635952012,0.0011731639916013946,0.004997591953724623,0.0002623785985633731,6.25e-05,0.0,6.25e-05,6.25e-05,0.008864019,0.0025098345,0.015585932,0.0048996774,0.3767929397358389,0.4664994895961535,1.5753547499769285,0.0,,,,
|
||||
16,675.0,0.0,3756.0,3756.0,178.0,3756.0,0.997327990000058,0.0,0.0,0.0,,,,0.0026418176857987423,0.0013215013550629145,0.007002991624176502,0.0002453049528412521,6.25e-05,0.0,6.25e-05,6.25e-05,0.009046442,0.0025474594,0.016441913,0.005280598,0.0,0.0,0.0,0.0,,,,
|
||||
17,779.0,0.0,4171.0,4171.0,415.0,4171.0,0.9969171400000668,6.0,80.0,0.0,,,,0.0023643675442424584,0.001207029356730382,0.005960710346698761,0.00019269902259111404,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.0085099405,0.002143361,0.016746926999999998,0.0045285644,1.2064564511640037,0.9581523932003888,3.7053456169634456,0.0,0.037320096000000004,0.03258535,0.10248235,0.008374133
|
||||
18,802.0,0.0,4265.0,4265.0,94.0,4265.0,0.9968240800000692,1.0,30.0,0.0,,,,0.0026463923555717843,0.0013860409596273074,0.005166415125131607,0.0002855767379514873,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.008782689,0.0024150796,0.0153460745,0.005183509,0.4758686413166112,0.3805813846183533,1.0,0.0,,,,
|
||||
19,859.0,0.0,4494.0,4494.0,229.0,4494.0,0.996597370000074,5.0,100.0,0.0,,,,0.002195212906052914,0.0012138090083981426,0.00528534222394228,0.00019210220489185306,6.25e-05,0.0,6.25e-05,6.25e-05,0.008517075,0.002382889,0.017914765,0.005308585,1.7352332608258287,0.8915224300531083,3.1694045534542283,0.0,0.06356255,0.03258758,0.11672841,0.028774487
|
||||
20,925.0,0.0,4758.0,4758.0,264.0,4758.0,0.9963360100000797,6.0,75.0,0.0,,,,0.0025167439267254213,0.0011864448561579714,0.005621550604701042,0.0002340352803003043,6.25e-05,0.0,6.25e-05,6.25e-05,0.008684341,0.0017787067000000001,0.014223633999999999,0.0059472983999999994,1.689846122458243,1.273814066516635,3.9579986855743465,0.0,0.04556285,0.030785719,0.098121285,0.012000842
|
||||
21,952.0,0.0,4866.0,4866.0,108.0,4866.0,0.996229090000082,0.0,0.0,0.0,,,,0.002560251447273633,0.0009665735161980654,0.004035839810967445,0.00024799819220788777,6.25e-05,0.0,6.25e-05,6.25e-05,0.008927823,0.0020366234,0.0152958,0.005353358000000001,0.0,0.0,0.0,0.0,,,,
|
||||
22,989.0,0.0,5012.0,5012.0,146.0,5012.0,0.9960845500000849,2.0,45.0,0.0,,,,0.002593663415205406,0.0011781043455332306,0.0047058621421456346,0.00024635010049678385,6.25e-05,0.0,6.25e-05,6.25e-05,0.009508743,0.0019255057000000001,0.01250373,0.006235984599999999,0.920688534667319,0.5000778477909199,1.8097278682212583,0.0,,,,
|
||||
23,1032.0,0.0,5184.0,5184.0,172.0,5184.0,0.9959142700000888,0.0,0.0,0.0,,,,0.002412760020761621,0.0012379089332650072,0.005492463242262603,0.00022076028108131143,6.25e-05,0.0,6.25e-05,6.25e-05,0.009503809,0.0025141584,0.017699867,0.0062589524,0.0,0.0,0.0,0.0,0.10933289,0.032549884,0.16467445,0.07506848
|
||||
24,1045.0,0.0,5236.0,5236.0,52.0,5236.0,0.9958627900000898,1.0,5.0,0.0,,,,0.0026766185809929785,0.0012504540423699385,0.005386156961321832,0.0011498613748699427,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.009200559,0.0022626007000000003,0.013827433,0.00582417,0.14856789533092288,0.3485317499642583,1.0,0.0,0.08756345,0.019930143,0.1093124,0.054611407
|
||||
25,1093.0,0.0,5428.0,5428.0,192.0,5428.0,0.995672710000094,3.0,45.0,0.0,,,,0.002222697652844848,0.0013756604614442107,0.005762553308159113,0.0001781654136721045,6.25e-05,0.0,6.25e-05,6.25e-05,0.008849018,0.0021958454000000002,0.014359153999999999,0.0046170973,0.59836742898907,0.5357145251150862,2.130812614153282,0.0,0.03703947,0.028580425,0.07965194,-0.014937886000000001
|
||||
|
||||
|
Reference in New Issue
Block a user