mirror of
https://github.com/gryf/coach.git
synced 2026-03-06 01:05:47 +01:00
new traces
This commit is contained in:
@@ -1,31 +1,26 @@
|
||||
Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,Total steps,Epsilon,Shaped Training Reward,Training Reward,Update Target Network,Evaluation Reward,Shaped Evaluation Reward,Success Rate,Loss/Mean,Loss/Stdev,Loss/Max,Loss/Min,Learning Rate/Mean,Learning Rate/Stdev,Learning Rate/Max,Learning Rate/Min,Grads (unclipped)/Mean,Grads (unclipped)/Stdev,Grads (unclipped)/Max,Grads (unclipped)/Min,Q/Mean,Q/Stdev,Q/Max,Q/Min
|
||||
1,0.0,1.0,269.0,269.0,269.0,269.0,7.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
2,0.0,1.0,531.0,531.0,262.0,531.0,8.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
3,0.0,1.0,654.0,654.0,123.0,654.0,0.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
4,0.0,1.0,1173.0,1173.0,519.0,1173.0,2.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
5,100.0,0.0,1572.0,1572.0,399.0,1572.0,8.0,10.0,310.0,0.0,,,,0.006223844418564113,0.008294042663087463,0.03155895695090294,9.275647607864812e-05,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.005592896,0.0043458864,0.015006336,0.0010827626,,,,
|
||||
6,160.0,0.0,1812.0,1812.0,240.0,1812.0,4.0,7.0,130.0,0.0,,,,0.008564803576276366,0.010985852447389552,0.04601012542843819,0.00010247386671835555,0.00025,0.0,0.00025,0.00025,0.0060127693999999995,0.005001401,0.020867711,0.0012939627,,,,
|
||||
7,185.0,0.0,1914.0,1914.0,102.0,1914.0,8.0,2.0,15.0,0.0,,,,0.005707002155832015,0.009575807855094808,0.03112555481493473,0.00017016606580000368,0.00025,0.0,0.00025,0.00025,0.0047362293,0.004079403,0.014057411,0.0019318176000000002,,,,
|
||||
8,229.0,0.0,2090.0,2090.0,176.0,2090.0,7.0,2.0,15.0,0.0,,,,0.00864216006702072,0.013155937701958298,0.061171818524599075,0.00018360336252953854,0.00025,0.0,0.00025,0.00025,0.0063004736,0.0053449036,0.02487476,0.0019890803,,,,
|
||||
9,244.0,0.0,2149.0,2149.0,59.0,2149.0,5.0,2.0,15.0,0.0,,,,0.006669382058524727,0.0073984037571708594,0.015499015338718891,0.0002397242496954277,0.0002500000000000001,1.0842021724855042e-19,0.00025,0.00025,0.0056597376,0.0035718853999999996,0.0101093175,0.0022593176,,,,
|
||||
10,267.0,0.0,2239.0,2239.0,90.0,2239.0,3.0,2.0,35.0,0.0,,,,0.0062163660673515714,0.008715943338641199,0.030871812254190445,0.00019301722932141277,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0052448297,0.003933181500000001,0.013718200000000002,0.0018610907000000002,,,,
|
||||
11,314.0,0.0,2430.0,2430.0,191.0,2430.0,8.0,3.0,30.0,0.0,,,,0.005064984451622722,0.009464219831212449,0.04566681012511253,0.00017265054339077324,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0042512245,0.0038818533000000003,0.016594999,0.0016967895000000002,0.027018031,0.010441347,0.0474995,0.016540313
|
||||
12,334.0,0.0,2508.0,2508.0,78.0,2508.0,0.0,2.0,45.0,0.0,,,,0.009793104943941887,0.011249256480204521,0.030716722831130024,0.0001681474968791008,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.006330653,0.0047096196,0.014098721000000002,0.0016581904999999999,,,,
|
||||
13,378.0,0.0,2684.0,2684.0,176.0,2684.0,5.0,0.0,0.0,0.0,,,,0.01011617302819187,0.013193202268065932,0.04607892408967018,0.00014670072414446622,0.00025,0.0,0.00025,0.00025,0.0067802290000000005,0.005344481,0.022279864,0.0016253429999999998,0.027286835,0.0073864055,0.03329719,0.016612418
|
||||
14,425.0,0.0,2872.0,2872.0,188.0,2872.0,0.0,0.0,0.0,0.0,,,,0.00757620267153896,0.010181129044846313,0.03055970929563045,0.00019950376008637252,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.005839123000000001,0.004426101,0.01861591,0.0021889664000000002,,,,
|
||||
15,449.0,0.0,2967.0,2967.0,95.0,2967.0,6.0,3.0,30.0,0.0,,,,0.0070000348653896545,0.011226164764985254,0.04456117376685143,0.00021107358043082056,0.00025,0.0,0.00025,0.00025,0.005659159,0.0046324306,0.021839907000000002,0.0021402768,,,,
|
||||
16,469.0,0.0,3049.0,3049.0,82.0,3049.0,3.0,0.0,0.0,0.0,,,,0.012940272329433357,0.009718707321816513,0.030684769153594967,0.0003000017604790628,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.008273507,0.0035852243,0.013593527,0.0028905305,,,,
|
||||
17,533.0,0.0,3306.0,3306.0,257.0,3306.0,1.0,5.0,55.0,0.0,,,,0.007539691670444881,0.009121751516234046,0.03060857020318508,0.00022119178902357817,0.00025,0.0,0.00025,0.00025,0.00609803,0.0035867486,0.013320565,0.002192039,,,,
|
||||
18,585.0,0.0,3511.0,3511.0,205.0,3511.0,7.0,0.0,0.0,0.0,,,,0.005838182990213253,0.007284520898622485,0.01573643647134304,0.00017755883163772523,0.00025,0.0,0.00025,0.00025,0.0050161253,0.0035143814,0.010200171999999999,0.0018448817,,,,
|
||||
19,632.0,0.0,3701.0,3701.0,190.0,3701.0,5.0,2.0,25.0,0.0,,,,0.006030775471020767,0.008624205468393242,0.030819704756140712,0.00014619529247283936,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0049460824,0.004009163499999999,0.014025801000000001,0.0014488354999999998,,,,
|
||||
20,680.0,0.0,3891.0,3891.0,190.0,3891.0,4.0,0.0,0.0,0.0,,,,0.0062177468741235024,0.009185724365931972,0.030945468693971637,0.00016168373986147344,0.00025,0.0,0.00025,0.00025,0.0048525543,0.0041472296999999995,0.014570421,0.0015842235999999998,,,,
|
||||
21,729.0,0.0,4090.0,4090.0,199.0,4090.0,9.0,4.0,50.0,0.0,,,,0.0066686894893717525,0.009633275859106637,0.03070710971951485,0.00016243076242972163,0.00025,0.0,0.00025,0.00025,0.005217642,0.0044929385,0.01947369,0.00170155,0.021158978,0.011703089,0.040702187,0.0043722745
|
||||
22,804.0,0.0,4390.0,4390.0,300.0,4390.0,9.0,5.0,60.0,0.0,,,,0.007745159575574075,0.010264969595287615,0.0457281582057476,0.0001735425612423569,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.005858070999999999,0.004608556,0.02206757,0.0016346257,,,,
|
||||
23,862.0,0.0,4619.0,4619.0,229.0,4619.0,6.0,3.0,30.0,0.0,,,,0.0073957111507249795,0.010238454419935428,0.045198917388916016,0.00018422666471451518,0.00025,0.0,0.00025,0.00025,0.005702048,0.0044779684,0.019911936,0.0017970852,,,,
|
||||
24,882.0,0.0,4699.0,4699.0,80.0,4699.0,6.0,0.0,0.0,0.0,,,,0.007019620326900622,0.010097406329511898,0.030556553974747658,0.00021815481886733326,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0058081313,0.0048652836,0.019417763,0.0023302154,,,,
|
||||
25,945.0,0.0,4951.0,4951.0,252.0,4951.0,5.0,4.0,50.0,0.0,,,,0.005672615208563262,0.007662691003304536,0.02989559806883335,0.00017223272880073634,0.00025,0.0,0.00025,0.00025,0.004905078,0.0036695688,0.013604815,0.0018130213,0.031090358,0.004259917,0.037605517000000005,0.025178626000000003
|
||||
26,995.0,0.0,5152.0,5152.0,201.0,5152.0,8.0,2.0,15.0,0.0,,,,0.006299167421530001,0.008046825175071413,0.030643418431282043,0.00017975828086491674,0.00025,0.0,0.00025,0.00025,0.005176335,0.003915025999999999,0.014020402,0.0017273452,0.026928194,0.009660842,0.041887067,0.010047999
|
||||
27,1017.0,0.0,5242.0,5242.0,90.0,5242.0,1.0,2.0,35.0,0.0,,,,0.005731220244011969,0.008559611287002292,0.03012747503817081,0.00019501463975757358,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0051502184999999995,0.004566707,0.01945674,0.0021261019,0.02149797,0.010033373,0.03370452,0.008069546
|
||||
28,1072.0,0.0,5462.0,5462.0,220.0,5462.0,3.0,2.0,55.0,0.0,,,,0.008864355713336004,0.011839999879392651,0.046134039759635925,0.0001610755716683343,0.00025,0.0,0.00025,0.00025,0.0062677735,0.0050042396999999995,0.020127073,0.0017192016,0.02061991,0.0075885756,0.034549624,0.010614768
|
||||
29,1118.0,0.0,5646.0,5646.0,184.0,5646.0,4.0,3.0,20.0,0.0,,,,0.0072352889821761185,0.008737181206568531,0.030466778203845024,0.00018102813919540492,0.00025,0.0,0.00025,0.00025,0.005792571999999999,0.004318339,0.019932609,0.0020496019,,,,
|
||||
30,1175.0,0.0,5874.0,5874.0,228.0,5874.0,4.0,5.0,85.0,0.0,,,,0.008313204468972149,0.011042285375825469,0.045756932348012924,0.00019610222079791129,0.00025,0.0,0.00025,0.00025,0.005883634,0.0046995464,0.022168385,0.001801039,0.0073951124,0.010906539,0.025537572999999997,-0.0070570237
|
||||
Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,Total steps,Epsilon,Shaped Training Reward,Training Reward,Update Target Network,Evaluation Reward,Shaped Evaluation Reward,Success Rate,Loss/Mean,Loss/Stdev,Loss/Max,Loss/Min,Learning Rate/Mean,Learning Rate/Stdev,Learning Rate/Max,Learning Rate/Min,Grads (unclipped)/Mean,Grads (unclipped)/Stdev,Grads (unclipped)/Max,Grads (unclipped)/Min,Discounted Return/Mean,Discounted Return/Stdev,Discounted Return/Max,Discounted Return/Min,Q/Mean,Q/Stdev,Q/Max,Q/Min
|
||||
1,0.0,1.0,269.0,269.0,269.0,269.0,7.0,,,0.0,,,,,,,,,,,,,,,,1.1777548651006522,0.7953334800368667,3.04158102714528,0.0,,,,
|
||||
2,0.0,1.0,531.0,531.0,262.0,531.0,8.0,,,0.0,,,,,,,,,,,,,,,,0.3442313865024097,0.26731465870050863,1.0,0.0,,,,
|
||||
3,0.0,1.0,654.0,654.0,123.0,654.0,0.0,,,0.0,,,,,,,,,,,,,,,,1.1194499207617956,0.862098603062819,2.450733217907448,0.0,,,,
|
||||
4,0.0,1.0,1173.0,1173.0,519.0,1173.0,2.0,,,0.0,,,,,,,,,,,,,,,,1.1038465051213655,1.1369108437507858,4.161070816478141,0.0,,,,
|
||||
5,100.0,0.0,1572.0,1572.0,399.0,1572.0,8.0,10.0,310.0,0.0,,,,0.006273858311178628,0.008330142333180622,0.03179644048213959,0.0001070434009307064,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0057809628,0.00428058,0.015232059,0.0012842978,2.054682483279469,0.9981946272625823,4.353923952687973,0.0,,,,
|
||||
6,160.0,0.0,1812.0,1812.0,240.0,1812.0,4.0,7.0,130.0,0.0,,,,0.00858094445017438,0.011025487792674208,0.04672722890973091,0.00010337847197661175,0.00025,0.0,0.00025,0.00025,0.005872111,0.0049856184,0.020408265,0.0012264452000000001,1.83971605615766,1.54653748962161,4.492326630353285,0.0,,,,
|
||||
7,185.0,0.0,1914.0,1914.0,102.0,1914.0,8.0,2.0,15.0,0.0,,,,0.0057056179083883754,0.009566845016376965,0.030910406261682514,0.00015892417286522686,0.00025,0.0,0.00025,0.00025,0.0045871167,0.004069118,0.013834482,0.0016493909,0.8252216843886011,0.7249623919611342,1.8953382542587165,0.0,,,,
|
||||
8,229.0,0.0,2090.0,2090.0,176.0,2090.0,7.0,2.0,15.0,0.0,,,,0.008657716054585762,0.013191662302277632,0.060961790382862084,0.00018780565005727112,0.00025,0.0,0.00025,0.00025,0.006128102,0.0052965875,0.024218792000000003,0.0018669614000000002,0.8372836508642453,0.5450147907804874,1.886384871716129,0.0,,,,
|
||||
9,244.0,0.0,2149.0,2149.0,59.0,2149.0,5.0,2.0,15.0,0.0,,,,0.00667665019240563,0.007406433018503216,0.01548141520470381,0.00024485771427862346,0.0002500000000000001,1.0842021724855042e-19,0.00025,0.00025,0.005659986,0.0035369787,0.010256552,0.0024132975,0.46716053564921,0.6576401247022132,1.8687458127689778,0.0,,,,
|
||||
10,267.0,0.0,2239.0,2239.0,90.0,2239.0,3.0,2.0,35.0,0.0,,,,0.006187197646637365,0.008654079896911358,0.030595635995268818,0.00020239711739122868,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.005233875,0.0037543268,0.013406766,0.002017471,0.7963928061047579,0.6503180718510583,1.770043145805155,0.0,,,,
|
||||
11,401.0,0.0,2775.0,2775.0,536.0,2775.0,8.0,8.0,105.0,0.0,,,,0.0076730817593521185,0.01026273844391202,0.0459497831761837,0.00017323925567325205,0.00025,0.0,0.00025,0.00025,0.0056375875,0.004533787,0.021587799999999997,0.0016972864999999998,1.274149577263458,0.9814292642439238,3.909936321269157,0.0,0.020429587,0.009730016,0.04222724,-0.0036528922999999997
|
||||
12,442.0,0.0,2941.0,2941.0,166.0,2941.0,8.0,6.0,95.0,0.0,,,,0.009460052854392859,0.011893971040711302,0.0601826086640358,0.00024936438421718776,0.00025,0.0,0.00025,0.00025,0.006743224,0.004512203,0.020062562,0.0024123169,2.1739952594843905,1.247283866258882,3.8537544767205016,0.0,,,,
|
||||
13,496.0,0.0,3156.0,3156.0,215.0,3156.0,7.0,2.0,55.0,0.0,,,,0.008886155373787645,0.01211537698485043,0.06058269366621971,0.00024669029517099256,0.00025,0.0,0.00025,0.00025,0.0064274530000000005,0.0050618723,0.027024375,0.0023406029999999997,0.5393877770998244,0.6154190288564962,1.7856781408072189,0.0,0.032848313,0.008609116,0.040870699999999996,0.01987039
|
||||
14,541.0,0.0,3335.0,3335.0,179.0,3335.0,5.0,1.0,5.0,0.0,,,,0.009253808953669958,0.010618086101890231,0.03098195604979992,0.00024773561744950706,0.00025,0.0,0.00025,0.00025,0.006421773,0.00394707,0.01344751,0.0024552035999999998,0.1617021076691104,0.3359277220934725,1.0,0.0,0.03360373,0.007870216999999999,0.039596006,0.016850319
|
||||
15,593.0,0.0,3543.0,3543.0,208.0,3543.0,1.0,4.0,40.0,0.0,,,,0.00918442351954022,0.01275409618221497,0.04474706575274468,0.0002603356551844627,0.00025,0.0,0.00025,0.00025,0.006705689,0.0054350337,0.021499146,0.0024255246,0.9277385930791114,0.9300546476425536,2.827112112528587,0.0,,,,
|
||||
16,643.0,0.0,3743.0,3743.0,200.0,3743.0,7.0,2.0,35.0,0.0,,,,0.008653623021091334,0.01203271051514775,0.04561404511332512,0.00025741007993929094,0.00025,0.0,0.00025,0.00025,0.006199294,0.004773637,0.020930363,0.0022822001,0.6712173748129522,0.6092674326727069,1.8514577710948756,0.0,,,,
|
||||
17,769.0,0.0,4247.0,4247.0,504.0,4247.0,4.0,8.0,120.0,0.0,,,,0.007997047552115484,0.011587850390758431,0.0613202415406704,0.00022856102441437545,0.0002500000000000001,1.0842021724855042e-19,0.00025,0.00025,0.00598843,0.0047509655999999996,0.030977622000000003,0.0021550405999999998,1.385963941755423,0.9458111472215864,3.9015703845088727,0.0,0.030356152,0.008328333,0.045441985,0.019884652
|
||||
18,803.0,0.0,4383.0,4383.0,136.0,4383.0,7.0,0.0,0.0,0.0,,,,0.008612036458062529,0.010332630430020251,0.03037862852215767,0.0002405663690296933,0.00025,0.0,0.00025,0.00025,0.0061402004,0.003962394,0.013849353,0.0022057625,0.0,0.0,0.0,0.0,,,,
|
||||
19,828.0,0.0,4483.0,4483.0,100.0,4483.0,3.0,1.0,15.0,0.0,,,,0.008099889304721728,0.011316411439653937,0.04556084796786308,0.00023716632858850065,0.00025,0.0,0.00025,0.00025,0.0061904215,0.004684817,0.019425906,0.0021622777,0.4473165228376146,0.3859060679188835,1.0,0.0,,,,
|
||||
20,929.0,0.0,4889.0,4889.0,406.0,4889.0,0.0,7.0,80.0,0.0,,,,0.008402860848495902,0.011576927779356556,0.0453546978533268,0.00022958195768296719,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.006206388,0.004747717,0.020835804,0.0021647965,1.3430331078057811,1.0463286436371946,3.709441691234059,0.0,0.023571777999999998,0.010907986000000001,0.042958718,0.00632574
|
||||
21,1012.0,0.0,5221.0,5221.0,332.0,5221.0,8.0,2.0,30.0,0.0,,,,0.005650608528423661,0.008218237986471697,0.03046272695064545,0.0002068828180199489,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0050593624,0.0040467440000000006,0.019566683,0.0018410714,0.4718607999390638,0.5336089280183028,1.770043145805155,0.0,0.015006665,0.006017194599999999,0.026400073,0.0025955157
|
||||
22,1045.0,0.0,5351.0,5351.0,130.0,5351.0,0.0,1.0,30.0,0.0,,,,0.002537768723524289,0.006608280106071086,0.0305725522339344,0.0002002959663514048,0.00025,0.0,0.00025,0.00025,0.00334153,0.003618995,0.019435143000000002,0.0017342078,0.35671674984062657,0.3848848926286408,1.0,0.0,,,,
|
||||
23,1135.0,0.0,5711.0,5711.0,360.0,5711.0,2.0,3.0,20.0,0.0,,,,0.006407883726610129,0.008698550527715315,0.03079607151448727,0.00015418978000525382,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0050226753,0.0041869559999999995,0.01992405,0.0015568208999999999,0.674559103612383,0.5515052753627817,2.0483907280574467,0.0,,,,
|
||||
24,1152.0,0.0,5782.0,5782.0,71.0,5782.0,4.0,0.0,0.0,0.0,,,,0.007435832170920227,0.010654573019591494,0.031099731102585793,0.0002141469449270517,0.00025,0.0,0.00025,0.00025,0.0054329154,0.0044891206,0.014260428,0.0020032807,0.0,0.0,0.0,0.0,,,,
|
||||
25,1193.0,0.0,5946.0,5946.0,164.0,5946.0,0.0,3.0,65.0,0.0,,,,0.005160149779476342,0.009222892010527532,0.03091062419116497,0.00019036485173273834,0.00025,0.0,0.00025,0.00025,0.004480932,0.004335616699999999,0.01924327,0.0018914957999999998,1.0087524143851263,0.8821235128988212,2.4841851845494327,0.0,0.014996342,0.010180945,0.03520646,-0.0037689934999999997
|
||||
|
||||
|
Reference in New Issue
Block a user