mirror of
https://github.com/gryf/coach.git
synced 2025-12-18 11:40:18 +01:00
10 KiB
10 KiB
| 1 | Episode # | Training Iter | In Heatup | ER #Transitions | ER #Episodes | Episode Length | Total steps | Epsilon | Shaped Training Reward | Training Reward | Update Target Network | Evaluation Reward | Shaped Evaluation Reward | Success Rate | Loss/Mean | Loss/Stdev | Loss/Max | Loss/Min | Learning Rate/Mean | Learning Rate/Stdev | Learning Rate/Max | Learning Rate/Min | Grads (unclipped)/Mean | Grads (unclipped)/Stdev | Grads (unclipped)/Max | Grads (unclipped)/Min |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 1 | 0.0 | 1.0 | 65.0 | 1.0 | 65.0 | 65.0 | 0.5 | 0.0 | |||||||||||||||||
| 3 | 2 | 0.0 | 1.0 | 140.0 | 2.0 | 75.0 | 140.0 | 0.5 | 0.0 | |||||||||||||||||
| 4 | 3 | 0.0 | 1.0 | 187.0 | 3.0 | 47.0 | 187.0 | 0.5 | 0.0 | |||||||||||||||||
| 5 | 4 | 0.0 | 1.0 | 262.0 | 4.0 | 75.0 | 262.0 | 0.5 | 0.0 | |||||||||||||||||
| 6 | 5 | 0.0 | 1.0 | 265.0 | 5.0 | 3.0 | 265.0 | 0.5 | 0.0 | |||||||||||||||||
| 7 | 6 | 0.0 | 1.0 | 277.0 | 6.0 | 12.0 | 277.0 | 0.5 | 0.0 | |||||||||||||||||
| 8 | 7 | 0.0 | 1.0 | 343.0 | 7.0 | 66.0 | 343.0 | 0.5 | 0.0 | |||||||||||||||||
| 9 | 8 | 0.0 | 1.0 | 356.0 | 8.0 | 13.0 | 356.0 | 0.5 | 0.0 | |||||||||||||||||
| 10 | 9 | 0.0 | 1.0 | 366.0 | 9.0 | 10.0 | 366.0 | 0.5 | 0.0 | |||||||||||||||||
| 11 | 10 | 0.0 | 1.0 | 372.0 | 10.0 | 6.0 | 372.0 | 0.5 | 0.0 | |||||||||||||||||
| 12 | 11 | 0.0 | 1.0 | 447.0 | 11.0 | 75.0 | 447.0 | 0.5 | 0.0 | |||||||||||||||||
| 13 | 12 | 0.0 | 1.0 | 452.0 | 12.0 | 5.0 | 452.0 | 0.5 | 0.0 | |||||||||||||||||
| 14 | 13 | 0.0 | 1.0 | 456.0 | 13.0 | 4.0 | 456.0 | 0.5 | 0.0 | |||||||||||||||||
| 15 | 14 | 0.0 | 1.0 | 531.0 | 14.0 | 75.0 | 531.0 | 0.5 | 0.0 | |||||||||||||||||
| 16 | 15 | 0.0 | 1.0 | 535.0 | 15.0 | 4.0 | 535.0 | 0.5 | 0.0 | |||||||||||||||||
| 17 | 16 | 0.0 | 1.0 | 604.0 | 16.0 | 69.0 | 604.0 | 0.5 | 0.0 | |||||||||||||||||
| 18 | 17 | 0.0 | 1.0 | 634.0 | 17.0 | 30.0 | 634.0 | 0.5 | 0.0 | |||||||||||||||||
| 19 | 18 | 0.0 | 1.0 | 709.0 | 18.0 | 75.0 | 709.0 | 0.5 | 0.0 | |||||||||||||||||
| 20 | 19 | 0.0 | 1.0 | 746.0 | 19.0 | 37.0 | 746.0 | 0.5 | 0.0 | |||||||||||||||||
| 21 | 20 | 0.0 | 1.0 | 752.0 | 20.0 | 6.0 | 752.0 | 0.5 | 0.0 | |||||||||||||||||
| 22 | 21 | 0.0 | 1.0 | 761.0 | 21.0 | 9.0 | 761.0 | 0.5 | 0.0 | |||||||||||||||||
| 23 | 22 | 0.0 | 1.0 | 836.0 | 22.0 | 75.0 | 836.0 | 0.5 | 0.0 | |||||||||||||||||
| 24 | 23 | 0.0 | 1.0 | 902.0 | 23.0 | 66.0 | 902.0 | 0.5 | 0.0 | |||||||||||||||||
| 25 | 24 | 0.0 | 1.0 | 905.0 | 24.0 | 3.0 | 905.0 | 0.5 | 0.0 | |||||||||||||||||
| 26 | 25 | 0.0 | 1.0 | 909.0 | 25.0 | 4.0 | 909.0 | 0.5 | 0.0 | |||||||||||||||||
| 27 | 26 | 0.0 | 1.0 | 984.0 | 26.0 | 75.0 | 984.0 | 0.5 | 0.0 | |||||||||||||||||
| 28 | 27 | 0.0 | 1.0 | 993.0 | 27.0 | 9.0 | 993.0 | 0.5 | 0.0 | |||||||||||||||||
| 29 | 28 | 0.0 | 1.0 | 1000.0 | 28.0 | 7.0 | 1000.0 | 0.5 | 0.0 | |||||||||||||||||
| 30 | 29 | 0.0 | 1.0 | 1012.0 | 29.0 | 12.0 | 1012.0 | 0.5 | 0.0 | |||||||||||||||||
| 31 | 30 | 0.0 | 1.0 | 1058.0 | 30.0 | 46.0 | 1058.0 | 0.5 | 0.0 | |||||||||||||||||
| 32 | 31 | 74.0 | 0.0 | 1133.0 | 31.0 | 75.0 | 1133.0 | 0.4962500000000004 | -310.0 | -310.0 | 0.0 | 9862.112614812078 | 5108.627430680448 | 21896.46875 | 4428.638671875 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 19652.328 | 8994.96 | 52983.04 | 6429.6387 | |||
| 33 | 32 | 149.0 | 0.0 | 1208.0 | 32.0 | 75.0 | 1208.0 | 0.4925000000000008 | -330.0 | -330.0 | 0.0 | 3830.6351790364574 | 643.7340248125081 | 5340.5830078125 | 2646.113525390625 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 8379.321 | 5266.063 | 22653.16 | 1860.6244 | |||
| 34 | 33 | 194.0 | 0.0 | 1253.0 | 33.0 | 45.0 | 1253.0 | 0.4902500000000011 | -122.0 | -122.0 | 0.0 | 3059.363802083333 | 588.2946622227233 | 4644.080078125 | 1812.8056640625 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 8209.5625 | 4655.1914 | 19927.584 | 1891.3015 | |||
| 35 | 34 | 269.0 | 0.0 | 1328.0 | 34.0 | 75.0 | 1328.0 | 0.4865000000000015 | -350.0 | -350.0 | 0.0 | 2846.889031575521 | 476.7265607773383 | 4139.458984375 | 1698.8955078125 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 6443.3677 | 3683.1653 | 17744.254 | 1654.5441 | |||
| 36 | 35 | 344.0 | 0.0 | 1403.0 | 35.0 | 75.0 | 1403.0 | 0.4827500000000019 | -345.0 | -345.0 | 0.0 | 2482.868015950521 | 453.8919717206632 | 3878.35205078125 | 1454.6219482421875 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 7611.8936 | 3933.5952 | 19037.822 | 1435.7284 | |||
| 37 | 36 | 419.0 | 0.0 | 1478.0 | 36.0 | 75.0 | 1478.0 | 0.4790000000000023 | -320.0 | -320.0 | 0.0 | 2371.336440429688 | 465.8108835988031 | 3901.125244140625 | 1313.65380859375 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 9474.646 | 5553.234 | 24757.568 | 1271.4858 | |||
| 38 | 37 | 494.0 | 0.0 | 1553.0 | 37.0 | 75.0 | 1553.0 | 0.4752500000000027 | -325.0 | -325.0 | 0.0 | 2169.166463216146 | 425.75691268537287 | 3692.046630859375 | 1355.68359375 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 8821.158000000001 | 5241.8975 | 27872.492000000002 | 1564.2307 | |||
| 39 | 38 | 569.0 | 0.0 | 1628.0 | 38.0 | 75.0 | 1628.0 | 0.4715000000000032 | -340.0 | -340.0 | 0.0 | 2110.4203141276043 | 459.47185940817917 | 3180.8662109375 | 1098.3739013671877 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 8521.446 | 6072.1846 | 34998.13 | 1994.5767 | |||
| 40 | 39 | 644.0 | 0.0 | 1703.0 | 39.0 | 75.0 | 1703.0 | 0.4677500000000036 | -340.0 | -340.0 | 0.0 | 2034.7563606770834 | 460.3998665400683 | 3170.345947265625 | 1119.7576904296877 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 12934.934 | 7226.505 | 32803.66 | 792.9248 | |||
| 41 | 40 | 678.0 | 0.0 | 1737.0 | 40.0 | 34.0 | 1737.0 | 0.4660500000000037 | -48.0 | -48.0 | 0.0 | 1953.1156221277572 | 545.1958983368963 | 3336.509521484375 | 1179.089111328125 | 0.0001 | 1.3552527156068802e-20 | 0.0001 | 0.0001 | 12777.6875 | 7534.3335 | 28442.002 | 1934.1208 | |||
| 42 | 41 | 753.0 | 0.0 | 1812.0 | 41.0 | 75.0 | 1812.0 | 0.4623000000000042 | -335.0 | -335.0 | 0.0 | 2128.1311783854167 | 520.2510966435275 | 3962.064208984375 | 1156.8756103515625 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 9502.953000000001 | 5733.1 | 35032.797 | 1371.4753 | |||
| 43 | 42 | 828.0 | 0.0 | 1887.0 | 42.0 | 75.0 | 1887.0 | 0.4585500000000046 | -330.0 | -330.0 | 0.0 | 2020.592638346354 | 508.0626314771112 | 3320.949462890625 | 1051.14404296875 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 10068.6 | 5923.7305 | 25615.827999999998 | 1038.5610000000001 | |||
| 44 | 43 | 838.0 | 0.0 | 1897.0 | 43.0 | 10.0 | 1897.0 | 0.4580500000000046 | 58.0 | 58.0 | 0.0 | 1911.0807373046875 | 484.4154870198784 | 2693.1943359375 | 1030.531982421875 | 0.0001 | 0.0 | 0.0001 | 0.0001 | 10108.119 | 6024.936 | 23948.987999999998 | 4229.723 | |||
| 45 | 44 | 913.0 | 0.0 | 1972.0 | 44.0 | 75.0 | 1972.0 | 0.454300000000005 | -320.0 | -320.0 | 0.0 | 1927.001064453125 | 514.9306701568819 | 3966.235595703125 | 1034.498046875 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 9262.863000000001 | 6342.0645 | 31713.102000000003 | 1045.8743 | |||
| 46 | 45 | 922.0 | 0.0 | 1981.0 | 45.0 | 9.0 | 1981.0 | 0.4538500000000051 | 63.0 | 63.0 | 0.0 | 1808.1862657335068 | 297.1387353146108 | 2182.508056640625 | 1355.8675537109375 | 0.0001 | 0.0 | 0.0001 | 0.0001 | 10279.511999999999 | 4780.2217 | 17691.68 | 4316.143 | |||
| 47 | 46 | 997.0 | 0.0 | 2056.0 | 46.0 | 75.0 | 2056.0 | 0.4501000000000055 | -315.0 | -315.0 | 0.0 | 2032.1784993489584 | 475.90695176095335 | 3158.3447265625 | 1094.5611572265623 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 10441.543 | 6276.14 | 26625.377 | 1116.9589 | |||
| 48 | 47 | 1072.0 | 0.0 | 2131.0 | 47.0 | 75.0 | 2131.0 | 0.4463500000000059 | -335.0 | -335.0 | 0.0 | 1901.55345703125 | 414.601381621737 | 2863.72021484375 | 1102.75927734375 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 10468.1455 | 5887.8525 | 28733.54 | 1633.4474 | |||
| 49 | 48 | 1147.0 | 0.0 | 2206.0 | 48.0 | 75.0 | 2206.0 | 0.4426000000000063 | -325.0 | -325.0 | 0.0 | 1844.411834309896 | 443.70547118732435 | 3207.015380859375 | 854.2076416015625 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 9129.1 | 4776.86 | 23007.46 | 1170.9935 | |||
| 50 | 49 | 1222.0 | 0.0 | 2281.0 | 49.0 | 75.0 | 2281.0 | 0.4388500000000067 | -355.0 | -355.0 | 0.0 | 1776.5706233723959 | 471.82444062467584 | 3012.540283203125 | 1001.5508422851562 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 9043.123 | 5778.9585 | 33845.637 | 1300.7959 | |||
| 51 | 50 | 1230.0 | 0.0 | 2289.0 | 50.0 | 8.0 | 2289.0 | 0.4384500000000068 | 67.0 | 67.0 | 0.0 | 1590.4605712890625 | 280.995974030903 | 2036.3619384765625 | 1259.98388671875 | 0.0001 | 0.0 | 0.0001 | 0.0001 | 15035.923999999999 | 5842.4980000000005 | 20706.568 | 3507.5747 | |||
| 52 | 51 | 1259.0 | 0.0 | 2318.0 | 51.0 | 29.0 | 2318.0 | 0.4370000000000069 | -28.0 | -28.0 | 0.0 | 1663.7892898033404 | 464.8343258797997 | 2668.75830078125 | 751.3123168945312 | 9.999999999999998e-05 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 12248.117 | 7167.755 | 30616.121 | 2583.2129999999997 | |||
| 53 | 52 | 1334.0 | 0.0 | 2393.0 | 52.0 | 75.0 | 2393.0 | 0.43325000000000735 | -340.0 | -340.0 | 0.0 | 1850.2906884765625 | 415.024752038264 | 3271.372314453125 | 1060.467041015625 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 7113.795999999999 | 4360.2896 | 23007.64 | 1550.2559 | |||
| 54 | 53 | 1409.0 | 0.0 | 2468.0 | 53.0 | 75.0 | 2468.0 | 0.42950000000000776 | -345.0 | -345.0 | 0.0 | 1730.308134765625 | 427.79760138333467 | 2762.183837890625 | 775.44775390625 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 8396.429 | 4558.9259999999995 | 23571.781000000003 | 1970.5563 | |||
| 55 | 54 | 1431.0 | 0.0 | 2490.0 | 54.0 | 22.0 | 2490.0 | 0.4284000000000079 | 0.0 | 0.0 | 0.0 | 1846.6991105513134 | 385.4605561709925 | 2543.722412109375 | 915.1123657226562 | 0.0001 | 1.3552527156068802e-20 | 0.0001 | 0.0001 | 8495.571 | 6709.9890000000005 | 33833.473 | 2038.4215 | |||
| 56 | 55 | 1473.0 | 0.0 | 2532.0 | 55.0 | 42.0 | 2532.0 | 0.4263000000000081 | -90.0 | -90.0 | 0.0 | 1890.0395827520458 | 446.4111479171437 | 2914.133056640625 | 755.6181640625 | 0.00010000000000000002 | 1.3552527156068802e-20 | 0.0001 | 0.0001 | 7235.0454 | 4041.2095 | 21379.494 | 1302.8073 | |||
| 57 | 56 | 1476.0 | 0.0 | 2535.0 | 56.0 | 3.0 | 2535.0 | 0.4261500000000081 | 91.0 | 91.0 | 0.0 | 1912.030314127604 | 342.86427285162813 | 2363.271728515625 | 1532.722412109375 | 0.0001 | 0.0 | 0.0001 | 0.0001 | 7210.1055 | 2696.3638 | 10781.295 | 4266.702 | |||
| 58 | 57 | 1479.0 | 0.0 | 2538.0 | 57.0 | 3.0 | 2538.0 | 0.42600000000000815 | 91.0 | 91.0 | 0.0 | 2022.01904296875 | 359.73376536375997 | 2496.085693359375 | 1625.116455078125 | 0.0001 | 0.0 | 0.0001 | 0.0001 | 4923.2085 | 1971.7198 | 6627.281 | 2159.7270000000003 | |||
| 59 | 58 | 1510.0 | 0.0 | 2569.0 | 58.0 | 31.0 | 2569.0 | 0.4244500000000083 | -31.0 | -31.0 | 0.0 | 1936.5541893743698 | 445.76280005387605 | 2937.03125 | 987.7350463867188 | 9.999999999999996e-05 | 4.0657581468206416e-20 | 0.0001 | 0.0001 | 8962.213 | 4653.1475 | 18630.568 | 2292.3245 | |||
| 60 | 59 | 1585.0 | 0.0 | 2644.0 | 59.0 | 75.0 | 2644.0 | 0.4207000000000087 | -345.0 | -345.0 | 0.0 | 2062.300531412761 | 461.74250925020425 | 3443.134521484375 | 908.7151489257812 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 10726.526000000002 | 6288.1504 | 34759.223 | 1402.5997 | |||
| 61 | 60 | 1594.0 | 0.0 | 2653.0 | 60.0 | 9.0 | 2653.0 | 0.4202500000000088 | 57.0 | 57.0 | 0.0 | 1937.900404188368 | 449.70101558453797 | 2752.651123046875 | 1147.4949951171875 | 0.0001 | 0.0 | 0.0001 | 0.0001 | 9633.898000000001 | 6012.1284 | 24146.093999999997 | 3509.1484 | |||
| 62 | 61 | 1669.0 | 0.0 | 2728.0 | 61.0 | 75.0 | 2728.0 | 0.4165000000000092 | -335.0 | -335.0 | 0.0 | 2081.188806152344 | 489.54920371293326 | 3186.210205078125 | 793.710205078125 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 9517.860999999999 | 6173.943 | 25958.996 | 1470.1646 | |||
| 63 | 62 | 1714.0 | 0.0 | 2773.0 | 62.0 | 45.0 | 2773.0 | 0.41425000000000944 | -107.0 | -107.0 | 0.0 | 1979.9250569661456 | 444.95341455418776 | 3409.033203125 | 1067.50146484375 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 11889.282 | 7202.778 | 28449.816000000003 | 1965.8135 | |||
| 64 | 63 | 1755.0 | 0.0 | 2814.0 | 63.0 | 41.0 | 2814.0 | 0.4122000000000097 | -86.0 | -86.0 | 0.0 | 1949.386736613948 | 438.01420887891226 | 2898.2509765625 | 1162.8082275390625 | 0.0001 | 0.0 | 0.0001 | 0.0001 | 8248.635 | 5983.8467 | 27771.922000000002 | 1338.8822 | |||
| 65 | 64 | 1766.0 | 0.0 | 2825.0 | 64.0 | 11.0 | 2825.0 | 0.4116500000000097 | 47.0 | 47.0 | 0.0 | 2142.1350430575285 | 338.90633193526367 | 2704.8408203125 | 1582.5853271484375 | 0.0001 | 0.0 | 0.0001 | 0.0001 | 6870.5347 | 3548.6636 | 14772.337 | 2794.1462 | |||
| 66 | 65 | 1841.0 | 0.0 | 2900.0 | 65.0 | 75.0 | 2900.0 | 0.4079000000000101 | -345.0 | -345.0 | 0.0 | 2000.6128336588545 | 430.99328281858436 | 2908.90380859375 | 960.3004150390624 | 0.00010000000000000003 | 2.7105054312137605e-20 | 0.0001 | 0.0001 | 10136.796 | 5358.4326 | 28253.752 | 1138.26 |