mirror of
https://github.com/gryf/coach.git
synced 2026-01-05 21:34:18 +01:00
12 KiB
12 KiB
| 1 | Episode # | Training Iter | In Heatup | ER #Transitions | ER #Episodes | Episode Length | Total steps | Epsilon | Shaped Training Reward | Training Reward | Update Target Network | Evaluation Reward | Shaped Evaluation Reward | Success Rate | Loss/Mean | Loss/Stdev | Loss/Max | Loss/Min | Learning Rate/Mean | Learning Rate/Stdev | Learning Rate/Max | Learning Rate/Min | Grads (unclipped)/Mean | Grads (unclipped)/Stdev | Grads (unclipped)/Max | Grads (unclipped)/Min | Discounted Return/Mean | Discounted Return/Stdev | Discounted Return/Max | Discounted Return/Min | Entropy/Mean | Entropy/Stdev | Entropy/Max | Entropy/Min | Advantages/Mean | Advantages/Stdev | Advantages/Max | Advantages/Min | Values/Mean | Values/Stdev | Values/Max | Values/Min | Value Loss/Mean | Value Loss/Stdev | Value Loss/Max | Value Loss/Min | Policy Loss/Mean | Policy Loss/Stdev | Policy Loss/Max | Policy Loss/Min |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 1 | 0.0 | 1.0 | 172.0 | 1.0 | 172.0 | 172.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | |||||||||||||||||||||||||||||||||||||
| 3 | 2 | 0.0 | 1.0 | 79.0 | 1.0 | 79.0 | 251.0 | 0.0 | 0.0 | 0.6655258513307333 | 0.7653968685057024 | 1.8953382542587165 | 0.0 | |||||||||||||||||||||||||||||||||||||
| 4 | 3 | 0.0 | 1.0 | 96.0 | 1.0 | 96.0 | 347.0 | 0.0 | 0.0 | 0.31623623119836064 | 0.4117963273741081 | 1.0 | 0.0 | |||||||||||||||||||||||||||||||||||||
| 5 | 4 | 0.0 | 1.0 | 371.0 | 1.0 | 371.0 | 718.0 | 0.0 | 0.0 | 1.3355309280324184 | 1.0180238538386663 | 3.6710632975826947 | 0.0 | |||||||||||||||||||||||||||||||||||||
| 6 | 5 | 0.0 | 1.0 | 344.0 | 1.0 | 344.0 | 1062.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | |||||||||||||||||||||||||||||||||||||
| 7 | 6 | 12.0 | 0.0 | 254.0 | 1.0 | 254.0 | 1316.0 | 0.0 | 6.0 | 80.0 | 0.0 | 0.19509883 | 0.22113559 | 0.68123406 | 0.00047456394999999995 | 1.7433348660779522 | 1.0187142388712978 | 3.719695753907597 | 0.0 | 1.7915602 | 5.9631707999999995e-05 | 1.7916646 | 1.791353 | 0.2262918949804468 | 0.4052190032356826 | 1.0116755962371826 | -0.008910976350307466 | 0.0027322858000000004 | 0.015280201 | 0.03439149 | -0.017219357 | 0.10770521 | 0.12396591 | 0.38448063 | 1.8039241000000002e-06 | 0.40517464 | 0.47274828 | 1.4911206 | -0.0077848933 | |||||||||||
| 8 | 7 | 29.0 | 0.0 | 334.0 | 1.0 | 334.0 | 1650.0 | 0.0 | 1.0 | 30.0 | 0.0 | 0.04769252 | 0.15901159 | 0.6634372 | 0.0024216557000000002 | 0.27632160409284623 | 0.2705646117859804 | 1.0 | 0.0 | 1.7914505 | 8.707981e-05 | 1.7916372 | 1.7912288 | 0.0370550392428413 | 0.19677852680040736 | 0.9944062232971193 | -0.025336399674415592 | 0.068387836 | 0.015558312 | 0.09796308 | 0.043330245 | 0.020047436000000002 | 0.077496596 | 0.32019043 | 5.2523033e-06 | 0.06660683 | 0.30359715 | 1.2421792 | -0.023875023999999998 | |||||||||||
| 9 | 8 | 36.0 | 0.0 | 128.0 | 1.0 | 128.0 | 1778.0 | 0.0 | 1.0 | 10.0 | 0.0 | 0.09955869 | 0.20010683 | 0.54699177 | 0.0065239915 | 0.4682151148816086 | 0.332164510934488 | 1.0 | 0.0 | 1.7912488000000002 | 9.2632894e-05 | 1.7914296000000003 | 1.7911137 | 0.07758730097363392 | 0.2730298587990429 | 0.9900790452957152 | -0.029358670115470886 | 0.10313641 | 0.002745719 | 0.11594209 | 0.096130215 | 0.04028255 | 0.08992219 | 0.24135466 | 2.5576886e-05 | 0.13940988 | 0.35006684 | 0.92214614 | -0.022096004 | |||||||||||
| 10 | 9 | 50.0 | 0.0 | 266.0 | 1.0 | 266.0 | 2044.0 | 0.0 | 5.0 | 75.0 | 0.0 | 0.30262554 | 0.4104986 | 1.2076516000000002 | 0.013035316000000002 | 1.4932915031001632 | 0.8839031098458202 | 3.43323955603109 | 0.0 | 1.7913542000000002 | 0.00010127693499999999 | 1.791509 | 1.7908573 | 0.21927762378293733 | 0.4035228875160485 | 1.0002621412277222 | -0.04568234086036682 | 0.16175748 | 0.03333184 | 0.22182891 | 0.11903856 | 0.1054567 | 0.15073928 | 0.40956032 | 8.165229e-05 | 0.39360209999999995 | 0.60812014 | 1.6208212 | -0.041010122999999996 | |||||||||||
| 11 | 10 | 57.0 | 0.0 | 138.0 | 1.0 | 138.0 | 2182.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.044218402000000004 | 0.021266992999999998 | 0.07302858 | 0.0056792577 | 0.0 | 0.0 | 0.0 | 0.0 | 1.7911481 | 0.00010475656 | 1.7912874 | 1.7907011999999998 | -0.02400694030026595 | 0.02247906301502126 | 0.02803117036819458 | -0.10323163866996764 | 0.29870743 | 0.029791757000000002 | 0.37329957 | 0.2534129 | 0.0005408207 | 0.00035989028 | 0.001230922 | 8.2141574e-05 | -0.04310067 | 0.023800402999999998 | 0.005341789699999999 | -0.070361935 | |||||||||||
| 12 | 11 | 69.0 | 0.0 | 239.0 | 1.0 | 239.0 | 2421.0 | 0.0 | 2.0 | 35.0 | 0.0 | 0.2583665 | 0.4150833 | 1.228677 | 0.053808387 | 0.6221455698949666 | 0.3185701723427279 | 1.293422721525216 | 0.0 | 1.7907401 | 0.00031908086 | 1.7912133000000001 | 1.7899948 | 0.07805510989644311 | 0.3018230800532408 | 0.9786887168884276 | -0.08048233389854431 | 0.33094752 | 0.013372423 | 0.37411574 | 0.30098158 | 0.04859488 | 0.10169968 | 0.28043127 | 0.0005444438 | 0.13855815 | 0.42433950000000004 | 1.108467 | -0.072092846 | |||||||||||
| 13 | 12 | 80.0 | 0.0 | 221.0 | 1.0 | 221.0 | 2642.0 | 0.0 | 6.0 | 80.0 | 0.0 | 0.48391336 | 0.40221074 | 1.09942 | 0.05414404 | 1.6712583569698125 | 0.9098789672579484 | 3.118180163315916 | 0.0 | 1.7884991000000001 | 0.0013924551000000002 | 1.7902508000000001 | 1.785885 | 0.15834423065185546 | 0.38744492697489613 | 0.9535312056541444 | -0.1274641752243042 | 0.49976876 | 0.076539606 | 0.6220838000000001 | 0.40243104 | 0.08759322 | 0.08715160000000001 | 0.21323131 | 0.0010414098 | 0.28146607 | 0.3843692 | 0.8391149999999999 | -0.1258507 | |||||||||||
| 14 | 13 | 83.0 | 0.0 | 60.0 | 1.0 | 60.0 | 2702.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.19376102 | 0.025060445 | 0.21882147 | 0.16870058 | 0.0 | 0.0 | 0.0 | 0.0 | 1.7862084999999999 | 0.00020189301 | 1.7865493000000001 | 1.7855456000000003 | -0.07056967169046402 | 0.04169400167193667 | -0.005379676818847656 | -0.154371976852417 | 0.6437744000000001 | 0.015510267 | 0.7031798 | 0.6309234 | 0.0033592340000000004 | 0.0007790946400000001 | 0.0041383285999999995 | 0.0025801393 | -0.12886816 | 0.013793725500000001 | -0.11507443 | -0.14266188 | |||||||||||
| 15 | 14 | 95.0 | 0.0 | 236.0 | 1.0 | 236.0 | 2938.0 | 0.0 | 3.0 | 65.0 | 0.0 | 0.28904006 | 0.41236135 | 1.551084 | 0.020245053 | 1.0239121744153088 | 0.6185542465114561 | 2.431606479465901 | 0.0 | 1.7871317 | 0.0005855132499999999 | 1.7882346999999998 | 1.7852147 | 0.031784444505518136 | 0.2962424032667875 | 1.828610181808472 | -0.17417967319488525 | 0.49963024 | 0.052589532 | 0.6409774 | 0.4295168 | 0.0443849 | 0.11141221 | 0.38939828 | 0.00024282213 | 0.054969538 | 0.3765643 | 1.2040217 | -0.13643822 | |||||||||||
| 16 | 15 | 104.0 | 0.0 | 181.0 | 1.0 | 181.0 | 3119.0 | 0.0 | 1.0 | 15.0 | 0.0 | 0.17768285 | 0.13748805 | 0.5389735999999999 | 0.09483471 | 0.3967620466627271 | 0.3132963268665544 | 1.0 | 0.0 | 1.7848563999999998 | 0.000734798 | 1.785902 | 1.7817947 | -0.0141413239762187 | 0.18461536769689052 | 0.9462706446647644 | -0.12360873818397522 | 0.5192491 | 0.018901557 | 0.5768884 | 0.48201087 | 0.017141404 | 0.04088881 | 0.12531848 | 0.0010934995 | -0.023188977000000003 | 0.176302 | 0.44238847 | -0.10848155 | |||||||||||
| 17 | 16 | 108.0 | 0.0 | 81.0 | 1.0 | 81.0 | 3200.0 | 0.0 | 2.0 | 15.0 | 0.0 | 0.9549913000000001 | 0.6688843000000001 | 1.7542866000000001 | 0.11721748 | 0.5378888730513616 | 0.6003268067889761 | 1.7471720943315965 | 0.0 | 1.7850477999999999 | 0.0009660981 | 1.7860456999999998 | 1.7824031999999999 | 0.4184389670689901 | 0.4525963959264465 | 0.993053138256073 | -0.102097749710083 | 0.48676348 | 0.024071414 | 0.5483365 | 0.45547286 | 0.18996733 | 0.14617560000000002 | 0.3583228 | 0.0018988681 | 0.7654829000000001 | 0.6699951 | 1.5368868999999998 | -0.0967084 | |||||||||||
| 18 | 17 | 113.0 | 0.0 | 84.0 | 1.0 | 84.0 | 3284.0 | 0.0 | 1.0 | 15.0 | 0.0 | 0.08543899 | 0.020702211 | 0.111974046 | 0.055297795999999996 | 0.2265144425937397 | 0.3933013228697155 | 1.0 | 0.0 | 1.7873621 | 0.0006459787 | 1.7881534 | 1.7860596999999998 | -0.035667921975255014 | 0.10791921481185313 | 0.8904736042022705 | -0.1039191484451294 | 0.42321816 | 0.024867327999999998 | 0.46856302 | 0.39477540000000005 | 0.006459379 | 0.0090453075 | 0.022123277 | 0.0010923959 | -0.0633661 | 0.023147937 | -0.023805222999999997 | -0.08250186 | |||||||||||
| 19 | 18 | 129.0 | 0.0 | 309.0 | 1.0 | 309.0 | 3593.0 | 0.0 | 3.0 | 45.0 | 0.0 | 0.28026912 | 0.40053105 | 1.2491518 | 0.008425997 | 0.8662809768433286 | 0.4997214922619827 | 1.8429431933839264 | 0.0 | 1.7877631999999999 | 0.0007633192599999999 | 1.7885981 | 1.7846953999999997 | 0.07579533636569978 | 0.30580757261711344 | 0.9922432899475098 | -0.13300999999046326 | 0.4081396 | 0.045195244 | 0.49497452 | 0.32608187 | 0.0496316 | 0.09908927 | 0.30438307 | 0.000105443636 | 0.13531558 | 0.42330202 | 1.2120090000000001 | -0.114020035 | |||||||||||
| 20 | 19 | 134.0 | 0.0 | 96.0 | 1.0 | 96.0 | 3689.0 | 0.0 | 1.0 | 15.0 | 0.0 | 0.11922532 | 0.08307043 | 0.26265112 | 0.06485479 | 0.4886400594217567 | 0.3703259810860411 | 1.0 | 0.0 | 1.7871433 | 0.00057778653 | 1.7879406999999998 | 1.7862363999999997 | -0.001410536840558052 | 0.1778469306102961 | 0.9087549448013306 | -0.08837711811065674 | 0.41927390000000003 | 0.032013103 | 0.46018165 | 0.37253463 | 0.015815761 | 0.026164377000000003 | 0.06113352 | 0.0005858624 | -0.004888147 | 0.09434917599999999 | 0.15841892 | -0.06494608 | |||||||||||
| 21 | 20 | 141.0 | 0.0 | 126.0 | 1.0 | 126.0 | 3815.0 | 0.0 | 1.0 | 20.0 | 0.0 | 0.17892276 | 0.18974670000000002 | 0.5871076999999999 | 0.04061436 | 0.4626024762434755 | 0.3397468290721503 | 1.0 | 0.0 | 1.7869374 | 0.00034472987 | 1.787608 | 1.7855246999999999 | 0.010839956998825073 | 0.2223429244291402 | 0.938248872756958 | -0.12247949838638306 | 0.38885185 | 0.02215005 | 0.44878253 | 0.36568108 | 0.024776941 | 0.052067712 | 0.14116788 | 0.00035636208 | 0.02077537 | 0.22919169 | 0.5269510000000001 | -0.15487865 | |||||||||||
| 22 | 21 | 152.0 | 0.0 | 203.0 | 1.0 | 203.0 | 4018.0 | 0.0 | 3.0 | 35.0 | 0.0 | 0.16685398 | 0.15809304 | 0.565851 | 0.07342667 | 0.8076575260116894 | 0.7265305853352912 | 2.160057442743484 | 0.0 | 1.7862483 | 0.0014891494 | 1.7879581000000002 | 1.7839129 | 0.012410407960414888 | 0.21971669345542869 | 0.948024034500122 | -0.09016576409339903 | 0.43260628 | 0.026799481 | 0.4922334 | 0.3847252 | 0.02421472 | 0.042090252 | 0.12565623 | 0.00092638604 | 0.020757709 | 0.17696977 | 0.45546275 | -0.09430063 | |||||||||||
| 23 | 22 | 157.0 | 0.0 | 97.0 | 1.0 | 97.0 | 4115.0 | 0.0 | 3.0 | 45.0 | 0.0 | 0.6433711999999999 | 0.74553686 | 1.9088638 | 0.08321298 | 1.0345263904078872 | 0.8827487033376469 | 2.5157175752154317 | 0.0 | 1.7857674 | 0.0010410689 | 1.7868642 | 1.7825214 | 0.25182808451354505 | 0.4908840090309371 | 1.735175848007202 | -0.09291231632232666 | 0.38321668 | 0.042277128 | 0.46946734 | 0.33924907 | 0.15219225 | 0.20525712 | 0.50007224 | 0.0013484001 | 0.44017676 | 0.68656087 | 1.5864606 | -0.10410466 | |||||||||||
| 24 | 23 | 162.0 | 0.0 | 91.0 | 1.0 | 91.0 | 4206.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.075180575 | 0.006743745 | 0.085042305 | 0.06789072 | 0.0 | 0.0 | 0.0 | 0.0 | 1.7854391 | 0.00031607927000000004 | 1.7862240000000003 | 1.7842703000000002 | -0.03848295994102955 | 0.01893502871781908 | -0.003447979688644409 | -0.07869347929954529 | 0.33710825 | 0.0073817223 | 0.36435217 | 0.3281642 | 0.0009197367999999999 | 0.00021758883999999998 | 0.0012860488 | 0.0007166114500000001 | -0.06852996 | 0.007950632 | -0.06106282 | -0.080443725 | |||||||||||
| 25 | 24 | 169.0 | 0.0 | 137.0 | 1.0 | 137.0 | 4343.0 | 0.0 | 2.0 | 15.0 | 0.0 | 0.5252931 | 0.6227796 | 1.638133 | 0.08790696 | 0.5940129172438323 | 0.5756163697390285 | 1.6361854860638707 | 0.0 | 1.7834058000000002 | 0.0009344258599999999 | 1.7848165 | 1.7812016 | 0.18035456563035648 | 0.3982012769084963 | 0.9823999404907228 | -0.08917045593261719 | 0.41844782 | 0.014422988999999999 | 0.46660876 | 0.39491826 | 0.09554601 | 0.13599983 | 0.33183685 | 0.0010732922 | 0.31740478 | 0.5796393 | 1.311009 | -0.09464724 | |||||||||||
| 26 | 25 | 176.0 | 0.0 | 130.0 | 1.0 | 130.0 | 4473.0 | 0.0 | 2.0 | 30.0 | 0.0 | 0.34749827 | 0.49382079999999995 | 1.4496006000000001 | 0.09435476 | 0.7449354244527606 | 0.6153664699948187 | 1.7397003733882803 | 0.0 | 1.7757193 | 0.0032942689000000002 | 1.7810607 | 1.7697625 | 0.06231525068481762 | 0.3068518768533089 | 0.9816009998321532 | -0.1330496072769165 | 0.489879 | 0.026906582000000002 | 0.5650137 | 0.44547275 | 0.049020633 | 0.08931285 | 0.24614899 | 0.0010592983999999999 | 0.09891536 | 0.3640319 | 0.9037651 | -0.11826469 | |||||||||||
| 27 | 26 | 180.0 | 0.0 | 79.0 | 1.0 | 79.0 | 4552.0 | 0.0 | 1.0 | 10.0 | 0.0 | 0.5800049 | 0.621704 | 1.4584333 | 0.108442254 | 0.16614454079876162 | 0.35835325356793346 | 1.0 | 0.0 | 1.7717383999999998 | 0.0010083972 | 1.773361 | 1.768905 | 0.15509415070215862 | 0.3853514544991082 | 0.9301938414573668 | -0.1339915692806244 | 0.4517303 | 0.0311643 | 0.51715523 | 0.4147598 | 0.08627499 | 0.118677594 | 0.25410578 | 0.0012751152000000001 | 0.26702836 | 0.5228872 | 1.0059426 | -0.12734489 | |||||||||||
| 28 | 27 | 192.0 | 0.0 | 228.0 | 1.0 | 228.0 | 4780.0 | 0.0 | 6.0 | 45.0 | 0.0 | 0.71833307 | 0.8871537 | 2.6851700000000003 | 0.119784765 | 1.9557469594274288 | 1.2113299633522974 | 3.7691313416270273 | 0.0 | 1.7596832999999998 | 0.0061596609999999994 | 1.7667857 | 1.7383785 | 0.2066974406892603 | 0.5095305429054708 | 1.811464548110962 | -0.14315438270568848 | 0.5574998000000001 | 0.027793197000000002 | 0.64380324 | 0.51100904 | 0.15117261 | 0.24757883 | 0.6801178000000001 | 0.0013509541 | 0.3654783 | 0.7136764 | 1.7989216000000001 | -0.121857285 | |||||||||||
| 29 | 28 | 195.0 | 0.0 | 60.0 | 1.0 | 60.0 | 4840.0 | 0.0 | 2.0 | 15.0 | 0.0 | 0.49510857 | 0.43411818 | 0.92922676 | 0.060990404000000005 | 0.4458790622513688 | 0.6575192889449866 | 1.877521022998968 | 0.0 | 1.7597702000000002 | 0.0021079525 | 1.7620791 | 1.7530606 | 0.1326778046786785 | 0.3788317711032021 | 0.8848448395729065 | -0.13622477650642395 | 0.6043301 | 0.0271843 | 0.6559411999999999 | 0.561541 | 0.08055846400000001 | 0.059245005 | 0.13980347 | 0.021313457 | 0.21867141 | 0.27701040000000005 | 0.49568182 | -0.05833899 | |||||||||||
| 30 | 29 | 226.0 | 0.0 | 616.0 | 1.0 | 616.0 | 5456.0 | 0.0 | 15.0 | 240.0 | 0.0 | 1.1688551999999999 | 1.0896888 | 3.6118822 | 0.098014034 | 2.0852043638273967 | 1.3167636930818822 | 4.3404004764447 | 0.0 | 1.742934 | 0.014055208000000001 | 1.7623421000000001 | 1.7109525 | 0.1393659818172455 | 0.4412685325283971 | 1.6910160779953003 | -0.5255360603332521 | 1.0301913 | 0.383238 | 1.7467842 | 0.5466168 | 0.107070394 | 0.14446682 | 0.5526603 | 0.0011366851 | 0.25609398 | 0.60589725 | 1.4118645 | -0.44296303 | |||||||||||
| 31 | 30 | 236.0 | 0.0 | 193.0 | 1.0 | 193.0 | 5649.0 | 0.0 | 5.0 | 55.0 | 0.0 | 1.9328797999999998 | 1.0595886 | 4.5198774 | 0.44015956 | 1.4536560767783049 | 1.173902840773651 | 3.234511537329536 | 0.0 | 1.6939487000000002 | 0.016129734 | 1.7192296999999999 | 1.6532421000000002 | 0.08677296373579238 | 0.4301078412251611 | 0.9538357257843018 | -0.5215082168579102 | 2.209638 | 0.12871107 | 2.505245 | 1.9755584 | 0.096261166 | 0.07482098 | 0.26794806 | 0.025336777999999997 | 0.18479401 | 0.5860191 | 1.2836683999999998 | -0.5055494 |