mirror of
https://github.com/gryf/coach.git
synced 2026-01-07 14:24:16 +01:00
12 KiB
12 KiB
| 1 | Episode # | Training Iter | In Heatup | ER #Transitions | ER #Episodes | Episode Length | Total steps | Epsilon | Shaped Training Reward | Training Reward | Update Target Network | Evaluation Reward | Shaped Evaluation Reward | Success Rate | Loss/Mean | Loss/Stdev | Loss/Max | Loss/Min | Learning Rate/Mean | Learning Rate/Stdev | Learning Rate/Max | Learning Rate/Min | Grads (unclipped)/Mean | Grads (unclipped)/Stdev | Grads (unclipped)/Max | Grads (unclipped)/Min | Discounted Return/Mean | Discounted Return/Stdev | Discounted Return/Max | Discounted Return/Min | Entropy/Mean | Entropy/Stdev | Entropy/Max | Entropy/Min | Advantages/Mean | Advantages/Stdev | Advantages/Max | Advantages/Min | Values/Mean | Values/Stdev | Values/Max | Values/Min | Value Loss/Mean | Value Loss/Stdev | Value Loss/Max | Value Loss/Min | Policy Loss/Mean | Policy Loss/Stdev | Policy Loss/Max | Policy Loss/Min |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 1 | 0.0 | 1.0 | 248.0 | 1.0 | 248.0 | 248.0 | 0.0 | 0.0 | 0.8700310430476327 | 0.7405333778534565 | 2.2328769490220686 | 0.0 | |||||||||||||||||||||||||||||||||||||
| 3 | 2 | 0.0 | 1.0 | 123.0 | 1.0 | 123.0 | 371.0 | 0.0 | 0.0 | 0.3899670547558481 | 0.3819119128698883 | 1.0 | 0.0 | |||||||||||||||||||||||||||||||||||||
| 4 | 3 | 0.0 | 1.0 | 88.0 | 1.0 | 88.0 | 459.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.0 | |||||||||||||||||||||||||||||||||||||
| 5 | 4 | 0.0 | 1.0 | 187.0 | 1.0 | 187.0 | 646.0 | 0.0 | 0.0 | 0.7890979761079344 | 0.4557561638352592 | 1.6825545950103868 | 0.0 | |||||||||||||||||||||||||||||||||||||
| 6 | 5 | 0.0 | 1.0 | 86.0 | 1.0 | 86.0 | 732.0 | 0.0 | 0.0 | 0.6919135855443926 | 0.7222189379050715 | 1.8429431933839264 | 0.0 | |||||||||||||||||||||||||||||||||||||
| 7 | 6 | 0.0 | 1.0 | 331.0 | 1.0 | 331.0 | 1063.0 | 0.0 | 0.0 | 1.274934530443537 | 0.6459615236299282 | 2.6500575414623486 | 0.0 | |||||||||||||||||||||||||||||||||||||
| 8 | 7 | 19.0 | 0.0 | 393.0 | 1.0 | 393.0 | 1456.0 | 0.0 | 6.0 | 75.0 | 0.0 | 0.11421088 | 0.21380013 | 0.59680337 | 0.0007558507000000001 | 1.2875349957019866 | 0.971210061310369 | 3.2939006486552924 | 0.0 | 1.7916838 | 2.6964899999999997e-05 | 1.7917563000000003 | 1.7916098000000003 | 0.14341006539700749 | 0.3535079829863394 | 1.8814263343811035 | -0.012832198292016985 | 0.026738504 | 0.01983405 | 0.06478101 | 0.0035744433 | 0.073494285 | 0.14081275 | 0.44342685 | 1.1059151000000002e-06 | 0.2566254 | 0.4923233 | 1.3469505 | -0.0116830645 | |||||||||||
| 9 | 8 | 28.0 | 0.0 | 176.0 | 1.0 | 176.0 | 1632.0 | 0.0 | 1.0 | 15.0 | 0.0 | 0.041054297000000003 | 0.09770801 | 0.29955843 | 0.0034954806 | 0.3311813182197609 | 0.3551902602002647 | 1.0 | 0.0 | 1.7914554 | 9.376556e-05 | 1.7917509999999999 | 1.7913146 | 0.033927604090422385 | 0.19766873338150195 | 0.9898095726966858 | -0.020439743995666504 | 0.09144559 | 0.012948282 | 0.109424695 | 0.06995269 | 0.021816997 | 0.057340953 | 0.17352688 | 8.623848e-05 | 0.060463965 | 0.20118664 | 0.5926347 | -0.02375073 | |||||||||||
| 10 | 9 | 40.0 | 0.0 | 230.0 | 1.0 | 230.0 | 1862.0 | 0.0 | 4.0 | 95.0 | 0.0 | 0.13237761 | 0.22048 | 0.6586441 | 0.0030599121999999998 | 1.072044354250264 | 0.6383021624195904 | 2.3444995076996524 | 0.0 | 1.7912047999999998 | 0.00016116806 | 1.7917396 | 1.7908642 | 0.1242723337289962 | 0.3330413540052279 | 0.9949659705162048 | -0.030232593417167664 | 0.13943788 | 0.016380336000000002 | 0.16490205 | 0.11253527599999999 | 0.06914418 | 0.11354548 | 0.33480042 | 0.00016573191 | 0.22288923 | 0.42013836 | 1.2402188 | -0.02921468 | |||||||||||
| 11 | 10 | 52.0 | 0.0 | 225.0 | 1.0 | 225.0 | 2087.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.012380877 | 0.004703414600000001 | 0.021775742999999997 | 0.0075669996 | 0.0 | 0.0 | 0.0 | 0.0 | 1.790831 | 0.00020312105 | 1.7917224999999999 | 1.7905108 | -0.022579368271610955 | 0.013048922208883124 | -0.001516878604888916 | -0.05166858434677124 | 0.23496416 | 0.033002004 | 0.29147413 | 0.19034456 | 0.000939706 | 0.00029336357999999995 | 0.0014079054999999998 | 0.0005678356 | -0.040449947 | 0.008927133 | -0.027699834 | -0.061478532999999995 | |||||||||||
| 12 | 11 | 55.0 | 0.0 | 61.0 | 1.0 | 61.0 | 2148.0 | 0.0 | 2.0 | 15.0 | 0.0 | 0.34558254 | 0.10964347 | 0.45522603 | 0.23593909 | 0.4908753215949722 | 0.6427284120931623 | 1.8429431933839264 | 0.0 | 1.7907859 | 0.00025409996 | 1.7917189999999998 | 1.7906520000000001 | 0.2867459513247013 | 0.44463848004967577 | 0.963326096534729 | -0.039502725005149834 | 0.26667840000000004 | 0.0025177263 | 0.27123266 | 0.2611343 | 0.17366691 | 0.032627106 | 0.20629402 | 0.1410398 | 0.5133227 | 0.121826604 | 0.6351493 | 0.39149609999999996 | |||||||||||
| 13 | 12 | 63.0 | 0.0 | 154.0 | 1.0 | 154.0 | 2302.0 | 0.0 | 2.0 | 15.0 | 0.0 | 0.17542875 | 0.39401492 | 1.14055 | 0.011324848 | 0.6548848943536648 | 0.6938572721285777 | 1.886384871716129 | 0.0 | 1.790846 | 0.00020264326 | 1.7917128 | 1.7904818 | 0.10235221503036362 | 0.3938365495483697 | 1.8367838859558103 | -0.06459653377532959 | 0.30300424 | 0.023851900000000002 | 0.34879282 | 0.2756737 | 0.09375900000000001 | 0.22594778 | 0.6472154 | 0.0012484822999999999 | 0.18546264 | 0.5920849 | 1.635689 | -0.06841414400000001 | |||||||||||
| 14 | 13 | 77.0 | 0.0 | 274.0 | 1.0 | 274.0 | 2576.0 | 0.0 | 2.0 | 25.0 | 0.0 | 0.15237926 | 0.36345005 | 1.3838784 | 0.017470764 | 0.5236986524949341 | 0.3926652750926971 | 1.3277227574378037 | 0.0 | 1.7904897000000002 | 0.00025717015 | 1.7916842 | 1.7899307 | 0.032115961382022266 | 0.2538612215988974 | 0.9805907011032104 | -0.10343283414840697 | 0.4437464 | 0.058837507000000004 | 0.56583196 | 0.36453107 | 0.043060284000000004 | 0.10292225 | 0.37266509999999997 | 0.0020458244 | 0.057298996 | 0.36375105 | 1.250245 | -0.101191714 | |||||||||||
| 15 | 14 | 83.0 | 0.0 | 103.0 | 1.0 | 103.0 | 2679.0 | 0.0 | 2.0 | 15.0 | 0.0 | 0.07037316 | 0.047356587 | 0.13836677 | 0.025409157999999998 | 0.7845364604064764 | 0.6820618892781382 | 1.8179069375972308 | 0.0 | 1.7897875 | 0.0005548012999999999 | 1.7916629000000002 | 1.7889906999999998 | -0.019784212410449985 | 0.1886624736866924 | 0.9033542275428772 | -0.11133238673210144 | 0.58218044 | 0.021696111 | 0.6264901999999999 | 0.5519036 | 0.03655105 | 0.038182367 | 0.08599932 | 0.004840155 | -0.03507611 | 0.08904675 | 0.079407215 | -0.1215153 | |||||||||||
| 16 | 15 | 88.0 | 0.0 | 92.0 | 1.0 | 92.0 | 2771.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.033596437 | 0.0029709726 | 0.03848647 | 0.030678531000000002 | 0.0 | 0.0 | 0.0 | 0.0 | 1.7880373 | 0.0009811816 | 1.7916303 | 1.7869519 | -0.054566520079970364 | 0.030518596589793445 | -0.0007356405258178711 | -0.11018291115760803 | 0.5583828000000001 | 0.004107872 | 0.5690894000000001 | 0.5528046 | 0.0047522154999999995 | 0.0002095685 | 0.004927455 | 0.004409475 | -0.096669495 | 0.00178767 | -0.09435672 | -0.09915057599999999 | |||||||||||
| 17 | 16 | 100.0 | 0.0 | 232.0 | 1.0 | 232.0 | 3003.0 | 0.0 | 2.0 | 10.0 | 0.0 | 0.16482343 | 0.35503832 | 1.2752326999999999 | 0.022478975 | 0.45029177267820303 | 0.4197177348117216 | 1.3310330883210135 | 0.0 | 1.7837206 | 0.0025686915 | 1.7915583 | 1.7788869999999999 | 0.005148372189565139 | 0.24196540373601536 | 0.9504172801971436 | -0.13010776042938232 | 0.6456753000000001 | 0.048038907 | 0.7289646 | 0.57959425 | 0.045316155999999996 | 0.092702776 | 0.31885064 | 0.0053946506 | 0.008588249000000001 | 0.3154728 | 0.9805802 | -0.13657857 | |||||||||||
| 18 | 17 | 114.0 | 0.0 | 263.0 | 1.0 | 263.0 | 3266.0 | 0.0 | 1.0 | 10.0 | 0.0 | 0.15859403 | 0.41664425 | 1.6014137 | 0.026942853 | 0.2030871577301164 | 0.3291722654404221 | 1.0 | 0.0 | 1.7763311999999998 | 0.004708352 | 1.7913265999999999 | 1.7676043999999997 | -0.008302561136392446 | 0.22270432322791744 | 0.968006670475006 | -0.14317667484283447 | 0.64081454 | 0.05134289 | 0.7383968000000001 | 0.57058036 | 0.033662584 | 0.09574595 | 0.36531943 | 0.0047015846 | -0.015162735 | 0.35005128 | 1.1956688999999998 | -0.14132895 | |||||||||||
| 19 | 18 | 119.0 | 0.0 | 90.0 | 1.0 | 90.0 | 3356.0 | 0.0 | 2.0 | 35.0 | 0.0 | 0.99584854 | 0.9705681999999999 | 2.135586 | 0.0327313 | 0.8124229268664929 | 0.6596524455289211 | 1.7856781408072189 | 0.0 | 1.7658342 | 0.0064437827 | 1.7909501 | 1.7576503 | 0.2908387087285519 | 0.4467877105109933 | 0.9755487442016602 | -0.1534261703491211 | 0.77051353 | 0.039883487 | 0.84487814 | 0.73211545 | 0.19243668 | 0.18527117 | 0.40972564 | 0.0074991053 | 0.5147201 | 0.6675354 | 1.3587703000000002 | -0.15439077 | |||||||||||
| 20 | 19 | 130.0 | 0.0 | 209.0 | 1.0 | 209.0 | 3565.0 | 0.0 | 4.0 | 50.0 | 0.0 | 0.5660963999999999 | 0.8534441999999999 | 2.868005 | 0.06250619 | 1.5178406757951433 | 0.8569879018324037 | 3.279881172665581 | 0.0 | 1.7593337 | 0.0056817230000000005 | 1.7906148000000002 | 1.7489371999999999 | 0.044801537096500386 | 0.34034919682818704 | 0.9900107383728028 | -0.2266418933868408 | 1.1287438 | 0.11789183 | 1.3896817 | 1.013916 | 0.12611601 | 0.14952904 | 0.4575872 | 0.015016868000000001 | 0.07396114599999999 | 0.43413877 | 1.215942 | -0.20843013 | |||||||||||
| 21 | 20 | 156.0 | 0.0 | 518.0 | 1.0 | 518.0 | 4083.0 | 0.0 | 7.0 | 130.0 | 0.0 | 0.9353090000000001 | 1.2858386 | 3.8660667 | 0.11725034 | 1.098791739364709 | 0.6320419503440284 | 2.523303015133401 | 0.0 | 1.6699091 | 0.055741128 | 1.7903702000000001 | 1.5692837 | -0.06757649946212768 | 0.3195450124164553 | 0.9396663904190063 | -0.5494513511657715 | 2.2210557 | 0.6047439 | 3.5003364 | 1.4445081 | 0.1674737 | 0.17189884 | 0.50756395 | 0.036066726 | -0.12177686 | 0.42073590000000005 | 1.1168726999999998 | -0.529899 | |||||||||||
| 22 | 21 | 162.0 | 0.0 | 103.0 | 1.0 | 103.0 | 4186.0 | 0.0 | 1.0 | 30.0 | 0.0 | 1.1245039 | 1.3816309 | 3.88741 | 0.40766072 | 0.28791485922371896 | 0.4044270844696768 | 1.0 | 0.0 | 1.5755019 | 0.038972553 | 1.7804282 | 1.5525216 | -0.20262039422988887 | 0.3420573312956313 | 0.7819786071777344 | -0.6609947681427002 | 3.3616974 | 0.16612557 | 3.6837413 | 3.15605 | 0.18570164 | 0.14099212 | 0.46655792 | 0.10048528 | -0.34885046 | 0.40083793 | 0.44589615 | -0.62824064 | |||||||||||
| 23 | 22 | 172.0 | 0.0 | 191.0 | 1.0 | 191.0 | 4377.0 | 0.0 | 4.0 | 35.0 | 0.0 | 1.0493082 | 0.8931684000000001 | 2.8788257 | 0.40921542 | 1.360820215871854 | 0.784373317174275 | 2.6276416239131137 | 0.0 | 1.5121492 | 0.036270477 | 1.7781756000000002 | 1.4913622 | -0.1084176672829522 | 0.38656666708586895 | 1.439842700958252 | -0.6016488075256348 | 2.8675182 | 0.25318608 | 3.2926830999999996 | 2.5298715 | 0.19097143 | 0.17252174 | 0.58011985 | 0.058588177000000005 | -0.16885796 | 0.43851078 | 0.66275233 | -0.52809024 | |||||||||||
| 24 | 23 | 177.0 | 0.0 | 84.0 | 1.0 | 84.0 | 4461.0 | 0.0 | 2.0 | 45.0 | 0.0 | 1.2559823 | 1.2462946000000001 | 3.4129782 | 0.46524242 | 0.7590341126385189 | 0.5714559904623038 | 1.6825545950103868 | 0.0 | 1.5744928 | 0.046586752 | 1.7830153000000002 | 1.5274831 | -0.0040334612131118774 | 0.41865952406709256 | 0.9548516273498536 | -0.4455758333206177 | 2.2548747000000002 | 0.117815435 | 2.422201 | 2.1072755 | 0.15494695 | 0.14008166 | 0.39015853 | 0.04275903 | 0.043876007 | 0.66575617 | 1.1958548 | -0.36775714 | |||||||||||
| 25 | 24 | 182.0 | 0.0 | 94.0 | 1.0 | 94.0 | 4555.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.43677402 | 0.022415543 | 0.47187870000000004 | 0.41241384 | 0.0 | 0.0 | 0.0 | 0.0 | 1.6601015 | 0.02886555 | 1.7863803 | 1.623586 | -0.19612670242786406 | 0.10077536524472708 | -0.017804980278015137 | -0.3609187602996826 | 1.8921119999999998 | 0.09945338 | 2.0795848 | 1.7547298999999998 | 0.035672493 | 0.0038337493 | 0.040968943 | 0.030137222 | -0.32919282 | 0.030663265 | -0.28128055 | -0.35991377 | |||||||||||
| 26 | 25 | 191.0 | 0.0 | 168.0 | 1.0 | 168.0 | 4723.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.34642940000000005 | 0.031286575 | 0.38121468 | 0.30028449999999995 | 0.0 | 0.0 | 0.0 | 0.0 | 1.711691 | 0.021477012 | 1.7870021 | 1.6728425 | -0.14421033672988415 | 0.0784776205445583 | -0.01166987419128418 | -0.3196219205856323 | 1.4310815000000001 | 0.1909281 | 1.7374218999999997 | 1.1538972 | 0.020933941 | 0.004734668 | 0.028576741 | 0.013943641000000001 | -0.2479685 | 0.03228178 | -0.19238672 | -0.2879433 | |||||||||||
| 27 | 26 | 197.0 | 0.0 | 111.0 | 1.0 | 111.0 | 4834.0 | 0.0 | 3.0 | 30.0 | 0.0 | 0.79219913 | 0.6585664000000001 | 1.8361028000000001 | 0.23683028 | 0.6851048481354731 | 0.8585430906034763 | 2.577892849269104 | 0.0 | 1.7532889999999999 | 0.007889994000000001 | 1.789348 | 1.7424953 | 0.198319748044014 | 0.41789017518559096 | 0.9343531131744384 | -0.19544732570648196 | 0.9423574 | 0.07165401 | 1.0466307 | 0.85023546 | 0.134664 | 0.11154076 | 0.27441356 | 0.0088588325 | 0.35140955 | 0.48767257 | 0.96400595 | -0.1610711 | |||||||||||
| 28 | 27 | 205.0 | 0.0 | 146.0 | 1.0 | 146.0 | 4980.0 | 0.0 | 2.0 | 50.0 | 0.0 | 0.3835866 | 0.29479313 | 0.8498258 | 0.17240569 | 0.7474950655330485 | 0.6391161056582584 | 1.8179069375972308 | 0.0 | 1.7678131000000001 | 0.0045808293 | 1.7901799999999999 | 1.7610288 | 0.05451156880174365 | 0.31425528117953666 | 0.9421547651290894 | -0.15150243043899536 | 0.7046019 | 0.06271613 | 0.8096890999999999 | 0.61898696 | 0.0591021 | 0.08257003 | 0.19253531 | 0.005577637 | 0.095768906 | 0.36126813 | 0.6872695 | -0.1504049 | |||||||||||
| 29 | 28 | 218.0 | 0.0 | 242.0 | 1.0 | 242.0 | 5222.0 | 0.0 | 6.0 | 80.0 | 0.0 | 0.7920397 | 0.79612815 | 2.63497 | 0.17391229 | 1.645187018776334 | 1.1888275486606186 | 3.7704337858175982 | 0.0 | 1.7655463 | 0.0030714702000000003 | 1.7900281000000002 | 1.7618682 | 0.2506444845348597 | 0.4905160603309943 | 1.8532297611236568 | -0.14203763008117676 | 0.62720054 | 0.027176457999999997 | 0.68468654 | 0.5817806 | 0.15193503 | 0.21912470000000003 | 0.7655721999999999 | 0.0058864880000000005 | 0.43411112 | 0.6935981999999999 | 1.8189167000000002 | -0.12550029999999998 | |||||||||||
| 30 | 29 | 235.0 | 0.0 | 338.0 | 1.0 | 338.0 | 5560.0 | 0.0 | 1.0 | 30.0 | 0.0 | 0.30830324 | 0.39548668 | 1.8343208 | 0.13877131 | 0.12902213300225207 | 0.2911176081952243 | 1.0 | 0.0 | 1.7481099999999998 | 0.009228752 | 1.7902348000000001 | 1.7353710999999998 | -0.027244952507317063 | 0.20766170336314208 | 0.965793788433075 | -0.15617334842681885 | 0.7521545999999999 | 0.05371476 | 0.86244637 | 0.68034315 | 0.02590205 | 0.07214319 | 0.3052665 | 0.005013725 | -0.049537443 | 0.32564682 | 1.2084311 | -0.17644764 | |||||||||||
| 31 | 30 | 240.0 | 0.0 | 85.0 | 1.0 | 85.0 | 5645.0 | 0.0 | 0.0 | 0.0 | 0.0 | 0.18760897 | 0.04284751 | 0.22613609 | 0.1154042 | 0.0 | 0.0 | 0.0 | 0.0 | 1.7366872 | 0.012117143 | 1.7896880000000002 | 1.7309592 | -0.06574315130710602 | 0.04403796497891437 | 0.013423502445220949 | -0.15937530994415286 | 0.7440799 | 0.01239285 | 0.7819453000000001 | 0.72635436 | 0.006604558000000001 | 0.00082349975 | 0.0074465787 | 0.005253814599999999 | -0.11371288 | 0.025646087 | -0.07066831 | -0.13479757 |