mirror of
https://github.com/gryf/coach.git
synced 2026-03-15 06:03:33 +01:00
Itaicaspi/episode reset refactoring (#105)
* reordering of the episode reset operation and allowing to store episodes only when they are terminated * reordering of the episode reset operation and allowing to store episodes only when they are terminated * revert tensorflow-gpu to 1.9.0 + bug fix in should_train() * tests readme file and refactoring of policy optimization agent train function * Update README.md * Update README.md * additional policy optimization train function simplifications * Updated the traces after the reordering of the environment reset * docker and jenkins files * updated the traces to the ones from within the docker container * updated traces and added control suite to the docker * updated jenkins file with the intel proxy + updated doom basic a3c test params * updated line breaks in jenkins file * added a missing line break in jenkins file * refining trace tests ignored presets + adding a configurable beta entropy value * switch the order of trace and golden tests in jenkins + fix golden tests processes not killed issue * updated benchmarks for dueling ddqn breakout and pong * allowing dynamic updates to the loss weights + bug fix in episode.update_returns * remove docker and jenkins file
This commit is contained in:
@@ -3,24 +3,24 @@ Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,To
|
||||
2,0.0,1.0,573.0,573.0,87.0,573.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
3,0.0,1.0,722.0,722.0,149.0,722.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
4,0.0,1.0,1057.0,1057.0,335.0,1057.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
5,51.0,0.0,1260.0,1260.0,203.0,1260.0,0.9997990300000044,3.0,30.0,0.0,,,,0.009506131430480666,0.013357074931555628,0.04922456666827202,0.00011823583918157964,0.00025,0.0,0.00025,0.00025,0.04541644,0.032187756,0.13184725,0.008537644,,,,
|
||||
6,116.0,0.0,1519.0,1519.0,259.0,1519.0,0.99954262000001,3.0,30.0,0.0,,,,0.009436892453007974,0.010444927167927037,0.044396519660949714,0.0002187119680456817,0.00025,0.0,0.00025,0.00025,0.043486382999999997,0.028469712999999997,0.1315432,0.010239484,,,,
|
||||
7,154.0,0.0,1673.0,1673.0,154.0,1673.0,0.9993901600000132,0.0,0.0,0.0,,,,0.006680036455739021,0.007691341664224352,0.028086043894290924,0.00016294234956149012,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.03525371,0.022364777000000002,0.08392369999999999,0.009258808,,,,
|
||||
8,188.0,0.0,1809.0,1809.0,136.0,1809.0,0.9992555200000162,0.0,0.0,0.0,,,,0.005725367511759567,0.009134182509519568,0.030434217303991318,0.0001105146948248148,0.00025,0.0,0.00025,0.00025,0.031003432,0.026752787000000004,0.11063196,0.008286015,,,,
|
||||
9,218.0,0.0,1927.0,1927.0,118.0,1927.0,0.9991387000000188,4.0,50.0,0.0,,,,0.005530147604683104,0.008635781810203545,0.029109837487339973,0.00016355639672838151,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.026989017,0.024766427,0.08535746,0.006113700600000001,,,,
|
||||
10,239.0,0.0,2013.0,2013.0,86.0,2013.0,0.9990535600000204,1.0,25.0,0.0,,,,0.007073877079944525,0.010856981851779086,0.040930863469839096,0.00027058221166953444,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.03715521,0.026002409,0.11184523,0.0153889125,,,,
|
||||
11,285.0,0.0,2197.0,2197.0,184.0,2197.0,0.9988714000000244,5.0,75.0,0.0,,,,0.0049696794215022865,0.008980699602831191,0.043269582092761986,0.00012109361705370249,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.025901955,0.02628609,0.11205949,0.006279965,,,,
|
||||
12,309.0,0.0,2293.0,2293.0,96.0,2293.0,0.9987763600000266,2.0,15.0,0.0,,,,0.005058763722142127,0.007785021317331955,0.027659159153699875,0.00018030928913503885,0.00025,0.0,0.00025,0.00025,0.027570038999999998,0.021486067999999997,0.08631482,0.008357895,,,,
|
||||
13,353.0,0.0,2467.0,2467.0,174.0,2467.0,0.9986041000000304,2.0,35.0,0.0,,,,0.0045628238068192405,0.007280793903160444,0.028272464871406555,9.907802450470626e-05,0.00025,0.0,0.00025,0.00025,0.025343232,0.02227741,0.07953325,0.0048882863,,,,
|
||||
14,400.0,0.0,2658.0,2658.0,191.0,2658.0,0.9984150100000344,1.0,25.0,0.0,,,,0.0097321032195357,0.01023961919664894,0.030154820531606674,0.00018444313900545242,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.04259975,0.028015751000000002,0.10317952,0.009026687,0.018213745,0.03228745,0.07245033,-0.01997892
|
||||
15,420.0,0.0,2737.0,2737.0,79.0,2737.0,0.998336800000036,3.0,30.0,0.0,,,,0.008781690090836491,0.00899884267405712,0.028885878622531887,0.00047134244232438505,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.04500962,0.024723325,0.10789993,0.017506445,,,,
|
||||
16,441.0,0.0,2822.0,2822.0,85.0,2822.0,0.998252650000038,1.0,20.0,0.0,,,,0.011111788584717685,0.00964176097294723,0.030850913375616074,0.0004762174794450402,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.050733815999999994,0.028628142999999998,0.12953582,0.018588755,,,,
|
||||
17,497.0,0.0,3045.0,3045.0,223.0,3045.0,0.9980318800000428,2.0,30.0,0.0,,,,0.00828668451010474,0.010699894323199828,0.04358338564634323,0.00020791786664631215,0.00025,0.0,0.00025,0.00025,0.039435297,0.027343287999999997,0.12071342,0.007059440500000001,0.014257256999999999,0.019365441,0.04348784,-0.0063439063
|
||||
18,519.0,0.0,3133.0,3133.0,88.0,3133.0,0.9979447600000446,1.0,10.0,0.0,,,,0.0074549241412155826,0.008195051001161512,0.028971081599593163,0.0003202491207048297,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.037259682999999995,0.021548636,0.073957734,0.01237885,,,,
|
||||
19,586.0,0.0,3399.0,3399.0,266.0,3399.0,0.9976814200000504,1.0,15.0,0.0,,,,0.006056426719257629,0.009519012818678223,0.043173693120479584,0.00011111447383882478,0.00025,0.0,0.00025,0.00025,0.030213887000000002,0.025259253,0.11475632,0.005044707,,,,
|
||||
20,644.0,0.0,3631.0,3631.0,232.0,3631.0,0.9974517400000552,3.0,30.0,0.0,,,,0.007892606775416864,0.009331413396285886,0.02925945073366165,0.00020737151498906317,0.00025,0.0,0.00025,0.00025,0.038149226,0.025099216,0.08682343,0.0064632813,-0.0009132011300000001,0.012333746999999999,0.009670014499999999,-0.025862066
|
||||
21,691.0,0.0,3822.0,3822.0,191.0,3822.0,0.9972626500000594,1.0,5.0,0.0,,,,0.0065839045484144074,0.010710195076304628,0.055450454354286194,0.00015095918206498027,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.03362562,0.03347708,0.17523270000000002,0.007759502,0.008254298,0.019461052,0.04853519,-0.01426878
|
||||
22,763.0,0.0,4107.0,4107.0,285.0,4107.0,0.9969805000000656,5.0,100.0,0.0,,,,0.006797392681821495,0.009432101821733327,0.04118099808692932,0.00019709108164533973,0.00025,0.0,0.00025,0.00025,0.03493503,0.025949332999999998,0.10501147,0.009826525,0.014940828,0.022241406000000002,0.05235735,-0.00962076
|
||||
23,842.0,0.0,4426.0,4426.0,319.0,4426.0,0.9966646900000724,7.0,90.0,0.0,,,,0.006717705090096975,0.009711801205322595,0.05458200722932816,0.0001975365012185648,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.035762466,0.028132005,0.17399962,0.007998915,,,,
|
||||
24,871.0,0.0,4540.0,4540.0,114.0,4540.0,0.9965518300000747,0.0,0.0,0.0,,,,0.004121708562236343,0.006990884078555905,0.0262324009090662,0.00016586761921644208,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.02528197,0.022645405,0.08977601,0.0065642386,0.02154913,0.01743115,0.038836032,-0.0025164383
|
||||
25,908.0,0.0,4687.0,4687.0,147.0,4687.0,0.9964063000000779,2.0,45.0,0.0,,,,0.005335816105110319,0.0065088615879247145,0.01545584015548229,0.00013705540914088488,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.030282034,0.02378779,0.06643725,0.0073994235,,,,
|
||||
5,51.0,0.0,1260.0,1260.0,203.0,1260.0,0.9997990300000044,5.0,55.0,0.0,,,,0.011007826140734787,0.014603481057153478,0.05728723481297492,0.00017679380835033953,0.00025,0.0,0.00025,0.00025,0.05001448,0.03673725,0.18864875,0.012782556,,,,
|
||||
6,70.0,0.0,1335.0,1335.0,75.0,1335.0,0.999724780000006,2.0,15.0,0.0,,,,0.011499390747447154,0.010961000063645872,0.0315467044711113,0.0005441936664283277,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.05759323400000001,0.024992667000000003,0.11028934,0.022131458,,,,
|
||||
7,91.0,0.0,1422.0,1422.0,87.0,1422.0,0.9996386500000078,1.0,15.0,0.0,,,,0.01132884354696476,0.013429386203264964,0.04364541172981262,0.000340703729307279,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.055466358,0.03408065,0.13973257,0.016833907,,,,
|
||||
8,159.0,0.0,1693.0,1693.0,271.0,1693.0,0.9993703600000136,5.0,55.0,0.0,,,,0.008705972996627245,0.01046594152738398,0.04259247332811356,0.00026405457174405456,0.00025,0.0,0.00025,0.00025,0.04516968,0.027806934,0.12673344,0.0123512,,,,
|
||||
9,201.0,0.0,1861.0,1861.0,168.0,1861.0,0.9992040400000172,3.0,50.0,0.0,,,,0.005878299186449675,0.009437852632040231,0.04434124007821083,0.00013726821634918449,0.00025,0.0,0.00025,0.00025,0.031320102999999995,0.02600094,0.118447885,0.008186511,,,,
|
||||
10,279.0,0.0,2172.0,2172.0,311.0,2172.0,0.998896150000024,4.0,65.0,0.0,,,,0.009727142530699404,0.012268936533653787,0.05482503771781922,0.00013224119902588427,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.045818377,0.03322848,0.13469987,0.006579738000000001,,,,
|
||||
11,440.0,0.0,2815.0,2815.0,643.0,2815.0,0.9982595800000378,10.0,335.0,0.0,,,,0.008651261723684205,0.01035218743544492,0.0460522323846817,0.00012582635099533943,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.042565465,0.027683503999999998,0.13492820000000003,0.0055641527,0.010471878,0.016772145,0.03140713,-0.011288109
|
||||
12,458.0,0.0,2888.0,2888.0,73.0,2888.0,0.9981873100000394,2.0,45.0,0.0,,,,0.009507577900270313,0.010686165551315943,0.03972183912992477,0.0004233591898810118,0.00025,0.0,0.00025,0.00025,0.04721937,0.025519945,0.11107015,0.016729604,,,,
|
||||
13,478.0,0.0,2969.0,2969.0,81.0,2969.0,0.9981071200000412,0.0,0.0,0.0,,,,0.006916543132683728,0.008256373671042505,0.02793971076607704,0.00034270941978320485,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.03785228,0.023063693,0.090955265,0.014428139,-0.0006935441000000001,0.008459795,0.012772851000000002,-0.010573764
|
||||
14,532.0,0.0,3183.0,3183.0,214.0,3183.0,0.9978952600000456,4.0,50.0,0.0,,,,0.0069841391733562975,0.009727930525240285,0.030958421528339383,0.00019982327648904172,0.00025,0.0,0.00025,0.00025,0.03517378,0.028121071,0.09745253599999999,0.007200333000000001,,,,
|
||||
15,551.0,0.0,3262.0,3262.0,79.0,3262.0,0.9978170500000474,2.0,15.0,0.0,,,,0.008571460710587226,0.012479903064922505,0.043056368827819824,0.0001790421229088679,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.03861944,0.03349347,0.12367985,0.008007733000000001,,,,
|
||||
16,626.0,0.0,3560.0,3560.0,298.0,3560.0,0.9975220300000538,6.0,145.0,0.0,,,,0.00916061567428138,0.00985262607730402,0.03863134235143662,0.00022459866886492819,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.04501683,0.026303627000000003,0.10941381,0.010795511,-0.007507985,0.015376373999999998,0.009678967,-0.030438615
|
||||
17,885.0,0.0,4598.0,4598.0,1038.0,4598.0,0.996494410000076,12.0,210.0,0.0,,,,0.007690413830856681,0.009722273214587109,0.04484198987483978,0.00014540684060193598,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.040153995,0.028107608,0.13334101,0.007176003,0.01752627,0.018640606,0.05206203,-0.006777686
|
||||
18,903.0,0.0,4668.0,4668.0,70.0,4668.0,0.9964251100000776,2.0,15.0,0.0,,,,0.008374075151925139,0.00685058487549806,0.01695725508034229,0.00013643733109347522,0.00025,0.0,0.00025,0.00025,0.041769784,0.025388801000000003,0.0693266,0.006554181,,,,
|
||||
19,924.0,0.0,4754.0,4754.0,86.0,4754.0,0.9963399700000796,2.0,35.0,0.0,,,,0.006986255206616728,0.009138039512187723,0.029435122385621067,0.00023959197278600186,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.03765729,0.027741422999999998,0.09483457,0.009779892,,,,
|
||||
20,988.0,0.0,5007.0,5007.0,253.0,5007.0,0.9960895000000848,1.0,5.0,0.0,,,,0.008958109939518932,0.010352110018017849,0.04120930656790733,0.00026069089653901756,0.00025,0.0,0.00025,0.00025,0.044280123,0.027352182000000003,0.10559346,0.010518369,,,,
|
||||
21,1009.0,0.0,5092.0,5092.0,85.0,5092.0,0.9960053500000868,0.0,0.0,0.0,,,,0.009729027376687596,0.007417915393123158,0.026410818099975586,0.0005171290249563754,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.05305024,0.022927448,0.11149109,0.019090652,,,,
|
||||
22,1041.0,0.0,5221.0,5221.0,129.0,5221.0,0.9958776400000896,1.0,10.0,0.0,,,,0.0065109121378554855,0.009705144564042924,0.04230054095387459,0.0002464384888298809,0.00025,0.0,0.00025,0.00025,0.03857564,0.029652012999999998,0.13166025,0.008339129,0.022667855,0.029822525,0.073469676,-0.01822071
|
||||
23,1101.0,0.0,5461.0,5461.0,240.0,5461.0,0.9956400400000948,6.0,85.0,0.0,,,,0.007464758036803688,0.008871554942636414,0.04159108921885489,9.95906739262864e-05,0.00025,0.0,0.00025,0.00025,0.040631982999999997,0.027780425,0.1273076,0.0052087842,,,,
|
||||
24,1167.0,0.0,5724.0,5724.0,263.0,5724.0,0.9953796700001004,1.0,25.0,0.0,,,,0.007049951021944059,0.008145597856309148,0.029556380584836006,0.00024747068528085947,0.00025,0.0,0.00025,0.00025,0.03756183,0.025077598,0.10530927,0.010631736000000001,,,,
|
||||
25,1188.0,0.0,5808.0,5808.0,84.0,5808.0,0.995296510000102,0.0,0.0,0.0,,,,0.008849835848585437,0.008812960520326749,0.028190467506647113,0.00018663128139451146,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.04469130599999999,0.028627316,0.10585028,0.008268119,,,,
|
||||
|
||||
|
Reference in New Issue
Block a user