mirror of
https://github.com/gryf/coach.git
synced 2026-03-14 13:45:46 +01:00
Itaicaspi/episode reset refactoring (#105)
* reordering of the episode reset operation and allowing to store episodes only when they are terminated * reordering of the episode reset operation and allowing to store episodes only when they are terminated * revert tensorflow-gpu to 1.9.0 + bug fix in should_train() * tests readme file and refactoring of policy optimization agent train function * Update README.md * Update README.md * additional policy optimization train function simplifications * Updated the traces after the reordering of the environment reset * docker and jenkins files * updated the traces to the ones from within the docker container * updated traces and added control suite to the docker * updated jenkins file with the intel proxy + updated doom basic a3c test params * updated line breaks in jenkins file * added a missing line break in jenkins file * refining trace tests ignored presets + adding a configurable beta entropy value * switch the order of trace and golden tests in jenkins + fix golden tests processes not killed issue * updated benchmarks for dueling ddqn breakout and pong * allowing dynamic updates to the loss weights + bug fix in episode.update_returns * remove docker and jenkins file
This commit is contained in:
@@ -3,29 +3,24 @@ Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,To
|
||||
2,0.0,1.0,573.0,573.0,87.0,573.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
3,0.0,1.0,722.0,722.0,149.0,722.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
4,0.0,1.0,1057.0,1057.0,335.0,1057.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
5,51.0,0.0,1260.0,1260.0,203.0,1260.0,0.9997990300000044,3.0,30.0,0.0,,,,3.931728353687361,1.7148335424993695e-05,3.9317572116851807,3.931634187698364,0.00025,0.0,0.00025,0.00025,0.0015541904000000001,0.0023056455,0.009599385,0.0007559575999999999,,,,
|
||||
6,116.0,0.0,1519.0,1519.0,259.0,1519.0,0.99954262000001,3.0,30.0,0.0,,,,3.9316723786867582,5.269867767456892e-05,3.9317219257354736,3.9313907623291016,0.00025,0.0,0.00025,0.00025,0.001739312,0.0026554922,0.009864504,0.00067749363,,,,
|
||||
7,154.0,0.0,1673.0,1673.0,154.0,1673.0,0.9993901600000132,0.0,0.0,0.0,,,,3.931619857486925,6.473394968283058e-05,3.9316527843475337,3.931235074996948,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0012083224,0.0019307991,0.009499238,0.0006370891400000001,,,,
|
||||
8,188.0,0.0,1809.0,1809.0,136.0,1809.0,0.9992555200000162,0.0,0.0,0.0,,,,3.931548202739042,7.783996401137547e-05,3.9316082000732417,3.9312365055084233,0.00025,0.0,0.00025,0.00025,0.0022799673,0.0033626328000000002,0.01030305,0.0006125771299999999,,,,
|
||||
9,218.0,0.0,1927.0,1927.0,118.0,1927.0,0.9991387000000188,4.0,50.0,0.0,,,,3.9314806302388514,0.00010239504684735038,3.931550741195679,3.931047201156616,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0016353407000000001,0.002778357,0.01035096,0.0005981442500000001,,,,
|
||||
10,239.0,0.0,2013.0,2013.0,86.0,2013.0,0.9990535600000204,1.0,25.0,0.0,,,,3.9313772519429526,0.00020685918056109227,3.931517362594605,3.9308536052703857,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0034886056,0.004297202,0.010684523999999999,0.00061402726,,,,
|
||||
11,285.0,0.0,2197.0,2197.0,184.0,2197.0,0.9988714000000244,5.0,75.0,0.0,,,,3.9313522369965264,7.248832757213434e-05,3.931442975997925,3.931007385253906,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0017790395999999998,0.0030002112,0.011006265,0.0006065490000000001,,,,
|
||||
12,309.0,0.0,2293.0,2293.0,96.0,2293.0,0.9987763600000266,2.0,15.0,0.0,,,,3.931213736534119,0.0002593847407516344,3.93136215209961,3.9304351806640634,0.00025,0.0,0.00025,0.00025,0.0028233638,0.0041352687,0.011190076,0.0005888872,,,,
|
||||
13,353.0,0.0,2467.0,2467.0,174.0,2467.0,0.9986041000000304,2.0,35.0,0.0,,,,3.9310338009487498,0.0002957116497356457,3.9312725067138667,3.929877519607544,0.00025,0.0,0.00025,0.00025,0.0030289008,0.0042545744,0.012507513,0.0006166726000000001,,,,
|
||||
14,406.0,0.0,2680.0,2680.0,213.0,2680.0,0.9983932300000348,3.0,60.0,0.0,,,,3.930882449419993,0.00035235950786128846,3.9310703277587886,3.929490327835083,0.00025,0.0,0.00025,0.00025,0.0028729883,0.004979132,0.022557117,0.0007968402,0.012837511921922923,0.022259134634650783,0.040622540563345584,-0.024907390773295932
|
||||
15,422.0,0.0,2745.0,2745.0,65.0,2745.0,0.9983288800000364,2.0,15.0,0.0,,,,3.9306667894124985,0.0004889590223132316,3.9309356212615967,3.929192781448364,0.00025,0.0,0.00025,0.00025,0.003993525,0.005016152,0.013677783,0.00091032905,,,,
|
||||
16,442.0,0.0,2826.0,2826.0,81.0,2826.0,0.998248690000038,0.0,0.0,0.0,,,,3.930476784706116,0.0005833675931495567,3.9308347702026367,3.92863392829895,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0037356387,0.0048887976000000005,0.014913436,0.00089475035,,,,
|
||||
17,501.0,0.0,3060.0,3060.0,234.0,3060.0,0.9980170300000429,4.0,35.0,0.0,,,,3.9304699938176038,0.00041264778275723504,3.9306838512420654,3.928467988967896,0.00025,0.0,0.00025,0.00025,0.0030552953999999997,0.0041774893,0.01554886,0.0010523795,0.023353116586804973,0.020788514387939237,0.05141336545348224,-0.0014774784445756026
|
||||
18,526.0,0.0,3161.0,3161.0,101.0,3161.0,0.9979170400000452,1.0,20.0,0.0,,,,3.9306457805633546,0.00023956495978218428,3.930816650390625,3.929875612258911,0.00025,0.0,0.00025,0.00025,0.002464988,0.003725262,0.013498537,0.00077633635,,,,
|
||||
19,589.0,0.0,3413.0,3413.0,252.0,3413.0,0.9976675600000506,2.0,55.0,0.0,,,,3.9304992774176224,0.00034951799503506604,3.9307899475097656,3.9290616512298575,0.00025,0.0,0.00025,0.00025,0.0029548485999999997,0.0043363147,0.01425068,0.0007409669,,,,
|
||||
20,646.0,0.0,3642.0,3642.0,229.0,3642.0,0.9974408500000556,2.0,15.0,0.0,,,,3.930309973264996,0.0005540508390044677,3.930628061294556,3.928320169448853,0.00025,0.0,0.00025,0.00025,0.0032555721999999996,0.004834081,0.015668849,0.0008300698,0.026904297930499418,0.021589106230980433,0.05910116657614764,0.005408810079098325
|
||||
21,698.0,0.0,3849.0,3849.0,207.0,3849.0,0.99723592000006,4.0,50.0,0.0,,,,3.929926037788391,0.0006353061160591977,3.9303271770477295,3.9271233081817623,0.00025,0.0,0.00025,0.00025,0.004353328,0.006303993000000001,0.029395893,0.0010768827,0.02748812679201423,0.0217088123519984,0.057050981000066316,0.0017140418291097805
|
||||
22,738.0,0.0,4010.0,4010.0,161.0,4010.0,0.9970765300000636,4.0,90.0,0.0,,,,3.92977910041809,0.0005514096791911278,3.930201768875122,3.9283792972564697,0.00025,0.0,0.00025,0.00025,0.004639727,0.005436519,0.015939886,0.0013534969000000001,,,,
|
||||
23,789.0,0.0,4214.0,4214.0,204.0,4214.0,0.996874570000068,2.0,10.0,0.0,,,,3.929426656049841,0.0008124188909974342,3.929957151412964,3.925875425338745,0.00025,0.0,0.00025,0.00025,0.005286702,0.0059416015,0.024375048,0.0017462726,0.030502823988597175,0.02342976988309637,0.06656642369926036,0.0004357606172566697
|
||||
24,854.0,0.0,4474.0,4474.0,260.0,4474.0,0.9966171700000734,5.0,80.0,0.0,,,,3.929753776697012,0.0006802738781902477,3.9303853511810303,3.926770448684693,0.00025,0.0,0.00025,0.00025,0.0032921252,0.004323490399999999,0.018876718,0.0008184177999999999,0.030289770103991618,0.011228381833076877,0.046150057762861824,0.014975410327315919
|
||||
25,901.0,0.0,4662.0,4662.0,188.0,4662.0,0.9964310500000776,3.0,30.0,0.0,,,,3.929939036673688,0.0008579045062845213,3.9304828643798833,3.926759004592896,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0043313909999999995,0.0071201716,0.033504024,0.0006334899,,,,
|
||||
26,969.0,0.0,4934.0,4934.0,272.0,4934.0,0.9961617700000832,1.0,5.0,0.0,,,,3.929590607390684,0.0006133207352767329,3.930098295211792,3.927515745162964,0.00025,0.0,0.00025,0.00025,0.0038270776,0.005072999999999999,0.021740799999999998,0.0010850433,,,,
|
||||
27,1028.0,0.0,5168.0,5168.0,234.0,5168.0,0.9959301100000884,3.0,30.0,0.0,,,,3.930041709188688,0.0004330404189005426,3.9302978515625,3.927629232406616,0.00025,0.0,0.00025,0.00025,0.0031090009999999997,0.004790003,0.02229039,0.0008657125,,,,
|
||||
28,1047.0,0.0,5245.0,5245.0,77.0,5245.0,0.99585388000009,2.0,45.0,0.0,,,,3.9298872069308635,0.0005701280611071911,3.9302644729614262,3.9285831451416016,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0042041945,0.0059060673,0.016562391,0.0008514148599999999,0.03760540119061923,0.01643017217867538,0.05344712957739886,0.01295695789158402
|
||||
29,1107.0,0.0,5486.0,5486.0,241.0,5486.0,0.9956152900000952,6.0,105.0,0.0,,,,3.929187309741974,0.0007912253650240303,3.930028200149536,3.92718768119812,0.00025,0.0,0.00025,0.00025,0.0057351263,0.0060241455000000005,0.018669646,0.0012705077,,,,
|
||||
30,1170.0,0.0,5738.0,5738.0,252.0,5738.0,0.9953658100001006,0.0,0.0,0.0,,,,3.9288085188184474,0.0009372335274004561,3.929582357406616,3.926055908203125,0.00025,0.0,0.00025,0.00025,0.0061082826,0.006076769,0.019835133,0.001853791,,,,
|
||||
5,51.0,0.0,1260.0,1260.0,203.0,1260.0,0.9997990300000044,5.0,55.0,0.0,,,,3.931745547874301,1.1304143308005733e-05,3.9317700862884517,3.9316890239715576,0.00025,0.0,0.00025,0.00025,0.0015866637,0.0023147496,0.009720516,0.0007565144,,,,
|
||||
6,70.0,0.0,1335.0,1335.0,75.0,1335.0,0.999724780000006,2.0,15.0,0.0,,,,3.931735929689909,7.235250669185713e-06,3.9317455291748047,3.931711912155152,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.001755927,0.0026373637,0.009641058000000001,0.0007148395500000001,,,,
|
||||
7,91.0,0.0,1422.0,1422.0,87.0,1422.0,0.9996386500000078,1.0,15.0,0.0,,,,3.931701206025623,5.099185273705093e-05,3.93173623085022,3.931553602218628,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.00282516,0.0035993564000000003,0.009418896999999999,0.00070036505,,,,
|
||||
8,159.0,0.0,1693.0,1693.0,271.0,1693.0,0.9993703600000136,5.0,55.0,0.0,,,,3.931656876606728,9.226522325134514e-05,3.931716203689575,3.9311599731445312,0.00025,0.0,0.00025,0.00025,0.0017165048,0.0027771054,0.012550428999999998,0.00063557597,,,,
|
||||
9,201.0,0.0,1861.0,1861.0,168.0,1861.0,0.9992040400000172,3.0,50.0,0.0,,,,3.93158137230646,0.00010474746316658029,3.93165135383606,3.931158781051636,0.00025,0.0,0.00025,0.00025,0.0017799592,0.002852903,0.009889938000000001,0.0006321495,,,,
|
||||
10,279.0,0.0,2172.0,2172.0,311.0,2172.0,0.998896150000024,4.0,65.0,0.0,,,,3.9314154325387416,0.00022279076273676361,3.931581258773804,3.930070638656616,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0026444625,0.004101368,0.019448647,0.00062298455,,,,
|
||||
11,407.0,0.0,2683.0,2683.0,511.0,2683.0,0.9983902600000351,9.0,320.0,0.0,,,,3.931240767240524,0.00015854553450050932,3.931373834609986,3.9305694103240967,0.0002500000000000001,1.0842021724855042e-19,0.00025,0.00025,0.0017362889000000002,0.0029191163,0.011232911000000002,0.0005518816,0.024129094928503625,0.00904320207528025,0.04169573485851341,0.012993395328522341
|
||||
12,424.0,0.0,2754.0,2754.0,71.0,2754.0,0.9983199700000364,1.0,15.0,0.0,,,,3.9310134579153617,0.000358822446065362,3.9312620162963863,3.93019700050354,0.00025,0.0,0.00025,0.00025,0.0032191304,0.0045680365999999995,0.011846525,0.0005631294,,,,
|
||||
13,457.0,0.0,2886.0,2886.0,132.0,2886.0,0.9981892900000392,2.0,25.0,0.0,,,,3.931020930409432,0.00018348520436412824,3.93116307258606,3.9301931858062735,0.00025,0.0,0.00025,0.00025,0.0016074966000000001,0.002708108,0.012189938999999999,0.00064319023,,,,
|
||||
14,504.0,0.0,3074.0,3074.0,188.0,3074.0,0.9980031700000432,3.0,35.0,0.0,,,,3.931025738301485,0.00015399033015145469,3.9311008453369136,3.9300034046173096,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0009836307000000001,0.0015528154999999999,0.011335916000000001,0.0005281837,0.021890531852842,0.014466196029404797,0.03762449622154298,-0.00010702610015811408
|
||||
15,528.0,0.0,3167.0,3167.0,93.0,3167.0,0.9979111000000452,1.0,15.0,0.0,,,,3.931034368017445,6.681329033129075e-05,3.9310910701751713,3.9308130741119385,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0016258046,0.0031157003000000004,0.011724828999999999,0.0004990724,,,,
|
||||
16,598.0,0.0,3449.0,3449.0,282.0,3449.0,0.9976319200000514,2.0,55.0,0.0,,,,3.930865437643869,0.0002831683814269127,3.9310925006866455,3.9296932220458975,0.00025,0.0,0.00025,0.00025,0.0021639192000000003,0.0036756303,0.012480825,0.00047580682,0.0305326876540985,0.00923045073371262,0.0438561670482166,0.021990178897977525
|
||||
17,668.0,0.0,3729.0,3729.0,280.0,3729.0,0.9973547200000574,4.0,45.0,0.0,,,,3.930601644515991,0.0003480949830888473,3.9308652877807617,3.9292240142822266,0.00025,0.0,0.00025,0.00025,0.0027047140000000004,0.0042121527,0.013903748,0.0006515036,0.029686454000572925,0.01902240661079521,0.058909925818443724,-0.002814809605478502
|
||||
18,738.0,0.0,4008.0,4008.0,279.0,4008.0,0.9970785100000634,3.0,45.0,0.0,,,,3.930277814183917,0.0005110864544539217,3.930636167526245,3.9281198978424072,0.00025,0.0,0.00025,0.00025,0.0036887865999999997,0.0051101656,0.02086526,0.0008114038499999999,,,,
|
||||
19,792.0,0.0,4223.0,4223.0,215.0,4223.0,0.9968656600000679,4.0,90.0,0.0,,,,3.930134093319928,0.00047399490243328624,3.930522918701172,3.9284942150115967,0.00025,0.0,0.00025,0.00025,0.0037553142999999997,0.004891396,0.0151908295,0.0010129308999999999,0.030484313207368687,0.012861465171913404,0.04339803867042122,0.011251759901643564
|
||||
20,893.0,0.0,4630.0,4630.0,407.0,4630.0,0.9964627300000768,10.0,115.0,0.0,,,,3.929736850285294,0.000766311293002325,3.930368661880493,3.926426649093628,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.004180377,0.006044741700000001,0.031209853,0.0009457401,0.0355303921426342,0.014215304187277478,0.05135452747345026,0.012931596487761264
|
||||
21,937.0,0.0,4805.0,4805.0,175.0,4805.0,0.9962894800000806,1.0,5.0,0.0,,,,3.930479177208834,0.00023689537153461093,3.930684328079224,3.929489135742188,0.00025,0.0,0.00025,0.00025,0.0021777323,0.0034656142999999998,0.014414535,0.00058991817,,,,
|
||||
22,1022.0,0.0,5146.0,5146.0,341.0,5146.0,0.995951890000088,3.0,65.0,0.0,,,,3.93046441078186,0.00035790579075833815,3.9307262897491455,3.929075956344605,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0024591651999999998,0.0041425275,0.014986968,0.00047587089999999996,,,,
|
||||
23,1120.0,0.0,5538.0,5538.0,392.0,5538.0,0.9955638100000964,6.0,80.0,0.0,,,,3.9300818811986864,0.0004955548155674863,3.930469751358032,3.928221464157105,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.0027119769,0.0042804847,0.020022545,0.00057932467,0.035476823337376714,0.014014476077534626,0.04927191920578547,0.007030519843102157
|
||||
24,1165.0,0.0,5718.0,5718.0,180.0,5718.0,0.9953856100001002,3.0,55.0,0.0,,,,3.9300585714253513,0.00053408662096811,3.9305152893066406,3.928401231765747,0.00025,0.0,0.00025,0.00025,0.0033172776,0.004863477299999999,0.016010353,0.0006072133999999999,,,,
|
||||
25,1190.0,0.0,5815.0,5815.0,97.0,5815.0,0.9952895800001024,0.0,0.0,0.0,,,,3.9299856324990587,0.0004047671393024133,3.9302456378936768,3.9285967350006095,0.00025,0.0,0.00025,0.00025,0.0030563176,0.004401815999999999,0.016188376,0.0011075826,,,,
|
||||
|
||||
|
Reference in New Issue
Block a user