mirror of
https://github.com/gryf/coach.git
synced 2026-04-15 20:13:33 +02:00
Itaicaspi/episode reset refactoring (#105)
* reordering of the episode reset operation and allowing to store episodes only when they are terminated * reordering of the episode reset operation and allowing to store episodes only when they are terminated * revert tensorflow-gpu to 1.9.0 + bug fix in should_train() * tests readme file and refactoring of policy optimization agent train function * Update README.md * Update README.md * additional policy optimization train function simplifications * Updated the traces after the reordering of the environment reset * docker and jenkins files * updated the traces to the ones from within the docker container * updated traces and added control suite to the docker * updated jenkins file with the intel proxy + updated doom basic a3c test params * updated line breaks in jenkins file * added a missing line break in jenkins file * refining trace tests ignored presets + adding a configurable beta entropy value * switch the order of trace and golden tests in jenkins + fix golden tests processes not killed issue * updated benchmarks for dueling ddqn breakout and pong * allowing dynamic updates to the loss weights + bug fix in episode.update_returns * remove docker and jenkins file
This commit is contained in:
@@ -3,29 +3,24 @@ Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,To
|
||||
2,0.0,1.0,573.0,573.0,87.0,573.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
3,0.0,1.0,722.0,722.0,149.0,722.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
4,0.0,1.0,1057.0,1057.0,335.0,1057.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
5,51.0,0.0,1259.0,1259.0,202.0,1259.0,0.999818200000006,3.0,35.0,0.0,,,,0.002354268465055879,0.0022267908155453207,0.008399246260523796,8.872663784131873e-06,0.00025,0.0,0.00025,0.00025,0.007744235,0.005350461,0.022665123,0.0008465818,,,,
|
||||
6,81.0,0.0,1382.0,1382.0,123.0,1382.0,0.9997075000000096,4.0,55.0,0.0,,,,0.006926822468327979,0.002244478491556321,0.0135076642036438,0.0033381427638232712,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.018759595,0.0053872466,0.032931123,0.009214188,,,,
|
||||
7,152.0,0.0,1665.0,1665.0,283.0,1665.0,0.9994528000000179,2.0,45.0,0.0,,,,0.00354002532754159,0.0019023348592878372,0.009204687550663948,0.00030229013646021485,0.00025,0.0,0.00025,0.00025,0.01304985,0.0035053138,0.024019292,0.008035132,,,,
|
||||
8,208.0,0.0,1887.0,1887.0,222.0,1887.0,0.9992530000000246,1.0,20.0,0.0,,,,0.003386984325646024,0.0014584238962574282,0.006831846199929714,0.0003159668995067477,0.00025,0.0,0.00025,0.00025,0.013196401000000002,0.0034898983,0.025287742000000002,0.008569226,,,,
|
||||
9,220.0,0.0,1938.0,1938.0,51.0,1938.0,0.999207100000026,0.0,0.0,0.0,,,,0.003167361059846977,0.0015483758671841056,0.006221367511898279,0.0007139326771721244,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.013424491,0.002968179,0.0176331,0.009279029,,,,
|
||||
10,269.0,0.0,2131.0,2131.0,193.0,2131.0,0.9990334000000318,1.0,5.0,0.0,,,,0.0032611473170061573,0.0016850956682255482,0.007028852589428425,0.00020222167950123549,0.00025,0.0,0.00025,0.00025,0.013227931,0.0036521524,0.021845128,0.007127245999999999,,,,
|
||||
11,363.0,0.0,2510.0,2510.0,379.0,2510.0,0.9986923000000429,8.0,100.0,0.0,,,,0.003091246536449886,0.001322660534422889,0.006632269825786352,0.00032261264277622104,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.013847044,0.0034531087,0.023722986,0.008786425,0.08158561,0.036171492,0.17906709,0.03910739
|
||||
12,403.0,0.0,2670.0,2670.0,160.0,2670.0,0.9985483000000478,1.0,25.0,0.0,,,,0.0033887081764987672,0.001894344488589778,0.00896457675844431,0.00035247692721895874,0.00025,0.0,0.00025,0.00025,0.014799103000000001,0.005142509,0.03727644,0.008755262,,,,
|
||||
13,566.0,0.0,3319.0,3319.0,649.0,3319.0,0.997964200000067,20.0,515.0,0.0,,,,0.0033814117187088463,0.001794335243639714,0.00981593132019043,0.00033476535463705664,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.01542785,0.0042213122,0.035808,0.008857572,,,,
|
||||
14,608.0,0.0,3490.0,3490.0,171.0,3490.0,0.997810300000072,2.0,15.0,0.0,,,,0.00307327011181596,0.0014598479376536175,0.007876500487327577,0.0004184547869954258,0.00025,0.0,0.00025,0.00025,0.015182586000000001,0.003907353,0.025957266,0.008718804,,,,
|
||||
15,661.0,0.0,3699.0,3699.0,209.0,3699.0,0.9976222000000784,3.0,30.0,0.0,,,,0.003574654932204142,0.0013611143826604485,0.006663748994469643,0.0012790606124326589,0.00025,0.0,0.00025,0.00025,0.015538703000000001,0.0037677127,0.02521416,0.009612316999999999,,,,
|
||||
16,699.0,0.0,3853.0,3853.0,154.0,3853.0,0.9974836000000828,3.0,75.0,0.0,,,,0.003063707425577664,0.0016034075091713835,0.007304192055016756,0.00034941814374178653,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.016172405,0.0048504383,0.027080176,0.008548103,,,,
|
||||
17,743.0,0.0,4030.0,4030.0,177.0,4030.0,0.997324300000088,3.0,30.0,0.0,,,,0.00310047399133592,0.0014594212466929055,0.0075475480407476425,0.0003596151655074209,0.00025,0.0,0.00025,0.00025,0.015252826,0.0038106788,0.029333811,0.009897261,0.109428376,0.08142622,0.25112388,0.031323746
|
||||
18,763.0,0.0,4107.0,4107.0,77.0,4107.0,0.9972550000000904,2.0,15.0,0.0,,,,0.00320658921264112,0.0014737941431521605,0.006449719425290823,0.0006320171523839235,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.015207966000000002,0.0041951295,0.026854733,0.009781642,,,,
|
||||
19,799.0,0.0,4254.0,4254.0,147.0,4254.0,0.9971227000000948,2.0,35.0,0.0,,,,0.003265373379690573,0.0015747774825930286,0.006731272675096989,0.0007752227247692645,0.00025,0.0,0.00025,0.00025,0.016477453,0.0043514105,0.030398313,0.009153037,,,,
|
||||
20,857.0,0.0,4485.0,4485.0,231.0,4485.0,0.9969148000001016,7.0,110.0,0.0,,,,0.0033697776560639514,0.0017829018890948177,0.009337665513157845,0.0005270092515274882,0.00025,0.0,0.00025,0.00025,0.017007816999999998,0.004538108,0.034457795,0.0102955345,0.086831845,0.028143487999999998,0.11529497,0.041701294
|
||||
21,954.0,0.0,4871.0,4871.0,386.0,4871.0,0.9965674000001129,1.0,10.0,0.0,,,,0.0032097528227748944,0.0014270266361265948,0.0072808810509741315,0.00034487116499803966,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.016735202,0.0040815175,0.029879992999999997,0.009203656999999999,0.08063345,0.06771858,0.22763099,-0.04870935
|
||||
22,987.0,0.0,5006.0,5006.0,135.0,5006.0,0.9964459000001171,1.0,15.0,0.0,,,,0.00348929021944941,0.0013416678040725266,0.006667369976639748,0.0004941442748531699,0.00025,0.0,0.00025,0.00025,0.017052516,0.0037629176,0.02555473,0.010013681,,,,
|
||||
23,1038.0,0.0,5208.0,5208.0,202.0,5208.0,0.9962641000001229,3.0,30.0,0.0,,,,0.003096698048323685,0.001467369498213491,0.006518170703202486,0.0005598508287221193,0.00025,0.0,0.00025,0.00025,0.017208265,0.004186028,0.02688086,0.009457254,,,,
|
||||
24,1054.0,0.0,5274.0,5274.0,66.0,5274.0,0.9962047000001251,2.0,15.0,0.0,,,,0.0023996760137379174,0.0011494210259765632,0.005033135414123535,0.00040235067717731,0.00025,0.0,0.00025,0.00025,0.014471052,0.0028194014,0.018233253,0.0090312585,0.09159353,0.073366776,0.19782996,-0.007508415
|
||||
25,1076.0,0.0,5359.0,5359.0,85.0,5359.0,0.9961282000001276,1.0,15.0,0.0,,,,0.0031479224470041863,0.0018338206488306352,0.008050543256103992,0.00018393099890090525,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.016573252,0.0058718068000000005,0.02915352,0.005962694,,,,
|
||||
26,1133.0,0.0,5587.0,5587.0,228.0,5587.0,0.9959230000001342,4.0,50.0,0.0,,,,0.002919742441327687,0.001194507040554492,0.006624207831919193,0.00057441764511168,0.00025,0.0,0.00025,0.00025,0.016612988000000002,0.00332599,0.026537797999999998,0.010939502,0.09447273,0.045939725,0.15817265,0.033776283
|
||||
27,1153.0,0.0,5667.0,5667.0,80.0,5667.0,0.9958510000001366,1.0,15.0,0.0,,,,0.00301869151298888,0.0013370276603479855,0.006056639365851879,0.001242607831954956,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.016518693,0.003245745,0.022646153,0.010498283999999998,,,,
|
||||
28,1173.0,0.0,5749.0,5749.0,82.0,5749.0,0.995777200000139,0.0,0.0,0.0,,,,0.0031465753330849108,0.0012105911527881745,0.0058187893591821185,0.0013689068146049974,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.018286983,0.005796103299999999,0.036277987000000005,0.011089685,,,,
|
||||
29,1218.0,0.0,5928.0,5928.0,179.0,5928.0,0.9956161000001444,1.0,5.0,0.0,,,,0.0031859539345734647,0.001230199051850356,0.005495925433933735,0.0007681638235226274,0.00025,0.0,0.00025,0.00025,0.017322628,0.004681325,0.032449782,0.008565956999999999,,,,
|
||||
30,1232.0,0.0,5983.0,5983.0,55.0,5983.0,0.9955666000001461,2.0,15.0,0.0,,,,0.0033092185206312157,0.0009492089431610681,0.0049632079899311074,0.0016535777831450105,0.0002500000000000001,1.0842021724855042e-19,0.00025,0.00025,0.016791698,0.0036438016999999997,0.024807067999999998,0.012081898999999998,,,,
|
||||
5,63.0,0.0,1310.0,1310.0,253.0,1310.0,0.9997723000000076,4.0,50.0,0.0,,,,0.003875652090250191,0.006230668056782436,0.04718368873000145,2.2094836822361685e-05,0.00025,0.0,0.00025,0.00025,0.01209846,0.018056398,0.1446681,0.0014401993,,,,
|
||||
6,191.0,0.0,1821.0,1821.0,511.0,1821.0,0.9993124000000226,12.0,185.0,0.0,,,,0.003655906816839981,0.0017923743519973538,0.008377103134989737,0.00027508928906172514,0.0002500000000000001,1.0842021724855042e-19,0.00025,0.00025,0.013568986000000002,0.0035154566,0.026353458,0.007167939,,,,
|
||||
7,296.0,0.0,2240.0,2240.0,419.0,2240.0,0.998935300000035,5.0,100.0,0.0,,,,0.003318573732810494,0.0015315255248514966,0.007952019572257996,0.00021419327822513878,0.0002500000000000001,1.0842021724855042e-19,0.00025,0.00025,0.014484913,0.003961455,0.033718556000000004,0.0059639704,0.040829557999999995,0.021066558,0.07627003,0.013901123
|
||||
8,339.0,0.0,2414.0,2414.0,174.0,2414.0,0.9987787000000402,1.0,5.0,0.0,,,,0.003183173737217954,0.0015401180638853654,0.006335136014968157,0.00038450717693194747,0.00025,0.0,0.00025,0.00025,0.015692346,0.0040802797,0.025410485,0.009213975,0.10701928,0.10879564,0.30108258,-0.011487618
|
||||
9,368.0,0.0,2529.0,2529.0,115.0,2529.0,0.9986752000000436,3.0,30.0,0.0,,,,0.003484182040015834,0.0017209235393860082,0.0067713456228375435,0.00019597783102653918,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.015461218999999998,0.0044411486,0.025622195,0.005317989699999999,,,,
|
||||
10,411.0,0.0,2702.0,2702.0,173.0,2702.0,0.9985195000000489,3.0,75.0,0.0,,,,0.003653256459497349,0.0013851372165254595,0.006258142180740832,0.0008657328435219824,0.00025,0.0,0.00025,0.00025,0.017220842,0.0031612364,0.025344394,0.009269036999999999,,,,
|
||||
11,465.0,0.0,2915.0,2915.0,213.0,2915.0,0.9983278000000549,3.0,20.0,0.0,,,,0.0032540040171951195,0.0013094868857552425,0.006947712041437626,0.0004492675070650876,0.00025,0.0,0.00025,0.00025,0.016636208,0.004167957,0.027587958,0.009301778,,,,
|
||||
12,510.0,0.0,3097.0,3097.0,182.0,3097.0,0.9981640000000604,4.0,60.0,0.0,,,,0.003109362826216966,0.0013988949206461794,0.006362042855471373,0.0003950340324081481,0.00025,0.0,0.00025,0.00025,0.016663404,0.004190624,0.027471463999999998,0.010103953,,,,
|
||||
13,550.0,0.0,3258.0,3258.0,161.0,3258.0,0.9980191000000652,3.0,75.0,0.0,,,,0.0035577299742726607,0.001388862490205299,0.008318169042468071,0.0004163705743849278,0.00025,0.0,0.00025,0.00025,0.017404305,0.0035805209999999997,0.02947828,0.012193107,,,,
|
||||
14,594.0,0.0,3433.0,3433.0,175.0,3433.0,0.9978616000000704,4.0,50.0,0.0,,,,0.003484184082142662,0.001732970471266746,0.007269437424838544,0.0006064289482310414,0.00025,0.0,0.00025,0.00025,0.019197596,0.0056097833,0.03633184,0.009341977,,,,
|
||||
15,630.0,0.0,3578.0,3578.0,145.0,3578.0,0.9977311000000748,2.0,25.0,0.0,,,,0.0037337387426911537,0.0015802323114164785,0.007099532522261144,0.0005637581925839187,0.00025,0.0,0.00025,0.00025,0.018333083,0.0047576996,0.031882799999999996,0.010614046,,,,
|
||||
16,675.0,0.0,3756.0,3756.0,178.0,3756.0,0.99757090000008,0.0,0.0,0.0,,,,0.0036686222513460298,0.0014980166633852432,0.007150433491915464,0.0005505527369678019,0.00025,0.0,0.00025,0.00025,0.018643329,0.004285918499999999,0.029188786,0.009071933,,,,
|
||||
17,779.0,0.0,4171.0,4171.0,415.0,4171.0,0.9971974000000924,6.0,80.0,0.0,,,,0.003027278060192027,0.0014114358437464045,0.007179290056228638,0.00035245553590357304,0.0002500000000000001,1.0842021724855042e-19,0.00025,0.00025,0.017073763999999998,0.004743929,0.03250031,0.0089325765,0.008589801,0.041869998,0.065109685,-0.06993793
|
||||
18,802.0,0.0,4265.0,4265.0,94.0,4265.0,0.9971128000000952,1.0,30.0,0.0,,,,0.002608991115424863,0.0016136469631561243,0.006101616192609072,0.0004670571361202746,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.016327688,0.004186721,0.02735403,0.011188851000000001,,,,
|
||||
19,859.0,0.0,4494.0,4494.0,229.0,4494.0,0.9969067000001018,5.0,100.0,0.0,,,,0.002831909199972359,0.0013861029304045335,0.006143730133771896,0.00027022871654480696,0.00025,0.0,0.00025,0.00025,0.016310083,0.0043867540000000005,0.027778333,0.007568861999999999,0.046633485999999995,0.052421506,0.14200787,-0.033771105
|
||||
20,925.0,0.0,4758.0,4758.0,264.0,4758.0,0.9966691000001096,6.0,75.0,0.0,,,,0.0030004231411462213,0.0014101580596944704,0.007745119743049146,0.000437128881458193,0.00025,0.0,0.00025,0.00025,0.018002652,0.0047670375,0.030942027999999996,0.009946148,0.056299467,0.06465223,0.2402926,-0.024710407
|
||||
21,952.0,0.0,4866.0,4866.0,108.0,4866.0,0.9965719000001128,0.0,0.0,0.0,,,,0.0030828455604093442,0.001222012049279153,0.005216440185904503,0.0004437630705069751,0.00025,0.0,0.00025,0.00025,0.01797254,0.004588888,0.029642342000000002,0.011304895,,,,
|
||||
22,989.0,0.0,5012.0,5012.0,146.0,5012.0,0.9964405000001172,2.0,45.0,0.0,,,,0.002605638285684917,0.0011707703827911154,0.005040653981268406,0.00027624226640909905,0.00025,0.0,0.00025,0.00025,0.014817067,0.0034752183,0.023371994,0.00671804,,,,
|
||||
23,1130.0,0.0,5575.0,5575.0,563.0,5575.0,0.995933800000134,9.0,305.0,0.0,,,,0.002375550828799804,0.0011445915311848994,0.005559086799621582,0.00019633854390122,0.00025,0.0,0.00025,0.00025,0.014003215,0.003680551,0.026976977000000003,0.0064814542,0.058442097,0.038910393,0.12662977,-0.038043927000000005
|
||||
24,1161.0,0.0,5702.0,5702.0,127.0,5702.0,0.9958195000001376,3.0,75.0,0.0,,,,0.002494539588599676,0.0010564055929805105,0.005466931965202093,0.0005216930294409393,0.0002500000000000001,5.421010862427521e-20,0.00025,0.00025,0.014305183,0.0035644062,0.02292288,0.008908606,,,,
|
||||
25,1228.0,0.0,5970.0,5970.0,268.0,5970.0,0.9955783000001456,0.0,0.0,0.0,,,,0.0021856559421091033,0.0011062408831445708,0.005686123855412006,0.0002359695208724588,0.00025,0.0,0.00025,0.00025,0.013199517,0.0036920388,0.024785466000000003,0.006574779300000001,,,,
|
||||
|
||||
|
Reference in New Issue
Block a user