mirror of
https://github.com/gryf/coach.git
synced 2026-04-18 05:13:32 +02:00
Itaicaspi/episode reset refactoring (#105)
* reordering of the episode reset operation and allowing to store episodes only when they are terminated * reordering of the episode reset operation and allowing to store episodes only when they are terminated * revert tensorflow-gpu to 1.9.0 + bug fix in should_train() * tests readme file and refactoring of policy optimization agent train function * Update README.md * Update README.md * additional policy optimization train function simplifications * Updated the traces after the reordering of the environment reset * docker and jenkins files * updated the traces to the ones from within the docker container * updated traces and added control suite to the docker * updated jenkins file with the intel proxy + updated doom basic a3c test params * updated line breaks in jenkins file * added a missing line break in jenkins file * refining trace tests ignored presets + adding a configurable beta entropy value * switch the order of trace and golden tests in jenkins + fix golden tests processes not killed issue * updated benchmarks for dueling ddqn breakout and pong * allowing dynamic updates to the loss weights + bug fix in episode.update_returns * remove docker and jenkins file
This commit is contained in:
@@ -3,29 +3,24 @@ Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,To
|
||||
2,0.0,1.0,573.0,573.0,87.0,573.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
3,0.0,1.0,722.0,722.0,149.0,722.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
4,0.0,1.0,1057.0,1057.0,335.0,1057.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
5,51.0,0.0,1259.0,1259.0,202.0,1259.0,0.9998000200000045,3.0,35.0,0.0,,,,0.0034466183491281745,0.003340898543875149,0.01218117494136095,2.661944745341316e-05,6.25e-05,0.0,6.25e-05,6.25e-05,0.011219176,0.007470515600000001,0.02738716,0.0017668923,,,,
|
||||
6,81.0,0.0,1382.0,1382.0,123.0,1382.0,0.9996782500000072,4.0,55.0,0.0,,,,0.011165372235700487,0.004458774445701718,0.021819429472088814,0.005195816047489643,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.027822528,0.007687265,0.04223389599999999,0.016463846,,,,
|
||||
7,152.0,0.0,1665.0,1665.0,283.0,1665.0,0.9993980800000132,2.0,45.0,0.0,,,,0.00623855225964856,0.0030330486680636712,0.013224589638412,0.0007156636565923692,6.25e-05,0.0,6.25e-05,6.25e-05,0.018865645,0.005285673,0.033977974,0.010334366999999999,,,,
|
||||
8,208.0,0.0,1887.0,1887.0,222.0,1887.0,0.9991783000000178,1.0,20.0,0.0,,,,0.0038385935840778975,0.0021158033238458662,0.00906903576105833,0.0003513850388117134,6.25e-05,0.0,6.25e-05,6.25e-05,0.013778427,0.0030470558,0.021373875,0.008706516,,,,
|
||||
9,220.0,0.0,1938.0,1938.0,51.0,1938.0,0.9991278100000188,0.0,0.0,0.0,,,,0.003801035270347105,0.0018785112794797772,0.006776161491870879,0.0003781157138291746,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.012194245,0.0018602667000000002,0.01696095,0.01006682,,,,
|
||||
10,269.0,0.0,2131.0,2131.0,193.0,2131.0,0.9989367400000232,1.0,5.0,0.0,,,,0.003452837460066135,0.0021161494549021354,0.010810058563947678,0.0002755867608357221,6.25e-05,0.0,6.25e-05,6.25e-05,0.012883931999999999,0.0038414826,0.026179705,0.007717976999999999,,,,
|
||||
11,363.0,0.0,2509.0,2509.0,378.0,2509.0,0.9985625200000312,8.0,105.0,0.0,,,,0.0038385342929185312,0.002197450802281801,0.013560933992266657,0.000329795788275078,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.013579085,0.0045603695000000005,0.035137113,0.0076442054,0.060884252,0.008807714,0.07398923,0.044078137999999996
|
||||
12,403.0,0.0,2667.0,2667.0,158.0,2667.0,0.9984061000000346,1.0,20.0,0.0,,,,0.0039893238288641435,0.0021892620525771848,0.009860016405582428,0.0002942612045444548,6.25e-05,0.0,6.25e-05,6.25e-05,0.013888638,0.0039621494,0.028397342000000002,0.008886355,,,,
|
||||
13,424.0,0.0,2753.0,2753.0,86.0,2753.0,0.9983209600000365,1.0,25.0,0.0,,,,0.003456612211829495,0.0020587698243105523,0.008297181688249111,0.00038015557220205675,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.012752383999999999,0.0027827478,0.020799935,0.009112617,,,,
|
||||
14,487.0,0.0,3003.0,3003.0,250.0,3003.0,0.9980734600000418,4.0,35.0,0.0,,,,0.0035351967242258117,0.0021189242929216105,0.009568667039275171,0.00023944152053445575,6.25e-05,0.0,6.25e-05,6.25e-05,0.013402411000000001,0.0034090402000000004,0.022448676,0.008539663000000001,,,,
|
||||
15,559.0,0.0,3292.0,3292.0,289.0,3292.0,0.997787350000048,3.0,45.0,0.0,,,,0.0035738618094506404,0.0020785595659065575,0.009401696734130384,0.0003029023064300418,6.25e-05,0.0,6.25e-05,6.25e-05,0.013828838999999999,0.004127528,0.024494877,0.008980279,,,,
|
||||
16,591.0,0.0,3421.0,3421.0,129.0,3421.0,0.9976596400000508,1.0,20.0,0.0,,,,0.002270541154302918,0.0013220278591834814,0.005336767993867397,0.00015750376041978598,6.25e-05,0.0,6.25e-05,6.25e-05,0.008640400999999999,0.0027808861,0.015539816000000001,0.0048837294,,,,
|
||||
17,641.0,0.0,3619.0,3619.0,198.0,3619.0,0.9974636200000552,4.0,50.0,0.0,,,,0.0023200249412911947,0.001272970510092554,0.005772919394075871,0.00016006443183869123,6.25e-05,0.0,6.25e-05,6.25e-05,0.008547546999999999,0.0024141644,0.014635223999999999,0.00513471,,,,
|
||||
18,659.0,0.0,3694.0,3694.0,75.0,3694.0,0.9973893700000568,2.0,15.0,0.0,,,,0.00222514630392349,0.0012230397213823035,0.0049801948480308065,0.00019548021373339,6.25e-05,0.0,6.25e-05,6.25e-05,0.008170923,0.0017159204,0.012074826,0.0055588847,,,,
|
||||
19,676.0,0.0,3761.0,3761.0,67.0,3761.0,0.997323040000058,0.0,0.0,0.0,,,,0.002457476888701101,0.001416694384168644,0.004826911259442568,0.00020686438074335456,6.25e-05,0.0,6.25e-05,6.25e-05,0.009877314,0.0036330753999999996,0.016690083,0.0060720159999999995,,,,
|
||||
20,760.0,0.0,4098.0,4098.0,337.0,4098.0,0.9969894100000654,5.0,75.0,0.0,,,,0.0024319054032925385,0.0013263558155535164,0.005569641478359699,0.00018588016973808408,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.009379297,0.0030807509999999996,0.019846683,0.0054414636,0.04652569,0.016040854,0.06404913,0.015960556
|
||||
21,791.0,0.0,4222.0,4222.0,124.0,4222.0,0.9968666500000679,1.0,30.0,0.0,,,,0.0021794731803839247,0.0011718290688936287,0.005569073371589185,0.0001716011029202491,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.00873512,0.0021913913,0.016666776,0.0058183987,,,,
|
||||
22,812.0,0.0,4304.0,4304.0,82.0,4304.0,0.9967854700000698,1.0,5.0,0.0,,,,0.0019065574230071867,0.0011469396393949038,0.003925406374037266,0.00020020424562972042,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.008078746500000001,0.0020175315,0.012820823,0.006058481,,,,
|
||||
23,858.0,0.0,4488.0,4488.0,184.0,4488.0,0.9966033100000736,3.0,40.0,0.0,,,,0.00237545639222093,0.0014159762842297016,0.0052749416790902615,0.00012829533079639077,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.009339779,0.0036552486,0.02111213,0.0047810297,0.058359805,0.02419141,0.09481566,0.03411417
|
||||
24,877.0,0.0,4563.0,4563.0,75.0,4563.0,0.9965290600000754,2.0,35.0,0.0,,,,0.0018037814221124313,0.000942041831796274,0.0039741676300764075,0.00020381834474392235,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.007797141600000001,0.0016731704999999998,0.012402746000000001,0.0055578630000000006,0.069268644,0.030192586,0.1046643,0.008713403
|
||||
25,903.0,0.0,4669.0,4669.0,106.0,4669.0,0.9964241200000776,0.0,0.0,0.0,,,,0.0022410110227960665,0.0010767211744821578,0.0042915213853120795,0.0001786778011592105,6.25e-05,0.0,6.25e-05,6.25e-05,0.008801429,0.0023838158,0.014880427,0.005826161,,,,
|
||||
26,949.0,0.0,4853.0,4853.0,184.0,4853.0,0.9962419600000816,0.0,0.0,0.0,,,,0.0024887697854074245,0.0014360504525598654,0.00585534330457449,0.00016110201249830425,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.009557521,0.0031522116999999996,0.01680403,0.005234984,0.053540934000000005,0.0246497,0.09204285599999999,0.013581572
|
||||
27,966.0,0.0,4920.0,4920.0,67.0,4920.0,0.996175630000083,1.0,5.0,0.0,,,,0.002170577046105309,0.0011411493600190698,0.00466995220631361,0.0002499166294001043,6.25e-05,0.0,6.25e-05,6.25e-05,0.008650793,0.0019061747,0.012208687,0.005993179,,,,
|
||||
28,1047.0,0.0,5245.0,5245.0,325.0,5245.0,0.99585388000009,4.0,40.0,0.0,,,,0.0024006758916427463,0.0012690461042417142,0.005421573296189308,0.0001969042932614684,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.009089955,0.0023783583,0.015432458000000001,0.0056008375,0.058892712,0.021359037999999997,0.10233389,0.030309968
|
||||
29,1096.0,0.0,5442.0,5442.0,197.0,5442.0,0.9956588500000942,0.0,0.0,0.0,,,,0.0019011555625035484,0.0011534560731979529,0.005133558064699173,0.00018047218327410516,6.25e-05,0.0,6.25e-05,6.25e-05,0.008425966,0.002764765,0.017151356,0.0056821685,0.06334073,0.02206539,0.102514274,0.027491631000000002
|
||||
30,1222.0,0.0,5946.0,5946.0,504.0,5946.0,0.9951598900001052,10.0,155.0,0.0,,,,0.002289209580339957,0.001271651628931315,0.006031029857695103,0.0001688292104518041,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.008890314,0.0025685276,0.01631673,0.004984512,0.04618715,0.025464163999999997,0.0957826,-0.0035402263
|
||||
5,63.0,0.0,1310.0,1310.0,253.0,1310.0,0.9997495300000054,4.0,50.0,0.0,,,,0.007803874562153987,0.008763884069155965,0.04718368873000145,2.0029816369060427e-05,6.25e-05,0.0,6.25e-05,6.25e-05,0.021732036,0.022223754,0.1446681,0.0012787414999999999,,,,
|
||||
6,191.0,0.0,1821.0,1821.0,511.0,1821.0,0.9992436400000164,12.0,185.0,0.0,,,,0.0076840334204318905,0.00407478669790096,0.020887335762381557,0.0006209309794940053,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.024990046000000002,0.007374348,0.05583174,0.01457165,,,,
|
||||
7,296.0,0.0,2240.0,2240.0,419.0,2240.0,0.9988288300000254,5.0,100.0,0.0,,,,0.006064200656865503,0.0026079780747149924,0.013106426224112509,0.0005442567635327578,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.022204678999999998,0.0051587676,0.03801172,0.01337866,0.04552897400000001,0.014450824,0.06804762,0.022983871
|
||||
8,339.0,0.0,2414.0,2414.0,174.0,2414.0,0.9986565700000292,1.0,5.0,0.0,,,,0.0056167520910263245,0.003348133333552833,0.01847168803215027,0.0006152484565973282,6.25e-05,0.0,6.25e-05,6.25e-05,0.022583058,0.006212645699999999,0.04925069,0.014691319,0.117131494,0.075825356,0.25262827,0.034186434
|
||||
9,368.0,0.0,2529.0,2529.0,115.0,2529.0,0.9985427200000316,3.0,30.0,0.0,,,,0.00567412653721736,0.0029112874704095106,0.012542505748569964,0.0006649551214650272,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.02317206,0.005647781,0.034866843,0.014415748999999999,,,,
|
||||
10,411.0,0.0,2702.0,2702.0,173.0,2702.0,0.9983714500000354,3.0,75.0,0.0,,,,0.005447928440421386,0.0027157055388668696,0.011556550860404968,0.0005230194656178355,6.25e-05,0.0,6.25e-05,6.25e-05,0.022507405,0.0063080876,0.04279238,0.014129612,,,,
|
||||
11,465.0,0.0,2915.0,2915.0,213.0,2915.0,0.99816058000004,3.0,20.0,0.0,,,,0.006813380568516704,0.002953363187898618,0.018070373684167862,0.0024055785033851858,6.25e-05,0.0,6.25e-05,6.25e-05,0.024714846000000002,0.0069003645,0.053911198,0.013334683,,,,
|
||||
12,510.0,0.0,3097.0,3097.0,182.0,3097.0,0.9979804000000438,4.0,60.0,0.0,,,,0.0057438461899033035,0.0028426672841737203,0.013382650911808014,0.0006364500150084497,6.25e-05,0.0,6.25e-05,6.25e-05,0.023799596,0.0060355333,0.047333322000000004,0.012709315,,,,
|
||||
13,550.0,0.0,3258.0,3258.0,161.0,3258.0,0.9978210100000472,3.0,75.0,0.0,,,,0.0061742550285998725,0.002734396119005929,0.011426813900470734,0.0025493670254945755,6.25e-05,0.0,6.25e-05,6.25e-05,0.024373332,0.0076977109999999994,0.054041553,0.015785009,,,,
|
||||
14,594.0,0.0,3433.0,3433.0,175.0,3433.0,0.9976477600000512,4.0,50.0,0.0,,,,0.0054328095094777285,0.0027096778707884584,0.01172078587114811,0.0007941549411043526,6.25e-05,0.0,6.25e-05,6.25e-05,0.023894975,0.0066084154,0.04917719,0.01552412,,,,
|
||||
15,630.0,0.0,3578.0,3578.0,145.0,3578.0,0.9975042100000542,2.0,25.0,0.0,,,,0.005161296885085499,0.002379623212789025,0.011234099976718426,0.000592207710724324,6.25e-05,0.0,6.25e-05,6.25e-05,0.022190819,0.0047294693,0.033406414,0.014175736999999999,,,,
|
||||
16,675.0,0.0,3756.0,3756.0,178.0,3756.0,0.997327990000058,0.0,0.0,0.0,,,,0.005717846387679772,0.002502733532058393,0.011211811564862728,0.0006601698696613313,6.25e-05,0.0,6.25e-05,6.25e-05,0.025067486,0.006331243,0.04131097,0.016266715,,,,
|
||||
17,779.0,0.0,4171.0,4171.0,415.0,4171.0,0.9969171400000668,6.0,80.0,0.0,,,,0.004081658166307114,0.0020001996419927288,0.009709015488624571,0.0003917928552255034,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.018329315,0.0046630735,0.031186484,0.008738925,0.022281086000000002,0.02669226,0.06086207,-0.0070810173999999995
|
||||
18,802.0,0.0,4265.0,4265.0,94.0,4265.0,0.9968240800000692,1.0,30.0,0.0,,,,0.003856045330631668,0.002170383825603264,0.007952725514769554,0.0005409078439697623,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.018558994,0.0060107456999999994,0.033156354,0.012791273999999998,,,,
|
||||
19,859.0,0.0,4494.0,4494.0,229.0,4494.0,0.996597370000074,5.0,100.0,0.0,,,,0.003978008200647309,0.0016841297405167286,0.008312854915857315,0.0003705012204591185,6.25e-05,0.0,6.25e-05,6.25e-05,0.018162485,0.0049022716,0.03275322,0.010325382,0.035759527,0.035056762000000005,0.08535823,-0.008915286
|
||||
20,925.0,0.0,4758.0,4758.0,264.0,4758.0,0.9963360100000797,6.0,75.0,0.0,,,,0.002300493763714957,0.0010825562309593726,0.0046387091279029855,0.0002016235230257735,6.25e-05,0.0,6.25e-05,6.25e-05,0.010100276,0.0024906192,0.01585796,0.0059240386,0.048761707,0.05004603,0.15401264,-0.0024325964
|
||||
21,952.0,0.0,4866.0,4866.0,108.0,4866.0,0.996229090000082,0.0,0.0,0.0,,,,0.002475268014957412,0.0012914969110412403,0.00562380813062191,0.0003233719035051763,6.25e-05,0.0,6.25e-05,6.25e-05,0.01129343,0.0028471393,0.01932526,0.007399376500000001,,,,
|
||||
22,989.0,0.0,5012.0,5012.0,146.0,5012.0,0.9960845500000849,2.0,45.0,0.0,,,,0.002166505141455369,0.000924038288373833,0.004925021436065435,0.00027738657081499696,6.25e-05,0.0,6.25e-05,6.25e-05,0.010186652,0.0026935977,0.019467099999999998,0.007402484,,,,
|
||||
23,1033.0,0.0,5187.0,5187.0,175.0,5187.0,0.9959113000000888,0.0,0.0,0.0,,,,0.0021631214036791453,0.0010276500026280158,0.004965011961758137,0.00023919624800328165,6.25e-05,0.0,6.25e-05,6.25e-05,0.009726720999999999,0.0021573787,0.01670704,0.006440047,0.13069957,0.037176996000000004,0.19228284,0.08094616
|
||||
24,1089.0,0.0,5412.0,5412.0,225.0,5412.0,0.9956885500000936,3.0,30.0,0.0,,,,0.002553392111232305,0.0011096866629888736,0.005850483663380146,0.0003285239799879492,6.25e-05,0.0,6.25e-05,6.25e-05,0.011104784,0.002389212,0.017829941999999998,0.00757342,0.0682852,0.061801534000000005,0.18812282,-0.006229040999999999
|
||||
25,1136.0,0.0,5602.0,5602.0,190.0,5602.0,0.9955004500000976,2.0,45.0,0.0,,,,0.001876247199648555,0.0011046318131782585,0.004761672578752041,0.00023924620472826064,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.009521739,0.002407699,0.016262773,0.005831246700000001,0.035645377,0.06185295,0.17193483,-0.037299167
|
||||
|
||||
|
Reference in New Issue
Block a user