mirror of
https://github.com/gryf/coach.git
synced 2026-04-03 10:43:33 +02:00
Itaicaspi/episode reset refactoring (#105)
* reordering of the episode reset operation and allowing to store episodes only when they are terminated * reordering of the episode reset operation and allowing to store episodes only when they are terminated * revert tensorflow-gpu to 1.9.0 + bug fix in should_train() * tests readme file and refactoring of policy optimization agent train function * Update README.md * Update README.md * additional policy optimization train function simplifications * Updated the traces after the reordering of the environment reset * docker and jenkins files * updated the traces to the ones from within the docker container * updated traces and added control suite to the docker * updated jenkins file with the intel proxy + updated doom basic a3c test params * updated line breaks in jenkins file * added a missing line break in jenkins file * refining trace tests ignored presets + adding a configurable beta entropy value * switch the order of trace and golden tests in jenkins + fix golden tests processes not killed issue * updated benchmarks for dueling ddqn breakout and pong * allowing dynamic updates to the loss weights + bug fix in episode.update_returns * remove docker and jenkins file
This commit is contained in:
@@ -3,29 +3,24 @@ Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,To
|
||||
2,0.0,1.0,573.0,573.0,87.0,573.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
3,0.0,1.0,722.0,722.0,149.0,722.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
4,0.0,1.0,1057.0,1057.0,335.0,1057.0,1.0,,,0.0,,,,,,,,,,,,,,,,,,,
|
||||
5,51.0,0.0,1260.0,1260.0,203.0,1260.0,0.9997990300000044,3.0,30.0,0.0,,,,30.53859548708972,44.314682007982455,150.4903564453125,0.16912639141082764,5.000000000000001e-05,6.776263578034403e-21,5e-05,5e-05,6.791042,6.4495187000000005,23.662077,1.2995651000000001,,,,
|
||||
6,116.0,0.0,1519.0,1519.0,259.0,1519.0,0.99954262000001,3.0,30.0,0.0,,,,31.40286669318493,36.255547758346076,148.12547302246094,0.1828265339136124,5.000000000000001e-05,6.776263578034403e-21,5e-05,5e-05,8.923345,6.8456674,31.171175,1.5896469,,,,
|
||||
7,154.0,0.0,1673.0,1673.0,154.0,1673.0,0.9993901600000132,0.0,0.0,0.0,,,,22.276954246194734,26.822031462503034,98.48810577392578,0.2816051840782165,4.999999999999999e-05,1.3552527156068802e-20,5e-05,5e-05,9.235014,4.645149,21.968481,3.4494073,,,,
|
||||
8,188.0,0.0,1809.0,1809.0,136.0,1809.0,0.9992555200000162,0.0,0.0,0.0,,,,19.016328675781978,31.38710695896604,98.0995101928711,0.2720474898815155,5e-05,6.776263578034403e-21,5e-05,5e-05,8.611777,7.304164,30.532827,3.280274,,,,
|
||||
9,218.0,0.0,1927.0,1927.0,118.0,1927.0,0.9991387000000188,4.0,50.0,0.0,,,,18.11380697687467,29.29193975183291,97.48050689697266,0.2490096986293793,4.999999999999999e-05,1.3552527156068802e-20,5e-05,5e-05,9.569202,8.223543,34.718906,2.933268,,,,
|
||||
10,239.0,0.0,2013.0,2013.0,86.0,2013.0,0.9990535600000204,1.0,25.0,0.0,,,,23.42363277503423,38.412630669473316,145.73297119140625,0.36567768454551697,5e-05,6.776263578034403e-21,5e-05,5e-05,12.172969,9.590582000000001,44.762127,5.082082700000001,,,,
|
||||
11,285.0,0.0,2197.0,2197.0,184.0,2197.0,0.9988714000000244,5.0,75.0,0.0,,,,16.187956988163613,30.38507923781825,145.3076934814453,0.281042754650116,5.0000000000000016e-05,1.3552527156068802e-20,5e-05,5e-05,9.950823,8.131824,45.485153000000004,3.1171607999999997,,,,
|
||||
12,309.0,0.0,2293.0,2293.0,96.0,2293.0,0.9987763600000266,2.0,15.0,0.0,,,,16.55143442377448,26.695402296011764,95.4090576171875,0.2967992722988129,5e-05,0.0,5e-05,5e-05,9.013406,8.831133,46.1924,3.6614769,,,,
|
||||
13,353.0,0.0,2467.0,2467.0,174.0,2467.0,0.9986041000000304,2.0,35.0,0.0,,,,14.740310977467082,24.52772692149401,97.43923950195312,0.23097966611385345,5.0000000000000016e-05,1.3552527156068802e-20,5e-05,5e-05,8.150308,6.594815700000001,31.787717999999998,2.299897,,,,
|
||||
14,400.0,0.0,2658.0,2658.0,191.0,2658.0,0.9984150100000344,1.0,25.0,0.0,,,,32.32692400191693,34.86153399624781,98.53972625732422,0.29887062311172485,5.0000000000000016e-05,2.0328790734103208e-20,5e-05,5e-05,15.370679999999998,9.051497,42.453285,3.6067166,0.02061364021675521,0.0067769050257598246,0.0303798052680213,0.009173157039294895
|
||||
15,420.0,0.0,2737.0,2737.0,79.0,2737.0,0.998336800000036,3.0,30.0,0.0,,,,28.536019751429556,30.448869863836503,93.33609008789062,0.7488499283790588,5e-05,0.0,5e-05,5e-05,22.326626,14.370629999999998,68.70875,11.235919,,,,
|
||||
16,441.0,0.0,2822.0,2822.0,85.0,2822.0,0.998252650000038,1.0,20.0,0.0,,,,36.1884659301667,31.21200822910139,94.37825775146484,1.1034283638000488,5e-05,6.776263578034403e-21,5e-05,5e-05,27.31245,18.221214,95.95713,16.466019,,,,
|
||||
17,497.0,0.0,3045.0,3045.0,223.0,3045.0,0.9980318800000428,2.0,30.0,0.0,,,,26.486526499901494,34.31913812205679,133.34033203125,0.8666461110115051,5.000000000000001e-05,6.776263578034403e-21,5e-05,5e-05,25.985167999999998,15.976610999999998,108.36258000000001,12.003894,0.02852728419992369,0.012236517428302918,0.04643445217803673,0.006784821223118342
|
||||
18,519.0,0.0,3133.0,3133.0,88.0,3133.0,0.9979447600000446,1.0,10.0,0.0,,,,24.17923441258344,26.460502373684182,91.19527435302734,1.1007275581359863,5e-05,6.776263578034403e-21,5e-05,5e-05,25.493132,9.448856,61.914528000000004,15.315972,,,,
|
||||
19,586.0,0.0,3399.0,3399.0,266.0,3399.0,0.9976814200000504,1.0,15.0,0.0,,,,19.367093969636887,30.53654667888193,138.79338073730472,0.5301144719123839,5.0000000000000016e-05,1.3552527156068802e-20,5e-05,5e-05,21.118656,17.394904999999998,100.10899,6.504474,,,,
|
||||
20,644.0,0.0,3631.0,3631.0,232.0,3631.0,0.9974517400000552,3.0,30.0,0.0,,,,25.538421301492328,31.2238672301977,95.78995513916016,0.4987463653087616,5.000000000000001e-05,6.776263578034403e-21,5e-05,5e-05,22.084887,15.076464999999999,68.79476,6.562572500000001,0.011964818493931188,0.003264027026202129,0.01488947989215376,0.005563916421342583
|
||||
21,691.0,0.0,3822.0,3822.0,191.0,3822.0,0.9972626500000594,1.0,5.0,0.0,,,,20.623328632496765,33.08831889922991,171.38589477539062,0.7546992301940918,5.0000000000000016e-05,2.0328790734103208e-20,5e-05,5e-05,26.541094,28.174709999999997,178.12593,10.046588,0.016623225918119714,0.008017604386992635,0.031264341372298075,0.005206719253328628
|
||||
22,763.0,0.0,4110.0,4110.0,288.0,4110.0,0.9969775300000656,5.0,100.0,0.0,,,,20.81435759945048,30.01146336976207,135.20793151855472,0.9363594651222228,5.000000000000001e-05,6.776263578034403e-21,5e-05,5e-05,27.0196,18.976485999999998,94.14133000000001,12.538364,0.021093616302338584,0.008422554661489449,0.029779689924325795,0.004451211805862841
|
||||
23,809.0,0.0,4291.0,4291.0,181.0,4291.0,0.9967983400000696,2.0,15.0,0.0,,,,21.38968964504159,34.311319777525604,183.166259765625,0.9679770469665528,5.0000000000000016e-05,1.3552527156068802e-20,5e-05,5e-05,30.949451,19.032299,116.2259,11.671700999999999,,,,
|
||||
24,832.0,0.0,4384.0,4384.0,93.0,4384.0,0.9967062700000716,2.0,15.0,0.0,,,,28.32993198477704,28.347670124431954,91.72865295410156,0.9682503938674928,4.999999999999999e-05,1.3552527156068802e-20,5e-05,5e-05,30.348809999999997,16.9566,86.52797,12.740698,,,,
|
||||
25,896.0,0.0,4639.0,4639.0,255.0,4639.0,0.996453820000077,3.0,50.0,0.0,,,,18.012998558580875,24.52147417904464,87.72151947021484,0.6401084065437317,5.000000000000001e-05,6.776263578034403e-21,5e-05,5e-05,27.058616999999998,18.284755999999998,101.61511999999999,8.696746000000001,0.020656253984173718,0.010331667719415127,0.0396795524546178,0.01031893009421765
|
||||
26,947.0,0.0,4846.0,4846.0,207.0,4846.0,0.9962488900000814,1.0,25.0,0.0,,,,14.372732569189631,22.762665065523,95.37085723876952,0.6254499554634094,5.000000000000001e-05,6.776263578034403e-21,5e-05,5e-05,19.155935,11.796223,53.041355,8.059999000000001,,,,
|
||||
27,963.0,0.0,4909.0,4909.0,63.0,4909.0,0.9961865200000828,2.0,15.0,0.0,,,,28.088446207344532,33.130785671948516,85.42578887939453,0.6590879559516907,5e-05,0.0,5e-05,5e-05,33.122856,31.809953999999998,107.821754,8.504436,,,,
|
||||
28,982.0,0.0,4985.0,4985.0,76.0,4985.0,0.9961112800000844,0.0,0.0,0.0,,,,20.659159697984396,24.893216005275328,89.03260803222656,1.0471786260604858,5e-05,0.0,5e-05,5e-05,33.272964,22.24945,102.92742,13.571832,,,,
|
||||
29,1048.0,0.0,5248.0,5248.0,263.0,5248.0,0.99585091000009,3.0,30.0,0.0,,,,15.208325591954319,24.90270362840188,125.36002349853516,0.6677142381668091,5.0000000000000016e-05,1.3552527156068802e-20,5e-05,5e-05,25.047573,18.866804000000002,122.81957,7.389894,0.007710378308947837,0.0065074938611493095,0.018967705124814528,-0.0025220525433542213
|
||||
30,1117.0,0.0,5526.0,5526.0,278.0,5526.0,0.9955756900000959,3.0,75.0,0.0,,,,19.523073547992155,24.76386978059245,94.19256591796876,0.43752905726432795,5.0000000000000016e-05,1.3552527156068802e-20,5e-05,5e-05,27.299099,20.852268,93.84137,4.555567,,,,
|
||||
5,51.0,0.0,1260.0,1260.0,203.0,1260.0,0.9997990300000044,5.0,55.0,0.0,,,,36.40264579741394,49.44809691530482,198.9517517089844,0.1989624798297882,5.000000000000001e-05,6.776263578034403e-21,5e-05,5e-05,7.8067063999999995,7.391117599999999,36.182125,1.4651048,,,,
|
||||
6,70.0,0.0,1335.0,1335.0,75.0,1335.0,0.999724780000006,2.0,15.0,0.0,,,,39.23580433663569,41.016771031064785,99.57048797607422,0.261367529630661,5e-05,0.0,5e-05,5e-05,10.85398,7.770962700000001,26.800815999999998,2.6992220000000002,,,,
|
||||
7,91.0,0.0,1422.0,1422.0,87.0,1422.0,0.9996386500000078,1.0,15.0,0.0,,,,38.0207036946501,47.816324507097775,148.4340362548828,0.3246855139732361,5e-05,6.776263578034403e-21,5e-05,5e-05,11.630027,8.391272,40.402522999999995,4.429657499999999,,,,
|
||||
8,159.0,0.0,1693.0,1693.0,271.0,1693.0,0.9993703600000136,5.0,55.0,0.0,,,,28.948033251869145,36.08735969022815,148.06871032714844,0.3664446473121643,5.0000000000000016e-05,1.3552527156068802e-20,5e-05,5e-05,11.167119999999999,6.748284,31.783441999999997,4.7481833,,,,
|
||||
9,201.0,0.0,1861.0,1861.0,168.0,1861.0,0.9992040400000172,3.0,50.0,0.0,,,,18.986573637950986,31.753488181878904,146.00331115722656,0.3643231987953186,5.000000000000001e-05,6.776263578034403e-21,5e-05,5e-05,9.701611999999999,7.381705,43.52698,4.8068805,,,,
|
||||
10,279.0,0.0,2172.0,2172.0,311.0,2172.0,0.998896150000024,4.0,65.0,0.0,,,,32.03847728096522,41.925721917185676,194.55128479003903,0.2954877316951752,5.0000000000000016e-05,2.0328790734103208e-20,5e-05,5e-05,18.140017999999998,13.331147,86.43568,3.4344087,,,,
|
||||
11,440.0,0.0,2815.0,2815.0,643.0,2815.0,0.9982595800000378,10.0,335.0,0.0,,,,28.069273558832844,34.57541787899187,143.40928649902344,0.4890246391296386,5.000000000000001e-05,6.776263578034403e-21,5e-05,5e-05,21.02929,14.073232,105.471725,7.160336,0.016182939943779884,0.00317882025612132,0.020630363033269532,0.012337473193183542
|
||||
12,458.0,0.0,2888.0,2888.0,73.0,2888.0,0.9981873100000394,2.0,45.0,0.0,,,,30.90841283400853,36.51044361360722,138.05393981933594,1.1750518083572388,5e-05,0.0,5e-05,5e-05,34.070717,18.229351,87.29681,17.943182,,,,
|
||||
13,478.0,0.0,2969.0,2969.0,81.0,2969.0,0.9981071200000412,0.0,0.0,0.0,,,,21.819078975915904,26.667606415139126,94.14669799804688,1.2481423616409302,5e-05,0.0,5e-05,5e-05,29.088186,7.6060133,48.72128,18.927726999999997,0.017232515091842898,0.004842224507737858,0.023045246455294547,0.011178828286356295
|
||||
14,532.0,0.0,3183.0,3183.0,214.0,3183.0,0.9978952600000456,4.0,50.0,0.0,,,,22.003884507550136,31.01379918463093,93.17678833007812,0.7777568697929382,5.0000000000000016e-05,1.3552527156068802e-20,5e-05,5e-05,25.917735999999998,17.056901999999997,82.94768499999999,11.922298,,,,
|
||||
15,551.0,0.0,3262.0,3262.0,79.0,3262.0,0.9978170500000474,2.0,15.0,0.0,,,,26.501989019544503,38.53608557260633,132.7838134765625,0.7758174538612366,5e-05,0.0,5e-05,5e-05,31.654518,29.090153000000004,115.05221999999999,12.105766000000001,,,,
|
||||
16,632.0,0.0,3584.0,3584.0,322.0,3584.0,0.9974982700000544,6.0,145.0,0.0,,,,26.855747359991074,31.176486537250174,123.03897094726562,0.973316729068756,5.000000000000001e-05,6.776263578034403e-21,5e-05,5e-05,36.815296000000004,22.30738,154.81078,14.858197,0.015187424104939663,0.005942733756463785,0.02293543783511268,0.008310022529549316
|
||||
17,671.0,0.0,3742.0,3742.0,158.0,3742.0,0.9973418500000576,2.0,15.0,0.0,,,,28.492036423622032,32.63528454234575,93.96733856201172,0.9652070403099059,4.999999999999999e-05,1.3552527156068802e-20,5e-05,5e-05,34.653465000000004,19.933933,92.079704,14.586936999999999,0.031495462678612966,0.008552723810986405,0.04882960178918439,0.021028505007270725
|
||||
18,692.0,0.0,3823.0,3823.0,81.0,3823.0,0.9972616600000594,2.0,15.0,0.0,,,,25.052144294977193,30.43845731410265,125.72972106933594,1.7888946533203125,5e-05,0.0,5e-05,5e-05,42.09162,22.177326,135.06197,26.311890000000002,,,,
|
||||
19,724.0,0.0,3954.0,3954.0,131.0,3954.0,0.9971319700000624,3.0,60.0,0.0,,,,22.733492869883776,25.48783858900171,85.9217758178711,1.1611932516098022,5e-05,0.0,5e-05,5e-05,36.707924,17.869907,97.16350600000001,17.332857,,,,
|
||||
20,892.0,0.0,4624.0,4624.0,670.0,4624.0,0.9964686700000768,10.0,120.0,0.0,,,,26.82198785878941,32.463568352909114,173.3283233642578,0.6274673938751221,5e-05,6.776263578034403e-21,5e-05,5e-05,40.43936,25.755894,179.22295,9.756477,0.03179729131830149,0.015935985961329873,0.06086315548294807,0.005561185698170447
|
||||
21,1039.0,0.0,5212.0,5212.0,588.0,5212.0,0.9958865500000892,7.0,305.0,0.0,,,,25.642627885957967,30.19485814602498,128.482666015625,0.874378502368927,5.0000000000000016e-05,1.3552527156068802e-20,5e-05,5e-05,38.308285,20.612198,146.47842,12.9673605,0.01867095795375159,0.00486977181278684,0.025539715652921586,0.011338672893034526
|
||||
22,1062.0,0.0,5306.0,5306.0,94.0,5306.0,0.9957934900000912,1.0,30.0,0.0,,,,27.773966304633927,35.56498822181043,128.78677368164062,0.7781664133071899,4.999999999999999e-05,1.3552527156068802e-20,5e-05,5e-05,37.376076,32.84612,134.23588999999998,10.897138,,,,
|
||||
23,1121.0,0.0,5540.0,5540.0,234.0,5540.0,0.9955618300000963,5.0,65.0,0.0,,,,27.48228641214041,31.674095369737838,117.5129852294922,1.5340145826339722,5.000000000000001e-05,6.776263578034403e-21,5e-05,5e-05,47.458725,30.501372999999997,172.14487,23.663988,,,,
|
||||
24,1159.0,0.0,5692.0,5692.0,152.0,5692.0,0.9954113500000996,0.0,0.0,0.0,,,,22.548715029892172,29.715242718167897,135.16885375976562,1.177747130393982,4.999999999999999e-05,1.3552527156068802e-20,5e-05,5e-05,37.85986,22.92256,141.62851,18.90979,,,,
|
||||
25,1211.0,0.0,5901.0,5901.0,209.0,5901.0,0.995204440000104,3.0,55.0,0.0,,,,20.993866240748996,25.480314720786012,95.07637786865234,0.8926278352737427,5.0000000000000016e-05,1.3552527156068802e-20,5e-05,5e-05,28.66507,14.327967000000001,80.878,13.025402,,,,
|
||||
|
||||
|
Reference in New Issue
Block a user