1
0
mirror of https://github.com/gryf/coach.git synced 2026-01-27 02:25:45 +01:00
Files
coach/rl_coach/traces/Doom_Battle_DFP/trace.csv
Itai Caspi 72a1d9d426 Itaicaspi/episode reset refactoring (#105)
* reordering of the episode reset operation and allowing to store episodes only when they are terminated

* reordering of the episode reset operation and allowing to store episodes only when they are terminated

* revert tensorflow-gpu to 1.9.0 + bug fix in should_train()

* tests readme file and refactoring of policy optimization agent train function

* Update README.md

* Update README.md

* additional policy optimization train function simplifications

* Updated the traces after the reordering of the environment reset

* docker and jenkins files

* updated the traces to the ones from within the docker container

* updated traces and added control suite to the docker

* updated jenkins file with the intel proxy + updated doom basic a3c test params

* updated line breaks in jenkins file

* added a missing line break in jenkins file

* refining trace tests ignored presets + adding a configurable beta entropy value

* switch the order of trace and golden tests in jenkins + fix golden tests processes not killed issue

* updated benchmarks for dueling ddqn breakout and pong

* allowing dynamic updates to the loss weights + bug fix in episode.update_returns

* remove docker and jenkins file
2018-09-04 15:07:54 +03:00

10 KiB

1Episode #Training IterIn HeatupER #TransitionsER #EpisodesEpisode LengthTotal stepsEpsilonShaped Training RewardTraining RewardUpdate Target NetworkEvaluation RewardShaped Evaluation RewardSuccess RateLoss/MeanLoss/StdevLoss/MaxLoss/MinLearning Rate/MeanLearning Rate/StdevLearning Rate/MaxLearning Rate/MinGrads (unclipped)/MeanGrads (unclipped)/StdevGrads (unclipped)/MaxGrads (unclipped)/Min
210.01.072.01.072.072.01.00.0
320.01.0152.02.080.0152.01.00.0
430.01.0258.03.0106.0258.01.00.0
540.01.0395.04.0137.0395.01.00.0
650.01.0482.05.087.0482.01.00.0
760.01.0619.06.0137.0619.01.00.0
870.01.0741.07.0122.0741.01.00.0
980.01.0854.08.0113.0854.01.00.0
1090.01.0990.09.0136.0990.01.00.0
11100.01.01156.010.0166.01156.01.00.0
121111.00.01244.011.088.01244.00.99999266666666561.01.00.01362870.1704545454202633.2858045881791029.3751155478.759.999999e-057.275958000000001e-120.00010.00019181.7044671.332516804.2152813.8562
131236.00.01441.012.0197.01441.00.99997624999999680.00.00.01268819.7825170348.80948817481559968.75883666.8750.00010.00.00010.000192217.9358346.1230842.8121415.611
141359.00.01625.013.0184.01625.00.99996091666666123.03.00.01097453.4375185885.354785648321374968.875690323.56250.0001000000057.275958000000001e-120.00010.0001450407.75199749.471067648.8161257.92
151473.00.01737.014.0112.01737.00.99995158333332661.01.00.0720170.776785714382766.57804747311925555.75584423.06259.999997999999999e-051.4551915e-110.00010.0001590398.1221381.361045701.94173675.36
161580.00.01791.015.054.01791.00.9999470833333260.00.00.0793692.9196428572183183.903419608131169408.625528233.00.00010.00.00010.0001528360.7289105.41114415.6242876.17
171690.00.01871.016.080.01871.00.99994041666665841.01.00.0694066.588371.25598764779864256.125549745.56259.999999e-057.275958000000001e-120.00010.0001818027.9296357.251396105.4287447.03
1817102.00.01967.017.096.01967.00.99993241666665720.00.00.0663839.973958333564899.01893068695784205.3125579032.43759.999997999999999e-051.4551915e-110.00010.0001462420.34251265.421030484.4147935.28
1918110.00.02032.018.065.02032.00.99992699999998981.01.00.0695984.304687584768.39021610889807562.3125547180.1250.00010.00.00010.0001430391.94207812.47813183.8207811.73
2019116.00.02085.019.053.02085.00.99992258333332240.00.00.0673908.104166666577784.40400788287775135.0553173.1250.00010.00.00010.0001442691.22271139.0958457.1166330.6
2120128.00.02180.020.095.02180.00.99991466666665482.02.00.0711864.028409090961660.675056842830183.75627056.31259.999999e-057.275958000000001e-120.00010.0001329869.97199046.1782139.25134099.55
2221134.00.02225.021.045.02225.00.99991091666665420.00.00.0756522.729166666588243.27123964629866818.375639968.43750.00010.00.00010.0001325175.53284253.2944805.195649.45
2322148.00.02337.022.0112.02337.00.99990158333331961.01.00.0753146.6071428572115219.81685904574973936.4375540484.18759.999997999999999e-051.4551915e-110.00010.0001352548.53180664.31817212.75144533.8
2423170.00.02514.023.0177.02514.00.99988683333331760.00.00.0749934.375127832.689414950921075921.25560355.18750.00010.00.00010.0001439716.4199622.05805644.394781.4
2524180.00.02597.024.083.02597.00.999879916666651.01.00.0681247.534375125400.85689817193912867.6875479958.8759.999999e-057.275958000000001e-120.00010.0001449936.8239054.84869260.4148829.58
2625197.00.02730.025.0133.02730.00.9998688333333150.00.00.0754226.9609375110542.87950780631983924.6875558276.250.00010.00.00010.0001394444.8215846.53802207.5685587.93
2726215.00.02877.026.0147.02877.00.99985658333331320.00.00.0719173.9565972221144825.754697965251032319.25475236.031259.999999e-057.275958000000001e-120.00010.0001388564.3249133.19877856.56109499.53
2827222.00.02928.027.051.02928.00.99985233333331280.00.00.0731635.703125157399.60955146723985211.8125485650.281250.00010.00.00010.0001301588.473236.35434868.34221974.97
2928234.00.03024.028.096.03024.00.99984433333331160.00.00.0673434.9453125111291.97425632774879607.4375452086.281259.999997999999999e-051.4551915e-110.00010.0001440101.47281616.66983453.884773.36
3029253.00.03181.029.0157.03181.00.99983124999997641.01.00.0744315.539473684386624.83914007386875519.125577295.259.999999e-057.275958000000001e-120.00010.0001458807.78282635.441082215.9131421.58
3130267.00.03286.030.0105.03286.00.99982249999997521.01.00.0717434.2548076924115258.97615360047923873.5625543786.43759.999997999999999e-051.4551915e-110.00010.0001428558.7207691.47811162.75130643.875
3231277.00.03366.031.080.03366.00.99981583333330760.00.00.0711374.312572415.09235334143849278.8125601717.3759.999999e-057.275958000000001e-120.00010.0001378304.38286992.251077769.167283.75
3332300.00.03550.032.0184.03550.00.9998004999999720.00.00.0698363.5326086957112767.16092423502921901.75502200.00.0001000000057.275958000000001e-120.00010.0001431487.66306761.941354223.584960.38
3433308.00.03620.033.070.03620.00.9997946666666380.00.00.0663993.60937587096.32117536859766391.0625544220.250.00010.00.00010.0001375039.7253182.45942774.498368.99
3534321.00.03718.034.098.03718.00.99978649999997022.02.00.0765584.3293269231128695.471347634541029789.8125470668.531259.999997999999999e-051.4551915e-110.00010.0001441566.94373265.661470760.287515.73
3635338.00.03859.035.0141.03859.00.99977474999996840.00.00.0716884.143382353131576.04973454161011837.1875506844.593750.00010.00.00010.0001373415.72231345.11874751.0113355.9
3736355.00.03995.036.0136.03995.00.99976341666663360.00.00.0721937.2352941177103882.59283400288882992.0625531336.250.00010.00.00010.0001382764.12213119.66774643.9499552.88
3837371.00.04119.037.0124.04119.00.99975308333329882.02.00.0725186.1640625100878.22357900153903022.8125549947.18750.00010.00.00010.0001344175.0232836.81010777.394721.695
3938385.00.04235.038.0116.04235.00.99974341666663080.00.00.0719966.3928571428107142.55067114241892775.0625559991.06259.999997999999999e-051.4551915e-110.00010.0001362664.7240388.1850150.897869.42
4039393.00.04294.039.059.04294.00.99973849999996341.01.00.0666581.04687559949.999658127774763241.4375564228.3750.00010.00.00010.0001358627.62161667.34674228.06161123.34
4140406.00.04404.040.0110.04404.00.99972933333329561.01.00.0709309.3269230769102515.23694020779971747.5625537066.09.999997999999999e-051.4551915e-110.00010.0001408076.66251145.9939021.3135196.75
4241419.00.04504.041.0100.04504.00.9997209999999610.00.00.0686281.701923076990042.421657481842031.3125527866.8759.999997999999999e-051.4551915e-110.00010.0001338762.03148208.45606126.9476600.88
4342429.00.04584.042.080.04584.00.99971433333329343.03.00.0694091.75625127169.415745779891005687.0532953.93759.999999e-057.275958000000001e-120.00010.0001329838.75252700.661017597.1130741.94
4443442.00.04689.043.0105.04689.00.99970558333329221.01.00.0732414.8461538461105516.87352287804938344.8125593771.43759.999997999999999e-051.4551915e-110.00010.0001484232.2309624.441061726.0131808.27
4544447.00.04726.044.037.04726.00.99970249999995840.00.00.0621613.6437588833.6735713408766784.0523614.593759.999999e-057.275958000000001e-120.00010.0001451280.84370993.25980591.9493973.31
4645459.00.04827.045.0101.04827.00.99969408333329061.01.00.0680325.48437572351.88512190571792630.5625526941.59.999997999999999e-051.4551915e-110.00010.0001378972.03195156.19840612.44107550.62
4746469.00.04905.046.078.04905.00.99968758333328963.03.00.0744519.77599203.81398693724880234.1875557504.81259.999999e-057.275958000000001e-120.00010.0001824161.1564658.562085172.5121570.23
4847495.00.05117.047.0212.05117.00.99966991666662041.01.00.0666839.3653846154118226.9086615851998517.9375479699.18750.00010.00.00010.0001460829.7307543.21244141.6121380.04
4948512.00.05246.048.0129.05246.00.9996591666666193.03.00.0724131.26171875104821.64083994547912557.0523902.93750.00010.00.00010.0001473582.8269440.06852397.5692651.44
5049523.00.05340.049.094.05340.00.99965133333328461.01.00.0677181.9005681818113756.40176243836792532.8125446570.093759.999999e-057.275958000000001e-120.00010.0001426151.6275540.97982115.75162091.97
5150541.00.05483.050.0143.05483.00.99963941666661640.00.00.0656404.232638888989892.79274772826839570.625455081.81259.999999e-057.275958000000001e-120.00010.0001372426.47180298.83759154.75102154.5
5251566.00.05679.051.0196.05679.00.99962308333328061.01.00.0684399.352571293.6438434751844978.75550241.93750.00010.00.00010.0001377658.4249473.561174649.4101264.086
5352577.00.05770.052.091.05770.00.99961549999994640.00.00.0734663.8295454546138708.0628225473971894.75556492.81259.999999e-057.275958000000001e-120.00010.0001495256.12317518.91112388.5122531.75
5453589.00.05862.053.092.05862.00.99960783333327840.00.00.0738314.2708333335104967.43094615475975733.9375635852.59.999997999999999e-051.4551915e-110.00010.0001430747.12268599.21025506.2580480.11
5554600.00.05952.054.090.05952.00.99960033333327761.01.00.0733725.8863636364120333.56674581894946715.4375519085.59.999999e-057.275958000000001e-120.00010.0001422559.28226174.39902062.06185472.72
5655620.00.06117.055.0165.06117.00.99958658333327552.02.00.0678218.7921875109486.55792635801881090.875486249.43759.999999e-057.275958000000001e-120.00010.0001367297.9191436.94823213.5687477.06