1
0
mirror of https://github.com/gryf/coach.git synced 2026-01-29 11:35:51 +01:00
Files
coach/rl_coach/traces/CartPole_DFP/trace.csv
Itai Caspi 72a1d9d426 Itaicaspi/episode reset refactoring (#105)
* reordering of the episode reset operation and allowing to store episodes only when they are terminated

* reordering of the episode reset operation and allowing to store episodes only when they are terminated

* revert tensorflow-gpu to 1.9.0 + bug fix in should_train()

* tests readme file and refactoring of policy optimization agent train function

* Update README.md

* Update README.md

* additional policy optimization train function simplifications

* Updated the traces after the reordering of the environment reset

* docker and jenkins files

* updated the traces to the ones from within the docker container

* updated traces and added control suite to the docker

* updated jenkins file with the intel proxy + updated doom basic a3c test params

* updated line breaks in jenkins file

* added a missing line break in jenkins file

* refining trace tests ignored presets + adding a configurable beta entropy value

* switch the order of trace and golden tests in jenkins + fix golden tests processes not killed issue

* updated benchmarks for dueling ddqn breakout and pong

* allowing dynamic updates to the loss weights + bug fix in episode.update_returns

* remove docker and jenkins file
2018-09-04 15:07:54 +03:00

92 lines
13 KiB
CSV

Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,Total steps,Epsilon,Shaped Training Reward,Training Reward,Update Target Network,Evaluation Reward,Shaped Evaluation Reward,Success Rate,Loss/Mean,Loss/Stdev,Loss/Max,Loss/Min,Learning Rate/Mean,Learning Rate/Stdev,Learning Rate/Max,Learning Rate/Min,Grads (unclipped)/Mean,Grads (unclipped)/Stdev,Grads (unclipped)/Max,Grads (unclipped)/Min
1,0.0,1.0,13.0,1.0,13.0,13.0,0.5,,,0.0,,,,,,,,,,,,,,,
2,0.0,1.0,29.0,2.0,16.0,29.0,0.5,,,0.0,,,,,,,,,,,,,,,
3,0.0,1.0,56.0,3.0,27.0,56.0,0.5,,,0.0,,,,,,,,,,,,,,,
4,0.0,1.0,67.0,4.0,11.0,67.0,0.5,,,0.0,,,,,,,,,,,,,,,
5,0.0,1.0,77.0,5.0,10.0,77.0,0.5,,,0.0,,,,,,,,,,,,,,,
6,0.0,1.0,94.0,6.0,17.0,94.0,0.5,,,0.0,,,,,,,,,,,,,,,
7,0.0,1.0,106.0,7.0,12.0,106.0,0.5,,,0.0,,,,,,,,,,,,,,,
8,0.0,1.0,121.0,8.0,15.0,121.0,0.5,,,0.0,,,,,,,,,,,,,,,
9,0.0,1.0,138.0,9.0,17.0,138.0,0.5,,,0.0,,,,,,,,,,,,,,,
10,0.0,1.0,172.0,10.0,34.0,172.0,0.5,,,0.0,,,,,,,,,,,,,,,
11,0.0,1.0,187.0,11.0,15.0,187.0,0.5,,,0.0,,,,,,,,,,,,,,,
12,0.0,1.0,201.0,12.0,14.0,201.0,0.5,,,0.0,,,,,,,,,,,,,,,
13,0.0,1.0,218.0,13.0,17.0,218.0,0.5,,,0.0,,,,,,,,,,,,,,,
14,0.0,1.0,235.0,14.0,17.0,235.0,0.5,,,0.0,,,,,,,,,,,,,,,
15,0.0,1.0,262.0,15.0,27.0,262.0,0.5,,,0.0,,,,,,,,,,,,,,,
16,0.0,1.0,279.0,16.0,17.0,279.0,0.5,,,0.0,,,,,,,,,,,,,,,
17,0.0,1.0,330.0,17.0,51.0,330.0,0.5,,,0.0,,,,,,,,,,,,,,,
18,0.0,1.0,350.0,18.0,20.0,350.0,0.5,,,0.0,,,,,,,,,,,,,,,
19,0.0,1.0,402.0,19.0,52.0,402.0,0.5,,,0.0,,,,,,,,,,,,,,,
20,0.0,1.0,411.0,20.0,9.0,411.0,0.5,,,0.0,,,,,,,,,,,,,,,
21,0.0,1.0,448.0,21.0,37.0,448.0,0.5,,,0.0,,,,,,,,,,,,,,,
22,0.0,1.0,462.0,22.0,14.0,462.0,0.5,,,0.0,,,,,,,,,,,,,,,
23,0.0,1.0,498.0,23.0,36.0,498.0,0.5,,,0.0,,,,,,,,,,,,,,,
24,0.0,1.0,510.0,24.0,12.0,510.0,0.5,,,0.0,,,,,,,,,,,,,,,
25,0.0,1.0,529.0,25.0,19.0,529.0,0.5,,,0.0,,,,,,,,,,,,,,,
26,0.0,1.0,554.0,26.0,25.0,554.0,0.5,,,0.0,,,,,,,,,,,,,,,
27,0.0,1.0,566.0,27.0,12.0,566.0,0.5,,,0.0,,,,,,,,,,,,,,,
28,0.0,1.0,618.0,28.0,52.0,618.0,0.5,,,0.0,,,,,,,,,,,,,,,
29,0.0,1.0,644.0,29.0,26.0,644.0,0.5,,,0.0,,,,,,,,,,,,,,,
30,0.0,1.0,660.0,30.0,16.0,660.0,0.5,,,0.0,,,,,,,,,,,,,,,
31,0.0,1.0,693.0,31.0,33.0,693.0,0.5,,,0.0,,,,,,,,,,,,,,,
32,0.0,1.0,707.0,32.0,14.0,707.0,0.5,,,0.0,,,,,,,,,,,,,,,
33,0.0,1.0,723.0,33.0,16.0,723.0,0.5,,,0.0,,,,,,,,,,,,,,,
34,0.0,1.0,736.0,34.0,13.0,736.0,0.5,,,0.0,,,,,,,,,,,,,,,
35,0.0,1.0,767.0,35.0,31.0,767.0,0.5,,,0.0,,,,,,,,,,,,,,,
36,0.0,1.0,778.0,36.0,11.0,778.0,0.5,,,0.0,,,,,,,,,,,,,,,
37,0.0,1.0,800.0,37.0,22.0,800.0,0.5,,,0.0,,,,,,,,,,,,,,,
38,0.0,1.0,825.0,38.0,25.0,825.0,0.5,,,0.0,,,,,,,,,,,,,,,
39,0.0,1.0,845.0,39.0,20.0,845.0,0.5,,,0.0,,,,,,,,,,,,,,,
40,0.0,1.0,867.0,40.0,22.0,867.0,0.5,,,0.0,,,,,,,,,,,,,,,
41,0.0,1.0,916.0,41.0,49.0,916.0,0.5,,,0.0,,,,,,,,,,,,,,,
42,0.0,1.0,930.0,42.0,14.0,930.0,0.5,,,0.0,,,,,,,,,,,,,,,
43,0.0,1.0,952.0,43.0,22.0,952.0,0.5,,,0.0,,,,,,,,,,,,,,,
44,0.0,1.0,964.0,44.0,12.0,964.0,0.5,,,0.0,,,,,,,,,,,,,,,
45,0.0,1.0,984.0,45.0,20.0,984.0,0.5,,,0.0,,,,,,,,,,,,,,,
46,0.0,1.0,994.0,46.0,10.0,994.0,0.5,,,0.0,,,,,,,,,,,,,,,
47,0.0,1.0,1011.0,47.0,17.0,1011.0,0.5,,,0.0,,,,,,,,,,,,,,,
48,0.0,1.0,1043.0,48.0,32.0,1043.0,0.5,,,0.0,,,,,,,,,,,,,,,
49,11.0,0.0,1055.0,49.0,12.0,1055.0,0.4980399999999998,12.0,12.0,0.0,,,,407.00918024236506,59.043146373400866,474.9180908203125,313.1038818359375,0.0001,0.0,0.0001,0.0001,430.847,77.9088,535.00134,292.06775
50,30.0,0.0,1074.0,50.0,19.0,1074.0,0.4949366666666662,19.0,19.0,0.0,,,,361.87703959147143,57.571153220720284,461.5362243652344,265.37258911132807,0.0001,0.0,0.0001,0.0001,311.6669,95.65562,527.886,183.04402
51,39.0,0.0,1083.0,51.0,9.0,1083.0,0.4934666666666661,9.0,9.0,0.0,,,,290.5712223052978,28.592770250767426,324.0646667480469,233.8979339599609,0.0001,0.0,0.0001,0.0001,156.36475,55.23453000000001,266.02353,80.92598000000001
52,57.0,0.0,1101.0,52.0,18.0,1101.0,0.4905266666666658,18.0,18.0,0.0,,,,302.5240622127758,51.07200591011856,397.303466796875,215.7681579589844,0.0001,0.0,0.0001,0.0001,125.00426499999999,43.877303999999995,221.17862000000002,47.998363
53,85.0,0.0,1129.0,53.0,28.0,1129.0,0.485953333333332,28.0,28.0,0.0,,,,273.5767901385272,41.09384043429787,369.19329833984375,200.9740753173828,0.0001,1.3552527156068802e-20,0.0001,0.0001,148.79572,55.79693,265.22497999999996,53.90749
54,108.0,0.0,1152.0,54.0,23.0,1152.0,0.482196666666665,23.0,23.0,0.0,,,,280.498798717152,45.31952722484967,382.5701599121094,209.29335021972656,0.0001,1.3552527156068802e-20,0.0001,0.0001,137.53911000000002,55.1492,243.37091,64.81319
55,132.0,0.0,1176.0,55.0,24.0,1176.0,0.4782766666666646,24.0,24.0,0.0,,,,265.3268936820652,47.88051442596014,345.6749267578125,176.47325134277344,9.999999999999998e-05,2.7105054312137605e-20,0.0001,0.0001,127.28493999999999,43.462986,228.50647999999998,53.6738
56,171.0,0.0,1215.0,56.0,39.0,1215.0,0.471906666666664,39.0,39.0,0.0,,,,259.54985769171464,35.00860201428681,329.51629638671875,195.73670959472656,9.999999999999998e-05,2.7105054312137605e-20,0.0001,0.0001,127.83568999999999,55.49781,361.5775,62.36788000000001
57,220.0,0.0,1264.0,57.0,49.0,1264.0,0.46390333333333,49.0,49.0,0.0,,,,234.32017167409265,39.67762681655549,348.2401123046875,148.27261352539062,0.0001,0.0,0.0001,0.0001,130.76501000000002,47.790714,293.13602000000003,78.02848
58,265.0,0.0,1309.0,58.0,45.0,1309.0,0.4565533333333293,45.0,45.0,0.0,,,,217.58444560657847,28.633086540237922,284.46954345703125,156.80096435546875,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,149.51617,41.31043,302.46732000000003,93.088844
59,315.0,0.0,1359.0,59.0,50.0,1359.0,0.4483866666666618,50.0,50.0,0.0,,,,181.83118065036072,28.659748770026674,252.75552368164062,124.99088287353516,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,157.73907,43.210159999999995,277.4141,83.70544
60,381.0,0.0,1425.0,60.0,66.0,1425.0,0.4376066666666608,66.0,66.0,0.0,,,,162.66219388521634,24.674537191314286,233.25091552734372,113.67489624023438,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,148.74516,42.076153000000005,256.46862999999996,68.96061
61,421.0,0.0,1465.0,61.0,40.0,1465.0,0.4310733333333269,40.0,40.0,0.0,,,,145.79672280336035,19.751329689793014,198.1054534912109,96.39559173583984,9.999999999999998e-05,2.7105054312137605e-20,0.0001,0.0001,146.95768999999999,65.732925,313.19208,51.533184000000006
62,456.0,0.0,1500.0,62.0,35.0,1500.0,0.4253566666666597,35.0,35.0,0.0,,,,131.11055688297049,16.95306181555285,186.7664794921875,99.96429443359376,0.0001,1.3552527156068802e-20,0.0001,0.0001,132.65295,53.839237,304.48956,62.909325
63,508.0,0.0,1552.0,63.0,52.0,1552.0,0.4168633333333256,52.0,52.0,0.0,,,,126.53350216734644,15.481871151448455,164.8385467529297,91.1605224609375,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,152.10985,88.43235,385.38083,39.948209999999996
64,562.0,0.0,1606.0,64.0,54.0,1606.0,0.4080433333333247,54.0,54.0,0.0,,,,118.98314911464476,13.810711322823195,152.51815795898438,78.3194808959961,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,138.26892,67.992775,326.97302,42.56321
65,639.0,0.0,1683.0,65.0,77.0,1683.0,0.3954666666666569,77.0,77.0,0.0,,,,117.58552340457314,14.767237376582813,145.6944580078125,76.0615234375,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,139.93097,68.41799,359.26813,34.659209999999995
66,702.0,0.0,1746.0,66.0,63.0,1746.0,0.3851766666666559,63.0,63.0,0.0,,,,120.67522491947297,12.975251902989402,149.65545654296875,86.92375183105469,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,194.05127,112.72679,523.8937,45.209587
67,758.0,0.0,1802.0,67.0,56.0,1802.0,0.3760299999999884,56.0,56.0,0.0,,,,114.29240389737215,11.037394276667747,142.71560668945312,84.41421508789062,0.00010000000000000003,4.0657581468206416e-20,0.0001,0.0001,167.91013,89.38369,499.4104,45.970905
68,855.0,0.0,1899.0,68.0,97.0,1899.0,0.36018666666665355,97.0,97.0,0.0,,,,108.84930968284607,10.904272250219288,136.30058288574222,80.56739044189453,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,166.04175,85.99049000000001,520.82025,38.817432000000004
69,943.0,0.0,1987.0,69.0,88.0,1987.0,0.3458133333333189,88.0,88.0,0.0,,,,107.02519383923759,11.39347761396693,136.39886474609378,78.00271606445312,9.999999999999998e-05,2.7105054312137605e-20,0.0001,0.0001,210.01866,110.30383,567.1114,60.903659999999995
70,996.0,0.0,2040.0,70.0,53.0,2040.0,0.3371566666666514,53.0,53.0,0.0,,,,104.3046335073618,9.90557600777946,122.74562072753906,81.93575286865234,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,224.59392999999997,108.33842,487.3267,68.59164399999999
71,1066.0,0.0,2110.0,71.0,70.0,2110.0,0.325723333333317,70.0,70.0,0.0,,,,99.84021825375766,12.33210844148148,139.12625122070312,78.9608154296875,0.00010000000000000003,2.7105054312137605e-20,0.0001,0.0001,209.42502,110.90117,597.66003,73.1405
72,1153.0,0.0,2197.0,72.0,87.0,2197.0,0.3115133333333157,87.0,87.0,0.0,,,,96.65015597676121,9.84319531790892,123.95345306396484,76.58502960205078,9.999999999999998e-05,2.7105054312137605e-20,0.0001,0.0001,216.96257000000003,121.00806399999999,613.5522,59.14050699999999
73,1276.0,0.0,2320.0,73.0,123.0,2320.0,0.29142333333331377,123.0,123.0,0.0,,,,97.39662977124823,12.261304899663234,137.88682556152344,74.04705810546875,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,230.93216,129.7123,612.3107,51.633354
74,1376.0,0.0,2420.0,74.0,100.0,2420.0,0.2750899999999789,100.0,100.0,0.0,,,,100.02240552805893,12.402266865856195,129.21238708496094,76.03594207763672,0.0001,0.0,0.0001,0.0001,333.58328,215.78375,1084.7336,59.14518
75,1474.0,0.0,2518.0,75.0,98.0,2518.0,0.25908333333331074,98.0,98.0,0.0,,,,100.24637352068399,11.541501085409068,135.85459899902344,79.60064697265625,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,291.26004,180.40565,992.3476,55.43
76,1630.0,0.0,2674.0,76.0,156.0,2674.0,0.23360333333331115,156.0,156.0,0.0,,,,96.7145296650548,12.927063203207426,135.03854370117188,69.76264953613281,0.0001,0.0,0.0001,0.0001,318.5015,187.47644,1042.6508,55.259426
77,1790.0,0.0,2834.0,77.0,160.0,2834.0,0.2074699999999798,160.0,160.0,0.0,,,,97.28608170995173,14.586646821280398,148.71713256835938,63.41643524169922,9.999999999999998e-05,2.7105054312137605e-20,0.0001,0.0001,428.08205999999996,299.95953,1505.8619,53.030354
78,1985.0,0.0,3029.0,78.0,195.0,3029.0,0.17561999999998226,195.0,195.0,0.0,,,,94.23654863023266,11.872838615596594,124.63626861572266,64.61207580566406,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,388.60703,246.09604,1546.4164,70.24545
79,2064.0,0.0,3108.0,79.0,79.0,3108.0,0.16271666666664988,79.0,79.0,0.0,,,,95.20987085195688,12.796128483766026,124.25724792480469,66.86399841308594,0.00010000000000000003,4.0657581468206416e-20,0.0001,0.0001,441.08117999999996,244.4737,1173.6305,91.54683
80,2261.0,0.0,3305.0,80.0,197.0,3305.0,0.13053999999998567,197.0,197.0,0.0,,,,91.81964377967678,14.275220726968213,153.1096649169922,60.52539443969727,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,438.85402999999997,290.9626,1554.4546,72.2978
81,2459.0,0.0,3503.0,81.0,198.0,3503.0,0.09819999999998584,198.0,198.0,0.0,,,,87.43646941209202,12.729616116502946,123.30382537841795,60.958091735839844,0.0001,0.0,0.0001,0.0001,505.83002,308.85773,1414.6854,103.33906999999999
82,2654.0,0.0,3698.0,82.0,195.0,3698.0,0.06634999999998556,195.0,195.0,0.0,,,,85.7298781601424,13.978231691978335,140.09968566894528,50.90789794921875,0.00010000000000000002,1.3552527156068802e-20,0.0001,0.0001,577.7435,358.6646,2119.695,86.51878
83,2837.0,0.0,3881.0,83.0,183.0,3881.0,0.036459999999985296,183.0,183.0,0.0,,,,79.93278704632769,12.023107460619213,113.99821472167969,50.35162353515625,0.0001,0.0,0.0001,0.0001,529.7014,395.3233,2509.3198,93.23408
84,3037.0,0.0,4081.0,84.0,200.0,4081.0,0.01,200.0,200.0,0.0,,,,78.72026734855307,13.478753772504628,117.58197021484376,46.87385940551758,0.0001,0.0,0.0001,0.0001,656.9392,443.30566,2533.2942,93.711685
85,3237.0,0.0,4281.0,85.0,200.0,4281.0,0.01,200.0,200.0,0.0,,,,80.28289934858006,14.76322732790999,126.55402374267578,39.721107482910156,0.0001,0.0,0.0001,0.0001,771.22064,559.2998,3551.7788,115.3446
86,3437.0,0.0,4481.0,86.0,200.0,4481.0,0.01,200.0,200.0,0.0,,,,76.70594802933121,14.472593183429652,150.84634399414062,41.38127136230469,0.0001,0.0,0.0001,0.0001,810.4775400000001,522.2886,3221.0596,77.76926999999999
87,3637.0,0.0,4681.0,87.0,200.0,4681.0,0.01,200.0,200.0,0.0,,,,72.90871241583896,12.42715688511501,115.57746124267578,44.61211395263672,0.0001,0.0,0.0001,0.0001,690.33563,405.4728,2354.9749,139.82854
88,3837.0,0.0,4881.0,88.0,200.0,4881.0,0.01,200.0,200.0,0.0,,,,73.5151865590158,14.072884510784956,115.23548889160156,42.79571533203125,0.0001,0.0,0.0001,0.0001,742.5526,519.8441,2976.3206,78.22694
89,4037.0,0.0,5081.0,89.0,200.0,5081.0,0.01,200.0,200.0,0.0,,,,68.8914678468177,13.91539629215193,114.30947875976562,30.74076271057129,0.0001,0.0,0.0001,0.0001,778.3665,499.35315,3280.329,94.1108
90,4237.0,0.0,5281.0,90.0,200.0,5281.0,0.01,200.0,200.0,0.0,,,,69.21584799301684,14.63634195328303,129.924560546875,31.90666198730469,0.0001,0.0,0.0001,0.0001,931.8132300000001,627.2812,4543.6943,110.74506000000001