Episode #,Training Iter,In Heatup,ER #Transitions,ER #Episodes,Episode Length,Total steps,Epsilon,Shaped Training Reward,Training Reward,Update Target Network,Evaluation Reward,Shaped Evaluation Reward,Success Rate,Loss/Mean,Loss/Stdev,Loss/Max,Loss/Min,Learning Rate/Mean,Learning Rate/Stdev,Learning Rate/Max,Learning Rate/Min,Grads (unclipped)/Mean,Grads (unclipped)/Stdev,Grads (unclipped)/Max,Grads (unclipped)/Min,Discounted Return/Mean,Discounted Return/Stdev,Discounted Return/Max,Discounted Return/Min,Q/Mean,Q/Stdev,Q/Max,Q/Min 1,0.0,1.0,1117.0,1117.0,1117.0,1117.0,1.0,,,0.0,,,,,,,,,,,,,,,,-1.5180229894995567,0.6998808293377133,-0.08930329112720292,-3.148474706421977,,,, 2,197.0,0.0,1905.0,1905.0,788.0,1905.0,0.9992198800000168,-21.0,-21.0,0.0,,,,0.008022314603535016,0.0045835976267830465,0.034036897122859955,4.404132778290659e-05,6.250000000000001e-05,1.3552527156068802e-20,6.25e-05,6.25e-05,0.04622123400000001,0.03147308,0.35551727,0.0068541886,-2.4312329564518818,0.5717677860635341,-0.7105532272722921,-3.3662833646890835,,,, 3,436.0,0.0,2861.0,2861.0,956.0,2861.0,0.9982734400000376,-20.0,-20.0,0.0,,,,0.007125079098864356,0.0033463100786013263,0.02057763934135437,6.804851000197232e-05,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.028711626,0.013181531000000002,0.08534362,0.005308075,-1.9661750356661605,0.7201571479030581,-0.2377786744047345,-3.3208045867789826,-0.110634394,0.06718283,-0.021104777,-0.22330762 4,678.0,0.0,3827.0,3827.0,966.0,3827.0,0.9973171000000582,-19.0,-19.0,0.0,,,,0.005711167145360257,0.002484417648740395,0.015254315920174122,6.606345414184034e-05,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.021287484,0.012238965,0.09981554,0.007149023000000001,-1.7559525724754523,0.8941220204944008,0.35366714208714395,-3.334054446646881,,,, 5,886.0,0.0,4660.0,4660.0,833.0,4660.0,0.996492430000076,-21.0,-21.0,0.0,,,,0.005441138387071148,0.002467626446986541,0.011788716539740562,0.000472158775664866,6.250000000000003e-05,2.7105054312137605e-20,6.25e-05,6.25e-05,0.015550702,0.0050054654,0.037898443999999996,0.006809624,-2.3374918938861518,0.5767458576234249,-0.7105532272722921,-3.359993917983808,-0.009537455,0.020503985,0.035534262999999996,-0.04081138