In [69]:
import tensorflow as tf

In [70]:
from numpy.random import RandomState

In [71]:
batch_size=8

In [72]:
w1=tf.Variable(tf.random_normal([2,3],stddev=1,seed=1))
w2=tf.Variable(tf.random_normal([3,1],stddev=1,seed=1))

forward propagation


In [73]:
x=tf.placeholder(tf.float32,shape=(None,2),name='x-input')
y_=tf.placeholder(tf.float32,shape=(None,1),name='y-input')

In [74]:
a=tf.matmul(x,w1)
y=tf.matmul(a,w2)

back propagation


In [75]:
cross_entropy=-tf.reduce_mean(y_ * tf.log(tf.clip_by_value(y,1e-10,1.0)))

In [76]:
train_step=tf.train.AdamOptimizer(0.001).minimize(cross_entropy)

In [77]:
rdm=RandomState(1)

In [79]:
dataset_size=128

In [80]:
X=rdm.rand(dataset_size,2)

In [81]:
Y=[[int(x1 + x2 < 1)] for (x1,x2) in X]

In [84]:
with tf.Session() as sess:
    init_op=tf.global_variables_initializer()
    sess.run(init_op)
    print(sess.run(w1))
    print(sess.run(w2))
    
    STEPS=5000
    for i in range(STEPS):
        start=(i*batch_size) % dataset_size
        end=min(start+batch_size,dataset_size)
        sess.run(train_step,feed_dict={x:X[start:end],y_:Y[start:end]})
        #print(sess.run(w1))
        #print(sess.run(w2))
        
        total_cross_entropy=sess.run(cross_entropy,feed_dict={x:X,y_:Y})
        print("After %d training step(s),cross entropy on all data is %g" %(i,total_cross_entropy))
        
    print(sess.run(w1))
    print(sess.run(w2))


[[-0.81131822  1.48459876  0.06532937]
 [-2.44270396  0.0992484   0.59122431]]
[[-0.81131822]
 [ 1.48459876]
 [ 0.06532937]]
After 0 training step(s),cross entropy on all data is 0.0674925
After 1 training step(s),cross entropy on all data is 0.0672511
After 2 training step(s),cross entropy on all data is 0.0670647
After 3 training step(s),cross entropy on all data is 0.066914
After 4 training step(s),cross entropy on all data is 0.0667947
After 5 training step(s),cross entropy on all data is 0.0666918
After 6 training step(s),cross entropy on all data is 0.0665712
After 7 training step(s),cross entropy on all data is 0.0664202
After 8 training step(s),cross entropy on all data is 0.0662492
After 9 training step(s),cross entropy on all data is 0.066075
After 10 training step(s),cross entropy on all data is 0.0659034
After 11 training step(s),cross entropy on all data is 0.0657333
After 12 training step(s),cross entropy on all data is 0.0655595
After 13 training step(s),cross entropy on all data is 0.065385
After 14 training step(s),cross entropy on all data is 0.0652272
After 15 training step(s),cross entropy on all data is 0.0650843
After 16 training step(s),cross entropy on all data is 0.0649217
After 17 training step(s),cross entropy on all data is 0.0647457
After 18 training step(s),cross entropy on all data is 0.0645858
After 19 training step(s),cross entropy on all data is 0.0644406
After 20 training step(s),cross entropy on all data is 0.0643085
After 21 training step(s),cross entropy on all data is 0.0641883
After 22 training step(s),cross entropy on all data is 0.0640613
After 23 training step(s),cross entropy on all data is 0.0639122
After 24 training step(s),cross entropy on all data is 0.0637453
After 25 training step(s),cross entropy on all data is 0.0635762
After 26 training step(s),cross entropy on all data is 0.0634173
After 27 training step(s),cross entropy on all data is 0.0632631
After 28 training step(s),cross entropy on all data is 0.063106
After 29 training step(s),cross entropy on all data is 0.0629485
After 30 training step(s),cross entropy on all data is 0.0628051
After 31 training step(s),cross entropy on all data is 0.0626746
After 32 training step(s),cross entropy on all data is 0.0625259
After 33 training step(s),cross entropy on all data is 0.0623641
After 34 training step(s),cross entropy on all data is 0.0622169
After 35 training step(s),cross entropy on all data is 0.0620829
After 36 training step(s),cross entropy on all data is 0.061961
After 37 training step(s),cross entropy on all data is 0.0618501
After 38 training step(s),cross entropy on all data is 0.0617338
After 39 training step(s),cross entropy on all data is 0.0615971
After 40 training step(s),cross entropy on all data is 0.0614568
After 41 training step(s),cross entropy on all data is 0.0613131
After 42 training step(s),cross entropy on all data is 0.0611695
After 43 training step(s),cross entropy on all data is 0.0610255
After 44 training step(s),cross entropy on all data is 0.0608774
After 45 training step(s),cross entropy on all data is 0.0607281
After 46 training step(s),cross entropy on all data is 0.0605924
After 47 training step(s),cross entropy on all data is 0.0604691
After 48 training step(s),cross entropy on all data is 0.060326
After 49 training step(s),cross entropy on all data is 0.0601682
After 50 training step(s),cross entropy on all data is 0.0600249
After 51 training step(s),cross entropy on all data is 0.0598948
After 52 training step(s),cross entropy on all data is 0.0597766
After 53 training step(s),cross entropy on all data is 0.0596694
After 54 training step(s),cross entropy on all data is 0.0595566
After 55 training step(s),cross entropy on all data is 0.0594224
After 56 training step(s),cross entropy on all data is 0.0592843
After 57 training step(s),cross entropy on all data is 0.0591428
After 58 training step(s),cross entropy on all data is 0.059001
After 59 training step(s),cross entropy on all data is 0.0588588
After 60 training step(s),cross entropy on all data is 0.0587123
After 61 training step(s),cross entropy on all data is 0.0585645
After 62 training step(s),cross entropy on all data is 0.0584304
After 63 training step(s),cross entropy on all data is 0.0583089
After 64 training step(s),cross entropy on all data is 0.0581669
After 65 training step(s),cross entropy on all data is 0.0580096
After 66 training step(s),cross entropy on all data is 0.057867
After 67 training step(s),cross entropy on all data is 0.0577378
After 68 training step(s),cross entropy on all data is 0.0576207
After 69 training step(s),cross entropy on all data is 0.0575145
After 70 training step(s),cross entropy on all data is 0.0574029
After 71 training step(s),cross entropy on all data is 0.0572694
After 72 training step(s),cross entropy on all data is 0.0571322
After 73 training step(s),cross entropy on all data is 0.0569914
After 74 training step(s),cross entropy on all data is 0.0568505
After 75 training step(s),cross entropy on all data is 0.056709
After 76 training step(s),cross entropy on all data is 0.0565632
After 77 training step(s),cross entropy on all data is 0.0564162
After 78 training step(s),cross entropy on all data is 0.0562831
After 79 training step(s),cross entropy on all data is 0.0561626
After 80 training step(s),cross entropy on all data is 0.0560214
After 81 training step(s),cross entropy on all data is 0.0558645
After 82 training step(s),cross entropy on all data is 0.0557225
After 83 training step(s),cross entropy on all data is 0.055594
After 84 training step(s),cross entropy on all data is 0.0554777
After 85 training step(s),cross entropy on all data is 0.0553724
After 86 training step(s),cross entropy on all data is 0.0552617
After 87 training step(s),cross entropy on all data is 0.055129
After 88 training step(s),cross entropy on all data is 0.0549926
After 89 training step(s),cross entropy on all data is 0.0548574
After 90 training step(s),cross entropy on all data is 0.054727
After 91 training step(s),cross entropy on all data is 0.0546091
After 92 training step(s),cross entropy on all data is 0.0544855
After 93 training step(s),cross entropy on all data is 0.0543597
After 94 training step(s),cross entropy on all data is 0.0542459
After 95 training step(s),cross entropy on all data is 0.054143
After 96 training step(s),cross entropy on all data is 0.0540194
After 97 training step(s),cross entropy on all data is 0.0538804
After 98 training step(s),cross entropy on all data is 0.0537547
After 99 training step(s),cross entropy on all data is 0.053641
After 100 training step(s),cross entropy on all data is 0.0535382
After 101 training step(s),cross entropy on all data is 0.0534453
After 102 training step(s),cross entropy on all data is 0.053347
After 103 training step(s),cross entropy on all data is 0.0532273
After 104 training step(s),cross entropy on all data is 0.0531037
After 105 training step(s),cross entropy on all data is 0.0529766
After 106 training step(s),cross entropy on all data is 0.0528494
After 107 training step(s),cross entropy on all data is 0.0527344
After 108 training step(s),cross entropy on all data is 0.0526136
After 109 training step(s),cross entropy on all data is 0.0524904
After 110 training step(s),cross entropy on all data is 0.052379
After 111 training step(s),cross entropy on all data is 0.0522784
After 112 training step(s),cross entropy on all data is 0.0521569
After 113 training step(s),cross entropy on all data is 0.0520196
After 114 training step(s),cross entropy on all data is 0.0518957
After 115 training step(s),cross entropy on all data is 0.0517836
After 116 training step(s),cross entropy on all data is 0.0516824
After 117 training step(s),cross entropy on all data is 0.0515909
After 118 training step(s),cross entropy on all data is 0.0514939
After 119 training step(s),cross entropy on all data is 0.0513755
After 120 training step(s),cross entropy on all data is 0.0512533
After 121 training step(s),cross entropy on all data is 0.0511275
After 122 training step(s),cross entropy on all data is 0.0510015
After 123 training step(s),cross entropy on all data is 0.0508876
After 124 training step(s),cross entropy on all data is 0.050768
After 125 training step(s),cross entropy on all data is 0.0506459
After 126 training step(s),cross entropy on all data is 0.0505357
After 127 training step(s),cross entropy on all data is 0.0504361
After 128 training step(s),cross entropy on all data is 0.0503156
After 129 training step(s),cross entropy on all data is 0.0501794
After 130 training step(s),cross entropy on all data is 0.0500563
After 131 training step(s),cross entropy on all data is 0.0499452
After 132 training step(s),cross entropy on all data is 0.0498448
After 133 training step(s),cross entropy on all data is 0.0497542
After 134 training step(s),cross entropy on all data is 0.0496581
After 135 training step(s),cross entropy on all data is 0.0495406
After 136 training step(s),cross entropy on all data is 0.0494194
After 137 training step(s),cross entropy on all data is 0.0492945
After 138 training step(s),cross entropy on all data is 0.0491694
After 139 training step(s),cross entropy on all data is 0.0490648
After 140 training step(s),cross entropy on all data is 0.0489559
After 141 training step(s),cross entropy on all data is 0.0488449
After 142 training step(s),cross entropy on all data is 0.0487446
After 143 training step(s),cross entropy on all data is 0.048654
After 144 training step(s),cross entropy on all data is 0.0485445
After 145 training step(s),cross entropy on all data is 0.0484332
After 146 training step(s),cross entropy on all data is 0.0483328
After 147 training step(s),cross entropy on all data is 0.0482422
After 148 training step(s),cross entropy on all data is 0.0481603
After 149 training step(s),cross entropy on all data is 0.0480864
After 150 training step(s),cross entropy on all data is 0.0480066
After 151 training step(s),cross entropy on all data is 0.0479063
After 152 training step(s),cross entropy on all data is 0.0478018
After 153 training step(s),cross entropy on all data is 0.0476933
After 154 training step(s),cross entropy on all data is 0.0475839
After 155 training step(s),cross entropy on all data is 0.0474852
After 156 training step(s),cross entropy on all data is 0.0473809
After 157 training step(s),cross entropy on all data is 0.0472738
After 158 training step(s),cross entropy on all data is 0.0471772
After 159 training step(s),cross entropy on all data is 0.04709
After 160 training step(s),cross entropy on all data is 0.0469834
After 161 training step(s),cross entropy on all data is 0.0468749
After 162 training step(s),cross entropy on all data is 0.0467769
After 163 training step(s),cross entropy on all data is 0.0466884
After 164 training step(s),cross entropy on all data is 0.0466086
After 165 training step(s),cross entropy on all data is 0.0465366
After 166 training step(s),cross entropy on all data is 0.0464584
After 167 training step(s),cross entropy on all data is 0.0463597
After 168 training step(s),cross entropy on all data is 0.0462566
After 169 training step(s),cross entropy on all data is 0.0461494
After 170 training step(s),cross entropy on all data is 0.0460413
After 171 training step(s),cross entropy on all data is 0.0459436
After 172 training step(s),cross entropy on all data is 0.0458403
After 173 training step(s),cross entropy on all data is 0.0457342
After 174 training step(s),cross entropy on all data is 0.0456385
After 175 training step(s),cross entropy on all data is 0.0455521
After 176 training step(s),cross entropy on all data is 0.0454463
After 177 training step(s),cross entropy on all data is 0.0453384
After 178 training step(s),cross entropy on all data is 0.0452411
After 179 training step(s),cross entropy on all data is 0.0451533
After 180 training step(s),cross entropy on all data is 0.0450741
After 181 training step(s),cross entropy on all data is 0.0450026
After 182 training step(s),cross entropy on all data is 0.0449249
After 183 training step(s),cross entropy on all data is 0.0448267
After 184 training step(s),cross entropy on all data is 0.0447242
After 185 training step(s),cross entropy on all data is 0.0446176
After 186 training step(s),cross entropy on all data is 0.0445099
After 187 training step(s),cross entropy on all data is 0.0444127
After 188 training step(s),cross entropy on all data is 0.0443099
After 189 training step(s),cross entropy on all data is 0.0442043
After 190 training step(s),cross entropy on all data is 0.044109
After 191 training step(s),cross entropy on all data is 0.044023
After 192 training step(s),cross entropy on all data is 0.0439177
After 193 training step(s),cross entropy on all data is 0.0438108
After 194 training step(s),cross entropy on all data is 0.0437223
After 195 training step(s),cross entropy on all data is 0.0436425
After 196 training step(s),cross entropy on all data is 0.0435705
After 197 training step(s),cross entropy on all data is 0.0435055
After 198 training step(s),cross entropy on all data is 0.0434469
After 199 training step(s),cross entropy on all data is 0.0433681
After 200 training step(s),cross entropy on all data is 0.0432842
After 201 training step(s),cross entropy on all data is 0.0431957
After 202 training step(s),cross entropy on all data is 0.0431054
After 203 training step(s),cross entropy on all data is 0.043024
After 204 training step(s),cross entropy on all data is 0.0429366
After 205 training step(s),cross entropy on all data is 0.0428461
After 206 training step(s),cross entropy on all data is 0.0427644
After 207 training step(s),cross entropy on all data is 0.0426907
After 208 training step(s),cross entropy on all data is 0.0425988
After 209 training step(s),cross entropy on all data is 0.0425047
After 210 training step(s),cross entropy on all data is 0.0424198
After 211 training step(s),cross entropy on all data is 0.0423432
After 212 training step(s),cross entropy on all data is 0.0422741
After 213 training step(s),cross entropy on all data is 0.0422118
After 214 training step(s),cross entropy on all data is 0.0421556
After 215 training step(s),cross entropy on all data is 0.042079
After 216 training step(s),cross entropy on all data is 0.0419972
After 217 training step(s),cross entropy on all data is 0.0419106
After 218 training step(s),cross entropy on all data is 0.041822
After 219 training step(s),cross entropy on all data is 0.041742
After 220 training step(s),cross entropy on all data is 0.0416567
After 221 training step(s),cross entropy on all data is 0.0415864
After 222 training step(s),cross entropy on all data is 0.0415229
After 223 training step(s),cross entropy on all data is 0.0414657
After 224 training step(s),cross entropy on all data is 0.0413908
After 225 training step(s),cross entropy on all data is 0.0413132
After 226 training step(s),cross entropy on all data is 0.0412433
After 227 training step(s),cross entropy on all data is 0.0411802
After 228 training step(s),cross entropy on all data is 0.0411233
After 229 training step(s),cross entropy on all data is 0.041072
After 230 training step(s),cross entropy on all data is 0.0410257
After 231 training step(s),cross entropy on all data is 0.0409603
After 232 training step(s),cross entropy on all data is 0.0408898
After 233 training step(s),cross entropy on all data is 0.0408145
After 234 training step(s),cross entropy on all data is 0.0407374
After 235 training step(s),cross entropy on all data is 0.0406678
After 236 training step(s),cross entropy on all data is 0.0405923
After 237 training step(s),cross entropy on all data is 0.0405242
After 238 training step(s),cross entropy on all data is 0.0404628
After 239 training step(s),cross entropy on all data is 0.0404075
After 240 training step(s),cross entropy on all data is 0.0403343
After 241 training step(s),cross entropy on all data is 0.0402582
After 242 training step(s),cross entropy on all data is 0.0401897
After 243 training step(s),cross entropy on all data is 0.0401278
After 244 training step(s),cross entropy on all data is 0.040072
After 245 training step(s),cross entropy on all data is 0.0400217
After 246 training step(s),cross entropy on all data is 0.0399764
After 247 training step(s),cross entropy on all data is 0.0399119
After 248 training step(s),cross entropy on all data is 0.0398423
After 249 training step(s),cross entropy on all data is 0.0397678
After 250 training step(s),cross entropy on all data is 0.0396912
After 251 training step(s),cross entropy on all data is 0.0396222
After 252 training step(s),cross entropy on all data is 0.0395474
After 253 training step(s),cross entropy on all data is 0.0394799
After 254 training step(s),cross entropy on all data is 0.039419
After 255 training step(s),cross entropy on all data is 0.0393641
After 256 training step(s),cross entropy on all data is 0.0392914
After 257 training step(s),cross entropy on all data is 0.0392157
After 258 training step(s),cross entropy on all data is 0.0391475
After 259 training step(s),cross entropy on all data is 0.039086
After 260 training step(s),cross entropy on all data is 0.0390306
After 261 training step(s),cross entropy on all data is 0.0389806
After 262 training step(s),cross entropy on all data is 0.0389355
After 263 training step(s),cross entropy on all data is 0.0388713
After 264 training step(s),cross entropy on all data is 0.038802
After 265 training step(s),cross entropy on all data is 0.0387278
After 266 training step(s),cross entropy on all data is 0.0386515
After 267 training step(s),cross entropy on all data is 0.0385828
After 268 training step(s),cross entropy on all data is 0.0385082
After 269 training step(s),cross entropy on all data is 0.0384409
After 270 training step(s),cross entropy on all data is 0.0383803
After 271 training step(s),cross entropy on all data is 0.0383256
After 272 training step(s),cross entropy on all data is 0.0382532
After 273 training step(s),cross entropy on all data is 0.0381778
After 274 training step(s),cross entropy on all data is 0.0381098
After 275 training step(s),cross entropy on all data is 0.0380485
After 276 training step(s),cross entropy on all data is 0.0379933
After 277 training step(s),cross entropy on all data is 0.0379434
After 278 training step(s),cross entropy on all data is 0.0378985
After 279 training step(s),cross entropy on all data is 0.0378346
After 280 training step(s),cross entropy on all data is 0.0377655
After 281 training step(s),cross entropy on all data is 0.0376916
After 282 training step(s),cross entropy on all data is 0.0376156
After 283 training step(s),cross entropy on all data is 0.037547
After 284 training step(s),cross entropy on all data is 0.0374727
After 285 training step(s),cross entropy on all data is 0.0374057
After 286 training step(s),cross entropy on all data is 0.0373453
After 287 training step(s),cross entropy on all data is 0.0372908
After 288 training step(s),cross entropy on all data is 0.0372187
After 289 training step(s),cross entropy on all data is 0.0371435
After 290 training step(s),cross entropy on all data is 0.0370757
After 291 training step(s),cross entropy on all data is 0.0370146
After 292 training step(s),cross entropy on all data is 0.0369596
After 293 training step(s),cross entropy on all data is 0.0369099
After 294 training step(s),cross entropy on all data is 0.0368652
After 295 training step(s),cross entropy on all data is 0.0368015
After 296 training step(s),cross entropy on all data is 0.0367327
After 297 training step(s),cross entropy on all data is 0.0366591
After 298 training step(s),cross entropy on all data is 0.0365833
After 299 training step(s),cross entropy on all data is 0.0365149
After 300 training step(s),cross entropy on all data is 0.0364409
After 301 training step(s),cross entropy on all data is 0.0363741
After 302 training step(s),cross entropy on all data is 0.036314
After 303 training step(s),cross entropy on all data is 0.0362598
After 304 training step(s),cross entropy on all data is 0.0361879
After 305 training step(s),cross entropy on all data is 0.036113
After 306 training step(s),cross entropy on all data is 0.0360455
After 307 training step(s),cross entropy on all data is 0.0359846
After 308 training step(s),cross entropy on all data is 0.0359298
After 309 training step(s),cross entropy on all data is 0.0358803
After 310 training step(s),cross entropy on all data is 0.0358358
After 311 training step(s),cross entropy on all data is 0.0357724
After 312 training step(s),cross entropy on all data is 0.0357038
After 313 training step(s),cross entropy on all data is 0.0356305
After 314 training step(s),cross entropy on all data is 0.035555
After 315 training step(s),cross entropy on all data is 0.0354869
After 316 training step(s),cross entropy on all data is 0.0354132
After 317 training step(s),cross entropy on all data is 0.0353467
After 318 training step(s),cross entropy on all data is 0.0352868
After 319 training step(s),cross entropy on all data is 0.0352328
After 320 training step(s),cross entropy on all data is 0.0351613
After 321 training step(s),cross entropy on all data is 0.0350936
After 322 training step(s),cross entropy on all data is 0.0350346
After 323 training step(s),cross entropy on all data is 0.0349814
After 324 training step(s),cross entropy on all data is 0.0349335
After 325 training step(s),cross entropy on all data is 0.0348903
After 326 training step(s),cross entropy on all data is 0.0348514
After 327 training step(s),cross entropy on all data is 0.0347963
After 328 training step(s),cross entropy on all data is 0.0347368
After 329 training step(s),cross entropy on all data is 0.0346732
After 330 training step(s),cross entropy on all data is 0.034607
After 331 training step(s),cross entropy on all data is 0.0345473
After 332 training step(s),cross entropy on all data is 0.0344831
After 333 training step(s),cross entropy on all data is 0.0344253
After 334 training step(s),cross entropy on all data is 0.0343732
After 335 training step(s),cross entropy on all data is 0.0343263
After 336 training step(s),cross entropy on all data is 0.0342745
After 337 training step(s),cross entropy on all data is 0.0342186
After 338 training step(s),cross entropy on all data is 0.0341682
After 339 training step(s),cross entropy on all data is 0.0341227
After 340 training step(s),cross entropy on all data is 0.0340818
After 341 training step(s),cross entropy on all data is 0.0340449
After 342 training step(s),cross entropy on all data is 0.0340116
After 343 training step(s),cross entropy on all data is 0.0339616
After 344 training step(s),cross entropy on all data is 0.0339066
After 345 training step(s),cross entropy on all data is 0.0338471
After 346 training step(s),cross entropy on all data is 0.0337845
After 347 training step(s),cross entropy on all data is 0.0337281
After 348 training step(s),cross entropy on all data is 0.0336669
After 349 training step(s),cross entropy on all data is 0.0336117
After 350 training step(s),cross entropy on all data is 0.033562
After 351 training step(s),cross entropy on all data is 0.0335172
After 352 training step(s),cross entropy on all data is 0.0334674
After 353 training step(s),cross entropy on all data is 0.0334132
After 354 training step(s),cross entropy on all data is 0.0333644
After 355 training step(s),cross entropy on all data is 0.0333203
After 356 training step(s),cross entropy on all data is 0.0332807
After 357 training step(s),cross entropy on all data is 0.0332449
After 358 training step(s),cross entropy on all data is 0.0332127
After 359 training step(s),cross entropy on all data is 0.0331636
After 360 training step(s),cross entropy on all data is 0.0331094
After 361 training step(s),cross entropy on all data is 0.0330506
After 362 training step(s),cross entropy on all data is 0.0329886
After 363 training step(s),cross entropy on all data is 0.0329328
After 364 training step(s),cross entropy on all data is 0.0328721
After 365 training step(s),cross entropy on all data is 0.0328174
After 366 training step(s),cross entropy on all data is 0.0327682
After 367 training step(s),cross entropy on all data is 0.0327237
After 368 training step(s),cross entropy on all data is 0.0326743
After 369 training step(s),cross entropy on all data is 0.0326203
After 370 training step(s),cross entropy on all data is 0.0325718
After 371 training step(s),cross entropy on all data is 0.032528
After 372 training step(s),cross entropy on all data is 0.0324885
After 373 training step(s),cross entropy on all data is 0.032453
After 374 training step(s),cross entropy on all data is 0.0324209
After 375 training step(s),cross entropy on all data is 0.032372
After 376 training step(s),cross entropy on all data is 0.0323179
After 377 training step(s),cross entropy on all data is 0.0322592
After 378 training step(s),cross entropy on all data is 0.0321974
After 379 training step(s),cross entropy on all data is 0.0321417
After 380 training step(s),cross entropy on all data is 0.0320811
After 381 training step(s),cross entropy on all data is 0.0320265
After 382 training step(s),cross entropy on all data is 0.0319773
After 383 training step(s),cross entropy on all data is 0.0319329
After 384 training step(s),cross entropy on all data is 0.0318835
After 385 training step(s),cross entropy on all data is 0.0318297
After 386 training step(s),cross entropy on all data is 0.0317811
After 387 training step(s),cross entropy on all data is 0.0317374
After 388 training step(s),cross entropy on all data is 0.031698
After 389 training step(s),cross entropy on all data is 0.0316624
After 390 training step(s),cross entropy on all data is 0.0316304
After 391 training step(s),cross entropy on all data is 0.0315815
After 392 training step(s),cross entropy on all data is 0.0315275
After 393 training step(s),cross entropy on all data is 0.0314689
After 394 training step(s),cross entropy on all data is 0.0314071
After 395 training step(s),cross entropy on all data is 0.0313514
After 396 training step(s),cross entropy on all data is 0.0312908
After 397 training step(s),cross entropy on all data is 0.0312362
After 398 training step(s),cross entropy on all data is 0.0311871
After 399 training step(s),cross entropy on all data is 0.0311428
After 400 training step(s),cross entropy on all data is 0.0310934
After 401 training step(s),cross entropy on all data is 0.0310395
After 402 training step(s),cross entropy on all data is 0.030991
After 403 training step(s),cross entropy on all data is 0.0309473
After 404 training step(s),cross entropy on all data is 0.0309079
After 405 training step(s),cross entropy on all data is 0.0308724
After 406 training step(s),cross entropy on all data is 0.0308404
After 407 training step(s),cross entropy on all data is 0.0307915
After 408 training step(s),cross entropy on all data is 0.0307376
After 409 training step(s),cross entropy on all data is 0.030679
After 410 training step(s),cross entropy on all data is 0.0306172
After 411 training step(s),cross entropy on all data is 0.0305615
After 412 training step(s),cross entropy on all data is 0.030501
After 413 training step(s),cross entropy on all data is 0.0304494
After 414 training step(s),cross entropy on all data is 0.0304069
After 415 training step(s),cross entropy on all data is 0.0303687
After 416 training step(s),cross entropy on all data is 0.0303258
After 417 training step(s),cross entropy on all data is 0.0302788
After 418 training step(s),cross entropy on all data is 0.0302365
After 419 training step(s),cross entropy on all data is 0.0301984
After 420 training step(s),cross entropy on all data is 0.030164
After 421 training step(s),cross entropy on all data is 0.030133
After 422 training step(s),cross entropy on all data is 0.0301051
After 423 training step(s),cross entropy on all data is 0.0300714
After 424 training step(s),cross entropy on all data is 0.0300325
After 425 training step(s),cross entropy on all data is 0.0299888
After 426 training step(s),cross entropy on all data is 0.0299412
After 427 training step(s),cross entropy on all data is 0.0298983
After 428 training step(s),cross entropy on all data is 0.029851
After 429 training step(s),cross entropy on all data is 0.0298084
After 430 training step(s),cross entropy on all data is 0.02977
After 431 training step(s),cross entropy on all data is 0.0297354
After 432 training step(s),cross entropy on all data is 0.0296958
After 433 training step(s),cross entropy on all data is 0.0296517
After 434 training step(s),cross entropy on all data is 0.029612
After 435 training step(s),cross entropy on all data is 0.0295762
After 436 training step(s),cross entropy on all data is 0.0295439
After 437 training step(s),cross entropy on all data is 0.0295148
After 438 training step(s),cross entropy on all data is 0.0294887
After 439 training step(s),cross entropy on all data is 0.0294565
After 440 training step(s),cross entropy on all data is 0.0294189
After 441 training step(s),cross entropy on all data is 0.0293764
After 442 training step(s),cross entropy on all data is 0.0293299
After 443 training step(s),cross entropy on all data is 0.0292879
After 444 training step(s),cross entropy on all data is 0.0292414
After 445 training step(s),cross entropy on all data is 0.0291995
After 446 training step(s),cross entropy on all data is 0.0291617
After 447 training step(s),cross entropy on all data is 0.0291277
After 448 training step(s),cross entropy on all data is 0.0290886
After 449 training step(s),cross entropy on all data is 0.0290449
After 450 training step(s),cross entropy on all data is 0.0290056
After 451 training step(s),cross entropy on all data is 0.0289701
After 452 training step(s),cross entropy on all data is 0.0289382
After 453 training step(s),cross entropy on all data is 0.0289094
After 454 training step(s),cross entropy on all data is 0.0288835
After 455 training step(s),cross entropy on all data is 0.0288515
After 456 training step(s),cross entropy on all data is 0.0288141
After 457 training step(s),cross entropy on all data is 0.0287718
After 458 training step(s),cross entropy on all data is 0.0287253
After 459 training step(s),cross entropy on all data is 0.0286834
After 460 training step(s),cross entropy on all data is 0.0286369
After 461 training step(s),cross entropy on all data is 0.0285951
After 462 training step(s),cross entropy on all data is 0.0285573
After 463 training step(s),cross entropy on all data is 0.0285233
After 464 training step(s),cross entropy on all data is 0.0284842
After 465 training step(s),cross entropy on all data is 0.0284406
After 466 training step(s),cross entropy on all data is 0.0284012
After 467 training step(s),cross entropy on all data is 0.0283658
After 468 training step(s),cross entropy on all data is 0.0283338
After 469 training step(s),cross entropy on all data is 0.028305
After 470 training step(s),cross entropy on all data is 0.0282791
After 471 training step(s),cross entropy on all data is 0.0282471
After 472 training step(s),cross entropy on all data is 0.0282096
After 473 training step(s),cross entropy on all data is 0.0281672
After 474 training step(s),cross entropy on all data is 0.0281206
After 475 training step(s),cross entropy on all data is 0.0280787
After 476 training step(s),cross entropy on all data is 0.0280321
After 477 training step(s),cross entropy on all data is 0.0279902
After 478 training step(s),cross entropy on all data is 0.0279524
After 479 training step(s),cross entropy on all data is 0.0279183
After 480 training step(s),cross entropy on all data is 0.0278792
After 481 training step(s),cross entropy on all data is 0.0278354
After 482 training step(s),cross entropy on all data is 0.027796
After 483 training step(s),cross entropy on all data is 0.0277604
After 484 training step(s),cross entropy on all data is 0.0277284
After 485 training step(s),cross entropy on all data is 0.0276996
After 486 training step(s),cross entropy on all data is 0.0276736
After 487 training step(s),cross entropy on all data is 0.0276416
After 488 training step(s),cross entropy on all data is 0.027604
After 489 training step(s),cross entropy on all data is 0.0275615
After 490 training step(s),cross entropy on all data is 0.0275149
After 491 training step(s),cross entropy on all data is 0.0274728
After 492 training step(s),cross entropy on all data is 0.0274262
After 493 training step(s),cross entropy on all data is 0.0273841
After 494 training step(s),cross entropy on all data is 0.0273463
After 495 training step(s),cross entropy on all data is 0.0273122
After 496 training step(s),cross entropy on all data is 0.0272729
After 497 training step(s),cross entropy on all data is 0.027229
After 498 training step(s),cross entropy on all data is 0.0271895
After 499 training step(s),cross entropy on all data is 0.027154
After 500 training step(s),cross entropy on all data is 0.0271219
After 501 training step(s),cross entropy on all data is 0.027093
After 502 training step(s),cross entropy on all data is 0.027067
After 503 training step(s),cross entropy on all data is 0.0270349
After 504 training step(s),cross entropy on all data is 0.0269973
After 505 training step(s),cross entropy on all data is 0.0269547
After 506 training step(s),cross entropy on all data is 0.0269079
After 507 training step(s),cross entropy on all data is 0.0268707
After 508 training step(s),cross entropy on all data is 0.0268304
After 509 training step(s),cross entropy on all data is 0.0267942
After 510 training step(s),cross entropy on all data is 0.0267615
After 511 training step(s),cross entropy on all data is 0.0267321
After 512 training step(s),cross entropy on all data is 0.0267056
After 513 training step(s),cross entropy on all data is 0.0266745
After 514 training step(s),cross entropy on all data is 0.0266465
After 515 training step(s),cross entropy on all data is 0.0266212
After 516 training step(s),cross entropy on all data is 0.0265985
After 517 training step(s),cross entropy on all data is 0.026578
After 518 training step(s),cross entropy on all data is 0.0265596
After 519 training step(s),cross entropy on all data is 0.0265355
After 520 training step(s),cross entropy on all data is 0.0265062
After 521 training step(s),cross entropy on all data is 0.0264722
After 522 training step(s),cross entropy on all data is 0.0264346
After 523 training step(s),cross entropy on all data is 0.0264007
After 524 training step(s),cross entropy on all data is 0.0263624
After 525 training step(s),cross entropy on all data is 0.0263279
After 526 training step(s),cross entropy on all data is 0.0262968
After 527 training step(s),cross entropy on all data is 0.0262688
After 528 training step(s),cross entropy on all data is 0.0262436
After 529 training step(s),cross entropy on all data is 0.0262136
After 530 training step(s),cross entropy on all data is 0.0261866
After 531 training step(s),cross entropy on all data is 0.0261623
After 532 training step(s),cross entropy on all data is 0.0261403
After 533 training step(s),cross entropy on all data is 0.0261206
After 534 training step(s),cross entropy on all data is 0.0261028
After 535 training step(s),cross entropy on all data is 0.0260793
After 536 training step(s),cross entropy on all data is 0.0260505
After 537 training step(s),cross entropy on all data is 0.0260169
After 538 training step(s),cross entropy on all data is 0.0259797
After 539 training step(s),cross entropy on all data is 0.0259461
After 540 training step(s),cross entropy on all data is 0.0259081
After 541 training step(s),cross entropy on all data is 0.0258738
After 542 training step(s),cross entropy on all data is 0.0258429
After 543 training step(s),cross entropy on all data is 0.0258151
After 544 training step(s),cross entropy on all data is 0.02579
After 545 training step(s),cross entropy on all data is 0.0257602
After 546 training step(s),cross entropy on all data is 0.0257333
After 547 training step(s),cross entropy on all data is 0.0257091
After 548 training step(s),cross entropy on all data is 0.0256872
After 549 training step(s),cross entropy on all data is 0.0256676
After 550 training step(s),cross entropy on all data is 0.0256499
After 551 training step(s),cross entropy on all data is 0.0256264
After 552 training step(s),cross entropy on all data is 0.0255976
After 553 training step(s),cross entropy on all data is 0.0255641
After 554 training step(s),cross entropy on all data is 0.0255268
After 555 training step(s),cross entropy on all data is 0.0254932
After 556 training step(s),cross entropy on all data is 0.0254551
After 557 training step(s),cross entropy on all data is 0.0254208
After 558 training step(s),cross entropy on all data is 0.0253898
After 559 training step(s),cross entropy on all data is 0.025362
After 560 training step(s),cross entropy on all data is 0.0253369
After 561 training step(s),cross entropy on all data is 0.025307
After 562 training step(s),cross entropy on all data is 0.0252801
After 563 training step(s),cross entropy on all data is 0.0252558
After 564 training step(s),cross entropy on all data is 0.025234
After 565 training step(s),cross entropy on all data is 0.0252143
After 566 training step(s),cross entropy on all data is 0.0251966
After 567 training step(s),cross entropy on all data is 0.025173
After 568 training step(s),cross entropy on all data is 0.0251442
After 569 training step(s),cross entropy on all data is 0.0251106
After 570 training step(s),cross entropy on all data is 0.0250774
After 571 training step(s),cross entropy on all data is 0.0250494
After 572 training step(s),cross entropy on all data is 0.0250241
After 573 training step(s),cross entropy on all data is 0.0250013
After 574 training step(s),cross entropy on all data is 0.0249808
After 575 training step(s),cross entropy on all data is 0.0249624
After 576 training step(s),cross entropy on all data is 0.0249457
After 577 training step(s),cross entropy on all data is 0.0249244
After 578 training step(s),cross entropy on all data is 0.0249052
After 579 training step(s),cross entropy on all data is 0.0248879
After 580 training step(s),cross entropy on all data is 0.0248723
After 581 training step(s),cross entropy on all data is 0.0248582
After 582 training step(s),cross entropy on all data is 0.0248456
After 583 training step(s),cross entropy on all data is 0.0248279
After 584 training step(s),cross entropy on all data is 0.0248058
After 585 training step(s),cross entropy on all data is 0.0247797
After 586 training step(s),cross entropy on all data is 0.0247499
After 587 training step(s),cross entropy on all data is 0.0247229
After 588 training step(s),cross entropy on all data is 0.0246987
After 589 training step(s),cross entropy on all data is 0.0246768
After 590 training step(s),cross entropy on all data is 0.0246572
After 591 training step(s),cross entropy on all data is 0.0246394
After 592 training step(s),cross entropy on all data is 0.0246235
After 593 training step(s),cross entropy on all data is 0.0246027
After 594 training step(s),cross entropy on all data is 0.024584
After 595 training step(s),cross entropy on all data is 0.0245672
After 596 training step(s),cross entropy on all data is 0.024552
After 597 training step(s),cross entropy on all data is 0.0245384
After 598 training step(s),cross entropy on all data is 0.024526
After 599 training step(s),cross entropy on all data is 0.0245087
After 600 training step(s),cross entropy on all data is 0.0244868
After 601 training step(s),cross entropy on all data is 0.0244609
After 602 training step(s),cross entropy on all data is 0.0244311
After 603 training step(s),cross entropy on all data is 0.0244043
After 604 training step(s),cross entropy on all data is 0.0243802
After 605 training step(s),cross entropy on all data is 0.0243584
After 606 training step(s),cross entropy on all data is 0.0243388
After 607 training step(s),cross entropy on all data is 0.0243212
After 608 training step(s),cross entropy on all data is 0.0243053
After 609 training step(s),cross entropy on all data is 0.0242846
After 610 training step(s),cross entropy on all data is 0.0242659
After 611 training step(s),cross entropy on all data is 0.0242491
After 612 training step(s),cross entropy on all data is 0.024234
After 613 training step(s),cross entropy on all data is 0.0242204
After 614 training step(s),cross entropy on all data is 0.0242081
After 615 training step(s),cross entropy on all data is 0.0241907
After 616 training step(s),cross entropy on all data is 0.0241688
After 617 training step(s),cross entropy on all data is 0.0241428
After 618 training step(s),cross entropy on all data is 0.024113
After 619 training step(s),cross entropy on all data is 0.0240861
After 620 training step(s),cross entropy on all data is 0.0240619
After 621 training step(s),cross entropy on all data is 0.0240401
After 622 training step(s),cross entropy on all data is 0.0240205
After 623 training step(s),cross entropy on all data is 0.0240028
After 624 training step(s),cross entropy on all data is 0.0239869
After 625 training step(s),cross entropy on all data is 0.0239661
After 626 training step(s),cross entropy on all data is 0.0239474
After 627 training step(s),cross entropy on all data is 0.0239306
After 628 training step(s),cross entropy on all data is 0.0239154
After 629 training step(s),cross entropy on all data is 0.0239017
After 630 training step(s),cross entropy on all data is 0.0238894
After 631 training step(s),cross entropy on all data is 0.023872
After 632 training step(s),cross entropy on all data is 0.02385
After 633 training step(s),cross entropy on all data is 0.0238239
After 634 training step(s),cross entropy on all data is 0.023794
After 635 training step(s),cross entropy on all data is 0.023767
After 636 training step(s),cross entropy on all data is 0.0237427
After 637 training step(s),cross entropy on all data is 0.0237209
After 638 training step(s),cross entropy on all data is 0.0237012
After 639 training step(s),cross entropy on all data is 0.0236834
After 640 training step(s),cross entropy on all data is 0.0236674
After 641 training step(s),cross entropy on all data is 0.0236466
After 642 training step(s),cross entropy on all data is 0.0236278
After 643 training step(s),cross entropy on all data is 0.0236109
After 644 training step(s),cross entropy on all data is 0.0235957
After 645 training step(s),cross entropy on all data is 0.023582
After 646 training step(s),cross entropy on all data is 0.0235696
After 647 training step(s),cross entropy on all data is 0.0235522
After 648 training step(s),cross entropy on all data is 0.0235301
After 649 training step(s),cross entropy on all data is 0.0235039
After 650 training step(s),cross entropy on all data is 0.0234739
After 651 training step(s),cross entropy on all data is 0.0234468
After 652 training step(s),cross entropy on all data is 0.0234225
After 653 training step(s),cross entropy on all data is 0.0234005
After 654 training step(s),cross entropy on all data is 0.0233807
After 655 training step(s),cross entropy on all data is 0.0233629
After 656 training step(s),cross entropy on all data is 0.0233469
After 657 training step(s),cross entropy on all data is 0.023326
After 658 training step(s),cross entropy on all data is 0.0233072
After 659 training step(s),cross entropy on all data is 0.0232902
After 660 training step(s),cross entropy on all data is 0.0232749
After 661 training step(s),cross entropy on all data is 0.0232612
After 662 training step(s),cross entropy on all data is 0.0232488
After 663 training step(s),cross entropy on all data is 0.0232313
After 664 training step(s),cross entropy on all data is 0.0232091
After 665 training step(s),cross entropy on all data is 0.0231829
After 666 training step(s),cross entropy on all data is 0.0231527
After 667 training step(s),cross entropy on all data is 0.0231256
After 668 training step(s),cross entropy on all data is 0.0231011
After 669 training step(s),cross entropy on all data is 0.0230791
After 670 training step(s),cross entropy on all data is 0.0230593
After 671 training step(s),cross entropy on all data is 0.0230414
After 672 training step(s),cross entropy on all data is 0.0230253
After 673 training step(s),cross entropy on all data is 0.0230044
After 674 training step(s),cross entropy on all data is 0.0229855
After 675 training step(s),cross entropy on all data is 0.0229685
After 676 training step(s),cross entropy on all data is 0.0229532
After 677 training step(s),cross entropy on all data is 0.0229394
After 678 training step(s),cross entropy on all data is 0.0229269
After 679 training step(s),cross entropy on all data is 0.0229093
After 680 training step(s),cross entropy on all data is 0.0228871
After 681 training step(s),cross entropy on all data is 0.0228608
After 682 training step(s),cross entropy on all data is 0.0228306
After 683 training step(s),cross entropy on all data is 0.0228033
After 684 training step(s),cross entropy on all data is 0.0227788
After 685 training step(s),cross entropy on all data is 0.0227567
After 686 training step(s),cross entropy on all data is 0.0227368
After 687 training step(s),cross entropy on all data is 0.0227189
After 688 training step(s),cross entropy on all data is 0.0227028
After 689 training step(s),cross entropy on all data is 0.0226818
After 690 training step(s),cross entropy on all data is 0.0226628
After 691 training step(s),cross entropy on all data is 0.0226458
After 692 training step(s),cross entropy on all data is 0.0226304
After 693 training step(s),cross entropy on all data is 0.0226166
After 694 training step(s),cross entropy on all data is 0.0226041
After 695 training step(s),cross entropy on all data is 0.0225865
After 696 training step(s),cross entropy on all data is 0.0225642
After 697 training step(s),cross entropy on all data is 0.0225378
After 698 training step(s),cross entropy on all data is 0.0225075
After 699 training step(s),cross entropy on all data is 0.0224802
After 700 training step(s),cross entropy on all data is 0.0224556
After 701 training step(s),cross entropy on all data is 0.0224335
After 702 training step(s),cross entropy on all data is 0.0224135
After 703 training step(s),cross entropy on all data is 0.0223956
After 704 training step(s),cross entropy on all data is 0.0223794
After 705 training step(s),cross entropy on all data is 0.0223583
After 706 training step(s),cross entropy on all data is 0.0223393
After 707 training step(s),cross entropy on all data is 0.0223223
After 708 training step(s),cross entropy on all data is 0.0223069
After 709 training step(s),cross entropy on all data is 0.022293
After 710 training step(s),cross entropy on all data is 0.0222805
After 711 training step(s),cross entropy on all data is 0.0222628
After 712 training step(s),cross entropy on all data is 0.0222405
After 713 training step(s),cross entropy on all data is 0.022214
After 714 training step(s),cross entropy on all data is 0.0221836
After 715 training step(s),cross entropy on all data is 0.0221562
After 716 training step(s),cross entropy on all data is 0.0221316
After 717 training step(s),cross entropy on all data is 0.0221094
After 718 training step(s),cross entropy on all data is 0.0220894
After 719 training step(s),cross entropy on all data is 0.0220714
After 720 training step(s),cross entropy on all data is 0.0220552
After 721 training step(s),cross entropy on all data is 0.022034
After 722 training step(s),cross entropy on all data is 0.022015
After 723 training step(s),cross entropy on all data is 0.0219979
After 724 training step(s),cross entropy on all data is 0.0219825
After 725 training step(s),cross entropy on all data is 0.0219686
After 726 training step(s),cross entropy on all data is 0.0219561
After 727 training step(s),cross entropy on all data is 0.0219383
After 728 training step(s),cross entropy on all data is 0.0219159
After 729 training step(s),cross entropy on all data is 0.0218894
After 730 training step(s),cross entropy on all data is 0.0218589
After 731 training step(s),cross entropy on all data is 0.0218315
After 732 training step(s),cross entropy on all data is 0.0218068
After 733 training step(s),cross entropy on all data is 0.0217845
After 734 training step(s),cross entropy on all data is 0.0217645
After 735 training step(s),cross entropy on all data is 0.0217465
After 736 training step(s),cross entropy on all data is 0.0217302
After 737 training step(s),cross entropy on all data is 0.0217091
After 738 training step(s),cross entropy on all data is 0.02169
After 739 training step(s),cross entropy on all data is 0.0216728
After 740 training step(s),cross entropy on all data is 0.0216574
After 741 training step(s),cross entropy on all data is 0.0216435
After 742 training step(s),cross entropy on all data is 0.0216309
After 743 training step(s),cross entropy on all data is 0.0216131
After 744 training step(s),cross entropy on all data is 0.0215907
After 745 training step(s),cross entropy on all data is 0.0215641
After 746 training step(s),cross entropy on all data is 0.0215336
After 747 training step(s),cross entropy on all data is 0.0215061
After 748 training step(s),cross entropy on all data is 0.0214813
After 749 training step(s),cross entropy on all data is 0.021459
After 750 training step(s),cross entropy on all data is 0.021439
After 751 training step(s),cross entropy on all data is 0.0214209
After 752 training step(s),cross entropy on all data is 0.0214046
After 753 training step(s),cross entropy on all data is 0.0213834
After 754 training step(s),cross entropy on all data is 0.0213643
After 755 training step(s),cross entropy on all data is 0.0213471
After 756 training step(s),cross entropy on all data is 0.0213316
After 757 training step(s),cross entropy on all data is 0.0213177
After 758 training step(s),cross entropy on all data is 0.0213051
After 759 training step(s),cross entropy on all data is 0.0212873
After 760 training step(s),cross entropy on all data is 0.0212648
After 761 training step(s),cross entropy on all data is 0.0212381
After 762 training step(s),cross entropy on all data is 0.0212076
After 763 training step(s),cross entropy on all data is 0.02118
After 764 training step(s),cross entropy on all data is 0.0211552
After 765 training step(s),cross entropy on all data is 0.0211329
After 766 training step(s),cross entropy on all data is 0.0211128
After 767 training step(s),cross entropy on all data is 0.0210947
After 768 training step(s),cross entropy on all data is 0.0210784
After 769 training step(s),cross entropy on all data is 0.0210571
After 770 training step(s),cross entropy on all data is 0.021038
After 771 training step(s),cross entropy on all data is 0.0210208
After 772 training step(s),cross entropy on all data is 0.0210053
After 773 training step(s),cross entropy on all data is 0.0209913
After 774 training step(s),cross entropy on all data is 0.0209787
After 775 training step(s),cross entropy on all data is 0.0209609
After 776 training step(s),cross entropy on all data is 0.0209384
After 777 training step(s),cross entropy on all data is 0.0209117
After 778 training step(s),cross entropy on all data is 0.020881
After 779 training step(s),cross entropy on all data is 0.0208535
After 780 training step(s),cross entropy on all data is 0.0208286
After 781 training step(s),cross entropy on all data is 0.0208062
After 782 training step(s),cross entropy on all data is 0.0207861
After 783 training step(s),cross entropy on all data is 0.020768
After 784 training step(s),cross entropy on all data is 0.0207516
After 785 training step(s),cross entropy on all data is 0.0207304
After 786 training step(s),cross entropy on all data is 0.0207112
After 787 training step(s),cross entropy on all data is 0.020694
After 788 training step(s),cross entropy on all data is 0.0206784
After 789 training step(s),cross entropy on all data is 0.0206644
After 790 training step(s),cross entropy on all data is 0.0206518
After 791 training step(s),cross entropy on all data is 0.020634
After 792 training step(s),cross entropy on all data is 0.0206114
After 793 training step(s),cross entropy on all data is 0.0205846
After 794 training step(s),cross entropy on all data is 0.020554
After 795 training step(s),cross entropy on all data is 0.0205264
After 796 training step(s),cross entropy on all data is 0.0205015
After 797 training step(s),cross entropy on all data is 0.0204791
After 798 training step(s),cross entropy on all data is 0.0204589
After 799 training step(s),cross entropy on all data is 0.0204407
After 800 training step(s),cross entropy on all data is 0.0204244
After 801 training step(s),cross entropy on all data is 0.0204031
After 802 training step(s),cross entropy on all data is 0.0203839
After 803 training step(s),cross entropy on all data is 0.0203667
After 804 training step(s),cross entropy on all data is 0.0203511
After 805 training step(s),cross entropy on all data is 0.0203371
After 806 training step(s),cross entropy on all data is 0.0203245
After 807 training step(s),cross entropy on all data is 0.0203066
After 808 training step(s),cross entropy on all data is 0.020284
After 809 training step(s),cross entropy on all data is 0.0202572
After 810 training step(s),cross entropy on all data is 0.0202265
After 811 training step(s),cross entropy on all data is 0.0201988
After 812 training step(s),cross entropy on all data is 0.0201739
After 813 training step(s),cross entropy on all data is 0.0201515
After 814 training step(s),cross entropy on all data is 0.0201313
After 815 training step(s),cross entropy on all data is 0.0201131
After 816 training step(s),cross entropy on all data is 0.0200967
After 817 training step(s),cross entropy on all data is 0.0200754
After 818 training step(s),cross entropy on all data is 0.0200562
After 819 training step(s),cross entropy on all data is 0.020039
After 820 training step(s),cross entropy on all data is 0.0200234
After 821 training step(s),cross entropy on all data is 0.0200094
After 822 training step(s),cross entropy on all data is 0.0199967
After 823 training step(s),cross entropy on all data is 0.0199788
After 824 training step(s),cross entropy on all data is 0.0199562
After 825 training step(s),cross entropy on all data is 0.0199294
After 826 training step(s),cross entropy on all data is 0.0198986
After 827 training step(s),cross entropy on all data is 0.0198709
After 828 training step(s),cross entropy on all data is 0.019846
After 829 training step(s),cross entropy on all data is 0.0198236
After 830 training step(s),cross entropy on all data is 0.0198033
After 831 training step(s),cross entropy on all data is 0.0197851
After 832 training step(s),cross entropy on all data is 0.0197687
After 833 training step(s),cross entropy on all data is 0.0197474
After 834 training step(s),cross entropy on all data is 0.0197282
After 835 training step(s),cross entropy on all data is 0.0197109
After 836 training step(s),cross entropy on all data is 0.0196953
After 837 training step(s),cross entropy on all data is 0.0196813
After 838 training step(s),cross entropy on all data is 0.0196686
After 839 training step(s),cross entropy on all data is 0.0196507
After 840 training step(s),cross entropy on all data is 0.0196281
After 841 training step(s),cross entropy on all data is 0.0196012
After 842 training step(s),cross entropy on all data is 0.0195704
After 843 training step(s),cross entropy on all data is 0.0195427
After 844 training step(s),cross entropy on all data is 0.0195177
After 845 training step(s),cross entropy on all data is 0.0194953
After 846 training step(s),cross entropy on all data is 0.019475
After 847 training step(s),cross entropy on all data is 0.0194568
After 848 training step(s),cross entropy on all data is 0.0194404
After 849 training step(s),cross entropy on all data is 0.019419
After 850 training step(s),cross entropy on all data is 0.0193998
After 851 training step(s),cross entropy on all data is 0.0193825
After 852 training step(s),cross entropy on all data is 0.0193669
After 853 training step(s),cross entropy on all data is 0.0193529
After 854 training step(s),cross entropy on all data is 0.0193402
After 855 training step(s),cross entropy on all data is 0.0193223
After 856 training step(s),cross entropy on all data is 0.0192996
After 857 training step(s),cross entropy on all data is 0.0192727
After 858 training step(s),cross entropy on all data is 0.0192419
After 859 training step(s),cross entropy on all data is 0.0192142
After 860 training step(s),cross entropy on all data is 0.0191892
After 861 training step(s),cross entropy on all data is 0.0191667
After 862 training step(s),cross entropy on all data is 0.0191465
After 863 training step(s),cross entropy on all data is 0.0191282
After 864 training step(s),cross entropy on all data is 0.0191118
After 865 training step(s),cross entropy on all data is 0.0190905
After 866 training step(s),cross entropy on all data is 0.0190712
After 867 training step(s),cross entropy on all data is 0.0190539
After 868 training step(s),cross entropy on all data is 0.0190383
After 869 training step(s),cross entropy on all data is 0.0190242
After 870 training step(s),cross entropy on all data is 0.0190116
After 871 training step(s),cross entropy on all data is 0.0189937
After 872 training step(s),cross entropy on all data is 0.018971
After 873 training step(s),cross entropy on all data is 0.018944
After 874 training step(s),cross entropy on all data is 0.0189132
After 875 training step(s),cross entropy on all data is 0.0188855
After 876 training step(s),cross entropy on all data is 0.0188605
After 877 training step(s),cross entropy on all data is 0.018838
After 878 training step(s),cross entropy on all data is 0.0188177
After 879 training step(s),cross entropy on all data is 0.0187995
After 880 training step(s),cross entropy on all data is 0.018783
After 881 training step(s),cross entropy on all data is 0.0187617
After 882 training step(s),cross entropy on all data is 0.0187424
After 883 training step(s),cross entropy on all data is 0.0187251
After 884 training step(s),cross entropy on all data is 0.0187095
After 885 training step(s),cross entropy on all data is 0.0186954
After 886 training step(s),cross entropy on all data is 0.0186828
After 887 training step(s),cross entropy on all data is 0.0186648
After 888 training step(s),cross entropy on all data is 0.0186421
After 889 training step(s),cross entropy on all data is 0.0186152
After 890 training step(s),cross entropy on all data is 0.0185843
After 891 training step(s),cross entropy on all data is 0.0185566
After 892 training step(s),cross entropy on all data is 0.0185316
After 893 training step(s),cross entropy on all data is 0.0185091
After 894 training step(s),cross entropy on all data is 0.0184888
After 895 training step(s),cross entropy on all data is 0.0184705
After 896 training step(s),cross entropy on all data is 0.0184541
After 897 training step(s),cross entropy on all data is 0.0184327
After 898 training step(s),cross entropy on all data is 0.0184135
After 899 training step(s),cross entropy on all data is 0.0183961
After 900 training step(s),cross entropy on all data is 0.0183805
After 901 training step(s),cross entropy on all data is 0.0183664
After 902 training step(s),cross entropy on all data is 0.0183538
After 903 training step(s),cross entropy on all data is 0.0183358
After 904 training step(s),cross entropy on all data is 0.0183131
After 905 training step(s),cross entropy on all data is 0.0182861
After 906 training step(s),cross entropy on all data is 0.0182553
After 907 training step(s),cross entropy on all data is 0.0182275
After 908 training step(s),cross entropy on all data is 0.0182025
After 909 training step(s),cross entropy on all data is 0.01818
After 910 training step(s),cross entropy on all data is 0.0181597
After 911 training step(s),cross entropy on all data is 0.0181415
After 912 training step(s),cross entropy on all data is 0.018125
After 913 training step(s),cross entropy on all data is 0.0181036
After 914 training step(s),cross entropy on all data is 0.0180844
After 915 training step(s),cross entropy on all data is 0.018067
After 916 training step(s),cross entropy on all data is 0.0180514
After 917 training step(s),cross entropy on all data is 0.0180374
After 918 training step(s),cross entropy on all data is 0.0180247
After 919 training step(s),cross entropy on all data is 0.0180067
After 920 training step(s),cross entropy on all data is 0.017984
After 921 training step(s),cross entropy on all data is 0.017957
After 922 training step(s),cross entropy on all data is 0.0179262
After 923 training step(s),cross entropy on all data is 0.0178984
After 924 training step(s),cross entropy on all data is 0.0178734
After 925 training step(s),cross entropy on all data is 0.0178509
After 926 training step(s),cross entropy on all data is 0.0178306
After 927 training step(s),cross entropy on all data is 0.0178123
After 928 training step(s),cross entropy on all data is 0.0177959
After 929 training step(s),cross entropy on all data is 0.0177745
After 930 training step(s),cross entropy on all data is 0.0177552
After 931 training step(s),cross entropy on all data is 0.0177379
After 932 training step(s),cross entropy on all data is 0.0177223
After 933 training step(s),cross entropy on all data is 0.0177082
After 934 training step(s),cross entropy on all data is 0.0176956
After 935 training step(s),cross entropy on all data is 0.0176776
After 936 training step(s),cross entropy on all data is 0.0176549
After 937 training step(s),cross entropy on all data is 0.0176279
After 938 training step(s),cross entropy on all data is 0.017597
After 939 training step(s),cross entropy on all data is 0.0175692
After 940 training step(s),cross entropy on all data is 0.0175442
After 941 training step(s),cross entropy on all data is 0.0175217
After 942 training step(s),cross entropy on all data is 0.0175014
After 943 training step(s),cross entropy on all data is 0.0174831
After 944 training step(s),cross entropy on all data is 0.0174667
After 945 training step(s),cross entropy on all data is 0.0174453
After 946 training step(s),cross entropy on all data is 0.0174261
After 947 training step(s),cross entropy on all data is 0.0174087
After 948 training step(s),cross entropy on all data is 0.0173931
After 949 training step(s),cross entropy on all data is 0.017379
After 950 training step(s),cross entropy on all data is 0.0173664
After 951 training step(s),cross entropy on all data is 0.0173484
After 952 training step(s),cross entropy on all data is 0.0173257
After 953 training step(s),cross entropy on all data is 0.0172987
After 954 training step(s),cross entropy on all data is 0.0172679
After 955 training step(s),cross entropy on all data is 0.0172401
After 956 training step(s),cross entropy on all data is 0.0172151
After 957 training step(s),cross entropy on all data is 0.0171925
After 958 training step(s),cross entropy on all data is 0.0171723
After 959 training step(s),cross entropy on all data is 0.017154
After 960 training step(s),cross entropy on all data is 0.0171375
After 961 training step(s),cross entropy on all data is 0.0171162
After 962 training step(s),cross entropy on all data is 0.0170969
After 963 training step(s),cross entropy on all data is 0.0170796
After 964 training step(s),cross entropy on all data is 0.017064
After 965 training step(s),cross entropy on all data is 0.0170499
After 966 training step(s),cross entropy on all data is 0.0170372
After 967 training step(s),cross entropy on all data is 0.0170193
After 968 training step(s),cross entropy on all data is 0.0169966
After 969 training step(s),cross entropy on all data is 0.0169696
After 970 training step(s),cross entropy on all data is 0.0169387
After 971 training step(s),cross entropy on all data is 0.0169109
After 972 training step(s),cross entropy on all data is 0.0168859
After 973 training step(s),cross entropy on all data is 0.0168634
After 974 training step(s),cross entropy on all data is 0.0168431
After 975 training step(s),cross entropy on all data is 0.0168249
After 976 training step(s),cross entropy on all data is 0.0168084
After 977 training step(s),cross entropy on all data is 0.016787
After 978 training step(s),cross entropy on all data is 0.0167678
After 979 training step(s),cross entropy on all data is 0.0167505
After 980 training step(s),cross entropy on all data is 0.0167349
After 981 training step(s),cross entropy on all data is 0.0167208
After 982 training step(s),cross entropy on all data is 0.0167082
After 983 training step(s),cross entropy on all data is 0.0166902
After 984 training step(s),cross entropy on all data is 0.0166675
After 985 training step(s),cross entropy on all data is 0.0166405
After 986 training step(s),cross entropy on all data is 0.0166097
After 987 training step(s),cross entropy on all data is 0.0165819
After 988 training step(s),cross entropy on all data is 0.0165569
After 989 training step(s),cross entropy on all data is 0.0165344
After 990 training step(s),cross entropy on all data is 0.0165141
After 991 training step(s),cross entropy on all data is 0.0164958
After 992 training step(s),cross entropy on all data is 0.0164794
After 993 training step(s),cross entropy on all data is 0.016458
After 994 training step(s),cross entropy on all data is 0.0164388
After 995 training step(s),cross entropy on all data is 0.0164215
After 996 training step(s),cross entropy on all data is 0.0164059
After 997 training step(s),cross entropy on all data is 0.0163918
After 998 training step(s),cross entropy on all data is 0.0163792
After 999 training step(s),cross entropy on all data is 0.0163612
After 1000 training step(s),cross entropy on all data is 0.0163385
After 1001 training step(s),cross entropy on all data is 0.0163115
After 1002 training step(s),cross entropy on all data is 0.0162807
After 1003 training step(s),cross entropy on all data is 0.0162529
After 1004 training step(s),cross entropy on all data is 0.0162279
After 1005 training step(s),cross entropy on all data is 0.0162054
After 1006 training step(s),cross entropy on all data is 0.0161852
After 1007 training step(s),cross entropy on all data is 0.0161669
After 1008 training step(s),cross entropy on all data is 0.0161505
After 1009 training step(s),cross entropy on all data is 0.0161291
After 1010 training step(s),cross entropy on all data is 0.0161099
After 1011 training step(s),cross entropy on all data is 0.0160926
After 1012 training step(s),cross entropy on all data is 0.016077
After 1013 training step(s),cross entropy on all data is 0.016063
After 1014 training step(s),cross entropy on all data is 0.0160503
After 1015 training step(s),cross entropy on all data is 0.0160324
After 1016 training step(s),cross entropy on all data is 0.0160097
After 1017 training step(s),cross entropy on all data is 0.0159827
After 1018 training step(s),cross entropy on all data is 0.0159551
After 1019 training step(s),cross entropy on all data is 0.0159329
After 1020 training step(s),cross entropy on all data is 0.0159129
After 1021 training step(s),cross entropy on all data is 0.0158949
After 1022 training step(s),cross entropy on all data is 0.0158787
After 1023 training step(s),cross entropy on all data is 0.0158641
After 1024 training step(s),cross entropy on all data is 0.0158509
After 1025 training step(s),cross entropy on all data is 0.015834
After 1026 training step(s),cross entropy on all data is 0.0158188
After 1027 training step(s),cross entropy on all data is 0.0158051
After 1028 training step(s),cross entropy on all data is 0.0157928
After 1029 training step(s),cross entropy on all data is 0.0157816
After 1030 training step(s),cross entropy on all data is 0.0157716
After 1031 training step(s),cross entropy on all data is 0.0157573
After 1032 training step(s),cross entropy on all data is 0.0157389
After 1033 training step(s),cross entropy on all data is 0.0157169
After 1034 training step(s),cross entropy on all data is 0.0156971
After 1035 training step(s),cross entropy on all data is 0.0156793
After 1036 training step(s),cross entropy on all data is 0.0156632
After 1037 training step(s),cross entropy on all data is 0.0156488
After 1038 training step(s),cross entropy on all data is 0.0156357
After 1039 training step(s),cross entropy on all data is 0.015624
After 1040 training step(s),cross entropy on all data is 0.0156135
After 1041 training step(s),cross entropy on all data is 0.0155989
After 1042 training step(s),cross entropy on all data is 0.0155857
After 1043 training step(s),cross entropy on all data is 0.0155739
After 1044 training step(s),cross entropy on all data is 0.0155632
After 1045 training step(s),cross entropy on all data is 0.0155536
After 1046 training step(s),cross entropy on all data is 0.015545
After 1047 training step(s),cross entropy on all data is 0.0155319
After 1048 training step(s),cross entropy on all data is 0.0155146
After 1049 training step(s),cross entropy on all data is 0.0154936
After 1050 training step(s),cross entropy on all data is 0.0154747
After 1051 training step(s),cross entropy on all data is 0.0154576
After 1052 training step(s),cross entropy on all data is 0.0154423
After 1053 training step(s),cross entropy on all data is 0.0154284
After 1054 training step(s),cross entropy on all data is 0.015416
After 1055 training step(s),cross entropy on all data is 0.0154048
After 1056 training step(s),cross entropy on all data is 0.0153947
After 1057 training step(s),cross entropy on all data is 0.0153805
After 1058 training step(s),cross entropy on all data is 0.0153677
After 1059 training step(s),cross entropy on all data is 0.0153562
After 1060 training step(s),cross entropy on all data is 0.0153459
After 1061 training step(s),cross entropy on all data is 0.0153365
After 1062 training step(s),cross entropy on all data is 0.0153281
After 1063 training step(s),cross entropy on all data is 0.0153152
After 1064 training step(s),cross entropy on all data is 0.0152981
After 1065 training step(s),cross entropy on all data is 0.0152772
After 1066 training step(s),cross entropy on all data is 0.0152584
After 1067 training step(s),cross entropy on all data is 0.0152415
After 1068 training step(s),cross entropy on all data is 0.0152263
After 1069 training step(s),cross entropy on all data is 0.0152125
After 1070 training step(s),cross entropy on all data is 0.0152002
After 1071 training step(s),cross entropy on all data is 0.0151891
After 1072 training step(s),cross entropy on all data is 0.015179
After 1073 training step(s),cross entropy on all data is 0.0151649
After 1074 training step(s),cross entropy on all data is 0.0151522
After 1075 training step(s),cross entropy on all data is 0.0151407
After 1076 training step(s),cross entropy on all data is 0.0151304
After 1077 training step(s),cross entropy on all data is 0.0151211
After 1078 training step(s),cross entropy on all data is 0.0151127
After 1079 training step(s),cross entropy on all data is 0.0150998
After 1080 training step(s),cross entropy on all data is 0.0150827
After 1081 training step(s),cross entropy on all data is 0.0150619
After 1082 training step(s),cross entropy on all data is 0.0150431
After 1083 training step(s),cross entropy on all data is 0.0150261
After 1084 training step(s),cross entropy on all data is 0.0150109
After 1085 training step(s),cross entropy on all data is 0.0149972
After 1086 training step(s),cross entropy on all data is 0.0149848
After 1087 training step(s),cross entropy on all data is 0.0149737
After 1088 training step(s),cross entropy on all data is 0.0149637
After 1089 training step(s),cross entropy on all data is 0.0149495
After 1090 training step(s),cross entropy on all data is 0.0149368
After 1091 training step(s),cross entropy on all data is 0.0149253
After 1092 training step(s),cross entropy on all data is 0.014915
After 1093 training step(s),cross entropy on all data is 0.0149057
After 1094 training step(s),cross entropy on all data is 0.0148973
After 1095 training step(s),cross entropy on all data is 0.0148844
After 1096 training step(s),cross entropy on all data is 0.0148673
After 1097 training step(s),cross entropy on all data is 0.0148464
After 1098 training step(s),cross entropy on all data is 0.0148275
After 1099 training step(s),cross entropy on all data is 0.0148106
After 1100 training step(s),cross entropy on all data is 0.0147953
After 1101 training step(s),cross entropy on all data is 0.0147816
After 1102 training step(s),cross entropy on all data is 0.0147692
After 1103 training step(s),cross entropy on all data is 0.0147581
After 1104 training step(s),cross entropy on all data is 0.014748
After 1105 training step(s),cross entropy on all data is 0.0147339
After 1106 training step(s),cross entropy on all data is 0.0147211
After 1107 training step(s),cross entropy on all data is 0.0147096
After 1108 training step(s),cross entropy on all data is 0.0146993
After 1109 training step(s),cross entropy on all data is 0.01469
After 1110 training step(s),cross entropy on all data is 0.0146816
After 1111 training step(s),cross entropy on all data is 0.0146686
After 1112 training step(s),cross entropy on all data is 0.0146515
After 1113 training step(s),cross entropy on all data is 0.0146306
After 1114 training step(s),cross entropy on all data is 0.0146117
After 1115 training step(s),cross entropy on all data is 0.0145947
After 1116 training step(s),cross entropy on all data is 0.0145833
After 1117 training step(s),cross entropy on all data is 0.0145731
After 1118 training step(s),cross entropy on all data is 0.0145639
After 1119 training step(s),cross entropy on all data is 0.0145556
After 1120 training step(s),cross entropy on all data is 0.0145481
After 1121 training step(s),cross entropy on all data is 0.0145375
After 1122 training step(s),cross entropy on all data is 0.0145279
After 1123 training step(s),cross entropy on all data is 0.0145193
After 1124 training step(s),cross entropy on all data is 0.0145116
After 1125 training step(s),cross entropy on all data is 0.0145046
After 1126 training step(s),cross entropy on all data is 0.0144983
After 1127 training step(s),cross entropy on all data is 0.0144886
After 1128 training step(s),cross entropy on all data is 0.0144799
After 1129 training step(s),cross entropy on all data is 0.0144679
After 1130 training step(s),cross entropy on all data is 0.0144572
After 1131 training step(s),cross entropy on all data is 0.0144475
After 1132 training step(s),cross entropy on all data is 0.0144388
After 1133 training step(s),cross entropy on all data is 0.014431
After 1134 training step(s),cross entropy on all data is 0.0144239
After 1135 training step(s),cross entropy on all data is 0.0144175
After 1136 training step(s),cross entropy on all data is 0.0144118
After 1137 training step(s),cross entropy on all data is 0.0144027
After 1138 training step(s),cross entropy on all data is 0.0143945
After 1139 training step(s),cross entropy on all data is 0.0143872
After 1140 training step(s),cross entropy on all data is 0.0143805
After 1141 training step(s),cross entropy on all data is 0.0143746
After 1142 training step(s),cross entropy on all data is 0.0143692
After 1143 training step(s),cross entropy on all data is 0.0143603
After 1144 training step(s),cross entropy on all data is 0.0143523
After 1145 training step(s),cross entropy on all data is 0.014341
After 1146 training step(s),cross entropy on all data is 0.0143309
After 1147 training step(s),cross entropy on all data is 0.0143217
After 1148 training step(s),cross entropy on all data is 0.0143135
After 1149 training step(s),cross entropy on all data is 0.014306
After 1150 training step(s),cross entropy on all data is 0.0142993
After 1151 training step(s),cross entropy on all data is 0.0142933
After 1152 training step(s),cross entropy on all data is 0.0142879
After 1153 training step(s),cross entropy on all data is 0.0142791
After 1154 training step(s),cross entropy on all data is 0.0142711
After 1155 training step(s),cross entropy on all data is 0.014264
After 1156 training step(s),cross entropy on all data is 0.0142575
After 1157 training step(s),cross entropy on all data is 0.0142517
After 1158 training step(s),cross entropy on all data is 0.0142465
After 1159 training step(s),cross entropy on all data is 0.0142378
After 1160 training step(s),cross entropy on all data is 0.0142299
After 1161 training step(s),cross entropy on all data is 0.0142187
After 1162 training step(s),cross entropy on all data is 0.0142086
After 1163 training step(s),cross entropy on all data is 0.0141995
After 1164 training step(s),cross entropy on all data is 0.0141913
After 1165 training step(s),cross entropy on all data is 0.0141839
After 1166 training step(s),cross entropy on all data is 0.0141773
After 1167 training step(s),cross entropy on all data is 0.0141713
After 1168 training step(s),cross entropy on all data is 0.0141659
After 1169 training step(s),cross entropy on all data is 0.0141571
After 1170 training step(s),cross entropy on all data is 0.0141492
After 1171 training step(s),cross entropy on all data is 0.0141421
After 1172 training step(s),cross entropy on all data is 0.0141356
After 1173 training step(s),cross entropy on all data is 0.0141299
After 1174 training step(s),cross entropy on all data is 0.0141246
After 1175 training step(s),cross entropy on all data is 0.0141159
After 1176 training step(s),cross entropy on all data is 0.014108
After 1177 training step(s),cross entropy on all data is 0.0140968
After 1178 training step(s),cross entropy on all data is 0.0140867
After 1179 training step(s),cross entropy on all data is 0.0140776
After 1180 training step(s),cross entropy on all data is 0.0140694
After 1181 training step(s),cross entropy on all data is 0.014062
After 1182 training step(s),cross entropy on all data is 0.0140553
After 1183 training step(s),cross entropy on all data is 0.0140493
After 1184 training step(s),cross entropy on all data is 0.014044
After 1185 training step(s),cross entropy on all data is 0.0140351
After 1186 training step(s),cross entropy on all data is 0.0140272
After 1187 training step(s),cross entropy on all data is 0.01402
After 1188 training step(s),cross entropy on all data is 0.0140136
After 1189 training step(s),cross entropy on all data is 0.0140078
After 1190 training step(s),cross entropy on all data is 0.0140026
After 1191 training step(s),cross entropy on all data is 0.0139938
After 1192 training step(s),cross entropy on all data is 0.0139859
After 1193 training step(s),cross entropy on all data is 0.0139746
After 1194 training step(s),cross entropy on all data is 0.0139645
After 1195 training step(s),cross entropy on all data is 0.0139553
After 1196 training step(s),cross entropy on all data is 0.0139471
After 1197 training step(s),cross entropy on all data is 0.0139397
After 1198 training step(s),cross entropy on all data is 0.013933
After 1199 training step(s),cross entropy on all data is 0.013927
After 1200 training step(s),cross entropy on all data is 0.0139216
After 1201 training step(s),cross entropy on all data is 0.0139128
After 1202 training step(s),cross entropy on all data is 0.0139048
After 1203 training step(s),cross entropy on all data is 0.0138976
After 1204 training step(s),cross entropy on all data is 0.0138911
After 1205 training step(s),cross entropy on all data is 0.0138853
After 1206 training step(s),cross entropy on all data is 0.0138801
After 1207 training step(s),cross entropy on all data is 0.0138713
After 1208 training step(s),cross entropy on all data is 0.0138633
After 1209 training step(s),cross entropy on all data is 0.013852
After 1210 training step(s),cross entropy on all data is 0.0138418
After 1211 training step(s),cross entropy on all data is 0.0138327
After 1212 training step(s),cross entropy on all data is 0.0138244
After 1213 training step(s),cross entropy on all data is 0.013817
After 1214 training step(s),cross entropy on all data is 0.0138103
After 1215 training step(s),cross entropy on all data is 0.0138043
After 1216 training step(s),cross entropy on all data is 0.0137988
After 1217 training step(s),cross entropy on all data is 0.01379
After 1218 training step(s),cross entropy on all data is 0.013782
After 1219 training step(s),cross entropy on all data is 0.0137748
After 1220 training step(s),cross entropy on all data is 0.0137683
After 1221 training step(s),cross entropy on all data is 0.0137624
After 1222 training step(s),cross entropy on all data is 0.0137572
After 1223 training step(s),cross entropy on all data is 0.0137483
After 1224 training step(s),cross entropy on all data is 0.0137404
After 1225 training step(s),cross entropy on all data is 0.013729
After 1226 training step(s),cross entropy on all data is 0.0137188
After 1227 training step(s),cross entropy on all data is 0.0137096
After 1228 training step(s),cross entropy on all data is 0.0137013
After 1229 training step(s),cross entropy on all data is 0.0136939
After 1230 training step(s),cross entropy on all data is 0.0136872
After 1231 training step(s),cross entropy on all data is 0.0136811
After 1232 training step(s),cross entropy on all data is 0.0136757
After 1233 training step(s),cross entropy on all data is 0.0136667
After 1234 training step(s),cross entropy on all data is 0.0136587
After 1235 training step(s),cross entropy on all data is 0.0136515
After 1236 training step(s),cross entropy on all data is 0.013645
After 1237 training step(s),cross entropy on all data is 0.0136391
After 1238 training step(s),cross entropy on all data is 0.0136339
After 1239 training step(s),cross entropy on all data is 0.013625
After 1240 training step(s),cross entropy on all data is 0.013617
After 1241 training step(s),cross entropy on all data is 0.0136056
After 1242 training step(s),cross entropy on all data is 0.0135954
After 1243 training step(s),cross entropy on all data is 0.0135861
After 1244 training step(s),cross entropy on all data is 0.0135778
After 1245 training step(s),cross entropy on all data is 0.0135703
After 1246 training step(s),cross entropy on all data is 0.0135636
After 1247 training step(s),cross entropy on all data is 0.0135575
After 1248 training step(s),cross entropy on all data is 0.0135521
After 1249 training step(s),cross entropy on all data is 0.0135431
After 1250 training step(s),cross entropy on all data is 0.0135351
After 1251 training step(s),cross entropy on all data is 0.0135278
After 1252 training step(s),cross entropy on all data is 0.0135213
After 1253 training step(s),cross entropy on all data is 0.0135154
After 1254 training step(s),cross entropy on all data is 0.0135101
After 1255 training step(s),cross entropy on all data is 0.0135012
After 1256 training step(s),cross entropy on all data is 0.0134932
After 1257 training step(s),cross entropy on all data is 0.0134818
After 1258 training step(s),cross entropy on all data is 0.0134715
After 1259 training step(s),cross entropy on all data is 0.0134622
After 1260 training step(s),cross entropy on all data is 0.0134539
After 1261 training step(s),cross entropy on all data is 0.0134464
After 1262 training step(s),cross entropy on all data is 0.0134396
After 1263 training step(s),cross entropy on all data is 0.0134336
After 1264 training step(s),cross entropy on all data is 0.0134281
After 1265 training step(s),cross entropy on all data is 0.0134191
After 1266 training step(s),cross entropy on all data is 0.013411
After 1267 training step(s),cross entropy on all data is 0.0134038
After 1268 training step(s),cross entropy on all data is 0.0133972
After 1269 training step(s),cross entropy on all data is 0.0133913
After 1270 training step(s),cross entropy on all data is 0.013386
After 1271 training step(s),cross entropy on all data is 0.0133771
After 1272 training step(s),cross entropy on all data is 0.013369
After 1273 training step(s),cross entropy on all data is 0.0133576
After 1274 training step(s),cross entropy on all data is 0.0133473
After 1275 training step(s),cross entropy on all data is 0.013338
After 1276 training step(s),cross entropy on all data is 0.0133296
After 1277 training step(s),cross entropy on all data is 0.0133221
After 1278 training step(s),cross entropy on all data is 0.0133153
After 1279 training step(s),cross entropy on all data is 0.0133092
After 1280 training step(s),cross entropy on all data is 0.0133037
After 1281 training step(s),cross entropy on all data is 0.0132947
After 1282 training step(s),cross entropy on all data is 0.0132866
After 1283 training step(s),cross entropy on all data is 0.0132793
After 1284 training step(s),cross entropy on all data is 0.0132727
After 1285 training step(s),cross entropy on all data is 0.0132668
After 1286 training step(s),cross entropy on all data is 0.0132615
After 1287 training step(s),cross entropy on all data is 0.0132525
After 1288 training step(s),cross entropy on all data is 0.0132445
After 1289 training step(s),cross entropy on all data is 0.013233
After 1290 training step(s),cross entropy on all data is 0.0132226
After 1291 training step(s),cross entropy on all data is 0.0132133
After 1292 training step(s),cross entropy on all data is 0.0132049
After 1293 training step(s),cross entropy on all data is 0.0131974
After 1294 training step(s),cross entropy on all data is 0.0131906
After 1295 training step(s),cross entropy on all data is 0.0131845
After 1296 training step(s),cross entropy on all data is 0.0131789
After 1297 training step(s),cross entropy on all data is 0.0131699
After 1298 training step(s),cross entropy on all data is 0.0131618
After 1299 training step(s),cross entropy on all data is 0.0131545
After 1300 training step(s),cross entropy on all data is 0.0131479
After 1301 training step(s),cross entropy on all data is 0.013142
After 1302 training step(s),cross entropy on all data is 0.0131366
After 1303 training step(s),cross entropy on all data is 0.0131276
After 1304 training step(s),cross entropy on all data is 0.0131195
After 1305 training step(s),cross entropy on all data is 0.013108
After 1306 training step(s),cross entropy on all data is 0.0130976
After 1307 training step(s),cross entropy on all data is 0.0130883
After 1308 training step(s),cross entropy on all data is 0.0130799
After 1309 training step(s),cross entropy on all data is 0.0130723
After 1310 training step(s),cross entropy on all data is 0.0130655
After 1311 training step(s),cross entropy on all data is 0.0130594
After 1312 training step(s),cross entropy on all data is 0.0130538
After 1313 training step(s),cross entropy on all data is 0.0130448
After 1314 training step(s),cross entropy on all data is 0.0130366
After 1315 training step(s),cross entropy on all data is 0.0130293
After 1316 training step(s),cross entropy on all data is 0.0130227
After 1317 training step(s),cross entropy on all data is 0.0130167
After 1318 training step(s),cross entropy on all data is 0.0130114
After 1319 training step(s),cross entropy on all data is 0.0130024
After 1320 training step(s),cross entropy on all data is 0.0129942
After 1321 training step(s),cross entropy on all data is 0.0129827
After 1322 training step(s),cross entropy on all data is 0.0129723
After 1323 training step(s),cross entropy on all data is 0.0129629
After 1324 training step(s),cross entropy on all data is 0.0129545
After 1325 training step(s),cross entropy on all data is 0.0129469
After 1326 training step(s),cross entropy on all data is 0.0129401
After 1327 training step(s),cross entropy on all data is 0.0129339
After 1328 training step(s),cross entropy on all data is 0.0129284
After 1329 training step(s),cross entropy on all data is 0.0129193
After 1330 training step(s),cross entropy on all data is 0.0129111
After 1331 training step(s),cross entropy on all data is 0.0129038
After 1332 training step(s),cross entropy on all data is 0.0128971
After 1333 training step(s),cross entropy on all data is 0.0128912
After 1334 training step(s),cross entropy on all data is 0.0128858
After 1335 training step(s),cross entropy on all data is 0.0128768
After 1336 training step(s),cross entropy on all data is 0.0128686
After 1337 training step(s),cross entropy on all data is 0.012857
After 1338 training step(s),cross entropy on all data is 0.0128466
After 1339 training step(s),cross entropy on all data is 0.0128372
After 1340 training step(s),cross entropy on all data is 0.0128288
After 1341 training step(s),cross entropy on all data is 0.0128212
After 1342 training step(s),cross entropy on all data is 0.0128143
After 1343 training step(s),cross entropy on all data is 0.0128081
After 1344 training step(s),cross entropy on all data is 0.0128026
After 1345 training step(s),cross entropy on all data is 0.0127935
After 1346 training step(s),cross entropy on all data is 0.0127853
After 1347 training step(s),cross entropy on all data is 0.0127779
After 1348 training step(s),cross entropy on all data is 0.0127713
After 1349 training step(s),cross entropy on all data is 0.0127653
After 1350 training step(s),cross entropy on all data is 0.0127599
After 1351 training step(s),cross entropy on all data is 0.0127508
After 1352 training step(s),cross entropy on all data is 0.0127427
After 1353 training step(s),cross entropy on all data is 0.0127311
After 1354 training step(s),cross entropy on all data is 0.0127206
After 1355 training step(s),cross entropy on all data is 0.0127112
After 1356 training step(s),cross entropy on all data is 0.0127027
After 1357 training step(s),cross entropy on all data is 0.0126951
After 1358 training step(s),cross entropy on all data is 0.0126882
After 1359 training step(s),cross entropy on all data is 0.012682
After 1360 training step(s),cross entropy on all data is 0.0126764
After 1361 training step(s),cross entropy on all data is 0.0126673
After 1362 training step(s),cross entropy on all data is 0.0126591
After 1363 training step(s),cross entropy on all data is 0.0126517
After 1364 training step(s),cross entropy on all data is 0.012645
After 1365 training step(s),cross entropy on all data is 0.012639
After 1366 training step(s),cross entropy on all data is 0.0126336
After 1367 training step(s),cross entropy on all data is 0.0126246
After 1368 training step(s),cross entropy on all data is 0.0126164
After 1369 training step(s),cross entropy on all data is 0.0126047
After 1370 training step(s),cross entropy on all data is 0.0125943
After 1371 training step(s),cross entropy on all data is 0.0125848
After 1372 training step(s),cross entropy on all data is 0.0125763
After 1373 training step(s),cross entropy on all data is 0.0125687
After 1374 training step(s),cross entropy on all data is 0.0125618
After 1375 training step(s),cross entropy on all data is 0.0125556
After 1376 training step(s),cross entropy on all data is 0.01255
After 1377 training step(s),cross entropy on all data is 0.0125408
After 1378 training step(s),cross entropy on all data is 0.0125326
After 1379 training step(s),cross entropy on all data is 0.0125252
After 1380 training step(s),cross entropy on all data is 0.0125185
After 1381 training step(s),cross entropy on all data is 0.0125125
After 1382 training step(s),cross entropy on all data is 0.0125071
After 1383 training step(s),cross entropy on all data is 0.012498
After 1384 training step(s),cross entropy on all data is 0.0124898
After 1385 training step(s),cross entropy on all data is 0.0124781
After 1386 training step(s),cross entropy on all data is 0.0124676
After 1387 training step(s),cross entropy on all data is 0.0124582
After 1388 training step(s),cross entropy on all data is 0.0124496
After 1389 training step(s),cross entropy on all data is 0.012442
After 1390 training step(s),cross entropy on all data is 0.0124351
After 1391 training step(s),cross entropy on all data is 0.0124288
After 1392 training step(s),cross entropy on all data is 0.0124232
After 1393 training step(s),cross entropy on all data is 0.0124141
After 1394 training step(s),cross entropy on all data is 0.0124058
After 1395 training step(s),cross entropy on all data is 0.0123984
After 1396 training step(s),cross entropy on all data is 0.0123917
After 1397 training step(s),cross entropy on all data is 0.0123857
After 1398 training step(s),cross entropy on all data is 0.0123802
After 1399 training step(s),cross entropy on all data is 0.0123711
After 1400 training step(s),cross entropy on all data is 0.0123629
After 1401 training step(s),cross entropy on all data is 0.0123512
After 1402 training step(s),cross entropy on all data is 0.0123407
After 1403 training step(s),cross entropy on all data is 0.0123312
After 1404 training step(s),cross entropy on all data is 0.0123227
After 1405 training step(s),cross entropy on all data is 0.012315
After 1406 training step(s),cross entropy on all data is 0.012308
After 1407 training step(s),cross entropy on all data is 0.0123018
After 1408 training step(s),cross entropy on all data is 0.0122962
After 1409 training step(s),cross entropy on all data is 0.012287
After 1410 training step(s),cross entropy on all data is 0.0122787
After 1411 training step(s),cross entropy on all data is 0.0122713
After 1412 training step(s),cross entropy on all data is 0.0122646
After 1413 training step(s),cross entropy on all data is 0.0122585
After 1414 training step(s),cross entropy on all data is 0.0122531
After 1415 training step(s),cross entropy on all data is 0.0122439
After 1416 training step(s),cross entropy on all data is 0.0122357
After 1417 training step(s),cross entropy on all data is 0.012224
After 1418 training step(s),cross entropy on all data is 0.0122134
After 1419 training step(s),cross entropy on all data is 0.0122039
After 1420 training step(s),cross entropy on all data is 0.0121954
After 1421 training step(s),cross entropy on all data is 0.0121877
After 1422 training step(s),cross entropy on all data is 0.0121807
After 1423 training step(s),cross entropy on all data is 0.0121745
After 1424 training step(s),cross entropy on all data is 0.0121689
After 1425 training step(s),cross entropy on all data is 0.0121597
After 1426 training step(s),cross entropy on all data is 0.0121514
After 1427 training step(s),cross entropy on all data is 0.0121439
After 1428 training step(s),cross entropy on all data is 0.0121372
After 1429 training step(s),cross entropy on all data is 0.0121311
After 1430 training step(s),cross entropy on all data is 0.0121257
After 1431 training step(s),cross entropy on all data is 0.0121165
After 1432 training step(s),cross entropy on all data is 0.0121083
After 1433 training step(s),cross entropy on all data is 0.0120965
After 1434 training step(s),cross entropy on all data is 0.0120859
After 1435 training step(s),cross entropy on all data is 0.0120764
After 1436 training step(s),cross entropy on all data is 0.0120678
After 1437 training step(s),cross entropy on all data is 0.0120601
After 1438 training step(s),cross entropy on all data is 0.0120532
After 1439 training step(s),cross entropy on all data is 0.0120469
After 1440 training step(s),cross entropy on all data is 0.0120413
After 1441 training step(s),cross entropy on all data is 0.012032
After 1442 training step(s),cross entropy on all data is 0.0120237
After 1443 training step(s),cross entropy on all data is 0.0120163
After 1444 training step(s),cross entropy on all data is 0.0120095
After 1445 training step(s),cross entropy on all data is 0.0120034
After 1446 training step(s),cross entropy on all data is 0.011998
After 1447 training step(s),cross entropy on all data is 0.0119888
After 1448 training step(s),cross entropy on all data is 0.0119805
After 1449 training step(s),cross entropy on all data is 0.0119688
After 1450 training step(s),cross entropy on all data is 0.0119582
After 1451 training step(s),cross entropy on all data is 0.0119486
After 1452 training step(s),cross entropy on all data is 0.01194
After 1453 training step(s),cross entropy on all data is 0.0119323
After 1454 training step(s),cross entropy on all data is 0.0119253
After 1455 training step(s),cross entropy on all data is 0.0119191
After 1456 training step(s),cross entropy on all data is 0.0119134
After 1457 training step(s),cross entropy on all data is 0.0119042
After 1458 training step(s),cross entropy on all data is 0.0118958
After 1459 training step(s),cross entropy on all data is 0.0118883
After 1460 training step(s),cross entropy on all data is 0.0118816
After 1461 training step(s),cross entropy on all data is 0.0118755
After 1462 training step(s),cross entropy on all data is 0.01187
After 1463 training step(s),cross entropy on all data is 0.0118608
After 1464 training step(s),cross entropy on all data is 0.0118525
After 1465 training step(s),cross entropy on all data is 0.0118408
After 1466 training step(s),cross entropy on all data is 0.0118301
After 1467 training step(s),cross entropy on all data is 0.0118206
After 1468 training step(s),cross entropy on all data is 0.011812
After 1469 training step(s),cross entropy on all data is 0.0118042
After 1470 training step(s),cross entropy on all data is 0.0117972
After 1471 training step(s),cross entropy on all data is 0.011791
After 1472 training step(s),cross entropy on all data is 0.0117853
After 1473 training step(s),cross entropy on all data is 0.011776
After 1474 training step(s),cross entropy on all data is 0.0117677
After 1475 training step(s),cross entropy on all data is 0.0117602
After 1476 training step(s),cross entropy on all data is 0.0117534
After 1477 training step(s),cross entropy on all data is 0.0117473
After 1478 training step(s),cross entropy on all data is 0.0117418
After 1479 training step(s),cross entropy on all data is 0.0117326
After 1480 training step(s),cross entropy on all data is 0.0117243
After 1481 training step(s),cross entropy on all data is 0.0117125
After 1482 training step(s),cross entropy on all data is 0.0117019
After 1483 training step(s),cross entropy on all data is 0.0116923
After 1484 training step(s),cross entropy on all data is 0.0116837
After 1485 training step(s),cross entropy on all data is 0.0116759
After 1486 training step(s),cross entropy on all data is 0.0116689
After 1487 training step(s),cross entropy on all data is 0.0116626
After 1488 training step(s),cross entropy on all data is 0.0116569
After 1489 training step(s),cross entropy on all data is 0.0116477
After 1490 training step(s),cross entropy on all data is 0.0116393
After 1491 training step(s),cross entropy on all data is 0.0116318
After 1492 training step(s),cross entropy on all data is 0.011625
After 1493 training step(s),cross entropy on all data is 0.0116189
After 1494 training step(s),cross entropy on all data is 0.0116134
After 1495 training step(s),cross entropy on all data is 0.0116042
After 1496 training step(s),cross entropy on all data is 0.0115958
After 1497 training step(s),cross entropy on all data is 0.011584
After 1498 training step(s),cross entropy on all data is 0.0115734
After 1499 training step(s),cross entropy on all data is 0.0115638
After 1500 training step(s),cross entropy on all data is 0.0115551
After 1501 training step(s),cross entropy on all data is 0.0115473
After 1502 training step(s),cross entropy on all data is 0.0115403
After 1503 training step(s),cross entropy on all data is 0.011534
After 1504 training step(s),cross entropy on all data is 0.0115284
After 1505 training step(s),cross entropy on all data is 0.0115191
After 1506 training step(s),cross entropy on all data is 0.0115107
After 1507 training step(s),cross entropy on all data is 0.0115031
After 1508 training step(s),cross entropy on all data is 0.0114964
After 1509 training step(s),cross entropy on all data is 0.0114902
After 1510 training step(s),cross entropy on all data is 0.0114847
After 1511 training step(s),cross entropy on all data is 0.0114755
After 1512 training step(s),cross entropy on all data is 0.0114672
After 1513 training step(s),cross entropy on all data is 0.0114553
After 1514 training step(s),cross entropy on all data is 0.0114446
After 1515 training step(s),cross entropy on all data is 0.011435
After 1516 training step(s),cross entropy on all data is 0.0114264
After 1517 training step(s),cross entropy on all data is 0.0114186
After 1518 training step(s),cross entropy on all data is 0.0114116
After 1519 training step(s),cross entropy on all data is 0.0114052
After 1520 training step(s),cross entropy on all data is 0.0113996
After 1521 training step(s),cross entropy on all data is 0.0113902
After 1522 training step(s),cross entropy on all data is 0.0113819
After 1523 training step(s),cross entropy on all data is 0.0113743
After 1524 training step(s),cross entropy on all data is 0.0113675
After 1525 training step(s),cross entropy on all data is 0.0113614
After 1526 training step(s),cross entropy on all data is 0.0113559
After 1527 training step(s),cross entropy on all data is 0.0113466
After 1528 training step(s),cross entropy on all data is 0.0113382
After 1529 training step(s),cross entropy on all data is 0.0113264
After 1530 training step(s),cross entropy on all data is 0.0113157
After 1531 training step(s),cross entropy on all data is 0.0113061
After 1532 training step(s),cross entropy on all data is 0.0112974
After 1533 training step(s),cross entropy on all data is 0.0112896
After 1534 training step(s),cross entropy on all data is 0.0112826
After 1535 training step(s),cross entropy on all data is 0.0112762
After 1536 training step(s),cross entropy on all data is 0.0112705
After 1537 training step(s),cross entropy on all data is 0.0112612
After 1538 training step(s),cross entropy on all data is 0.0112528
After 1539 training step(s),cross entropy on all data is 0.0112452
After 1540 training step(s),cross entropy on all data is 0.0112384
After 1541 training step(s),cross entropy on all data is 0.0112323
After 1542 training step(s),cross entropy on all data is 0.0112268
After 1543 training step(s),cross entropy on all data is 0.0112175
After 1544 training step(s),cross entropy on all data is 0.0112091
After 1545 training step(s),cross entropy on all data is 0.0111972
After 1546 training step(s),cross entropy on all data is 0.0111865
After 1547 training step(s),cross entropy on all data is 0.0111769
After 1548 training step(s),cross entropy on all data is 0.0111682
After 1549 training step(s),cross entropy on all data is 0.0111604
After 1550 training step(s),cross entropy on all data is 0.0111534
After 1551 training step(s),cross entropy on all data is 0.011147
After 1552 training step(s),cross entropy on all data is 0.0111413
After 1553 training step(s),cross entropy on all data is 0.011132
After 1554 training step(s),cross entropy on all data is 0.0111236
After 1555 training step(s),cross entropy on all data is 0.011116
After 1556 training step(s),cross entropy on all data is 0.0111092
After 1557 training step(s),cross entropy on all data is 0.011103
After 1558 training step(s),cross entropy on all data is 0.0110975
After 1559 training step(s),cross entropy on all data is 0.0110882
After 1560 training step(s),cross entropy on all data is 0.0110798
After 1561 training step(s),cross entropy on all data is 0.0110679
After 1562 training step(s),cross entropy on all data is 0.0110572
After 1563 training step(s),cross entropy on all data is 0.0110475
After 1564 training step(s),cross entropy on all data is 0.0110388
After 1565 training step(s),cross entropy on all data is 0.011031
After 1566 training step(s),cross entropy on all data is 0.011024
After 1567 training step(s),cross entropy on all data is 0.0110176
After 1568 training step(s),cross entropy on all data is 0.0110119
After 1569 training step(s),cross entropy on all data is 0.0110025
After 1570 training step(s),cross entropy on all data is 0.0109941
After 1571 training step(s),cross entropy on all data is 0.0109865
After 1572 training step(s),cross entropy on all data is 0.0109797
After 1573 training step(s),cross entropy on all data is 0.0109735
After 1574 training step(s),cross entropy on all data is 0.010968
After 1575 training step(s),cross entropy on all data is 0.0109587
After 1576 training step(s),cross entropy on all data is 0.0109503
After 1577 training step(s),cross entropy on all data is 0.0109384
After 1578 training step(s),cross entropy on all data is 0.0109276
After 1579 training step(s),cross entropy on all data is 0.010918
After 1580 training step(s),cross entropy on all data is 0.0109093
After 1581 training step(s),cross entropy on all data is 0.0109014
After 1582 training step(s),cross entropy on all data is 0.0108944
After 1583 training step(s),cross entropy on all data is 0.010888
After 1584 training step(s),cross entropy on all data is 0.0108823
After 1585 training step(s),cross entropy on all data is 0.0108729
After 1586 training step(s),cross entropy on all data is 0.0108645
After 1587 training step(s),cross entropy on all data is 0.0108569
After 1588 training step(s),cross entropy on all data is 0.01085
After 1589 training step(s),cross entropy on all data is 0.0108439
After 1590 training step(s),cross entropy on all data is 0.0108383
After 1591 training step(s),cross entropy on all data is 0.010829
After 1592 training step(s),cross entropy on all data is 0.0108206
After 1593 training step(s),cross entropy on all data is 0.0108087
After 1594 training step(s),cross entropy on all data is 0.0107979
After 1595 training step(s),cross entropy on all data is 0.0107882
After 1596 training step(s),cross entropy on all data is 0.0107795
After 1597 training step(s),cross entropy on all data is 0.0107717
After 1598 training step(s),cross entropy on all data is 0.0107646
After 1599 training step(s),cross entropy on all data is 0.0107582
After 1600 training step(s),cross entropy on all data is 0.0107525
After 1601 training step(s),cross entropy on all data is 0.0107431
After 1602 training step(s),cross entropy on all data is 0.0107347
After 1603 training step(s),cross entropy on all data is 0.0107271
After 1604 training step(s),cross entropy on all data is 0.0107202
After 1605 training step(s),cross entropy on all data is 0.0107141
After 1606 training step(s),cross entropy on all data is 0.0107085
After 1607 training step(s),cross entropy on all data is 0.0106992
After 1608 training step(s),cross entropy on all data is 0.0106908
After 1609 training step(s),cross entropy on all data is 0.0106788
After 1610 training step(s),cross entropy on all data is 0.010668
After 1611 training step(s),cross entropy on all data is 0.0106583
After 1612 training step(s),cross entropy on all data is 0.0106496
After 1613 training step(s),cross entropy on all data is 0.0106418
After 1614 training step(s),cross entropy on all data is 0.0106347
After 1615 training step(s),cross entropy on all data is 0.0106283
After 1616 training step(s),cross entropy on all data is 0.0106226
After 1617 training step(s),cross entropy on all data is 0.0106132
After 1618 training step(s),cross entropy on all data is 0.0106047
After 1619 training step(s),cross entropy on all data is 0.0105971
After 1620 training step(s),cross entropy on all data is 0.0105902
After 1621 training step(s),cross entropy on all data is 0.0105841
After 1622 training step(s),cross entropy on all data is 0.0105785
After 1623 training step(s),cross entropy on all data is 0.0105692
After 1624 training step(s),cross entropy on all data is 0.0105607
After 1625 training step(s),cross entropy on all data is 0.0105488
After 1626 training step(s),cross entropy on all data is 0.010538
After 1627 training step(s),cross entropy on all data is 0.0105283
After 1628 training step(s),cross entropy on all data is 0.0105196
After 1629 training step(s),cross entropy on all data is 0.0105117
After 1630 training step(s),cross entropy on all data is 0.0105046
After 1631 training step(s),cross entropy on all data is 0.0104982
After 1632 training step(s),cross entropy on all data is 0.0104925
After 1633 training step(s),cross entropy on all data is 0.0104831
After 1634 training step(s),cross entropy on all data is 0.0104746
After 1635 training step(s),cross entropy on all data is 0.010467
After 1636 training step(s),cross entropy on all data is 0.0104601
After 1637 training step(s),cross entropy on all data is 0.0104539
After 1638 training step(s),cross entropy on all data is 0.0104484
After 1639 training step(s),cross entropy on all data is 0.010439
After 1640 training step(s),cross entropy on all data is 0.0104313
After 1641 training step(s),cross entropy on all data is 0.0104263
After 1642 training step(s),cross entropy on all data is 0.0104217
After 1643 training step(s),cross entropy on all data is 0.0104177
After 1644 training step(s),cross entropy on all data is 0.010414
After 1645 training step(s),cross entropy on all data is 0.0104107
After 1646 training step(s),cross entropy on all data is 0.0104077
After 1647 training step(s),cross entropy on all data is 0.010405
After 1648 training step(s),cross entropy on all data is 0.0104026
After 1649 training step(s),cross entropy on all data is 0.0103975
After 1650 training step(s),cross entropy on all data is 0.0103929
After 1651 training step(s),cross entropy on all data is 0.0103887
After 1652 training step(s),cross entropy on all data is 0.010385
After 1653 training step(s),cross entropy on all data is 0.0103817
After 1654 training step(s),cross entropy on all data is 0.0103786
After 1655 training step(s),cross entropy on all data is 0.0103731
After 1656 training step(s),cross entropy on all data is 0.010368
After 1657 training step(s),cross entropy on all data is 0.0103635
After 1658 training step(s),cross entropy on all data is 0.0103594
After 1659 training step(s),cross entropy on all data is 0.0103558
After 1660 training step(s),cross entropy on all data is 0.0103524
After 1661 training step(s),cross entropy on all data is 0.0103495
After 1662 training step(s),cross entropy on all data is 0.0103468
After 1663 training step(s),cross entropy on all data is 0.0103444
After 1664 training step(s),cross entropy on all data is 0.0103422
After 1665 training step(s),cross entropy on all data is 0.0103373
After 1666 training step(s),cross entropy on all data is 0.0103329
After 1667 training step(s),cross entropy on all data is 0.0103289
After 1668 training step(s),cross entropy on all data is 0.0103254
After 1669 training step(s),cross entropy on all data is 0.0103221
After 1670 training step(s),cross entropy on all data is 0.0103192
After 1671 training step(s),cross entropy on all data is 0.0103138
After 1672 training step(s),cross entropy on all data is 0.0103088
After 1673 training step(s),cross entropy on all data is 0.0103044
After 1674 training step(s),cross entropy on all data is 0.0103004
After 1675 training step(s),cross entropy on all data is 0.0102968
After 1676 training step(s),cross entropy on all data is 0.0102935
After 1677 training step(s),cross entropy on all data is 0.0102906
After 1678 training step(s),cross entropy on all data is 0.010288
After 1679 training step(s),cross entropy on all data is 0.0102856
After 1680 training step(s),cross entropy on all data is 0.0102835
After 1681 training step(s),cross entropy on all data is 0.0102786
After 1682 training step(s),cross entropy on all data is 0.0102742
After 1683 training step(s),cross entropy on all data is 0.0102702
After 1684 training step(s),cross entropy on all data is 0.0102667
After 1685 training step(s),cross entropy on all data is 0.0102635
After 1686 training step(s),cross entropy on all data is 0.0102606
After 1687 training step(s),cross entropy on all data is 0.0102551
After 1688 training step(s),cross entropy on all data is 0.0102502
After 1689 training step(s),cross entropy on all data is 0.0102457
After 1690 training step(s),cross entropy on all data is 0.0102417
After 1691 training step(s),cross entropy on all data is 0.0102381
After 1692 training step(s),cross entropy on all data is 0.0102349
After 1693 training step(s),cross entropy on all data is 0.010232
After 1694 training step(s),cross entropy on all data is 0.0102293
After 1695 training step(s),cross entropy on all data is 0.010227
After 1696 training step(s),cross entropy on all data is 0.0102248
After 1697 training step(s),cross entropy on all data is 0.0102199
After 1698 training step(s),cross entropy on all data is 0.0102155
After 1699 training step(s),cross entropy on all data is 0.0102116
After 1700 training step(s),cross entropy on all data is 0.010208
After 1701 training step(s),cross entropy on all data is 0.0102048
After 1702 training step(s),cross entropy on all data is 0.0102019
After 1703 training step(s),cross entropy on all data is 0.0101964
After 1704 training step(s),cross entropy on all data is 0.0101915
After 1705 training step(s),cross entropy on all data is 0.010187
After 1706 training step(s),cross entropy on all data is 0.010183
After 1707 training step(s),cross entropy on all data is 0.0101794
After 1708 training step(s),cross entropy on all data is 0.0101761
After 1709 training step(s),cross entropy on all data is 0.0101732
After 1710 training step(s),cross entropy on all data is 0.0101706
After 1711 training step(s),cross entropy on all data is 0.0101682
After 1712 training step(s),cross entropy on all data is 0.010166
After 1713 training step(s),cross entropy on all data is 0.0101612
After 1714 training step(s),cross entropy on all data is 0.0101567
After 1715 training step(s),cross entropy on all data is 0.0101528
After 1716 training step(s),cross entropy on all data is 0.0101492
After 1717 training step(s),cross entropy on all data is 0.010146
After 1718 training step(s),cross entropy on all data is 0.0101431
After 1719 training step(s),cross entropy on all data is 0.0101376
After 1720 training step(s),cross entropy on all data is 0.0101326
After 1721 training step(s),cross entropy on all data is 0.0101281
After 1722 training step(s),cross entropy on all data is 0.0101241
After 1723 training step(s),cross entropy on all data is 0.0101205
After 1724 training step(s),cross entropy on all data is 0.0101172
After 1725 training step(s),cross entropy on all data is 0.0101143
After 1726 training step(s),cross entropy on all data is 0.0101116
After 1727 training step(s),cross entropy on all data is 0.0101092
After 1728 training step(s),cross entropy on all data is 0.0101071
After 1729 training step(s),cross entropy on all data is 0.0101022
After 1730 training step(s),cross entropy on all data is 0.0100977
After 1731 training step(s),cross entropy on all data is 0.0100938
After 1732 training step(s),cross entropy on all data is 0.0100902
After 1733 training step(s),cross entropy on all data is 0.0100869
After 1734 training step(s),cross entropy on all data is 0.010084
After 1735 training step(s),cross entropy on all data is 0.0100785
After 1736 training step(s),cross entropy on all data is 0.0100735
After 1737 training step(s),cross entropy on all data is 0.010069
After 1738 training step(s),cross entropy on all data is 0.010065
After 1739 training step(s),cross entropy on all data is 0.0100613
After 1740 training step(s),cross entropy on all data is 0.0100581
After 1741 training step(s),cross entropy on all data is 0.0100551
After 1742 training step(s),cross entropy on all data is 0.0100524
After 1743 training step(s),cross entropy on all data is 0.0100501
After 1744 training step(s),cross entropy on all data is 0.0100479
After 1745 training step(s),cross entropy on all data is 0.010043
After 1746 training step(s),cross entropy on all data is 0.0100385
After 1747 training step(s),cross entropy on all data is 0.0100345
After 1748 training step(s),cross entropy on all data is 0.0100309
After 1749 training step(s),cross entropy on all data is 0.0100277
After 1750 training step(s),cross entropy on all data is 0.0100248
After 1751 training step(s),cross entropy on all data is 0.0100192
After 1752 training step(s),cross entropy on all data is 0.0100142
After 1753 training step(s),cross entropy on all data is 0.0100097
After 1754 training step(s),cross entropy on all data is 0.0100056
After 1755 training step(s),cross entropy on all data is 0.010002
After 1756 training step(s),cross entropy on all data is 0.00999871
After 1757 training step(s),cross entropy on all data is 0.00999574
After 1758 training step(s),cross entropy on all data is 0.00999308
After 1759 training step(s),cross entropy on all data is 0.00999067
After 1760 training step(s),cross entropy on all data is 0.00998851
After 1761 training step(s),cross entropy on all data is 0.00998356
After 1762 training step(s),cross entropy on all data is 0.00997911
After 1763 training step(s),cross entropy on all data is 0.0099751
After 1764 training step(s),cross entropy on all data is 0.00997149
After 1765 training step(s),cross entropy on all data is 0.00996823
After 1766 training step(s),cross entropy on all data is 0.0099653
After 1767 training step(s),cross entropy on all data is 0.00995973
After 1768 training step(s),cross entropy on all data is 0.00995471
After 1769 training step(s),cross entropy on all data is 0.00995019
After 1770 training step(s),cross entropy on all data is 0.00994612
After 1771 training step(s),cross entropy on all data is 0.00994246
After 1772 training step(s),cross entropy on all data is 0.00993916
After 1773 training step(s),cross entropy on all data is 0.00993618
After 1774 training step(s),cross entropy on all data is 0.00993351
After 1775 training step(s),cross entropy on all data is 0.0099311
After 1776 training step(s),cross entropy on all data is 0.00992893
After 1777 training step(s),cross entropy on all data is 0.00992397
After 1778 training step(s),cross entropy on all data is 0.0099195
After 1779 training step(s),cross entropy on all data is 0.00991547
After 1780 training step(s),cross entropy on all data is 0.00991185
After 1781 training step(s),cross entropy on all data is 0.00990859
After 1782 training step(s),cross entropy on all data is 0.00990565
After 1783 training step(s),cross entropy on all data is 0.00990005
After 1784 training step(s),cross entropy on all data is 0.00989502
After 1785 training step(s),cross entropy on all data is 0.00989048
After 1786 training step(s),cross entropy on all data is 0.0098864
After 1787 training step(s),cross entropy on all data is 0.00988272
After 1788 training step(s),cross entropy on all data is 0.00987941
After 1789 training step(s),cross entropy on all data is 0.00987643
After 1790 training step(s),cross entropy on all data is 0.00987375
After 1791 training step(s),cross entropy on all data is 0.00987133
After 1792 training step(s),cross entropy on all data is 0.00986915
After 1793 training step(s),cross entropy on all data is 0.00986417
After 1794 training step(s),cross entropy on all data is 0.00985969
After 1795 training step(s),cross entropy on all data is 0.00985565
After 1796 training step(s),cross entropy on all data is 0.00985202
After 1797 training step(s),cross entropy on all data is 0.00984874
After 1798 training step(s),cross entropy on all data is 0.0098458
After 1799 training step(s),cross entropy on all data is 0.00984018
After 1800 training step(s),cross entropy on all data is 0.00983513
After 1801 training step(s),cross entropy on all data is 0.00983058
After 1802 training step(s),cross entropy on all data is 0.00982649
After 1803 training step(s),cross entropy on all data is 0.00982279
After 1804 training step(s),cross entropy on all data is 0.00981947
After 1805 training step(s),cross entropy on all data is 0.00981648
After 1806 training step(s),cross entropy on all data is 0.00981379
After 1807 training step(s),cross entropy on all data is 0.00981136
After 1808 training step(s),cross entropy on all data is 0.00980918
After 1809 training step(s),cross entropy on all data is 0.00980418
After 1810 training step(s),cross entropy on all data is 0.00979969
After 1811 training step(s),cross entropy on all data is 0.00979564
After 1812 training step(s),cross entropy on all data is 0.00979199
After 1813 training step(s),cross entropy on all data is 0.00978871
After 1814 training step(s),cross entropy on all data is 0.00978575
After 1815 training step(s),cross entropy on all data is 0.00978012
After 1816 training step(s),cross entropy on all data is 0.00977505
After 1817 training step(s),cross entropy on all data is 0.00977048
After 1818 training step(s),cross entropy on all data is 0.00976638
After 1819 training step(s),cross entropy on all data is 0.00976267
After 1820 training step(s),cross entropy on all data is 0.00975934
After 1821 training step(s),cross entropy on all data is 0.00975634
After 1822 training step(s),cross entropy on all data is 0.00975364
After 1823 training step(s),cross entropy on all data is 0.00975121
After 1824 training step(s),cross entropy on all data is 0.00974902
After 1825 training step(s),cross entropy on all data is 0.009744
After 1826 training step(s),cross entropy on all data is 0.00973949
After 1827 training step(s),cross entropy on all data is 0.00973543
After 1828 training step(s),cross entropy on all data is 0.00973177
After 1829 training step(s),cross entropy on all data is 0.00972848
After 1830 training step(s),cross entropy on all data is 0.00972551
After 1831 training step(s),cross entropy on all data is 0.00971987
After 1832 training step(s),cross entropy on all data is 0.00971478
After 1833 training step(s),cross entropy on all data is 0.0097102
After 1834 training step(s),cross entropy on all data is 0.00970608
After 1835 training step(s),cross entropy on all data is 0.00970236
After 1836 training step(s),cross entropy on all data is 0.00969902
After 1837 training step(s),cross entropy on all data is 0.00969601
After 1838 training step(s),cross entropy on all data is 0.0096933
After 1839 training step(s),cross entropy on all data is 0.00969086
After 1840 training step(s),cross entropy on all data is 0.00968866
After 1841 training step(s),cross entropy on all data is 0.00968364
After 1842 training step(s),cross entropy on all data is 0.00967911
After 1843 training step(s),cross entropy on all data is 0.00967504
After 1844 training step(s),cross entropy on all data is 0.00967137
After 1845 training step(s),cross entropy on all data is 0.00966807
After 1846 training step(s),cross entropy on all data is 0.00966509
After 1847 training step(s),cross entropy on all data is 0.00965942
After 1848 training step(s),cross entropy on all data is 0.00965432
After 1849 training step(s),cross entropy on all data is 0.00964973
After 1850 training step(s),cross entropy on all data is 0.00964559
After 1851 training step(s),cross entropy on all data is 0.00964187
After 1852 training step(s),cross entropy on all data is 0.00963852
After 1853 training step(s),cross entropy on all data is 0.0096355
After 1854 training step(s),cross entropy on all data is 0.00963278
After 1855 training step(s),cross entropy on all data is 0.00963033
After 1856 training step(s),cross entropy on all data is 0.00962812
After 1857 training step(s),cross entropy on all data is 0.00962308
After 1858 training step(s),cross entropy on all data is 0.00961855
After 1859 training step(s),cross entropy on all data is 0.00961446
After 1860 training step(s),cross entropy on all data is 0.00961078
After 1861 training step(s),cross entropy on all data is 0.00960747
After 1862 training step(s),cross entropy on all data is 0.00960448
After 1863 training step(s),cross entropy on all data is 0.0095988
After 1864 training step(s),cross entropy on all data is 0.00959368
After 1865 training step(s),cross entropy on all data is 0.00958908
After 1866 training step(s),cross entropy on all data is 0.00958493
After 1867 training step(s),cross entropy on all data is 0.00958119
After 1868 training step(s),cross entropy on all data is 0.00957783
After 1869 training step(s),cross entropy on all data is 0.0095748
After 1870 training step(s),cross entropy on all data is 0.00957207
After 1871 training step(s),cross entropy on all data is 0.00956962
After 1872 training step(s),cross entropy on all data is 0.0095674
After 1873 training step(s),cross entropy on all data is 0.00956235
After 1874 training step(s),cross entropy on all data is 0.0095578
After 1875 training step(s),cross entropy on all data is 0.0095537
After 1876 training step(s),cross entropy on all data is 0.00955001
After 1877 training step(s),cross entropy on all data is 0.00954669
After 1878 training step(s),cross entropy on all data is 0.00954369
After 1879 training step(s),cross entropy on all data is 0.00953799
After 1880 training step(s),cross entropy on all data is 0.00953286
After 1881 training step(s),cross entropy on all data is 0.00952824
After 1882 training step(s),cross entropy on all data is 0.00952408
After 1883 training step(s),cross entropy on all data is 0.00952033
After 1884 training step(s),cross entropy on all data is 0.00951696
After 1885 training step(s),cross entropy on all data is 0.00951392
After 1886 training step(s),cross entropy on all data is 0.00951119
After 1887 training step(s),cross entropy on all data is 0.00950872
After 1888 training step(s),cross entropy on all data is 0.00950651
After 1889 training step(s),cross entropy on all data is 0.00950144
After 1890 training step(s),cross entropy on all data is 0.00949687
After 1891 training step(s),cross entropy on all data is 0.00949276
After 1892 training step(s),cross entropy on all data is 0.00948906
After 1893 training step(s),cross entropy on all data is 0.00948573
After 1894 training step(s),cross entropy on all data is 0.00948273
After 1895 training step(s),cross entropy on all data is 0.00947701
After 1896 training step(s),cross entropy on all data is 0.00947187
After 1897 training step(s),cross entropy on all data is 0.00946723
After 1898 training step(s),cross entropy on all data is 0.00946306
After 1899 training step(s),cross entropy on all data is 0.0094593
After 1900 training step(s),cross entropy on all data is 0.00945592
After 1901 training step(s),cross entropy on all data is 0.00945287
After 1902 training step(s),cross entropy on all data is 0.00945013
After 1903 training step(s),cross entropy on all data is 0.00944766
After 1904 training step(s),cross entropy on all data is 0.00944543
After 1905 training step(s),cross entropy on all data is 0.00944035
After 1906 training step(s),cross entropy on all data is 0.00943577
After 1907 training step(s),cross entropy on all data is 0.00943165
After 1908 training step(s),cross entropy on all data is 0.00942794
After 1909 training step(s),cross entropy on all data is 0.0094246
After 1910 training step(s),cross entropy on all data is 0.00942159
After 1911 training step(s),cross entropy on all data is 0.00941586
After 1912 training step(s),cross entropy on all data is 0.0094107
After 1913 training step(s),cross entropy on all data is 0.00940605
After 1914 training step(s),cross entropy on all data is 0.00940187
After 1915 training step(s),cross entropy on all data is 0.0093981
After 1916 training step(s),cross entropy on all data is 0.0093947
After 1917 training step(s),cross entropy on all data is 0.00939165
After 1918 training step(s),cross entropy on all data is 0.0093889
After 1919 training step(s),cross entropy on all data is 0.00938642
After 1920 training step(s),cross entropy on all data is 0.00938419
After 1921 training step(s),cross entropy on all data is 0.00937909
After 1922 training step(s),cross entropy on all data is 0.0093745
After 1923 training step(s),cross entropy on all data is 0.00937037
After 1924 training step(s),cross entropy on all data is 0.00936665
After 1925 training step(s),cross entropy on all data is 0.0093633
After 1926 training step(s),cross entropy on all data is 0.00936028
After 1927 training step(s),cross entropy on all data is 0.00935453
After 1928 training step(s),cross entropy on all data is 0.00934936
After 1929 training step(s),cross entropy on all data is 0.0093447
After 1930 training step(s),cross entropy on all data is 0.0093405
After 1931 training step(s),cross entropy on all data is 0.00933672
After 1932 training step(s),cross entropy on all data is 0.00933332
After 1933 training step(s),cross entropy on all data is 0.00933025
After 1934 training step(s),cross entropy on all data is 0.0093275
After 1935 training step(s),cross entropy on all data is 0.00932501
After 1936 training step(s),cross entropy on all data is 0.00932278
After 1937 training step(s),cross entropy on all data is 0.00931766
After 1938 training step(s),cross entropy on all data is 0.00931306
After 1939 training step(s),cross entropy on all data is 0.00930892
After 1940 training step(s),cross entropy on all data is 0.00930519
After 1941 training step(s),cross entropy on all data is 0.00930183
After 1942 training step(s),cross entropy on all data is 0.0092988
After 1943 training step(s),cross entropy on all data is 0.00929304
After 1944 training step(s),cross entropy on all data is 0.00928785
After 1945 training step(s),cross entropy on all data is 0.00928317
After 1946 training step(s),cross entropy on all data is 0.00927896
After 1947 training step(s),cross entropy on all data is 0.00927517
After 1948 training step(s),cross entropy on all data is 0.00927176
After 1949 training step(s),cross entropy on all data is 0.00926869
After 1950 training step(s),cross entropy on all data is 0.00926592
After 1951 training step(s),cross entropy on all data is 0.00926343
After 1952 training step(s),cross entropy on all data is 0.00926119
After 1953 training step(s),cross entropy on all data is 0.00925607
After 1954 training step(s),cross entropy on all data is 0.00925145
After 1955 training step(s),cross entropy on all data is 0.0092473
After 1956 training step(s),cross entropy on all data is 0.00924356
After 1957 training step(s),cross entropy on all data is 0.00924019
After 1958 training step(s),cross entropy on all data is 0.00923716
After 1959 training step(s),cross entropy on all data is 0.00923138
After 1960 training step(s),cross entropy on all data is 0.00922617
After 1961 training step(s),cross entropy on all data is 0.00922149
After 1962 training step(s),cross entropy on all data is 0.00921727
After 1963 training step(s),cross entropy on all data is 0.00921347
After 1964 training step(s),cross entropy on all data is 0.00921004
After 1965 training step(s),cross entropy on all data is 0.00920696
After 1966 training step(s),cross entropy on all data is 0.00920419
After 1967 training step(s),cross entropy on all data is 0.00920169
After 1968 training step(s),cross entropy on all data is 0.00919944
After 1969 training step(s),cross entropy on all data is 0.00919431
After 1970 training step(s),cross entropy on all data is 0.00918968
After 1971 training step(s),cross entropy on all data is 0.00918552
After 1972 training step(s),cross entropy on all data is 0.00918177
After 1973 training step(s),cross entropy on all data is 0.00917839
After 1974 training step(s),cross entropy on all data is 0.00917535
After 1975 training step(s),cross entropy on all data is 0.00916955
After 1976 training step(s),cross entropy on all data is 0.00916433
After 1977 training step(s),cross entropy on all data is 0.00915964
After 1978 training step(s),cross entropy on all data is 0.0091554
After 1979 training step(s),cross entropy on all data is 0.0091516
After 1980 training step(s),cross entropy on all data is 0.00914817
After 1981 training step(s),cross entropy on all data is 0.00914508
After 1982 training step(s),cross entropy on all data is 0.0091423
After 1983 training step(s),cross entropy on all data is 0.00913979
After 1984 training step(s),cross entropy on all data is 0.00913754
After 1985 training step(s),cross entropy on all data is 0.00913239
After 1986 training step(s),cross entropy on all data is 0.00912775
After 1987 training step(s),cross entropy on all data is 0.00912357
After 1988 training step(s),cross entropy on all data is 0.00911982
After 1989 training step(s),cross entropy on all data is 0.00911643
After 1990 training step(s),cross entropy on all data is 0.00911338
After 1991 training step(s),cross entropy on all data is 0.00910757
After 1992 training step(s),cross entropy on all data is 0.00910234
After 1993 training step(s),cross entropy on all data is 0.00909763
After 1994 training step(s),cross entropy on all data is 0.00909339
After 1995 training step(s),cross entropy on all data is 0.00908957
After 1996 training step(s),cross entropy on all data is 0.00908613
After 1997 training step(s),cross entropy on all data is 0.00908303
After 1998 training step(s),cross entropy on all data is 0.00908025
After 1999 training step(s),cross entropy on all data is 0.00907774
After 2000 training step(s),cross entropy on all data is 0.00907547
After 2001 training step(s),cross entropy on all data is 0.00907031
After 2002 training step(s),cross entropy on all data is 0.00906566
After 2003 training step(s),cross entropy on all data is 0.00906148
After 2004 training step(s),cross entropy on all data is 0.00905771
After 2005 training step(s),cross entropy on all data is 0.00905432
After 2006 training step(s),cross entropy on all data is 0.00905126
After 2007 training step(s),cross entropy on all data is 0.00904544
After 2008 training step(s),cross entropy on all data is 0.00904019
After 2009 training step(s),cross entropy on all data is 0.00903547
After 2010 training step(s),cross entropy on all data is 0.00903122
After 2011 training step(s),cross entropy on all data is 0.00902739
After 2012 training step(s),cross entropy on all data is 0.00902394
After 2013 training step(s),cross entropy on all data is 0.00902084
After 2014 training step(s),cross entropy on all data is 0.00901804
After 2015 training step(s),cross entropy on all data is 0.00901552
After 2016 training step(s),cross entropy on all data is 0.00901325
After 2017 training step(s),cross entropy on all data is 0.00900808
After 2018 training step(s),cross entropy on all data is 0.00900342
After 2019 training step(s),cross entropy on all data is 0.00899923
After 2020 training step(s),cross entropy on all data is 0.00899545
After 2021 training step(s),cross entropy on all data is 0.00899205
After 2022 training step(s),cross entropy on all data is 0.00898898
After 2023 training step(s),cross entropy on all data is 0.00898314
After 2024 training step(s),cross entropy on all data is 0.00897789
After 2025 training step(s),cross entropy on all data is 0.00897315
After 2026 training step(s),cross entropy on all data is 0.00896889
After 2027 training step(s),cross entropy on all data is 0.00896505
After 2028 training step(s),cross entropy on all data is 0.00896159
After 2029 training step(s),cross entropy on all data is 0.00895848
After 2030 training step(s),cross entropy on all data is 0.00895568
After 2031 training step(s),cross entropy on all data is 0.00895316
After 2032 training step(s),cross entropy on all data is 0.00895088
After 2033 training step(s),cross entropy on all data is 0.0089457
After 2034 training step(s),cross entropy on all data is 0.00894103
After 2035 training step(s),cross entropy on all data is 0.00893682
After 2036 training step(s),cross entropy on all data is 0.00893303
After 2037 training step(s),cross entropy on all data is 0.00892963
After 2038 training step(s),cross entropy on all data is 0.00892656
After 2039 training step(s),cross entropy on all data is 0.0089207
After 2040 training step(s),cross entropy on all data is 0.00891543
After 2041 training step(s),cross entropy on all data is 0.00891068
After 2042 training step(s),cross entropy on all data is 0.00890641
After 2043 training step(s),cross entropy on all data is 0.00890256
After 2044 training step(s),cross entropy on all data is 0.0088991
After 2045 training step(s),cross entropy on all data is 0.00889598
After 2046 training step(s),cross entropy on all data is 0.00889317
After 2047 training step(s),cross entropy on all data is 0.00889064
After 2048 training step(s),cross entropy on all data is 0.00888836
After 2049 training step(s),cross entropy on all data is 0.00888316
After 2050 training step(s),cross entropy on all data is 0.00887848
After 2051 training step(s),cross entropy on all data is 0.00887427
After 2052 training step(s),cross entropy on all data is 0.00887047
After 2053 training step(s),cross entropy on all data is 0.00886705
After 2054 training step(s),cross entropy on all data is 0.00886398
After 2055 training step(s),cross entropy on all data is 0.00885811
After 2056 training step(s),cross entropy on all data is 0.00885283
After 2057 training step(s),cross entropy on all data is 0.00884807
After 2058 training step(s),cross entropy on all data is 0.00884379
After 2059 training step(s),cross entropy on all data is 0.00883993
After 2060 training step(s),cross entropy on all data is 0.00883646
After 2061 training step(s),cross entropy on all data is 0.00883333
After 2062 training step(s),cross entropy on all data is 0.00883051
After 2063 training step(s),cross entropy on all data is 0.00882798
After 2064 training step(s),cross entropy on all data is 0.0088257
After 2065 training step(s),cross entropy on all data is 0.00882048
After 2066 training step(s),cross entropy on all data is 0.00881579
After 2067 training step(s),cross entropy on all data is 0.00881157
After 2068 training step(s),cross entropy on all data is 0.00880777
After 2069 training step(s),cross entropy on all data is 0.00880434
After 2070 training step(s),cross entropy on all data is 0.00880126
After 2071 training step(s),cross entropy on all data is 0.00879538
After 2072 training step(s),cross entropy on all data is 0.00879008
After 2073 training step(s),cross entropy on all data is 0.00878531
After 2074 training step(s),cross entropy on all data is 0.00878102
After 2075 training step(s),cross entropy on all data is 0.00877715
After 2076 training step(s),cross entropy on all data is 0.00877367
After 2077 training step(s),cross entropy on all data is 0.00877054
After 2078 training step(s),cross entropy on all data is 0.00876772
After 2079 training step(s),cross entropy on all data is 0.00876518
After 2080 training step(s),cross entropy on all data is 0.00876289
After 2081 training step(s),cross entropy on all data is 0.00875767
After 2082 training step(s),cross entropy on all data is 0.00875297
After 2083 training step(s),cross entropy on all data is 0.00874873
After 2084 training step(s),cross entropy on all data is 0.00874492
After 2085 training step(s),cross entropy on all data is 0.00874149
After 2086 training step(s),cross entropy on all data is 0.0087384
After 2087 training step(s),cross entropy on all data is 0.0087325
After 2088 training step(s),cross entropy on all data is 0.00872719
After 2089 training step(s),cross entropy on all data is 0.00872242
After 2090 training step(s),cross entropy on all data is 0.00871811
After 2091 training step(s),cross entropy on all data is 0.00871424
After 2092 training step(s),cross entropy on all data is 0.00871075
After 2093 training step(s),cross entropy on all data is 0.00870761
After 2094 training step(s),cross entropy on all data is 0.00870478
After 2095 training step(s),cross entropy on all data is 0.00870223
After 2096 training step(s),cross entropy on all data is 0.00869994
After 2097 training step(s),cross entropy on all data is 0.00869471
After 2098 training step(s),cross entropy on all data is 0.00868999
After 2099 training step(s),cross entropy on all data is 0.00868575
After 2100 training step(s),cross entropy on all data is 0.00868193
After 2101 training step(s),cross entropy on all data is 0.00867849
After 2102 training step(s),cross entropy on all data is 0.0086754
After 2103 training step(s),cross entropy on all data is 0.00866949
After 2104 training step(s),cross entropy on all data is 0.00866417
After 2105 training step(s),cross entropy on all data is 0.00865938
After 2106 training step(s),cross entropy on all data is 0.00865507
After 2107 training step(s),cross entropy on all data is 0.00865118
After 2108 training step(s),cross entropy on all data is 0.00864768
After 2109 training step(s),cross entropy on all data is 0.00864454
After 2110 training step(s),cross entropy on all data is 0.0086417
After 2111 training step(s),cross entropy on all data is 0.00863915
After 2112 training step(s),cross entropy on all data is 0.00863685
After 2113 training step(s),cross entropy on all data is 0.00863161
After 2114 training step(s),cross entropy on all data is 0.00862688
After 2115 training step(s),cross entropy on all data is 0.00862264
After 2116 training step(s),cross entropy on all data is 0.00861881
After 2117 training step(s),cross entropy on all data is 0.00861536
After 2118 training step(s),cross entropy on all data is 0.00861226
After 2119 training step(s),cross entropy on all data is 0.00860634
After 2120 training step(s),cross entropy on all data is 0.00860101
After 2121 training step(s),cross entropy on all data is 0.00859621
After 2122 training step(s),cross entropy on all data is 0.00859188
After 2123 training step(s),cross entropy on all data is 0.00858799
After 2124 training step(s),cross entropy on all data is 0.00858449
After 2125 training step(s),cross entropy on all data is 0.00858133
After 2126 training step(s),cross entropy on all data is 0.00857849
After 2127 training step(s),cross entropy on all data is 0.00857593
After 2128 training step(s),cross entropy on all data is 0.00857363
After 2129 training step(s),cross entropy on all data is 0.00856837
After 2130 training step(s),cross entropy on all data is 0.00856364
After 2131 training step(s),cross entropy on all data is 0.00855938
After 2132 training step(s),cross entropy on all data is 0.00855555
After 2133 training step(s),cross entropy on all data is 0.0085521
After 2134 training step(s),cross entropy on all data is 0.00854899
After 2135 training step(s),cross entropy on all data is 0.00854305
After 2136 training step(s),cross entropy on all data is 0.00853771
After 2137 training step(s),cross entropy on all data is 0.0085329
After 2138 training step(s),cross entropy on all data is 0.00852857
After 2139 training step(s),cross entropy on all data is 0.00852467
After 2140 training step(s),cross entropy on all data is 0.00852116
After 2141 training step(s),cross entropy on all data is 0.008518
After 2142 training step(s),cross entropy on all data is 0.00851515
After 2143 training step(s),cross entropy on all data is 0.00851258
After 2144 training step(s),cross entropy on all data is 0.00851027
After 2145 training step(s),cross entropy on all data is 0.00850501
After 2146 training step(s),cross entropy on all data is 0.00850027
After 2147 training step(s),cross entropy on all data is 0.00849601
After 2148 training step(s),cross entropy on all data is 0.00849216
After 2149 training step(s),cross entropy on all data is 0.0084887
After 2150 training step(s),cross entropy on all data is 0.00848558
After 2151 training step(s),cross entropy on all data is 0.00847964
After 2152 training step(s),cross entropy on all data is 0.00847429
After 2153 training step(s),cross entropy on all data is 0.00846947
After 2154 training step(s),cross entropy on all data is 0.00846513
After 2155 training step(s),cross entropy on all data is 0.00846122
After 2156 training step(s),cross entropy on all data is 0.0084577
After 2157 training step(s),cross entropy on all data is 0.00845453
After 2158 training step(s),cross entropy on all data is 0.00845168
After 2159 training step(s),cross entropy on all data is 0.00844911
After 2160 training step(s),cross entropy on all data is 0.0084468
After 2161 training step(s),cross entropy on all data is 0.00844152
After 2162 training step(s),cross entropy on all data is 0.00843677
After 2163 training step(s),cross entropy on all data is 0.0084325
After 2164 training step(s),cross entropy on all data is 0.00842865
After 2165 training step(s),cross entropy on all data is 0.00842518
After 2166 training step(s),cross entropy on all data is 0.00842206
After 2167 training step(s),cross entropy on all data is 0.0084161
After 2168 training step(s),cross entropy on all data is 0.00841074
After 2169 training step(s),cross entropy on all data is 0.00840591
After 2170 training step(s),cross entropy on all data is 0.00840156
After 2171 training step(s),cross entropy on all data is 0.00839764
After 2172 training step(s),cross entropy on all data is 0.00839411
After 2173 training step(s),cross entropy on all data is 0.00839094
After 2174 training step(s),cross entropy on all data is 0.00838808
After 2175 training step(s),cross entropy on all data is 0.00838551
After 2176 training step(s),cross entropy on all data is 0.00838319
After 2177 training step(s),cross entropy on all data is 0.0083779
After 2178 training step(s),cross entropy on all data is 0.00837314
After 2179 training step(s),cross entropy on all data is 0.00836886
After 2180 training step(s),cross entropy on all data is 0.008365
After 2181 training step(s),cross entropy on all data is 0.00836153
After 2182 training step(s),cross entropy on all data is 0.0083584
After 2183 training step(s),cross entropy on all data is 0.00835243
After 2184 training step(s),cross entropy on all data is 0.00834706
After 2185 training step(s),cross entropy on all data is 0.00834222
After 2186 training step(s),cross entropy on all data is 0.00833786
After 2187 training step(s),cross entropy on all data is 0.00833394
After 2188 training step(s),cross entropy on all data is 0.0083304
After 2189 training step(s),cross entropy on all data is 0.00832722
After 2190 training step(s),cross entropy on all data is 0.00832436
After 2191 training step(s),cross entropy on all data is 0.00832178
After 2192 training step(s),cross entropy on all data is 0.00831946
After 2193 training step(s),cross entropy on all data is 0.00831416
After 2194 training step(s),cross entropy on all data is 0.00830939
After 2195 training step(s),cross entropy on all data is 0.0083051
After 2196 training step(s),cross entropy on all data is 0.00830124
After 2197 training step(s),cross entropy on all data is 0.00829776
After 2198 training step(s),cross entropy on all data is 0.00829462
After 2199 training step(s),cross entropy on all data is 0.00828864
After 2200 training step(s),cross entropy on all data is 0.00828326
After 2201 training step(s),cross entropy on all data is 0.00827841
After 2202 training step(s),cross entropy on all data is 0.00827404
After 2203 training step(s),cross entropy on all data is 0.00827011
After 2204 training step(s),cross entropy on all data is 0.00826657
After 2205 training step(s),cross entropy on all data is 0.00826338
After 2206 training step(s),cross entropy on all data is 0.00826052
After 2207 training step(s),cross entropy on all data is 0.00825793
After 2208 training step(s),cross entropy on all data is 0.0082556
After 2209 training step(s),cross entropy on all data is 0.0082503
After 2210 training step(s),cross entropy on all data is 0.00824552
After 2211 training step(s),cross entropy on all data is 0.00824122
After 2212 training step(s),cross entropy on all data is 0.00823735
After 2213 training step(s),cross entropy on all data is 0.00823387
After 2214 training step(s),cross entropy on all data is 0.00823073
After 2215 training step(s),cross entropy on all data is 0.00822473
After 2216 training step(s),cross entropy on all data is 0.00821934
After 2217 training step(s),cross entropy on all data is 0.00821448
After 2218 training step(s),cross entropy on all data is 0.00821011
After 2219 training step(s),cross entropy on all data is 0.00820617
After 2220 training step(s),cross entropy on all data is 0.00820262
After 2221 training step(s),cross entropy on all data is 0.00819943
After 2222 training step(s),cross entropy on all data is 0.00819655
After 2223 training step(s),cross entropy on all data is 0.00819396
After 2224 training step(s),cross entropy on all data is 0.00819163
After 2225 training step(s),cross entropy on all data is 0.00818632
After 2226 training step(s),cross entropy on all data is 0.00818154
After 2227 training step(s),cross entropy on all data is 0.00817723
After 2228 training step(s),cross entropy on all data is 0.00817335
After 2229 training step(s),cross entropy on all data is 0.00816986
After 2230 training step(s),cross entropy on all data is 0.00816671
After 2231 training step(s),cross entropy on all data is 0.00816071
After 2232 training step(s),cross entropy on all data is 0.00815531
After 2233 training step(s),cross entropy on all data is 0.00815044
After 2234 training step(s),cross entropy on all data is 0.00814606
After 2235 training step(s),cross entropy on all data is 0.00814211
After 2236 training step(s),cross entropy on all data is 0.00813856
After 2237 training step(s),cross entropy on all data is 0.00813536
After 2238 training step(s),cross entropy on all data is 0.00813248
After 2239 training step(s),cross entropy on all data is 0.00812989
After 2240 training step(s),cross entropy on all data is 0.00812755
After 2241 training step(s),cross entropy on all data is 0.00812223
After 2242 training step(s),cross entropy on all data is 0.00811744
After 2243 training step(s),cross entropy on all data is 0.00811312
After 2244 training step(s),cross entropy on all data is 0.00810923
After 2245 training step(s),cross entropy on all data is 0.00810574
After 2246 training step(s),cross entropy on all data is 0.00810259
After 2247 training step(s),cross entropy on all data is 0.00809657
After 2248 training step(s),cross entropy on all data is 0.00809116
After 2249 training step(s),cross entropy on all data is 0.00808628
After 2250 training step(s),cross entropy on all data is 0.00808189
After 2251 training step(s),cross entropy on all data is 0.00807794
After 2252 training step(s),cross entropy on all data is 0.00807438
After 2253 training step(s),cross entropy on all data is 0.00807117
After 2254 training step(s),cross entropy on all data is 0.00806829
After 2255 training step(s),cross entropy on all data is 0.00806569
After 2256 training step(s),cross entropy on all data is 0.00806335
After 2257 training step(s),cross entropy on all data is 0.00805802
After 2258 training step(s),cross entropy on all data is 0.00805322
After 2259 training step(s),cross entropy on all data is 0.0080489
After 2260 training step(s),cross entropy on all data is 0.008045
After 2261 training step(s),cross entropy on all data is 0.0080415
After 2262 training step(s),cross entropy on all data is 0.00803834
After 2263 training step(s),cross entropy on all data is 0.00803232
After 2264 training step(s),cross entropy on all data is 0.0080269
After 2265 training step(s),cross entropy on all data is 0.00802201
After 2266 training step(s),cross entropy on all data is 0.00801761
After 2267 training step(s),cross entropy on all data is 0.00801365
After 2268 training step(s),cross entropy on all data is 0.00801009
After 2269 training step(s),cross entropy on all data is 0.00800688
After 2270 training step(s),cross entropy on all data is 0.00800399
After 2271 training step(s),cross entropy on all data is 0.00800139
After 2272 training step(s),cross entropy on all data is 0.00799904
After 2273 training step(s),cross entropy on all data is 0.0079937
After 2274 training step(s),cross entropy on all data is 0.00798889
After 2275 training step(s),cross entropy on all data is 0.00798538
After 2276 training step(s),cross entropy on all data is 0.00798348
After 2277 training step(s),cross entropy on all data is 0.00798176
After 2278 training step(s),cross entropy on all data is 0.00798022
After 2279 training step(s),cross entropy on all data is 0.00797719
After 2280 training step(s),cross entropy on all data is 0.00797446
After 2281 training step(s),cross entropy on all data is 0.007972
After 2282 training step(s),cross entropy on all data is 0.00796979
After 2283 training step(s),cross entropy on all data is 0.0079678
After 2284 training step(s),cross entropy on all data is 0.00796601
After 2285 training step(s),cross entropy on all data is 0.00796439
After 2286 training step(s),cross entropy on all data is 0.00796294
After 2287 training step(s),cross entropy on all data is 0.00796163
After 2288 training step(s),cross entropy on all data is 0.00796045
After 2289 training step(s),cross entropy on all data is 0.00795939
After 2290 training step(s),cross entropy on all data is 0.00795843
After 2291 training step(s),cross entropy on all data is 0.00795757
After 2292 training step(s),cross entropy on all data is 0.0079568
After 2293 training step(s),cross entropy on all data is 0.0079561
After 2294 training step(s),cross entropy on all data is 0.00795547
After 2295 training step(s),cross entropy on all data is 0.00795326
After 2296 training step(s),cross entropy on all data is 0.00795127
After 2297 training step(s),cross entropy on all data is 0.00794947
After 2298 training step(s),cross entropy on all data is 0.00794785
After 2299 training step(s),cross entropy on all data is 0.0079464
After 2300 training step(s),cross entropy on all data is 0.00794509
After 2301 training step(s),cross entropy on all data is 0.00794391
After 2302 training step(s),cross entropy on all data is 0.00794285
After 2303 training step(s),cross entropy on all data is 0.00794189
After 2304 training step(s),cross entropy on all data is 0.00794103
After 2305 training step(s),cross entropy on all data is 0.00794026
After 2306 training step(s),cross entropy on all data is 0.00793956
After 2307 training step(s),cross entropy on all data is 0.00793893
After 2308 training step(s),cross entropy on all data is 0.00793836
After 2309 training step(s),cross entropy on all data is 0.00793785
After 2310 training step(s),cross entropy on all data is 0.00793739
After 2311 training step(s),cross entropy on all data is 0.00793532
After 2312 training step(s),cross entropy on all data is 0.00793346
After 2313 training step(s),cross entropy on all data is 0.00793178
After 2314 training step(s),cross entropy on all data is 0.00793027
After 2315 training step(s),cross entropy on all data is 0.00792891
After 2316 training step(s),cross entropy on all data is 0.00792768
After 2317 training step(s),cross entropy on all data is 0.00792658
After 2318 training step(s),cross entropy on all data is 0.00792559
After 2319 training step(s),cross entropy on all data is 0.00792469
After 2320 training step(s),cross entropy on all data is 0.00792389
After 2321 training step(s),cross entropy on all data is 0.00792316
After 2322 training step(s),cross entropy on all data is 0.00792251
After 2323 training step(s),cross entropy on all data is 0.00792192
After 2324 training step(s),cross entropy on all data is 0.00792139
After 2325 training step(s),cross entropy on all data is 0.00792091
After 2326 training step(s),cross entropy on all data is 0.00792048
After 2327 training step(s),cross entropy on all data is 0.00791843
After 2328 training step(s),cross entropy on all data is 0.00791658
After 2329 training step(s),cross entropy on all data is 0.00791492
After 2330 training step(s),cross entropy on all data is 0.00791342
After 2331 training step(s),cross entropy on all data is 0.00791208
After 2332 training step(s),cross entropy on all data is 0.00791086
After 2333 training step(s),cross entropy on all data is 0.00790977
After 2334 training step(s),cross entropy on all data is 0.00790878
After 2335 training step(s),cross entropy on all data is 0.0079079
After 2336 training step(s),cross entropy on all data is 0.0079071
After 2337 training step(s),cross entropy on all data is 0.00790638
After 2338 training step(s),cross entropy on all data is 0.00790573
After 2339 training step(s),cross entropy on all data is 0.00790515
After 2340 training step(s),cross entropy on all data is 0.00790462
After 2341 training step(s),cross entropy on all data is 0.00790415
After 2342 training step(s),cross entropy on all data is 0.00790373
After 2343 training step(s),cross entropy on all data is 0.00790167
After 2344 training step(s),cross entropy on all data is 0.00789982
After 2345 training step(s),cross entropy on all data is 0.00789815
After 2346 training step(s),cross entropy on all data is 0.00789665
After 2347 training step(s),cross entropy on all data is 0.0078953
After 2348 training step(s),cross entropy on all data is 0.00789408
After 2349 training step(s),cross entropy on all data is 0.00789298
After 2350 training step(s),cross entropy on all data is 0.00789199
After 2351 training step(s),cross entropy on all data is 0.00789111
After 2352 training step(s),cross entropy on all data is 0.00789031
After 2353 training step(s),cross entropy on all data is 0.00788958
After 2354 training step(s),cross entropy on all data is 0.00788894
After 2355 training step(s),cross entropy on all data is 0.00788835
After 2356 training step(s),cross entropy on all data is 0.00788783
After 2357 training step(s),cross entropy on all data is 0.00788735
After 2358 training step(s),cross entropy on all data is 0.00788693
After 2359 training step(s),cross entropy on all data is 0.00788486
After 2360 training step(s),cross entropy on all data is 0.007883
After 2361 training step(s),cross entropy on all data is 0.00788132
After 2362 training step(s),cross entropy on all data is 0.00787981
After 2363 training step(s),cross entropy on all data is 0.00787846
After 2364 training step(s),cross entropy on all data is 0.00787723
After 2365 training step(s),cross entropy on all data is 0.00787613
After 2366 training step(s),cross entropy on all data is 0.00787514
After 2367 training step(s),cross entropy on all data is 0.00787425
After 2368 training step(s),cross entropy on all data is 0.00787344
After 2369 training step(s),cross entropy on all data is 0.00787272
After 2370 training step(s),cross entropy on all data is 0.00787207
After 2371 training step(s),cross entropy on all data is 0.00787148
After 2372 training step(s),cross entropy on all data is 0.00787095
After 2373 training step(s),cross entropy on all data is 0.00787047
After 2374 training step(s),cross entropy on all data is 0.00787005
After 2375 training step(s),cross entropy on all data is 0.00786797
After 2376 training step(s),cross entropy on all data is 0.0078661
After 2377 training step(s),cross entropy on all data is 0.00786442
After 2378 training step(s),cross entropy on all data is 0.0078629
After 2379 training step(s),cross entropy on all data is 0.00786154
After 2380 training step(s),cross entropy on all data is 0.00786031
After 2381 training step(s),cross entropy on all data is 0.0078592
After 2382 training step(s),cross entropy on all data is 0.0078582
After 2383 training step(s),cross entropy on all data is 0.0078573
After 2384 training step(s),cross entropy on all data is 0.0078565
After 2385 training step(s),cross entropy on all data is 0.00785577
After 2386 training step(s),cross entropy on all data is 0.00785512
After 2387 training step(s),cross entropy on all data is 0.00785452
After 2388 training step(s),cross entropy on all data is 0.00785399
After 2389 training step(s),cross entropy on all data is 0.00785351
After 2390 training step(s),cross entropy on all data is 0.00785308
After 2391 training step(s),cross entropy on all data is 0.007851
After 2392 training step(s),cross entropy on all data is 0.00784912
After 2393 training step(s),cross entropy on all data is 0.00784742
After 2394 training step(s),cross entropy on all data is 0.0078459
After 2395 training step(s),cross entropy on all data is 0.00784453
After 2396 training step(s),cross entropy on all data is 0.00784329
After 2397 training step(s),cross entropy on all data is 0.00784218
After 2398 training step(s),cross entropy on all data is 0.00784118
After 2399 training step(s),cross entropy on all data is 0.00784028
After 2400 training step(s),cross entropy on all data is 0.00783947
After 2401 training step(s),cross entropy on all data is 0.00783874
After 2402 training step(s),cross entropy on all data is 0.00783808
After 2403 training step(s),cross entropy on all data is 0.00783748
After 2404 training step(s),cross entropy on all data is 0.00783695
After 2405 training step(s),cross entropy on all data is 0.00783647
After 2406 training step(s),cross entropy on all data is 0.00783604
After 2407 training step(s),cross entropy on all data is 0.00783394
After 2408 training step(s),cross entropy on all data is 0.00783205
After 2409 training step(s),cross entropy on all data is 0.00783035
After 2410 training step(s),cross entropy on all data is 0.00782882
After 2411 training step(s),cross entropy on all data is 0.00782744
After 2412 training step(s),cross entropy on all data is 0.0078262
After 2413 training step(s),cross entropy on all data is 0.00782508
After 2414 training step(s),cross entropy on all data is 0.00782407
After 2415 training step(s),cross entropy on all data is 0.00782317
After 2416 training step(s),cross entropy on all data is 0.00782235
After 2417 training step(s),cross entropy on all data is 0.00782162
After 2418 training step(s),cross entropy on all data is 0.00782095
After 2419 training step(s),cross entropy on all data is 0.00782036
After 2420 training step(s),cross entropy on all data is 0.00781982
After 2421 training step(s),cross entropy on all data is 0.00781934
After 2422 training step(s),cross entropy on all data is 0.0078189
After 2423 training step(s),cross entropy on all data is 0.0078168
After 2424 training step(s),cross entropy on all data is 0.0078149
After 2425 training step(s),cross entropy on all data is 0.00781319
After 2426 training step(s),cross entropy on all data is 0.00781165
After 2427 training step(s),cross entropy on all data is 0.00781027
After 2428 training step(s),cross entropy on all data is 0.00780902
After 2429 training step(s),cross entropy on all data is 0.0078079
After 2430 training step(s),cross entropy on all data is 0.00780688
After 2431 training step(s),cross entropy on all data is 0.00780597
After 2432 training step(s),cross entropy on all data is 0.00780515
After 2433 training step(s),cross entropy on all data is 0.00780441
After 2434 training step(s),cross entropy on all data is 0.00780375
After 2435 training step(s),cross entropy on all data is 0.00780315
After 2436 training step(s),cross entropy on all data is 0.00780261
After 2437 training step(s),cross entropy on all data is 0.00780212
After 2438 training step(s),cross entropy on all data is 0.00780169
After 2439 training step(s),cross entropy on all data is 0.00779957
After 2440 training step(s),cross entropy on all data is 0.00779766
After 2441 training step(s),cross entropy on all data is 0.00779595
After 2442 training step(s),cross entropy on all data is 0.0077944
After 2443 training step(s),cross entropy on all data is 0.00779301
After 2444 training step(s),cross entropy on all data is 0.00779175
After 2445 training step(s),cross entropy on all data is 0.00779063
After 2446 training step(s),cross entropy on all data is 0.00778961
After 2447 training step(s),cross entropy on all data is 0.00778869
After 2448 training step(s),cross entropy on all data is 0.00778787
After 2449 training step(s),cross entropy on all data is 0.00778713
After 2450 training step(s),cross entropy on all data is 0.00778646
After 2451 training step(s),cross entropy on all data is 0.00778586
After 2452 training step(s),cross entropy on all data is 0.00778531
After 2453 training step(s),cross entropy on all data is 0.00778483
After 2454 training step(s),cross entropy on all data is 0.00778439
After 2455 training step(s),cross entropy on all data is 0.00778226
After 2456 training step(s),cross entropy on all data is 0.00778034
After 2457 training step(s),cross entropy on all data is 0.00777862
After 2458 training step(s),cross entropy on all data is 0.00777706
After 2459 training step(s),cross entropy on all data is 0.00777566
After 2460 training step(s),cross entropy on all data is 0.00777441
After 2461 training step(s),cross entropy on all data is 0.00777327
After 2462 training step(s),cross entropy on all data is 0.00777225
After 2463 training step(s),cross entropy on all data is 0.00777133
After 2464 training step(s),cross entropy on all data is 0.0077705
After 2465 training step(s),cross entropy on all data is 0.00776976
After 2466 training step(s),cross entropy on all data is 0.00776908
After 2467 training step(s),cross entropy on all data is 0.00776848
After 2468 training step(s),cross entropy on all data is 0.00776794
After 2469 training step(s),cross entropy on all data is 0.00776745
After 2470 training step(s),cross entropy on all data is 0.007767
After 2471 training step(s),cross entropy on all data is 0.00776486
After 2472 training step(s),cross entropy on all data is 0.00776294
After 2473 training step(s),cross entropy on all data is 0.00776121
After 2474 training step(s),cross entropy on all data is 0.00775964
After 2475 training step(s),cross entropy on all data is 0.00775824
After 2476 training step(s),cross entropy on all data is 0.00775697
After 2477 training step(s),cross entropy on all data is 0.00775583
After 2478 training step(s),cross entropy on all data is 0.00775481
After 2479 training step(s),cross entropy on all data is 0.00775388
After 2480 training step(s),cross entropy on all data is 0.00775305
After 2481 training step(s),cross entropy on all data is 0.0077523
After 2482 training step(s),cross entropy on all data is 0.00775163
After 2483 training step(s),cross entropy on all data is 0.00775102
After 2484 training step(s),cross entropy on all data is 0.00775047
After 2485 training step(s),cross entropy on all data is 0.00774998
After 2486 training step(s),cross entropy on all data is 0.00774954
After 2487 training step(s),cross entropy on all data is 0.00774739
After 2488 training step(s),cross entropy on all data is 0.00774545
After 2489 training step(s),cross entropy on all data is 0.00774371
After 2490 training step(s),cross entropy on all data is 0.00774214
After 2491 training step(s),cross entropy on all data is 0.00774073
After 2492 training step(s),cross entropy on all data is 0.00773946
After 2493 training step(s),cross entropy on all data is 0.00773831
After 2494 training step(s),cross entropy on all data is 0.00773728
After 2495 training step(s),cross entropy on all data is 0.00773635
After 2496 training step(s),cross entropy on all data is 0.00773552
After 2497 training step(s),cross entropy on all data is 0.00773476
After 2498 training step(s),cross entropy on all data is 0.00773409
After 2499 training step(s),cross entropy on all data is 0.00773348
After 2500 training step(s),cross entropy on all data is 0.00773293
After 2501 training step(s),cross entropy on all data is 0.00773243
After 2502 training step(s),cross entropy on all data is 0.00773199
After 2503 training step(s),cross entropy on all data is 0.00772983
After 2504 training step(s),cross entropy on all data is 0.00772788
After 2505 training step(s),cross entropy on all data is 0.00772613
After 2506 training step(s),cross entropy on all data is 0.00772456
After 2507 training step(s),cross entropy on all data is 0.00772314
After 2508 training step(s),cross entropy on all data is 0.00772186
After 2509 training step(s),cross entropy on all data is 0.00772071
After 2510 training step(s),cross entropy on all data is 0.00771967
After 2511 training step(s),cross entropy on all data is 0.00771874
After 2512 training step(s),cross entropy on all data is 0.0077179
After 2513 training step(s),cross entropy on all data is 0.00771714
After 2514 training step(s),cross entropy on all data is 0.00771646
After 2515 training step(s),cross entropy on all data is 0.00771585
After 2516 training step(s),cross entropy on all data is 0.0077153
After 2517 training step(s),cross entropy on all data is 0.0077148
After 2518 training step(s),cross entropy on all data is 0.00771435
After 2519 training step(s),cross entropy on all data is 0.00771218
After 2520 training step(s),cross entropy on all data is 0.00771023
After 2521 training step(s),cross entropy on all data is 0.00770847
After 2522 training step(s),cross entropy on all data is 0.00770689
After 2523 training step(s),cross entropy on all data is 0.00770546
After 2524 training step(s),cross entropy on all data is 0.00770418
After 2525 training step(s),cross entropy on all data is 0.00770302
After 2526 training step(s),cross entropy on all data is 0.00770198
After 2527 training step(s),cross entropy on all data is 0.00770105
After 2528 training step(s),cross entropy on all data is 0.0077002
After 2529 training step(s),cross entropy on all data is 0.00769944
After 2530 training step(s),cross entropy on all data is 0.00769876
After 2531 training step(s),cross entropy on all data is 0.00769814
After 2532 training step(s),cross entropy on all data is 0.00769759
After 2533 training step(s),cross entropy on all data is 0.00769709
After 2534 training step(s),cross entropy on all data is 0.00769664
After 2535 training step(s),cross entropy on all data is 0.00769446
After 2536 training step(s),cross entropy on all data is 0.0076925
After 2537 training step(s),cross entropy on all data is 0.00769073
After 2538 training step(s),cross entropy on all data is 0.00768914
After 2539 training step(s),cross entropy on all data is 0.00768771
After 2540 training step(s),cross entropy on all data is 0.00768642
After 2541 training step(s),cross entropy on all data is 0.00768526
After 2542 training step(s),cross entropy on all data is 0.00768421
After 2543 training step(s),cross entropy on all data is 0.00768327
After 2544 training step(s),cross entropy on all data is 0.00768242
After 2545 training step(s),cross entropy on all data is 0.00768166
After 2546 training step(s),cross entropy on all data is 0.00768097
After 2547 training step(s),cross entropy on all data is 0.00768035
After 2548 training step(s),cross entropy on all data is 0.0076798
After 2549 training step(s),cross entropy on all data is 0.00767929
After 2550 training step(s),cross entropy on all data is 0.00767884
After 2551 training step(s),cross entropy on all data is 0.00767665
After 2552 training step(s),cross entropy on all data is 0.00767468
After 2553 training step(s),cross entropy on all data is 0.00767291
After 2554 training step(s),cross entropy on all data is 0.00767131
After 2555 training step(s),cross entropy on all data is 0.00766987
After 2556 training step(s),cross entropy on all data is 0.00766858
After 2557 training step(s),cross entropy on all data is 0.00766741
After 2558 training step(s),cross entropy on all data is 0.00766636
After 2559 training step(s),cross entropy on all data is 0.00766541
After 2560 training step(s),cross entropy on all data is 0.00766456
After 2561 training step(s),cross entropy on all data is 0.00766379
After 2562 training step(s),cross entropy on all data is 0.0076631
After 2563 training step(s),cross entropy on all data is 0.00766248
After 2564 training step(s),cross entropy on all data is 0.00766192
After 2565 training step(s),cross entropy on all data is 0.00766142
After 2566 training step(s),cross entropy on all data is 0.00766096
After 2567 training step(s),cross entropy on all data is 0.00765877
After 2568 training step(s),cross entropy on all data is 0.00765679
After 2569 training step(s),cross entropy on all data is 0.007655
After 2570 training step(s),cross entropy on all data is 0.0076534
After 2571 training step(s),cross entropy on all data is 0.00765195
After 2572 training step(s),cross entropy on all data is 0.00765065
After 2573 training step(s),cross entropy on all data is 0.00764948
After 2574 training step(s),cross entropy on all data is 0.00764842
After 2575 training step(s),cross entropy on all data is 0.00764747
After 2576 training step(s),cross entropy on all data is 0.00764662
After 2577 training step(s),cross entropy on all data is 0.00764585
After 2578 training step(s),cross entropy on all data is 0.00764515
After 2579 training step(s),cross entropy on all data is 0.00764453
After 2580 training step(s),cross entropy on all data is 0.00764397
After 2581 training step(s),cross entropy on all data is 0.00764346
After 2582 training step(s),cross entropy on all data is 0.007643
After 2583 training step(s),cross entropy on all data is 0.0076408
After 2584 training step(s),cross entropy on all data is 0.00763881
After 2585 training step(s),cross entropy on all data is 0.00763702
After 2586 training step(s),cross entropy on all data is 0.0076354
After 2587 training step(s),cross entropy on all data is 0.00763395
After 2588 training step(s),cross entropy on all data is 0.00763264
After 2589 training step(s),cross entropy on all data is 0.00763147
After 2590 training step(s),cross entropy on all data is 0.00763041
After 2591 training step(s),cross entropy on all data is 0.00762945
After 2592 training step(s),cross entropy on all data is 0.0076286
After 2593 training step(s),cross entropy on all data is 0.00762782
After 2594 training step(s),cross entropy on all data is 0.00762712
After 2595 training step(s),cross entropy on all data is 0.0076265
After 2596 training step(s),cross entropy on all data is 0.00762593
After 2597 training step(s),cross entropy on all data is 0.00762542
After 2598 training step(s),cross entropy on all data is 0.00762497
After 2599 training step(s),cross entropy on all data is 0.00762275
After 2600 training step(s),cross entropy on all data is 0.00762075
After 2601 training step(s),cross entropy on all data is 0.00761895
After 2602 training step(s),cross entropy on all data is 0.00761733
After 2603 training step(s),cross entropy on all data is 0.00761587
After 2604 training step(s),cross entropy on all data is 0.00761456
After 2605 training step(s),cross entropy on all data is 0.00761338
After 2606 training step(s),cross entropy on all data is 0.00761231
After 2607 training step(s),cross entropy on all data is 0.00761136
After 2608 training step(s),cross entropy on all data is 0.00761049
After 2609 training step(s),cross entropy on all data is 0.00760971
After 2610 training step(s),cross entropy on all data is 0.00760901
After 2611 training step(s),cross entropy on all data is 0.00760838
After 2612 training step(s),cross entropy on all data is 0.00760782
After 2613 training step(s),cross entropy on all data is 0.00760731
After 2614 training step(s),cross entropy on all data is 0.00760685
After 2615 training step(s),cross entropy on all data is 0.00760462
After 2616 training step(s),cross entropy on all data is 0.00760261
After 2617 training step(s),cross entropy on all data is 0.0076008
After 2618 training step(s),cross entropy on all data is 0.00759918
After 2619 training step(s),cross entropy on all data is 0.00759771
After 2620 training step(s),cross entropy on all data is 0.00759639
After 2621 training step(s),cross entropy on all data is 0.00759521
After 2622 training step(s),cross entropy on all data is 0.00759414
After 2623 training step(s),cross entropy on all data is 0.00759317
After 2624 training step(s),cross entropy on all data is 0.00759231
After 2625 training step(s),cross entropy on all data is 0.00759153
After 2626 training step(s),cross entropy on all data is 0.00759082
After 2627 training step(s),cross entropy on all data is 0.00759019
After 2628 training step(s),cross entropy on all data is 0.00758962
After 2629 training step(s),cross entropy on all data is 0.00758911
After 2630 training step(s),cross entropy on all data is 0.00758865
After 2631 training step(s),cross entropy on all data is 0.00758641
After 2632 training step(s),cross entropy on all data is 0.00758439
After 2633 training step(s),cross entropy on all data is 0.00758258
After 2634 training step(s),cross entropy on all data is 0.00758094
After 2635 training step(s),cross entropy on all data is 0.00757947
After 2636 training step(s),cross entropy on all data is 0.00757815
After 2637 training step(s),cross entropy on all data is 0.00757696
After 2638 training step(s),cross entropy on all data is 0.00757588
After 2639 training step(s),cross entropy on all data is 0.00757491
After 2640 training step(s),cross entropy on all data is 0.00757404
After 2641 training step(s),cross entropy on all data is 0.00757326
After 2642 training step(s),cross entropy on all data is 0.00757255
After 2643 training step(s),cross entropy on all data is 0.00757192
After 2644 training step(s),cross entropy on all data is 0.00757135
After 2645 training step(s),cross entropy on all data is 0.00757083
After 2646 training step(s),cross entropy on all data is 0.00757037
After 2647 training step(s),cross entropy on all data is 0.00756812
After 2648 training step(s),cross entropy on all data is 0.00756609
After 2649 training step(s),cross entropy on all data is 0.00756427
After 2650 training step(s),cross entropy on all data is 0.00756263
After 2651 training step(s),cross entropy on all data is 0.00756115
After 2652 training step(s),cross entropy on all data is 0.00755982
After 2653 training step(s),cross entropy on all data is 0.00755862
After 2654 training step(s),cross entropy on all data is 0.00755755
After 2655 training step(s),cross entropy on all data is 0.00755658
After 2656 training step(s),cross entropy on all data is 0.0075557
After 2657 training step(s),cross entropy on all data is 0.00755491
After 2658 training step(s),cross entropy on all data is 0.0075542
After 2659 training step(s),cross entropy on all data is 0.00755357
After 2660 training step(s),cross entropy on all data is 0.00755299
After 2661 training step(s),cross entropy on all data is 0.00755247
After 2662 training step(s),cross entropy on all data is 0.00755201
After 2663 training step(s),cross entropy on all data is 0.00754975
After 2664 training step(s),cross entropy on all data is 0.00754772
After 2665 training step(s),cross entropy on all data is 0.00754589
After 2666 training step(s),cross entropy on all data is 0.00754424
After 2667 training step(s),cross entropy on all data is 0.00754276
After 2668 training step(s),cross entropy on all data is 0.00754142
After 2669 training step(s),cross entropy on all data is 0.00754022
After 2670 training step(s),cross entropy on all data is 0.00753913
After 2671 training step(s),cross entropy on all data is 0.00753816
After 2672 training step(s),cross entropy on all data is 0.00753728
After 2673 training step(s),cross entropy on all data is 0.00753649
After 2674 training step(s),cross entropy on all data is 0.00753578
After 2675 training step(s),cross entropy on all data is 0.00753514
After 2676 training step(s),cross entropy on all data is 0.00753456
After 2677 training step(s),cross entropy on all data is 0.00753404
After 2678 training step(s),cross entropy on all data is 0.00753357
After 2679 training step(s),cross entropy on all data is 0.0075313
After 2680 training step(s),cross entropy on all data is 0.00752926
After 2681 training step(s),cross entropy on all data is 0.00752742
After 2682 training step(s),cross entropy on all data is 0.00752577
After 2683 training step(s),cross entropy on all data is 0.00752428
After 2684 training step(s),cross entropy on all data is 0.00752294
After 2685 training step(s),cross entropy on all data is 0.00752173
After 2686 training step(s),cross entropy on all data is 0.00752064
After 2687 training step(s),cross entropy on all data is 0.00751966
After 2688 training step(s),cross entropy on all data is 0.00751878
After 2689 training step(s),cross entropy on all data is 0.00751799
After 2690 training step(s),cross entropy on all data is 0.00751727
After 2691 training step(s),cross entropy on all data is 0.00751663
After 2692 training step(s),cross entropy on all data is 0.00751605
After 2693 training step(s),cross entropy on all data is 0.00751552
After 2694 training step(s),cross entropy on all data is 0.00751505
After 2695 training step(s),cross entropy on all data is 0.00751278
After 2696 training step(s),cross entropy on all data is 0.00751073
After 2697 training step(s),cross entropy on all data is 0.00750888
After 2698 training step(s),cross entropy on all data is 0.00750722
After 2699 training step(s),cross entropy on all data is 0.00750572
After 2700 training step(s),cross entropy on all data is 0.00750438
After 2701 training step(s),cross entropy on all data is 0.00750316
After 2702 training step(s),cross entropy on all data is 0.00750207
After 2703 training step(s),cross entropy on all data is 0.00750109
After 2704 training step(s),cross entropy on all data is 0.0075002
After 2705 training step(s),cross entropy on all data is 0.0074994
After 2706 training step(s),cross entropy on all data is 0.00749869
After 2707 training step(s),cross entropy on all data is 0.00749804
After 2708 training step(s),cross entropy on all data is 0.00749746
After 2709 training step(s),cross entropy on all data is 0.00749693
After 2710 training step(s),cross entropy on all data is 0.00749646
After 2711 training step(s),cross entropy on all data is 0.00749417
After 2712 training step(s),cross entropy on all data is 0.00749212
After 2713 training step(s),cross entropy on all data is 0.00749026
After 2714 training step(s),cross entropy on all data is 0.00748859
After 2715 training step(s),cross entropy on all data is 0.00748709
After 2716 training step(s),cross entropy on all data is 0.00748574
After 2717 training step(s),cross entropy on all data is 0.00748452
After 2718 training step(s),cross entropy on all data is 0.00748342
After 2719 training step(s),cross entropy on all data is 0.00748244
After 2720 training step(s),cross entropy on all data is 0.00748155
After 2721 training step(s),cross entropy on all data is 0.00748075
After 2722 training step(s),cross entropy on all data is 0.00748002
After 2723 training step(s),cross entropy on all data is 0.00747938
After 2724 training step(s),cross entropy on all data is 0.00747879
After 2725 training step(s),cross entropy on all data is 0.00747827
After 2726 training step(s),cross entropy on all data is 0.00747779
After 2727 training step(s),cross entropy on all data is 0.0074755
After 2728 training step(s),cross entropy on all data is 0.00747343
After 2729 training step(s),cross entropy on all data is 0.00747157
After 2730 training step(s),cross entropy on all data is 0.00746989
After 2731 training step(s),cross entropy on all data is 0.00746838
After 2732 training step(s),cross entropy on all data is 0.00746702
After 2733 training step(s),cross entropy on all data is 0.0074658
After 2734 training step(s),cross entropy on all data is 0.0074647
After 2735 training step(s),cross entropy on all data is 0.00746371
After 2736 training step(s),cross entropy on all data is 0.00746282
After 2737 training step(s),cross entropy on all data is 0.00746201
After 2738 training step(s),cross entropy on all data is 0.00746129
After 2739 training step(s),cross entropy on all data is 0.00746064
After 2740 training step(s),cross entropy on all data is 0.00746005
After 2741 training step(s),cross entropy on all data is 0.00745952
After 2742 training step(s),cross entropy on all data is 0.00745904
After 2743 training step(s),cross entropy on all data is 0.00745674
After 2744 training step(s),cross entropy on all data is 0.00745466
After 2745 training step(s),cross entropy on all data is 0.00745279
After 2746 training step(s),cross entropy on all data is 0.00745111
After 2747 training step(s),cross entropy on all data is 0.0074496
After 2748 training step(s),cross entropy on all data is 0.00744823
After 2749 training step(s),cross entropy on all data is 0.00744701
After 2750 training step(s),cross entropy on all data is 0.0074459
After 2751 training step(s),cross entropy on all data is 0.0074449
After 2752 training step(s),cross entropy on all data is 0.00744401
After 2753 training step(s),cross entropy on all data is 0.0074432
After 2754 training step(s),cross entropy on all data is 0.00744247
After 2755 training step(s),cross entropy on all data is 0.00744182
After 2756 training step(s),cross entropy on all data is 0.00744123
After 2757 training step(s),cross entropy on all data is 0.0074407
After 2758 training step(s),cross entropy on all data is 0.00744022
After 2759 training step(s),cross entropy on all data is 0.00743791
After 2760 training step(s),cross entropy on all data is 0.00743582
After 2761 training step(s),cross entropy on all data is 0.00743395
After 2762 training step(s),cross entropy on all data is 0.00743226
After 2763 training step(s),cross entropy on all data is 0.00743074
After 2764 training step(s),cross entropy on all data is 0.00742937
After 2765 training step(s),cross entropy on all data is 0.00742813
After 2766 training step(s),cross entropy on all data is 0.00742702
After 2767 training step(s),cross entropy on all data is 0.00742602
After 2768 training step(s),cross entropy on all data is 0.00742512
After 2769 training step(s),cross entropy on all data is 0.00742431
After 2770 training step(s),cross entropy on all data is 0.00742358
After 2771 training step(s),cross entropy on all data is 0.00742292
After 2772 training step(s),cross entropy on all data is 0.00742233
After 2773 training step(s),cross entropy on all data is 0.0074218
After 2774 training step(s),cross entropy on all data is 0.00742132
After 2775 training step(s),cross entropy on all data is 0.007419
After 2776 training step(s),cross entropy on all data is 0.0074169
After 2777 training step(s),cross entropy on all data is 0.00741502
After 2778 training step(s),cross entropy on all data is 0.00741332
After 2779 training step(s),cross entropy on all data is 0.0074118
After 2780 training step(s),cross entropy on all data is 0.00741042
After 2781 training step(s),cross entropy on all data is 0.00740918
After 2782 training step(s),cross entropy on all data is 0.00740807
After 2783 training step(s),cross entropy on all data is 0.00740707
After 2784 training step(s),cross entropy on all data is 0.00740616
After 2785 training step(s),cross entropy on all data is 0.00740535
After 2786 training step(s),cross entropy on all data is 0.00740462
After 2787 training step(s),cross entropy on all data is 0.00740396
After 2788 training step(s),cross entropy on all data is 0.00740336
After 2789 training step(s),cross entropy on all data is 0.00740283
After 2790 training step(s),cross entropy on all data is 0.00740234
After 2791 training step(s),cross entropy on all data is 0.00740001
After 2792 training step(s),cross entropy on all data is 0.00739791
After 2793 training step(s),cross entropy on all data is 0.00739602
After 2794 training step(s),cross entropy on all data is 0.00739432
After 2795 training step(s),cross entropy on all data is 0.00739278
After 2796 training step(s),cross entropy on all data is 0.0073914
After 2797 training step(s),cross entropy on all data is 0.00739016
After 2798 training step(s),cross entropy on all data is 0.00738904
After 2799 training step(s),cross entropy on all data is 0.00738803
After 2800 training step(s),cross entropy on all data is 0.00738713
After 2801 training step(s),cross entropy on all data is 0.00738631
After 2802 training step(s),cross entropy on all data is 0.00738557
After 2803 training step(s),cross entropy on all data is 0.00738491
After 2804 training step(s),cross entropy on all data is 0.00738431
After 2805 training step(s),cross entropy on all data is 0.00738378
After 2806 training step(s),cross entropy on all data is 0.00738329
After 2807 training step(s),cross entropy on all data is 0.00738095
After 2808 training step(s),cross entropy on all data is 0.00737884
After 2809 training step(s),cross entropy on all data is 0.00737695
After 2810 training step(s),cross entropy on all data is 0.00737523
After 2811 training step(s),cross entropy on all data is 0.0073737
After 2812 training step(s),cross entropy on all data is 0.00737231
After 2813 training step(s),cross entropy on all data is 0.00737106
After 2814 training step(s),cross entropy on all data is 0.00736994
After 2815 training step(s),cross entropy on all data is 0.00736893
After 2816 training step(s),cross entropy on all data is 0.00736802
After 2817 training step(s),cross entropy on all data is 0.0073672
After 2818 training step(s),cross entropy on all data is 0.00736646
After 2819 training step(s),cross entropy on all data is 0.00736579
After 2820 training step(s),cross entropy on all data is 0.00736519
After 2821 training step(s),cross entropy on all data is 0.00736465
After 2822 training step(s),cross entropy on all data is 0.00736417
After 2823 training step(s),cross entropy on all data is 0.00736182
After 2824 training step(s),cross entropy on all data is 0.0073597
After 2825 training step(s),cross entropy on all data is 0.0073578
After 2826 training step(s),cross entropy on all data is 0.00735608
After 2827 training step(s),cross entropy on all data is 0.00735453
After 2828 training step(s),cross entropy on all data is 0.00735314
After 2829 training step(s),cross entropy on all data is 0.00735189
After 2830 training step(s),cross entropy on all data is 0.00735076
After 2831 training step(s),cross entropy on all data is 0.00734975
After 2832 training step(s),cross entropy on all data is 0.00734883
After 2833 training step(s),cross entropy on all data is 0.00734801
After 2834 training step(s),cross entropy on all data is 0.00734727
After 2835 training step(s),cross entropy on all data is 0.0073466
After 2836 training step(s),cross entropy on all data is 0.007346
After 2837 training step(s),cross entropy on all data is 0.00734546
After 2838 training step(s),cross entropy on all data is 0.00734497
After 2839 training step(s),cross entropy on all data is 0.00734261
After 2840 training step(s),cross entropy on all data is 0.00734048
After 2841 training step(s),cross entropy on all data is 0.00733857
After 2842 training step(s),cross entropy on all data is 0.00733685
After 2843 training step(s),cross entropy on all data is 0.0073353
After 2844 training step(s),cross entropy on all data is 0.0073339
After 2845 training step(s),cross entropy on all data is 0.00733264
After 2846 training step(s),cross entropy on all data is 0.00733151
After 2847 training step(s),cross entropy on all data is 0.00733049
After 2848 training step(s),cross entropy on all data is 0.00732957
After 2849 training step(s),cross entropy on all data is 0.00732875
After 2850 training step(s),cross entropy on all data is 0.007328
After 2851 training step(s),cross entropy on all data is 0.00732733
After 2852 training step(s),cross entropy on all data is 0.00732673
After 2853 training step(s),cross entropy on all data is 0.00732619
After 2854 training step(s),cross entropy on all data is 0.0073257
After 2855 training step(s),cross entropy on all data is 0.00732333
After 2856 training step(s),cross entropy on all data is 0.00732119
After 2857 training step(s),cross entropy on all data is 0.00731927
After 2858 training step(s),cross entropy on all data is 0.00731754
After 2859 training step(s),cross entropy on all data is 0.00731599
After 2860 training step(s),cross entropy on all data is 0.00731459
After 2861 training step(s),cross entropy on all data is 0.00731332
After 2862 training step(s),cross entropy on all data is 0.00731219
After 2863 training step(s),cross entropy on all data is 0.00731116
After 2864 training step(s),cross entropy on all data is 0.00731024
After 2865 training step(s),cross entropy on all data is 0.00730941
After 2866 training step(s),cross entropy on all data is 0.00730867
After 2867 training step(s),cross entropy on all data is 0.00730799
After 2868 training step(s),cross entropy on all data is 0.00730739
After 2869 training step(s),cross entropy on all data is 0.00730684
After 2870 training step(s),cross entropy on all data is 0.00730635
After 2871 training step(s),cross entropy on all data is 0.00730397
After 2872 training step(s),cross entropy on all data is 0.00730183
After 2873 training step(s),cross entropy on all data is 0.0072999
After 2874 training step(s),cross entropy on all data is 0.00729817
After 2875 training step(s),cross entropy on all data is 0.00729661
After 2876 training step(s),cross entropy on all data is 0.0072952
After 2877 training step(s),cross entropy on all data is 0.00729393
After 2878 training step(s),cross entropy on all data is 0.00729279
After 2879 training step(s),cross entropy on all data is 0.00729176
After 2880 training step(s),cross entropy on all data is 0.00729084
After 2881 training step(s),cross entropy on all data is 0.00729
After 2882 training step(s),cross entropy on all data is 0.00728926
After 2883 training step(s),cross entropy on all data is 0.00728858
After 2884 training step(s),cross entropy on all data is 0.00728797
After 2885 training step(s),cross entropy on all data is 0.00728742
After 2886 training step(s),cross entropy on all data is 0.00728693
After 2887 training step(s),cross entropy on all data is 0.00728454
After 2888 training step(s),cross entropy on all data is 0.00728239
After 2889 training step(s),cross entropy on all data is 0.00728046
After 2890 training step(s),cross entropy on all data is 0.00727872
After 2891 training step(s),cross entropy on all data is 0.00727715
After 2892 training step(s),cross entropy on all data is 0.00727574
After 2893 training step(s),cross entropy on all data is 0.00727447
After 2894 training step(s),cross entropy on all data is 0.00727332
After 2895 training step(s),cross entropy on all data is 0.00727229
After 2896 training step(s),cross entropy on all data is 0.00727136
After 2897 training step(s),cross entropy on all data is 0.00727053
After 2898 training step(s),cross entropy on all data is 0.00726977
After 2899 training step(s),cross entropy on all data is 0.0072691
After 2900 training step(s),cross entropy on all data is 0.00726849
After 2901 training step(s),cross entropy on all data is 0.00726794
After 2902 training step(s),cross entropy on all data is 0.00726744
After 2903 training step(s),cross entropy on all data is 0.00726505
After 2904 training step(s),cross entropy on all data is 0.00726289
After 2905 training step(s),cross entropy on all data is 0.00726095
After 2906 training step(s),cross entropy on all data is 0.0072592
After 2907 training step(s),cross entropy on all data is 0.00725762
After 2908 training step(s),cross entropy on all data is 0.00725621
After 2909 training step(s),cross entropy on all data is 0.00725493
After 2910 training step(s),cross entropy on all data is 0.00725378
After 2911 training step(s),cross entropy on all data is 0.00725275
After 2912 training step(s),cross entropy on all data is 0.00725181
After 2913 training step(s),cross entropy on all data is 0.00725097
After 2914 training step(s),cross entropy on all data is 0.00725022
After 2915 training step(s),cross entropy on all data is 0.00724954
After 2916 training step(s),cross entropy on all data is 0.00724893
After 2917 training step(s),cross entropy on all data is 0.00724838
After 2918 training step(s),cross entropy on all data is 0.00724788
After 2919 training step(s),cross entropy on all data is 0.00724548
After 2920 training step(s),cross entropy on all data is 0.00724331
After 2921 training step(s),cross entropy on all data is 0.00724136
After 2922 training step(s),cross entropy on all data is 0.00723961
After 2923 training step(s),cross entropy on all data is 0.00723803
After 2924 training step(s),cross entropy on all data is 0.0072366
After 2925 training step(s),cross entropy on all data is 0.00723532
After 2926 training step(s),cross entropy on all data is 0.00723417
After 2927 training step(s),cross entropy on all data is 0.00723313
After 2928 training step(s),cross entropy on all data is 0.0072322
After 2929 training step(s),cross entropy on all data is 0.00723135
After 2930 training step(s),cross entropy on all data is 0.0072306
After 2931 training step(s),cross entropy on all data is 0.00722991
After 2932 training step(s),cross entropy on all data is 0.0072293
After 2933 training step(s),cross entropy on all data is 0.00722874
After 2934 training step(s),cross entropy on all data is 0.00722825
After 2935 training step(s),cross entropy on all data is 0.00722583
After 2936 training step(s),cross entropy on all data is 0.00722366
After 2937 training step(s),cross entropy on all data is 0.0072217
After 2938 training step(s),cross entropy on all data is 0.00721994
After 2939 training step(s),cross entropy on all data is 0.00721836
After 2940 training step(s),cross entropy on all data is 0.00721693
After 2941 training step(s),cross entropy on all data is 0.00721564
After 2942 training step(s),cross entropy on all data is 0.00721449
After 2943 training step(s),cross entropy on all data is 0.00721344
After 2944 training step(s),cross entropy on all data is 0.0072125
After 2945 training step(s),cross entropy on all data is 0.00721166
After 2946 training step(s),cross entropy on all data is 0.0072109
After 2947 training step(s),cross entropy on all data is 0.00721021
After 2948 training step(s),cross entropy on all data is 0.0072096
After 2949 training step(s),cross entropy on all data is 0.00720904
After 2950 training step(s),cross entropy on all data is 0.00720854
After 2951 training step(s),cross entropy on all data is 0.00720612
After 2952 training step(s),cross entropy on all data is 0.00720394
After 2953 training step(s),cross entropy on all data is 0.00720198
After 2954 training step(s),cross entropy on all data is 0.00720021
After 2955 training step(s),cross entropy on all data is 0.00719862
After 2956 training step(s),cross entropy on all data is 0.00719718
After 2957 training step(s),cross entropy on all data is 0.00719589
After 2958 training step(s),cross entropy on all data is 0.00719473
After 2959 training step(s),cross entropy on all data is 0.00719369
After 2960 training step(s),cross entropy on all data is 0.00719274
After 2961 training step(s),cross entropy on all data is 0.0071919
After 2962 training step(s),cross entropy on all data is 0.00719113
After 2963 training step(s),cross entropy on all data is 0.00719045
After 2964 training step(s),cross entropy on all data is 0.00718983
After 2965 training step(s),cross entropy on all data is 0.00718927
After 2966 training step(s),cross entropy on all data is 0.00718877
After 2967 training step(s),cross entropy on all data is 0.00718634
After 2968 training step(s),cross entropy on all data is 0.00718415
After 2969 training step(s),cross entropy on all data is 0.00718218
After 2970 training step(s),cross entropy on all data is 0.00718041
After 2971 training step(s),cross entropy on all data is 0.00717881
After 2972 training step(s),cross entropy on all data is 0.00717737
After 2973 training step(s),cross entropy on all data is 0.00717608
After 2974 training step(s),cross entropy on all data is 0.00717491
After 2975 training step(s),cross entropy on all data is 0.00717386
After 2976 training step(s),cross entropy on all data is 0.00717292
After 2977 training step(s),cross entropy on all data is 0.00717206
After 2978 training step(s),cross entropy on all data is 0.0071713
After 2979 training step(s),cross entropy on all data is 0.00717061
After 2980 training step(s),cross entropy on all data is 0.00716999
After 2981 training step(s),cross entropy on all data is 0.00716943
After 2982 training step(s),cross entropy on all data is 0.00716892
After 2983 training step(s),cross entropy on all data is 0.00716649
After 2984 training step(s),cross entropy on all data is 0.00716429
After 2985 training step(s),cross entropy on all data is 0.00716231
After 2986 training step(s),cross entropy on all data is 0.00716053
After 2987 training step(s),cross entropy on all data is 0.00715893
After 2988 training step(s),cross entropy on all data is 0.00715749
After 2989 training step(s),cross entropy on all data is 0.00715619
After 2990 training step(s),cross entropy on all data is 0.00715502
After 2991 training step(s),cross entropy on all data is 0.00715397
After 2992 training step(s),cross entropy on all data is 0.00715302
After 2993 training step(s),cross entropy on all data is 0.00715216
After 2994 training step(s),cross entropy on all data is 0.00715139
After 2995 training step(s),cross entropy on all data is 0.0071507
After 2996 training step(s),cross entropy on all data is 0.00715008
After 2997 training step(s),cross entropy on all data is 0.00714952
After 2998 training step(s),cross entropy on all data is 0.00714901
After 2999 training step(s),cross entropy on all data is 0.00714656
After 3000 training step(s),cross entropy on all data is 0.00714436
After 3001 training step(s),cross entropy on all data is 0.00714238
After 3002 training step(s),cross entropy on all data is 0.00714059
After 3003 training step(s),cross entropy on all data is 0.00713898
After 3004 training step(s),cross entropy on all data is 0.00713753
After 3005 training step(s),cross entropy on all data is 0.00713623
After 3006 training step(s),cross entropy on all data is 0.00713506
After 3007 training step(s),cross entropy on all data is 0.007134
After 3008 training step(s),cross entropy on all data is 0.00713305
After 3009 training step(s),cross entropy on all data is 0.00713219
After 3010 training step(s),cross entropy on all data is 0.00713142
After 3011 training step(s),cross entropy on all data is 0.00713073
After 3012 training step(s),cross entropy on all data is 0.0071301
After 3013 training step(s),cross entropy on all data is 0.00712954
After 3014 training step(s),cross entropy on all data is 0.00712903
After 3015 training step(s),cross entropy on all data is 0.00712657
After 3016 training step(s),cross entropy on all data is 0.00712436
After 3017 training step(s),cross entropy on all data is 0.00712237
After 3018 training step(s),cross entropy on all data is 0.00712058
After 3019 training step(s),cross entropy on all data is 0.00711897
After 3020 training step(s),cross entropy on all data is 0.00711752
After 3021 training step(s),cross entropy on all data is 0.00711621
After 3022 training step(s),cross entropy on all data is 0.00711503
After 3023 training step(s),cross entropy on all data is 0.00711397
After 3024 training step(s),cross entropy on all data is 0.00711301
After 3025 training step(s),cross entropy on all data is 0.00711215
After 3026 training step(s),cross entropy on all data is 0.00711138
After 3027 training step(s),cross entropy on all data is 0.00711068
After 3028 training step(s),cross entropy on all data is 0.00711005
After 3029 training step(s),cross entropy on all data is 0.00710949
After 3030 training step(s),cross entropy on all data is 0.00710898
After 3031 training step(s),cross entropy on all data is 0.00710652
After 3032 training step(s),cross entropy on all data is 0.0071043
After 3033 training step(s),cross entropy on all data is 0.0071023
After 3034 training step(s),cross entropy on all data is 0.0071005
After 3035 training step(s),cross entropy on all data is 0.00709889
After 3036 training step(s),cross entropy on all data is 0.00709743
After 3037 training step(s),cross entropy on all data is 0.00709611
After 3038 training step(s),cross entropy on all data is 0.00709493
After 3039 training step(s),cross entropy on all data is 0.00709387
After 3040 training step(s),cross entropy on all data is 0.00709291
After 3041 training step(s),cross entropy on all data is 0.00709205
After 3042 training step(s),cross entropy on all data is 0.00709127
After 3043 training step(s),cross entropy on all data is 0.00709057
After 3044 training step(s),cross entropy on all data is 0.00708994
After 3045 training step(s),cross entropy on all data is 0.00708937
After 3046 training step(s),cross entropy on all data is 0.00708886
After 3047 training step(s),cross entropy on all data is 0.00708639
After 3048 training step(s),cross entropy on all data is 0.00708417
After 3049 training step(s),cross entropy on all data is 0.00708216
After 3050 training step(s),cross entropy on all data is 0.00708036
After 3051 training step(s),cross entropy on all data is 0.00707874
After 3052 training step(s),cross entropy on all data is 0.00707727
After 3053 training step(s),cross entropy on all data is 0.00707596
After 3054 training step(s),cross entropy on all data is 0.00707477
After 3055 training step(s),cross entropy on all data is 0.0070737
After 3056 training step(s),cross entropy on all data is 0.00707274
After 3057 training step(s),cross entropy on all data is 0.00707187
After 3058 training step(s),cross entropy on all data is 0.0070711
After 3059 training step(s),cross entropy on all data is 0.00707039
After 3060 training step(s),cross entropy on all data is 0.00706976
After 3061 training step(s),cross entropy on all data is 0.00706919
After 3062 training step(s),cross entropy on all data is 0.00706868
After 3063 training step(s),cross entropy on all data is 0.0070662
After 3064 training step(s),cross entropy on all data is 0.00706397
After 3065 training step(s),cross entropy on all data is 0.00706196
After 3066 training step(s),cross entropy on all data is 0.00706015
After 3067 training step(s),cross entropy on all data is 0.00705852
After 3068 training step(s),cross entropy on all data is 0.00705705
After 3069 training step(s),cross entropy on all data is 0.00705573
After 3070 training step(s),cross entropy on all data is 0.00705454
After 3071 training step(s),cross entropy on all data is 0.00705347
After 3072 training step(s),cross entropy on all data is 0.0070525
After 3073 training step(s),cross entropy on all data is 0.00705163
After 3074 training step(s),cross entropy on all data is 0.00705085
After 3075 training step(s),cross entropy on all data is 0.00705015
After 3076 training step(s),cross entropy on all data is 0.00704951
After 3077 training step(s),cross entropy on all data is 0.00704894
After 3078 training step(s),cross entropy on all data is 0.00704843
After 3079 training step(s),cross entropy on all data is 0.00704594
After 3080 training step(s),cross entropy on all data is 0.0070437
After 3081 training step(s),cross entropy on all data is 0.00704168
After 3082 training step(s),cross entropy on all data is 0.00703987
After 3083 training step(s),cross entropy on all data is 0.00703823
After 3084 training step(s),cross entropy on all data is 0.00703676
After 3085 training step(s),cross entropy on all data is 0.00703544
After 3086 training step(s),cross entropy on all data is 0.00703424
After 3087 training step(s),cross entropy on all data is 0.00703317
After 3088 training step(s),cross entropy on all data is 0.0070322
After 3089 training step(s),cross entropy on all data is 0.00703133
After 3090 training step(s),cross entropy on all data is 0.00703054
After 3091 training step(s),cross entropy on all data is 0.00702984
After 3092 training step(s),cross entropy on all data is 0.0070292
After 3093 training step(s),cross entropy on all data is 0.00702863
After 3094 training step(s),cross entropy on all data is 0.00702811
After 3095 training step(s),cross entropy on all data is 0.00702562
After 3096 training step(s),cross entropy on all data is 0.00702337
After 3097 training step(s),cross entropy on all data is 0.00702135
After 3098 training step(s),cross entropy on all data is 0.00701952
After 3099 training step(s),cross entropy on all data is 0.00701788
After 3100 training step(s),cross entropy on all data is 0.00701641
After 3101 training step(s),cross entropy on all data is 0.00701508
After 3102 training step(s),cross entropy on all data is 0.00701388
After 3103 training step(s),cross entropy on all data is 0.0070128
After 3104 training step(s),cross entropy on all data is 0.00701183
After 3105 training step(s),cross entropy on all data is 0.00701096
After 3106 training step(s),cross entropy on all data is 0.00701017
After 3107 training step(s),cross entropy on all data is 0.00700946
After 3108 training step(s),cross entropy on all data is 0.00700882
After 3109 training step(s),cross entropy on all data is 0.00700825
After 3110 training step(s),cross entropy on all data is 0.00700773
After 3111 training step(s),cross entropy on all data is 0.00700523
After 3112 training step(s),cross entropy on all data is 0.00700297
After 3113 training step(s),cross entropy on all data is 0.00700094
After 3114 training step(s),cross entropy on all data is 0.00699912
After 3115 training step(s),cross entropy on all data is 0.00699747
After 3116 training step(s),cross entropy on all data is 0.00699599
After 3117 training step(s),cross entropy on all data is 0.00699466
After 3118 training step(s),cross entropy on all data is 0.00699345
After 3119 training step(s),cross entropy on all data is 0.00699237
After 3120 training step(s),cross entropy on all data is 0.0069914
After 3121 training step(s),cross entropy on all data is 0.00699052
After 3122 training step(s),cross entropy on all data is 0.00698973
After 3123 training step(s),cross entropy on all data is 0.00698902
After 3124 training step(s),cross entropy on all data is 0.00698838
After 3125 training step(s),cross entropy on all data is 0.0069878
After 3126 training step(s),cross entropy on all data is 0.00698728
After 3127 training step(s),cross entropy on all data is 0.00698477
After 3128 training step(s),cross entropy on all data is 0.00698251
After 3129 training step(s),cross entropy on all data is 0.00698048
After 3130 training step(s),cross entropy on all data is 0.00697864
After 3131 training step(s),cross entropy on all data is 0.00697699
After 3132 training step(s),cross entropy on all data is 0.00697551
After 3133 training step(s),cross entropy on all data is 0.00697417
After 3134 training step(s),cross entropy on all data is 0.00697296
After 3135 training step(s),cross entropy on all data is 0.00697188
After 3136 training step(s),cross entropy on all data is 0.0069709
After 3137 training step(s),cross entropy on all data is 0.00697002
After 3138 training step(s),cross entropy on all data is 0.00696923
After 3139 training step(s),cross entropy on all data is 0.00696852
After 3140 training step(s),cross entropy on all data is 0.00696787
After 3141 training step(s),cross entropy on all data is 0.00696729
After 3142 training step(s),cross entropy on all data is 0.00696677
After 3143 training step(s),cross entropy on all data is 0.00696426
After 3144 training step(s),cross entropy on all data is 0.00696199
After 3145 training step(s),cross entropy on all data is 0.00695994
After 3146 training step(s),cross entropy on all data is 0.00695811
After 3147 training step(s),cross entropy on all data is 0.00695645
After 3148 training step(s),cross entropy on all data is 0.00695496
After 3149 training step(s),cross entropy on all data is 0.00695362
After 3150 training step(s),cross entropy on all data is 0.00695241
After 3151 training step(s),cross entropy on all data is 0.00695132
After 3152 training step(s),cross entropy on all data is 0.00695034
After 3153 training step(s),cross entropy on all data is 0.00694946
After 3154 training step(s),cross entropy on all data is 0.00694866
After 3155 training step(s),cross entropy on all data is 0.00694795
After 3156 training step(s),cross entropy on all data is 0.0069473
After 3157 training step(s),cross entropy on all data is 0.00694672
After 3158 training step(s),cross entropy on all data is 0.0069462
After 3159 training step(s),cross entropy on all data is 0.00694367
After 3160 training step(s),cross entropy on all data is 0.0069414
After 3161 training step(s),cross entropy on all data is 0.00693935
After 3162 training step(s),cross entropy on all data is 0.0069375
After 3163 training step(s),cross entropy on all data is 0.00693584
After 3164 training step(s),cross entropy on all data is 0.00693435
After 3165 training step(s),cross entropy on all data is 0.006933
After 3166 training step(s),cross entropy on all data is 0.00693179
After 3167 training step(s),cross entropy on all data is 0.0069307
After 3168 training step(s),cross entropy on all data is 0.00692971
After 3169 training step(s),cross entropy on all data is 0.00692883
After 3170 training step(s),cross entropy on all data is 0.00692803
After 3171 training step(s),cross entropy on all data is 0.00692731
After 3172 training step(s),cross entropy on all data is 0.00692667
After 3173 training step(s),cross entropy on all data is 0.00692609
After 3174 training step(s),cross entropy on all data is 0.00692556
After 3175 training step(s),cross entropy on all data is 0.00692303
After 3176 training step(s),cross entropy on all data is 0.00692075
After 3177 training step(s),cross entropy on all data is 0.00691869
After 3178 training step(s),cross entropy on all data is 0.00691684
After 3179 training step(s),cross entropy on all data is 0.00691517
After 3180 training step(s),cross entropy on all data is 0.00691368
After 3181 training step(s),cross entropy on all data is 0.00691232
After 3182 training step(s),cross entropy on all data is 0.00691111
After 3183 training step(s),cross entropy on all data is 0.00691001
After 3184 training step(s),cross entropy on all data is 0.00690903
After 3185 training step(s),cross entropy on all data is 0.00690814
After 3186 training step(s),cross entropy on all data is 0.00690734
After 3187 training step(s),cross entropy on all data is 0.00690662
After 3188 training step(s),cross entropy on all data is 0.00690597
After 3189 training step(s),cross entropy on all data is 0.00690539
After 3190 training step(s),cross entropy on all data is 0.00690486
After 3191 training step(s),cross entropy on all data is 0.00690232
After 3192 training step(s),cross entropy on all data is 0.00690003
After 3193 training step(s),cross entropy on all data is 0.00689797
After 3194 training step(s),cross entropy on all data is 0.00689611
After 3195 training step(s),cross entropy on all data is 0.00689444
After 3196 training step(s),cross entropy on all data is 0.00689294
After 3197 training step(s),cross entropy on all data is 0.00689159
After 3198 training step(s),cross entropy on all data is 0.00689036
After 3199 training step(s),cross entropy on all data is 0.00688927
After 3200 training step(s),cross entropy on all data is 0.00688828
After 3201 training step(s),cross entropy on all data is 0.00688739
After 3202 training step(s),cross entropy on all data is 0.00688659
After 3203 training step(s),cross entropy on all data is 0.00688586
After 3204 training step(s),cross entropy on all data is 0.00688521
After 3205 training step(s),cross entropy on all data is 0.00688463
After 3206 training step(s),cross entropy on all data is 0.0068841
After 3207 training step(s),cross entropy on all data is 0.00688155
After 3208 training step(s),cross entropy on all data is 0.00687926
After 3209 training step(s),cross entropy on all data is 0.00687719
After 3210 training step(s),cross entropy on all data is 0.00687533
After 3211 training step(s),cross entropy on all data is 0.00687365
After 3212 training step(s),cross entropy on all data is 0.00687214
After 3213 training step(s),cross entropy on all data is 0.00687078
After 3214 training step(s),cross entropy on all data is 0.00686956
After 3215 training step(s),cross entropy on all data is 0.00686846
After 3216 training step(s),cross entropy on all data is 0.00686747
After 3217 training step(s),cross entropy on all data is 0.00686657
After 3218 training step(s),cross entropy on all data is 0.00686577
After 3219 training step(s),cross entropy on all data is 0.00686505
After 3220 training step(s),cross entropy on all data is 0.00686439
After 3221 training step(s),cross entropy on all data is 0.00686381
After 3222 training step(s),cross entropy on all data is 0.00686328
After 3223 training step(s),cross entropy on all data is 0.00686072
After 3224 training step(s),cross entropy on all data is 0.00685842
After 3225 training step(s),cross entropy on all data is 0.00685634
After 3226 training step(s),cross entropy on all data is 0.00685448
After 3227 training step(s),cross entropy on all data is 0.0068528
After 3228 training step(s),cross entropy on all data is 0.00685128
After 3229 training step(s),cross entropy on all data is 0.00684992
After 3230 training step(s),cross entropy on all data is 0.00684869
After 3231 training step(s),cross entropy on all data is 0.00684759
After 3232 training step(s),cross entropy on all data is 0.0068466
After 3233 training step(s),cross entropy on all data is 0.0068457
After 3234 training step(s),cross entropy on all data is 0.00684489
After 3235 training step(s),cross entropy on all data is 0.00684417
After 3236 training step(s),cross entropy on all data is 0.00684351
After 3237 training step(s),cross entropy on all data is 0.00684292
After 3238 training step(s),cross entropy on all data is 0.00684239
After 3239 training step(s),cross entropy on all data is 0.00683983
After 3240 training step(s),cross entropy on all data is 0.00683752
After 3241 training step(s),cross entropy on all data is 0.00683544
After 3242 training step(s),cross entropy on all data is 0.00683357
After 3243 training step(s),cross entropy on all data is 0.00683188
After 3244 training step(s),cross entropy on all data is 0.00683036
After 3245 training step(s),cross entropy on all data is 0.006829
After 3246 training step(s),cross entropy on all data is 0.00682777
After 3247 training step(s),cross entropy on all data is 0.00682666
After 3248 training step(s),cross entropy on all data is 0.00682566
After 3249 training step(s),cross entropy on all data is 0.00682476
After 3250 training step(s),cross entropy on all data is 0.00682396
After 3251 training step(s),cross entropy on all data is 0.00682323
After 3252 training step(s),cross entropy on all data is 0.00682257
After 3253 training step(s),cross entropy on all data is 0.00682198
After 3254 training step(s),cross entropy on all data is 0.00682145
After 3255 training step(s),cross entropy on all data is 0.00681888
After 3256 training step(s),cross entropy on all data is 0.00681656
After 3257 training step(s),cross entropy on all data is 0.00681447
After 3258 training step(s),cross entropy on all data is 0.0068126
After 3259 training step(s),cross entropy on all data is 0.00681091
After 3260 training step(s),cross entropy on all data is 0.00680939
After 3261 training step(s),cross entropy on all data is 0.00680802
After 3262 training step(s),cross entropy on all data is 0.00680678
After 3263 training step(s),cross entropy on all data is 0.00680567
After 3264 training step(s),cross entropy on all data is 0.00680467
After 3265 training step(s),cross entropy on all data is 0.00680377
After 3266 training step(s),cross entropy on all data is 0.00680296
After 3267 training step(s),cross entropy on all data is 0.00680223
After 3268 training step(s),cross entropy on all data is 0.00680157
After 3269 training step(s),cross entropy on all data is 0.00680098
After 3270 training step(s),cross entropy on all data is 0.00680044
After 3271 training step(s),cross entropy on all data is 0.00679786
After 3272 training step(s),cross entropy on all data is 0.00679554
After 3273 training step(s),cross entropy on all data is 0.00679345
After 3274 training step(s),cross entropy on all data is 0.00679157
After 3275 training step(s),cross entropy on all data is 0.00678987
After 3276 training step(s),cross entropy on all data is 0.00678835
After 3277 training step(s),cross entropy on all data is 0.00678697
After 3278 training step(s),cross entropy on all data is 0.00678574
After 3279 training step(s),cross entropy on all data is 0.00678462
After 3280 training step(s),cross entropy on all data is 0.00678362
After 3281 training step(s),cross entropy on all data is 0.00678271
After 3282 training step(s),cross entropy on all data is 0.0067819
After 3283 training step(s),cross entropy on all data is 0.00678117
After 3284 training step(s),cross entropy on all data is 0.00678051
After 3285 training step(s),cross entropy on all data is 0.00677991
After 3286 training step(s),cross entropy on all data is 0.00677938
After 3287 training step(s),cross entropy on all data is 0.00677679
After 3288 training step(s),cross entropy on all data is 0.00677446
After 3289 training step(s),cross entropy on all data is 0.00677237
After 3290 training step(s),cross entropy on all data is 0.00677048
After 3291 training step(s),cross entropy on all data is 0.00676878
After 3292 training step(s),cross entropy on all data is 0.00676725
After 3293 training step(s),cross entropy on all data is 0.00676587
After 3294 training step(s),cross entropy on all data is 0.00676463
After 3295 training step(s),cross entropy on all data is 0.00676351
After 3296 training step(s),cross entropy on all data is 0.00676251
After 3297 training step(s),cross entropy on all data is 0.0067616
After 3298 training step(s),cross entropy on all data is 0.00676079
After 3299 training step(s),cross entropy on all data is 0.00676005
After 3300 training step(s),cross entropy on all data is 0.00675939
After 3301 training step(s),cross entropy on all data is 0.00675879
After 3302 training step(s),cross entropy on all data is 0.00675826
After 3303 training step(s),cross entropy on all data is 0.00675567
After 3304 training step(s),cross entropy on all data is 0.00675333
After 3305 training step(s),cross entropy on all data is 0.00675123
After 3306 training step(s),cross entropy on all data is 0.00674933
After 3307 training step(s),cross entropy on all data is 0.00674763
After 3308 training step(s),cross entropy on all data is 0.00674609
After 3309 training step(s),cross entropy on all data is 0.00674471
After 3310 training step(s),cross entropy on all data is 0.00674347
After 3311 training step(s),cross entropy on all data is 0.00674235
After 3312 training step(s),cross entropy on all data is 0.00674134
After 3313 training step(s),cross entropy on all data is 0.00674043
After 3314 training step(s),cross entropy on all data is 0.00673961
After 3315 training step(s),cross entropy on all data is 0.00673888
After 3316 training step(s),cross entropy on all data is 0.00673821
After 3317 training step(s),cross entropy on all data is 0.00673762
After 3318 training step(s),cross entropy on all data is 0.00673708
After 3319 training step(s),cross entropy on all data is 0.00673448
After 3320 training step(s),cross entropy on all data is 0.00673214
After 3321 training step(s),cross entropy on all data is 0.00673003
After 3322 training step(s),cross entropy on all data is 0.00672813
After 3323 training step(s),cross entropy on all data is 0.00672642
After 3324 training step(s),cross entropy on all data is 0.00672488
After 3325 training step(s),cross entropy on all data is 0.0067235
After 3326 training step(s),cross entropy on all data is 0.00672225
After 3327 training step(s),cross entropy on all data is 0.00672113
After 3328 training step(s),cross entropy on all data is 0.00672011
After 3329 training step(s),cross entropy on all data is 0.0067192
After 3330 training step(s),cross entropy on all data is 0.00671838
After 3331 training step(s),cross entropy on all data is 0.00671765
After 3332 training step(s),cross entropy on all data is 0.00671698
After 3333 training step(s),cross entropy on all data is 0.00671638
After 3334 training step(s),cross entropy on all data is 0.00671584
After 3335 training step(s),cross entropy on all data is 0.00671324
After 3336 training step(s),cross entropy on all data is 0.00671089
After 3337 training step(s),cross entropy on all data is 0.00670877
After 3338 training step(s),cross entropy on all data is 0.00670687
After 3339 training step(s),cross entropy on all data is 0.00670516
After 3340 training step(s),cross entropy on all data is 0.00670361
After 3341 training step(s),cross entropy on all data is 0.00670222
After 3342 training step(s),cross entropy on all data is 0.00670097
After 3343 training step(s),cross entropy on all data is 0.00669985
After 3344 training step(s),cross entropy on all data is 0.00669883
After 3345 training step(s),cross entropy on all data is 0.00669792
After 3346 training step(s),cross entropy on all data is 0.0066971
After 3347 training step(s),cross entropy on all data is 0.00669636
After 3348 training step(s),cross entropy on all data is 0.00669569
After 3349 training step(s),cross entropy on all data is 0.00669509
After 3350 training step(s),cross entropy on all data is 0.00669455
After 3351 training step(s),cross entropy on all data is 0.00669194
After 3352 training step(s),cross entropy on all data is 0.00668958
After 3353 training step(s),cross entropy on all data is 0.00668746
After 3354 training step(s),cross entropy on all data is 0.00668555
After 3355 training step(s),cross entropy on all data is 0.00668384
After 3356 training step(s),cross entropy on all data is 0.00668229
After 3357 training step(s),cross entropy on all data is 0.0066809
After 3358 training step(s),cross entropy on all data is 0.00667964
After 3359 training step(s),cross entropy on all data is 0.00667851
After 3360 training step(s),cross entropy on all data is 0.00667749
After 3361 training step(s),cross entropy on all data is 0.00667658
After 3362 training step(s),cross entropy on all data is 0.00667575
After 3363 training step(s),cross entropy on all data is 0.00667501
After 3364 training step(s),cross entropy on all data is 0.00667434
After 3365 training step(s),cross entropy on all data is 0.00667374
After 3366 training step(s),cross entropy on all data is 0.0066732
After 3367 training step(s),cross entropy on all data is 0.00667058
After 3368 training step(s),cross entropy on all data is 0.00666822
After 3369 training step(s),cross entropy on all data is 0.00666609
After 3370 training step(s),cross entropy on all data is 0.00666418
After 3371 training step(s),cross entropy on all data is 0.00666246
After 3372 training step(s),cross entropy on all data is 0.00666091
After 3373 training step(s),cross entropy on all data is 0.00665951
After 3374 training step(s),cross entropy on all data is 0.00665825
After 3375 training step(s),cross entropy on all data is 0.00665712
After 3376 training step(s),cross entropy on all data is 0.0066561
After 3377 training step(s),cross entropy on all data is 0.00665518
After 3378 training step(s),cross entropy on all data is 0.00665435
After 3379 training step(s),cross entropy on all data is 0.00665361
After 3380 training step(s),cross entropy on all data is 0.00665294
After 3381 training step(s),cross entropy on all data is 0.00665234
After 3382 training step(s),cross entropy on all data is 0.00665179
After 3383 training step(s),cross entropy on all data is 0.00664917
After 3384 training step(s),cross entropy on all data is 0.0066468
After 3385 training step(s),cross entropy on all data is 0.00664467
After 3386 training step(s),cross entropy on all data is 0.00664275
After 3387 training step(s),cross entropy on all data is 0.00664102
After 3388 training step(s),cross entropy on all data is 0.00663947
After 3389 training step(s),cross entropy on all data is 0.00663807
After 3390 training step(s),cross entropy on all data is 0.00663681
After 3391 training step(s),cross entropy on all data is 0.00663567
After 3392 training step(s),cross entropy on all data is 0.00663465
After 3393 training step(s),cross entropy on all data is 0.00663373
After 3394 training step(s),cross entropy on all data is 0.0066329
After 3395 training step(s),cross entropy on all data is 0.00663216
After 3396 training step(s),cross entropy on all data is 0.00663148
After 3397 training step(s),cross entropy on all data is 0.00663088
After 3398 training step(s),cross entropy on all data is 0.00663033
After 3399 training step(s),cross entropy on all data is 0.0066277
After 3400 training step(s),cross entropy on all data is 0.00662533
After 3401 training step(s),cross entropy on all data is 0.00662319
After 3402 training step(s),cross entropy on all data is 0.00662127
After 3403 training step(s),cross entropy on all data is 0.00661954
After 3404 training step(s),cross entropy on all data is 0.00661798
After 3405 training step(s),cross entropy on all data is 0.00661657
After 3406 training step(s),cross entropy on all data is 0.00661531
After 3407 training step(s),cross entropy on all data is 0.00661417
After 3408 training step(s),cross entropy on all data is 0.00661315
After 3409 training step(s),cross entropy on all data is 0.00661222
After 3410 training step(s),cross entropy on all data is 0.00661139
After 3411 training step(s),cross entropy on all data is 0.00661065
After 3412 training step(s),cross entropy on all data is 0.00660997
After 3413 training step(s),cross entropy on all data is 0.00660937
After 3414 training step(s),cross entropy on all data is 0.00660882
After 3415 training step(s),cross entropy on all data is 0.00660618
After 3416 training step(s),cross entropy on all data is 0.0066038
After 3417 training step(s),cross entropy on all data is 0.00660166
After 3418 training step(s),cross entropy on all data is 0.00659973
After 3419 training step(s),cross entropy on all data is 0.00659799
After 3420 training step(s),cross entropy on all data is 0.00659643
After 3421 training step(s),cross entropy on all data is 0.00659502
After 3422 training step(s),cross entropy on all data is 0.00659376
After 3423 training step(s),cross entropy on all data is 0.00659262
After 3424 training step(s),cross entropy on all data is 0.00659159
After 3425 training step(s),cross entropy on all data is 0.00659066
After 3426 training step(s),cross entropy on all data is 0.00658983
After 3427 training step(s),cross entropy on all data is 0.00658908
After 3428 training step(s),cross entropy on all data is 0.0065884
After 3429 training step(s),cross entropy on all data is 0.0065878
After 3430 training step(s),cross entropy on all data is 0.00658725
After 3431 training step(s),cross entropy on all data is 0.0065846
After 3432 training step(s),cross entropy on all data is 0.00658222
After 3433 training step(s),cross entropy on all data is 0.00658007
After 3434 training step(s),cross entropy on all data is 0.00657814
After 3435 training step(s),cross entropy on all data is 0.0065764
After 3436 training step(s),cross entropy on all data is 0.00657483
After 3437 training step(s),cross entropy on all data is 0.00657342
After 3438 training step(s),cross entropy on all data is 0.00657215
After 3439 training step(s),cross entropy on all data is 0.00657101
After 3440 training step(s),cross entropy on all data is 0.00656998
After 3441 training step(s),cross entropy on all data is 0.00656905
After 3442 training step(s),cross entropy on all data is 0.00656822
After 3443 training step(s),cross entropy on all data is 0.00656746
After 3444 training step(s),cross entropy on all data is 0.00656679
After 3445 training step(s),cross entropy on all data is 0.00656618
After 3446 training step(s),cross entropy on all data is 0.00656563
After 3447 training step(s),cross entropy on all data is 0.00656297
After 3448 training step(s),cross entropy on all data is 0.00656058
After 3449 training step(s),cross entropy on all data is 0.00655843
After 3450 training step(s),cross entropy on all data is 0.0065565
After 3451 training step(s),cross entropy on all data is 0.00655475
After 3452 training step(s),cross entropy on all data is 0.00655318
After 3453 training step(s),cross entropy on all data is 0.00655177
After 3454 training step(s),cross entropy on all data is 0.00655049
After 3455 training step(s),cross entropy on all data is 0.00654935
After 3456 training step(s),cross entropy on all data is 0.00654831
After 3457 training step(s),cross entropy on all data is 0.00654738
After 3458 training step(s),cross entropy on all data is 0.00654655
After 3459 training step(s),cross entropy on all data is 0.00654579
After 3460 training step(s),cross entropy on all data is 0.00654512
After 3461 training step(s),cross entropy on all data is 0.0065445
After 3462 training step(s),cross entropy on all data is 0.00654395
After 3463 training step(s),cross entropy on all data is 0.00654129
After 3464 training step(s),cross entropy on all data is 0.0065389
After 3465 training step(s),cross entropy on all data is 0.00653674
After 3466 training step(s),cross entropy on all data is 0.0065348
After 3467 training step(s),cross entropy on all data is 0.00653305
After 3468 training step(s),cross entropy on all data is 0.00653148
After 3469 training step(s),cross entropy on all data is 0.00653006
After 3470 training step(s),cross entropy on all data is 0.00652878
After 3471 training step(s),cross entropy on all data is 0.00652763
After 3472 training step(s),cross entropy on all data is 0.0065266
After 3473 training step(s),cross entropy on all data is 0.00652567
After 3474 training step(s),cross entropy on all data is 0.00652483
After 3475 training step(s),cross entropy on all data is 0.00652407
After 3476 training step(s),cross entropy on all data is 0.00652339
After 3477 training step(s),cross entropy on all data is 0.00652278
After 3478 training step(s),cross entropy on all data is 0.00652223
After 3479 training step(s),cross entropy on all data is 0.00651956
After 3480 training step(s),cross entropy on all data is 0.00651716
After 3481 training step(s),cross entropy on all data is 0.006515
After 3482 training step(s),cross entropy on all data is 0.00651305
After 3483 training step(s),cross entropy on all data is 0.0065113
After 3484 training step(s),cross entropy on all data is 0.00650972
After 3485 training step(s),cross entropy on all data is 0.0065083
After 3486 training step(s),cross entropy on all data is 0.00650702
After 3487 training step(s),cross entropy on all data is 0.00650587
After 3488 training step(s),cross entropy on all data is 0.00650483
After 3489 training step(s),cross entropy on all data is 0.0065039
After 3490 training step(s),cross entropy on all data is 0.00650306
After 3491 training step(s),cross entropy on all data is 0.0065023
After 3492 training step(s),cross entropy on all data is 0.00650162
After 3493 training step(s),cross entropy on all data is 0.006501
After 3494 training step(s),cross entropy on all data is 0.00650045
After 3495 training step(s),cross entropy on all data is 0.00649778
After 3496 training step(s),cross entropy on all data is 0.00649537
After 3497 training step(s),cross entropy on all data is 0.0064932
After 3498 training step(s),cross entropy on all data is 0.00649125
After 3499 training step(s),cross entropy on all data is 0.00648949
After 3500 training step(s),cross entropy on all data is 0.00648791
After 3501 training step(s),cross entropy on all data is 0.00648649
After 3502 training step(s),cross entropy on all data is 0.00648521
After 3503 training step(s),cross entropy on all data is 0.00648405
After 3504 training step(s),cross entropy on all data is 0.00648301
After 3505 training step(s),cross entropy on all data is 0.00648208
After 3506 training step(s),cross entropy on all data is 0.00648123
After 3507 training step(s),cross entropy on all data is 0.00648047
After 3508 training step(s),cross entropy on all data is 0.00647979
After 3509 training step(s),cross entropy on all data is 0.00647917
After 3510 training step(s),cross entropy on all data is 0.00647862
After 3511 training step(s),cross entropy on all data is 0.00647594
After 3512 training step(s),cross entropy on all data is 0.00647353
After 3513 training step(s),cross entropy on all data is 0.00647136
After 3514 training step(s),cross entropy on all data is 0.0064694
After 3515 training step(s),cross entropy on all data is 0.00646764
After 3516 training step(s),cross entropy on all data is 0.00646606
After 3517 training step(s),cross entropy on all data is 0.00646463
After 3518 training step(s),cross entropy on all data is 0.00646334
After 3519 training step(s),cross entropy on all data is 0.00646219
After 3520 training step(s),cross entropy on all data is 0.00646114
After 3521 training step(s),cross entropy on all data is 0.00646021
After 3522 training step(s),cross entropy on all data is 0.00645936
After 3523 training step(s),cross entropy on all data is 0.0064586
After 3524 training step(s),cross entropy on all data is 0.00645792
After 3525 training step(s),cross entropy on all data is 0.0064573
After 3526 training step(s),cross entropy on all data is 0.00645674
After 3527 training step(s),cross entropy on all data is 0.00645406
After 3528 training step(s),cross entropy on all data is 0.00645164
After 3529 training step(s),cross entropy on all data is 0.00644946
After 3530 training step(s),cross entropy on all data is 0.0064475
After 3531 training step(s),cross entropy on all data is 0.00644574
After 3532 training step(s),cross entropy on all data is 0.00644415
After 3533 training step(s),cross entropy on all data is 0.00644272
After 3534 training step(s),cross entropy on all data is 0.00644143
After 3535 training step(s),cross entropy on all data is 0.00644027
After 3536 training step(s),cross entropy on all data is 0.00643923
After 3537 training step(s),cross entropy on all data is 0.00643829
After 3538 training step(s),cross entropy on all data is 0.00643744
After 3539 training step(s),cross entropy on all data is 0.00643668
After 3540 training step(s),cross entropy on all data is 0.00643599
After 3541 training step(s),cross entropy on all data is 0.00643537
After 3542 training step(s),cross entropy on all data is 0.00643482
After 3543 training step(s),cross entropy on all data is 0.00643212
After 3544 training step(s),cross entropy on all data is 0.0064297
After 3545 training step(s),cross entropy on all data is 0.00642752
After 3546 training step(s),cross entropy on all data is 0.00642555
After 3547 training step(s),cross entropy on all data is 0.00642378
After 3548 training step(s),cross entropy on all data is 0.00642219
After 3549 training step(s),cross entropy on all data is 0.00642076
After 3550 training step(s),cross entropy on all data is 0.00641947
After 3551 training step(s),cross entropy on all data is 0.0064183
After 3552 training step(s),cross entropy on all data is 0.00641726
After 3553 training step(s),cross entropy on all data is 0.00641632
After 3554 training step(s),cross entropy on all data is 0.00641547
After 3555 training step(s),cross entropy on all data is 0.0064147
After 3556 training step(s),cross entropy on all data is 0.00641401
After 3557 training step(s),cross entropy on all data is 0.0064134
After 3558 training step(s),cross entropy on all data is 0.00641284
After 3559 training step(s),cross entropy on all data is 0.00641014
After 3560 training step(s),cross entropy on all data is 0.00640771
After 3561 training step(s),cross entropy on all data is 0.00640552
After 3562 training step(s),cross entropy on all data is 0.00640356
After 3563 training step(s),cross entropy on all data is 0.00640178
After 3564 training step(s),cross entropy on all data is 0.00640019
After 3565 training step(s),cross entropy on all data is 0.00639875
After 3566 training step(s),cross entropy on all data is 0.00639746
After 3567 training step(s),cross entropy on all data is 0.00639629
After 3568 training step(s),cross entropy on all data is 0.00639524
After 3569 training step(s),cross entropy on all data is 0.0063943
After 3570 training step(s),cross entropy on all data is 0.00639345
After 3571 training step(s),cross entropy on all data is 0.00639268
After 3572 training step(s),cross entropy on all data is 0.00639199
After 3573 training step(s),cross entropy on all data is 0.00639137
After 3574 training step(s),cross entropy on all data is 0.00639081
After 3575 training step(s),cross entropy on all data is 0.00638811
After 3576 training step(s),cross entropy on all data is 0.00638567
After 3577 training step(s),cross entropy on all data is 0.00638348
After 3578 training step(s),cross entropy on all data is 0.00638151
After 3579 training step(s),cross entropy on all data is 0.00637973
After 3580 training step(s),cross entropy on all data is 0.00637813
After 3581 training step(s),cross entropy on all data is 0.00637669
After 3582 training step(s),cross entropy on all data is 0.0063754
After 3583 training step(s),cross entropy on all data is 0.00637423
After 3584 training step(s),cross entropy on all data is 0.00637318
After 3585 training step(s),cross entropy on all data is 0.00637223
After 3586 training step(s),cross entropy on all data is 0.00637138
After 3587 training step(s),cross entropy on all data is 0.00637061
After 3588 training step(s),cross entropy on all data is 0.00636992
After 3589 training step(s),cross entropy on all data is 0.0063693
After 3590 training step(s),cross entropy on all data is 0.00636874
After 3591 training step(s),cross entropy on all data is 0.00636603
After 3592 training step(s),cross entropy on all data is 0.00636359
After 3593 training step(s),cross entropy on all data is 0.00636139
After 3594 training step(s),cross entropy on all data is 0.00635942
After 3595 training step(s),cross entropy on all data is 0.00635764
After 3596 training step(s),cross entropy on all data is 0.00635603
After 3597 training step(s),cross entropy on all data is 0.00635459
After 3598 training step(s),cross entropy on all data is 0.00635329
After 3599 training step(s),cross entropy on all data is 0.00635212
After 3600 training step(s),cross entropy on all data is 0.00635107
After 3601 training step(s),cross entropy on all data is 0.00635012
After 3602 training step(s),cross entropy on all data is 0.00634926
After 3603 training step(s),cross entropy on all data is 0.0063485
After 3604 training step(s),cross entropy on all data is 0.0063478
After 3605 training step(s),cross entropy on all data is 0.00634718
After 3606 training step(s),cross entropy on all data is 0.00634662
After 3607 training step(s),cross entropy on all data is 0.0063439
After 3608 training step(s),cross entropy on all data is 0.00634146
After 3609 training step(s),cross entropy on all data is 0.00633926
After 3610 training step(s),cross entropy on all data is 0.00633728
After 3611 training step(s),cross entropy on all data is 0.00633549
After 3612 training step(s),cross entropy on all data is 0.00633389
After 3613 training step(s),cross entropy on all data is 0.00633244
After 3614 training step(s),cross entropy on all data is 0.00633114
After 3615 training step(s),cross entropy on all data is 0.00632996
After 3616 training step(s),cross entropy on all data is 0.00632891
After 3617 training step(s),cross entropy on all data is 0.00632796
After 3618 training step(s),cross entropy on all data is 0.0063271
After 3619 training step(s),cross entropy on all data is 0.00632633
After 3620 training step(s),cross entropy on all data is 0.00632564
After 3621 training step(s),cross entropy on all data is 0.00632501
After 3622 training step(s),cross entropy on all data is 0.00632445
After 3623 training step(s),cross entropy on all data is 0.00632173
After 3624 training step(s),cross entropy on all data is 0.00631928
After 3625 training step(s),cross entropy on all data is 0.00631707
After 3626 training step(s),cross entropy on all data is 0.00631509
After 3627 training step(s),cross entropy on all data is 0.0063133
After 3628 training step(s),cross entropy on all data is 0.00631169
After 3629 training step(s),cross entropy on all data is 0.00631024
After 3630 training step(s),cross entropy on all data is 0.00630894
After 3631 training step(s),cross entropy on all data is 0.00630776
After 3632 training step(s),cross entropy on all data is 0.00630671
After 3633 training step(s),cross entropy on all data is 0.00630575
After 3634 training step(s),cross entropy on all data is 0.00630489
After 3635 training step(s),cross entropy on all data is 0.00630412
After 3636 training step(s),cross entropy on all data is 0.00630343
After 3637 training step(s),cross entropy on all data is 0.0063028
After 3638 training step(s),cross entropy on all data is 0.00630224
After 3639 training step(s),cross entropy on all data is 0.00629951
After 3640 training step(s),cross entropy on all data is 0.00629706
After 3641 training step(s),cross entropy on all data is 0.00629485
After 3642 training step(s),cross entropy on all data is 0.00629286
After 3643 training step(s),cross entropy on all data is 0.00629107
After 3644 training step(s),cross entropy on all data is 0.00628945
After 3645 training step(s),cross entropy on all data is 0.006288
After 3646 training step(s),cross entropy on all data is 0.00628669
After 3647 training step(s),cross entropy on all data is 0.00628552
After 3648 training step(s),cross entropy on all data is 0.00628446
After 3649 training step(s),cross entropy on all data is 0.0062835
After 3650 training step(s),cross entropy on all data is 0.00628264
After 3651 training step(s),cross entropy on all data is 0.00628187
After 3652 training step(s),cross entropy on all data is 0.00628117
After 3653 training step(s),cross entropy on all data is 0.00628054
After 3654 training step(s),cross entropy on all data is 0.00627998
After 3655 training step(s),cross entropy on all data is 0.00627725
After 3656 training step(s),cross entropy on all data is 0.00627479
After 3657 training step(s),cross entropy on all data is 0.00627257
After 3658 training step(s),cross entropy on all data is 0.00627058
After 3659 training step(s),cross entropy on all data is 0.00626879
After 3660 training step(s),cross entropy on all data is 0.00626717
After 3661 training step(s),cross entropy on all data is 0.00626571
After 3662 training step(s),cross entropy on all data is 0.0062644
After 3663 training step(s),cross entropy on all data is 0.00626322
After 3664 training step(s),cross entropy on all data is 0.00626216
After 3665 training step(s),cross entropy on all data is 0.00626121
After 3666 training step(s),cross entropy on all data is 0.00626034
After 3667 training step(s),cross entropy on all data is 0.00625957
After 3668 training step(s),cross entropy on all data is 0.00625887
After 3669 training step(s),cross entropy on all data is 0.00625824
After 3670 training step(s),cross entropy on all data is 0.00625768
After 3671 training step(s),cross entropy on all data is 0.00625494
After 3672 training step(s),cross entropy on all data is 0.00625248
After 3673 training step(s),cross entropy on all data is 0.00625026
After 3674 training step(s),cross entropy on all data is 0.00624826
After 3675 training step(s),cross entropy on all data is 0.00624646
After 3676 training step(s),cross entropy on all data is 0.00624484
After 3677 training step(s),cross entropy on all data is 0.00624338
After 3678 training step(s),cross entropy on all data is 0.00624207
After 3679 training step(s),cross entropy on all data is 0.00624089
After 3680 training step(s),cross entropy on all data is 0.00623982
After 3681 training step(s),cross entropy on all data is 0.00623887
After 3682 training step(s),cross entropy on all data is 0.006238
After 3683 training step(s),cross entropy on all data is 0.00623723
After 3684 training step(s),cross entropy on all data is 0.00623653
After 3685 training step(s),cross entropy on all data is 0.0062359
After 3686 training step(s),cross entropy on all data is 0.00623533
After 3687 training step(s),cross entropy on all data is 0.00623259
After 3688 training step(s),cross entropy on all data is 0.00623012
After 3689 training step(s),cross entropy on all data is 0.0062279
After 3690 training step(s),cross entropy on all data is 0.00622589
After 3691 training step(s),cross entropy on all data is 0.00622409
After 3692 training step(s),cross entropy on all data is 0.00622247
After 3693 training step(s),cross entropy on all data is 0.00622101
After 3694 training step(s),cross entropy on all data is 0.00621969
After 3695 training step(s),cross entropy on all data is 0.00621851
After 3696 training step(s),cross entropy on all data is 0.00621744
After 3697 training step(s),cross entropy on all data is 0.00621648
After 3698 training step(s),cross entropy on all data is 0.00621562
After 3699 training step(s),cross entropy on all data is 0.00621484
After 3700 training step(s),cross entropy on all data is 0.00621414
After 3701 training step(s),cross entropy on all data is 0.00621351
After 3702 training step(s),cross entropy on all data is 0.00621294
After 3703 training step(s),cross entropy on all data is 0.00621019
After 3704 training step(s),cross entropy on all data is 0.00620772
After 3705 training step(s),cross entropy on all data is 0.00620549
After 3706 training step(s),cross entropy on all data is 0.00620348
After 3707 training step(s),cross entropy on all data is 0.00620168
After 3708 training step(s),cross entropy on all data is 0.00620005
After 3709 training step(s),cross entropy on all data is 0.00619859
After 3710 training step(s),cross entropy on all data is 0.00619727
After 3711 training step(s),cross entropy on all data is 0.00619608
After 3712 training step(s),cross entropy on all data is 0.00619502
After 3713 training step(s),cross entropy on all data is 0.00619406
After 3714 training step(s),cross entropy on all data is 0.00619319
After 3715 training step(s),cross entropy on all data is 0.00619241
After 3716 training step(s),cross entropy on all data is 0.00619171
After 3717 training step(s),cross entropy on all data is 0.00619107
After 3718 training step(s),cross entropy on all data is 0.0061905
After 3719 training step(s),cross entropy on all data is 0.00618775
After 3720 training step(s),cross entropy on all data is 0.00618527
After 3721 training step(s),cross entropy on all data is 0.00618304
After 3722 training step(s),cross entropy on all data is 0.00618103
After 3723 training step(s),cross entropy on all data is 0.00617922
After 3724 training step(s),cross entropy on all data is 0.00617759
After 3725 training step(s),cross entropy on all data is 0.00617613
After 3726 training step(s),cross entropy on all data is 0.00617481
After 3727 training step(s),cross entropy on all data is 0.00617362
After 3728 training step(s),cross entropy on all data is 0.00617255
After 3729 training step(s),cross entropy on all data is 0.00617159
After 3730 training step(s),cross entropy on all data is 0.00617072
After 3731 training step(s),cross entropy on all data is 0.00616994
After 3732 training step(s),cross entropy on all data is 0.00616923
After 3733 training step(s),cross entropy on all data is 0.0061686
After 3734 training step(s),cross entropy on all data is 0.00616803
After 3735 training step(s),cross entropy on all data is 0.00616527
After 3736 training step(s),cross entropy on all data is 0.00616279
After 3737 training step(s),cross entropy on all data is 0.00616055
After 3738 training step(s),cross entropy on all data is 0.00615854
After 3739 training step(s),cross entropy on all data is 0.00615673
After 3740 training step(s),cross entropy on all data is 0.0061551
After 3741 training step(s),cross entropy on all data is 0.00615363
After 3742 training step(s),cross entropy on all data is 0.0061523
After 3743 training step(s),cross entropy on all data is 0.00615111
After 3744 training step(s),cross entropy on all data is 0.00615004
After 3745 training step(s),cross entropy on all data is 0.00614908
After 3746 training step(s),cross entropy on all data is 0.00614821
After 3747 training step(s),cross entropy on all data is 0.00614742
After 3748 training step(s),cross entropy on all data is 0.00614672
After 3749 training step(s),cross entropy on all data is 0.00614608
After 3750 training step(s),cross entropy on all data is 0.00614551
After 3751 training step(s),cross entropy on all data is 0.00614275
After 3752 training step(s),cross entropy on all data is 0.00614026
After 3753 training step(s),cross entropy on all data is 0.00613802
After 3754 training step(s),cross entropy on all data is 0.00613601
After 3755 training step(s),cross entropy on all data is 0.00613419
After 3756 training step(s),cross entropy on all data is 0.00613256
After 3757 training step(s),cross entropy on all data is 0.00613108
After 3758 training step(s),cross entropy on all data is 0.00612976
After 3759 training step(s),cross entropy on all data is 0.00612856
After 3760 training step(s),cross entropy on all data is 0.00612749
After 3761 training step(s),cross entropy on all data is 0.00612652
After 3762 training step(s),cross entropy on all data is 0.00612565
After 3763 training step(s),cross entropy on all data is 0.00612487
After 3764 training step(s),cross entropy on all data is 0.00612416
After 3765 training step(s),cross entropy on all data is 0.00612353
After 3766 training step(s),cross entropy on all data is 0.00612295
After 3767 training step(s),cross entropy on all data is 0.00612018
After 3768 training step(s),cross entropy on all data is 0.00611769
After 3769 training step(s),cross entropy on all data is 0.00611545
After 3770 training step(s),cross entropy on all data is 0.00611343
After 3771 training step(s),cross entropy on all data is 0.00611161
After 3772 training step(s),cross entropy on all data is 0.00610997
After 3773 training step(s),cross entropy on all data is 0.0061085
After 3774 training step(s),cross entropy on all data is 0.00610717
After 3775 training step(s),cross entropy on all data is 0.00610598
After 3776 training step(s),cross entropy on all data is 0.0061049
After 3777 training step(s),cross entropy on all data is 0.00610393
After 3778 training step(s),cross entropy on all data is 0.00610306
After 3779 training step(s),cross entropy on all data is 0.00610227
After 3780 training step(s),cross entropy on all data is 0.00610156
After 3781 training step(s),cross entropy on all data is 0.00610093
After 3782 training step(s),cross entropy on all data is 0.00610035
After 3783 training step(s),cross entropy on all data is 0.00609758
After 3784 training step(s),cross entropy on all data is 0.00609508
After 3785 training step(s),cross entropy on all data is 0.00609284
After 3786 training step(s),cross entropy on all data is 0.00609081
After 3787 training step(s),cross entropy on all data is 0.00608899
After 3788 training step(s),cross entropy on all data is 0.00608735
After 3789 training step(s),cross entropy on all data is 0.00608587
After 3790 training step(s),cross entropy on all data is 0.00608454
After 3791 training step(s),cross entropy on all data is 0.00608335
After 3792 training step(s),cross entropy on all data is 0.00608227
After 3793 training step(s),cross entropy on all data is 0.0060813
After 3794 training step(s),cross entropy on all data is 0.00608042
After 3795 training step(s),cross entropy on all data is 0.00607964
After 3796 training step(s),cross entropy on all data is 0.00607893
After 3797 training step(s),cross entropy on all data is 0.00607829
After 3798 training step(s),cross entropy on all data is 0.00607772
After 3799 training step(s),cross entropy on all data is 0.00607494
After 3800 training step(s),cross entropy on all data is 0.00607244
After 3801 training step(s),cross entropy on all data is 0.00607019
After 3802 training step(s),cross entropy on all data is 0.00606816
After 3803 training step(s),cross entropy on all data is 0.00606633
After 3804 training step(s),cross entropy on all data is 0.00606469
After 3805 training step(s),cross entropy on all data is 0.00606321
After 3806 training step(s),cross entropy on all data is 0.00606188
After 3807 training step(s),cross entropy on all data is 0.00606068
After 3808 training step(s),cross entropy on all data is 0.0060596
After 3809 training step(s),cross entropy on all data is 0.00605863
After 3810 training step(s),cross entropy on all data is 0.00605775
After 3811 training step(s),cross entropy on all data is 0.00605696
After 3812 training step(s),cross entropy on all data is 0.00605625
After 3813 training step(s),cross entropy on all data is 0.00605561
After 3814 training step(s),cross entropy on all data is 0.00605504
After 3815 training step(s),cross entropy on all data is 0.00605225
After 3816 training step(s),cross entropy on all data is 0.00604975
After 3817 training step(s),cross entropy on all data is 0.0060475
After 3818 training step(s),cross entropy on all data is 0.00604546
After 3819 training step(s),cross entropy on all data is 0.00604364
After 3820 training step(s),cross entropy on all data is 0.00604199
After 3821 training step(s),cross entropy on all data is 0.00604051
After 3822 training step(s),cross entropy on all data is 0.00603917
After 3823 training step(s),cross entropy on all data is 0.00603797
After 3824 training step(s),cross entropy on all data is 0.00603689
After 3825 training step(s),cross entropy on all data is 0.00603592
After 3826 training step(s),cross entropy on all data is 0.00603504
After 3827 training step(s),cross entropy on all data is 0.00603425
After 3828 training step(s),cross entropy on all data is 0.00603354
After 3829 training step(s),cross entropy on all data is 0.0060329
After 3830 training step(s),cross entropy on all data is 0.00603232
After 3831 training step(s),cross entropy on all data is 0.00602953
After 3832 training step(s),cross entropy on all data is 0.00602703
After 3833 training step(s),cross entropy on all data is 0.00602477
After 3834 training step(s),cross entropy on all data is 0.00602273
After 3835 training step(s),cross entropy on all data is 0.0060209
After 3836 training step(s),cross entropy on all data is 0.00601925
After 3837 training step(s),cross entropy on all data is 0.00601777
After 3838 training step(s),cross entropy on all data is 0.00601643
After 3839 training step(s),cross entropy on all data is 0.00601523
After 3840 training step(s),cross entropy on all data is 0.00601414
After 3841 training step(s),cross entropy on all data is 0.00601317
After 3842 training step(s),cross entropy on all data is 0.00601229
After 3843 training step(s),cross entropy on all data is 0.0060115
After 3844 training step(s),cross entropy on all data is 0.00601079
After 3845 training step(s),cross entropy on all data is 0.00601014
After 3846 training step(s),cross entropy on all data is 0.00600957
After 3847 training step(s),cross entropy on all data is 0.00600677
After 3848 training step(s),cross entropy on all data is 0.00600426
After 3849 training step(s),cross entropy on all data is 0.006002
After 3850 training step(s),cross entropy on all data is 0.00599996
After 3851 training step(s),cross entropy on all data is 0.00599813
After 3852 training step(s),cross entropy on all data is 0.00599647
After 3853 training step(s),cross entropy on all data is 0.00599499
After 3854 training step(s),cross entropy on all data is 0.00599365
After 3855 training step(s),cross entropy on all data is 0.00599244
After 3856 training step(s),cross entropy on all data is 0.00599136
After 3857 training step(s),cross entropy on all data is 0.00599038
After 3858 training step(s),cross entropy on all data is 0.0059895
After 3859 training step(s),cross entropy on all data is 0.00598871
After 3860 training step(s),cross entropy on all data is 0.005988
After 3861 training step(s),cross entropy on all data is 0.00598735
After 3862 training step(s),cross entropy on all data is 0.00598678
After 3863 training step(s),cross entropy on all data is 0.00598398
After 3864 training step(s),cross entropy on all data is 0.00598146
After 3865 training step(s),cross entropy on all data is 0.00597919
After 3866 training step(s),cross entropy on all data is 0.00597715
After 3867 training step(s),cross entropy on all data is 0.00597532
After 3868 training step(s),cross entropy on all data is 0.00597366
After 3869 training step(s),cross entropy on all data is 0.00597217
After 3870 training step(s),cross entropy on all data is 0.00597083
After 3871 training step(s),cross entropy on all data is 0.00596962
After 3872 training step(s),cross entropy on all data is 0.00596854
After 3873 training step(s),cross entropy on all data is 0.00596756
After 3874 training step(s),cross entropy on all data is 0.00596668
After 3875 training step(s),cross entropy on all data is 0.00596588
After 3876 training step(s),cross entropy on all data is 0.00596517
After 3877 training step(s),cross entropy on all data is 0.00596453
After 3878 training step(s),cross entropy on all data is 0.00596395
After 3879 training step(s),cross entropy on all data is 0.00596115
After 3880 training step(s),cross entropy on all data is 0.00595862
After 3881 training step(s),cross entropy on all data is 0.00595635
After 3882 training step(s),cross entropy on all data is 0.00595431
After 3883 training step(s),cross entropy on all data is 0.00595247
After 3884 training step(s),cross entropy on all data is 0.00595081
After 3885 training step(s),cross entropy on all data is 0.00594932
After 3886 training step(s),cross entropy on all data is 0.00594798
After 3887 training step(s),cross entropy on all data is 0.00594677
After 3888 training step(s),cross entropy on all data is 0.00594568
After 3889 training step(s),cross entropy on all data is 0.0059447
After 3890 training step(s),cross entropy on all data is 0.00594382
After 3891 training step(s),cross entropy on all data is 0.00594302
After 3892 training step(s),cross entropy on all data is 0.00594231
After 3893 training step(s),cross entropy on all data is 0.00594166
After 3894 training step(s),cross entropy on all data is 0.00594108
After 3895 training step(s),cross entropy on all data is 0.00593828
After 3896 training step(s),cross entropy on all data is 0.00593575
After 3897 training step(s),cross entropy on all data is 0.00593348
After 3898 training step(s),cross entropy on all data is 0.00593143
After 3899 training step(s),cross entropy on all data is 0.00592959
After 3900 training step(s),cross entropy on all data is 0.00592793
After 3901 training step(s),cross entropy on all data is 0.00592643
After 3902 training step(s),cross entropy on all data is 0.00592509
After 3903 training step(s),cross entropy on all data is 0.00592388
After 3904 training step(s),cross entropy on all data is 0.00592279
After 3905 training step(s),cross entropy on all data is 0.0059218
After 3906 training step(s),cross entropy on all data is 0.00592092
After 3907 training step(s),cross entropy on all data is 0.00592012
After 3908 training step(s),cross entropy on all data is 0.00591941
After 3909 training step(s),cross entropy on all data is 0.00591876
After 3910 training step(s),cross entropy on all data is 0.00591818
After 3911 training step(s),cross entropy on all data is 0.00591537
After 3912 training step(s),cross entropy on all data is 0.00591284
After 3913 training step(s),cross entropy on all data is 0.00591056
After 3914 training step(s),cross entropy on all data is 0.00590851
After 3915 training step(s),cross entropy on all data is 0.00590667
After 3916 training step(s),cross entropy on all data is 0.00590501
After 3917 training step(s),cross entropy on all data is 0.00590351
After 3918 training step(s),cross entropy on all data is 0.00590216
After 3919 training step(s),cross entropy on all data is 0.00590095
After 3920 training step(s),cross entropy on all data is 0.00589986
After 3921 training step(s),cross entropy on all data is 0.00589887
After 3922 training step(s),cross entropy on all data is 0.00589799
After 3923 training step(s),cross entropy on all data is 0.00589719
After 3924 training step(s),cross entropy on all data is 0.00589647
After 3925 training step(s),cross entropy on all data is 0.00589583
After 3926 training step(s),cross entropy on all data is 0.00589524
After 3927 training step(s),cross entropy on all data is 0.00589243
After 3928 training step(s),cross entropy on all data is 0.0058899
After 3929 training step(s),cross entropy on all data is 0.00588762
After 3930 training step(s),cross entropy on all data is 0.00588556
After 3931 training step(s),cross entropy on all data is 0.00588371
After 3932 training step(s),cross entropy on all data is 0.00588205
After 3933 training step(s),cross entropy on all data is 0.00588055
After 3934 training step(s),cross entropy on all data is 0.0058792
After 3935 training step(s),cross entropy on all data is 0.00587799
After 3936 training step(s),cross entropy on all data is 0.00587689
After 3937 training step(s),cross entropy on all data is 0.00587591
After 3938 training step(s),cross entropy on all data is 0.00587502
After 3939 training step(s),cross entropy on all data is 0.00587422
After 3940 training step(s),cross entropy on all data is 0.0058735
After 3941 training step(s),cross entropy on all data is 0.00587286
After 3942 training step(s),cross entropy on all data is 0.00587227
After 3943 training step(s),cross entropy on all data is 0.00586946
After 3944 training step(s),cross entropy on all data is 0.00586692
After 3945 training step(s),cross entropy on all data is 0.00586463
After 3946 training step(s),cross entropy on all data is 0.00586258
After 3947 training step(s),cross entropy on all data is 0.00586073
After 3948 training step(s),cross entropy on all data is 0.00585906
After 3949 training step(s),cross entropy on all data is 0.00585756
After 3950 training step(s),cross entropy on all data is 0.00585621
After 3951 training step(s),cross entropy on all data is 0.00585499
After 3952 training step(s),cross entropy on all data is 0.0058539
After 3953 training step(s),cross entropy on all data is 0.00585291
After 3954 training step(s),cross entropy on all data is 0.00585202
After 3955 training step(s),cross entropy on all data is 0.00585122
After 3956 training step(s),cross entropy on all data is 0.0058505
After 3957 training step(s),cross entropy on all data is 0.00584985
After 3958 training step(s),cross entropy on all data is 0.00584927
After 3959 training step(s),cross entropy on all data is 0.00584645
After 3960 training step(s),cross entropy on all data is 0.00584391
After 3961 training step(s),cross entropy on all data is 0.00584162
After 3962 training step(s),cross entropy on all data is 0.00583956
After 3963 training step(s),cross entropy on all data is 0.00583771
After 3964 training step(s),cross entropy on all data is 0.00583604
After 3965 training step(s),cross entropy on all data is 0.00583453
After 3966 training step(s),cross entropy on all data is 0.00583318
After 3967 training step(s),cross entropy on all data is 0.00583196
After 3968 training step(s),cross entropy on all data is 0.00583087
After 3969 training step(s),cross entropy on all data is 0.00582988
After 3970 training step(s),cross entropy on all data is 0.00582899
After 3971 training step(s),cross entropy on all data is 0.00582819
After 3972 training step(s),cross entropy on all data is 0.00582747
After 3973 training step(s),cross entropy on all data is 0.00582682
After 3974 training step(s),cross entropy on all data is 0.00582623
After 3975 training step(s),cross entropy on all data is 0.00582341
After 3976 training step(s),cross entropy on all data is 0.00582086
After 3977 training step(s),cross entropy on all data is 0.00581857
After 3978 training step(s),cross entropy on all data is 0.00581651
After 3979 training step(s),cross entropy on all data is 0.00581465
After 3980 training step(s),cross entropy on all data is 0.00581298
After 3981 training step(s),cross entropy on all data is 0.00581148
After 3982 training step(s),cross entropy on all data is 0.00581012
After 3983 training step(s),cross entropy on all data is 0.0058089
After 3984 training step(s),cross entropy on all data is 0.0058078
After 3985 training step(s),cross entropy on all data is 0.00580681
After 3986 training step(s),cross entropy on all data is 0.00580592
After 3987 training step(s),cross entropy on all data is 0.00580512
After 3988 training step(s),cross entropy on all data is 0.0058044
After 3989 training step(s),cross entropy on all data is 0.00580375
After 3990 training step(s),cross entropy on all data is 0.00580316
After 3991 training step(s),cross entropy on all data is 0.00580033
After 3992 training step(s),cross entropy on all data is 0.00579779
After 3993 training step(s),cross entropy on all data is 0.00579549
After 3994 training step(s),cross entropy on all data is 0.00579343
After 3995 training step(s),cross entropy on all data is 0.00579157
After 3996 training step(s),cross entropy on all data is 0.00578989
After 3997 training step(s),cross entropy on all data is 0.00578839
After 3998 training step(s),cross entropy on all data is 0.00578703
After 3999 training step(s),cross entropy on all data is 0.00578581
After 4000 training step(s),cross entropy on all data is 0.00578471
After 4001 training step(s),cross entropy on all data is 0.00578372
After 4002 training step(s),cross entropy on all data is 0.00578283
After 4003 training step(s),cross entropy on all data is 0.00578202
After 4004 training step(s),cross entropy on all data is 0.0057813
After 4005 training step(s),cross entropy on all data is 0.00578065
After 4006 training step(s),cross entropy on all data is 0.00578006
After 4007 training step(s),cross entropy on all data is 0.00577723
After 4008 training step(s),cross entropy on all data is 0.00577468
After 4009 training step(s),cross entropy on all data is 0.00577238
After 4010 training step(s),cross entropy on all data is 0.00577031
After 4011 training step(s),cross entropy on all data is 0.00576845
After 4012 training step(s),cross entropy on all data is 0.00576677
After 4013 training step(s),cross entropy on all data is 0.00576526
After 4014 training step(s),cross entropy on all data is 0.00576391
After 4015 training step(s),cross entropy on all data is 0.00576268
After 4016 training step(s),cross entropy on all data is 0.00576158
After 4017 training step(s),cross entropy on all data is 0.00576059
After 4018 training step(s),cross entropy on all data is 0.0057597
After 4019 training step(s),cross entropy on all data is 0.00575889
After 4020 training step(s),cross entropy on all data is 0.00575817
After 4021 training step(s),cross entropy on all data is 0.00575752
After 4022 training step(s),cross entropy on all data is 0.00575693
After 4023 training step(s),cross entropy on all data is 0.00575409
After 4024 training step(s),cross entropy on all data is 0.00575154
After 4025 training step(s),cross entropy on all data is 0.00574924
After 4026 training step(s),cross entropy on all data is 0.00574717
After 4027 training step(s),cross entropy on all data is 0.0057453
After 4028 training step(s),cross entropy on all data is 0.00574362
After 4029 training step(s),cross entropy on all data is 0.00574211
After 4030 training step(s),cross entropy on all data is 0.00574075
After 4031 training step(s),cross entropy on all data is 0.00573953
After 4032 training step(s),cross entropy on all data is 0.00573842
After 4033 training step(s),cross entropy on all data is 0.00573743
After 4034 training step(s),cross entropy on all data is 0.00573654
After 4035 training step(s),cross entropy on all data is 0.00573573
After 4036 training step(s),cross entropy on all data is 0.00573501
After 4037 training step(s),cross entropy on all data is 0.00573435
After 4038 training step(s),cross entropy on all data is 0.00573377
After 4039 training step(s),cross entropy on all data is 0.00573093
After 4040 training step(s),cross entropy on all data is 0.00572837
After 4041 training step(s),cross entropy on all data is 0.00572606
After 4042 training step(s),cross entropy on all data is 0.00572399
After 4043 training step(s),cross entropy on all data is 0.00572212
After 4044 training step(s),cross entropy on all data is 0.00572044
After 4045 training step(s),cross entropy on all data is 0.00571893
After 4046 training step(s),cross entropy on all data is 0.00571757
After 4047 training step(s),cross entropy on all data is 0.00571634
After 4048 training step(s),cross entropy on all data is 0.00571524
After 4049 training step(s),cross entropy on all data is 0.00571424
After 4050 training step(s),cross entropy on all data is 0.00571335
After 4051 training step(s),cross entropy on all data is 0.00571254
After 4052 training step(s),cross entropy on all data is 0.00571181
After 4053 training step(s),cross entropy on all data is 0.00571116
After 4054 training step(s),cross entropy on all data is 0.00571057
After 4055 training step(s),cross entropy on all data is 0.00570773
After 4056 training step(s),cross entropy on all data is 0.00570516
After 4057 training step(s),cross entropy on all data is 0.00570286
After 4058 training step(s),cross entropy on all data is 0.00570078
After 4059 training step(s),cross entropy on all data is 0.00569891
After 4060 training step(s),cross entropy on all data is 0.00569723
After 4061 training step(s),cross entropy on all data is 0.00569572
After 4062 training step(s),cross entropy on all data is 0.00569435
After 4063 training step(s),cross entropy on all data is 0.00569312
After 4064 training step(s),cross entropy on all data is 0.00569202
After 4065 training step(s),cross entropy on all data is 0.00569102
After 4066 training step(s),cross entropy on all data is 0.00569012
After 4067 training step(s),cross entropy on all data is 0.00568932
After 4068 training step(s),cross entropy on all data is 0.00568859
After 4069 training step(s),cross entropy on all data is 0.00568794
After 4070 training step(s),cross entropy on all data is 0.00568735
After 4071 training step(s),cross entropy on all data is 0.0056845
After 4072 training step(s),cross entropy on all data is 0.00568193
After 4073 training step(s),cross entropy on all data is 0.00567963
After 4074 training step(s),cross entropy on all data is 0.00567755
After 4075 training step(s),cross entropy on all data is 0.00567567
After 4076 training step(s),cross entropy on all data is 0.00567399
After 4077 training step(s),cross entropy on all data is 0.00567247
After 4078 training step(s),cross entropy on all data is 0.00567111
After 4079 training step(s),cross entropy on all data is 0.00566988
After 4080 training step(s),cross entropy on all data is 0.00566877
After 4081 training step(s),cross entropy on all data is 0.00566777
After 4082 training step(s),cross entropy on all data is 0.00566687
After 4083 training step(s),cross entropy on all data is 0.00566607
After 4084 training step(s),cross entropy on all data is 0.00566534
After 4085 training step(s),cross entropy on all data is 0.00566468
After 4086 training step(s),cross entropy on all data is 0.00566409
After 4087 training step(s),cross entropy on all data is 0.00566124
After 4088 training step(s),cross entropy on all data is 0.00565867
After 4089 training step(s),cross entropy on all data is 0.00565636
After 4090 training step(s),cross entropy on all data is 0.00565428
After 4091 training step(s),cross entropy on all data is 0.00565241
After 4092 training step(s),cross entropy on all data is 0.00565072
After 4093 training step(s),cross entropy on all data is 0.0056492
After 4094 training step(s),cross entropy on all data is 0.00564783
After 4095 training step(s),cross entropy on all data is 0.0056466
After 4096 training step(s),cross entropy on all data is 0.00564549
After 4097 training step(s),cross entropy on all data is 0.0056445
After 4098 training step(s),cross entropy on all data is 0.0056436
After 4099 training step(s),cross entropy on all data is 0.00564279
After 4100 training step(s),cross entropy on all data is 0.00564206
After 4101 training step(s),cross entropy on all data is 0.0056414
After 4102 training step(s),cross entropy on all data is 0.00564081
After 4103 training step(s),cross entropy on all data is 0.00563796
After 4104 training step(s),cross entropy on all data is 0.00563539
After 4105 training step(s),cross entropy on all data is 0.00563307
After 4106 training step(s),cross entropy on all data is 0.00563099
After 4107 training step(s),cross entropy on all data is 0.00562911
After 4108 training step(s),cross entropy on all data is 0.00562742
After 4109 training step(s),cross entropy on all data is 0.0056259
After 4110 training step(s),cross entropy on all data is 0.00562453
After 4111 training step(s),cross entropy on all data is 0.0056233
After 4112 training step(s),cross entropy on all data is 0.00562219
After 4113 training step(s),cross entropy on all data is 0.00562119
After 4114 training step(s),cross entropy on all data is 0.00562029
After 4115 training step(s),cross entropy on all data is 0.00561948
After 4116 training step(s),cross entropy on all data is 0.00561875
After 4117 training step(s),cross entropy on all data is 0.00561809
After 4118 training step(s),cross entropy on all data is 0.0056175
After 4119 training step(s),cross entropy on all data is 0.00561464
After 4120 training step(s),cross entropy on all data is 0.00561207
After 4121 training step(s),cross entropy on all data is 0.00560975
After 4122 training step(s),cross entropy on all data is 0.00560767
After 4123 training step(s),cross entropy on all data is 0.00560579
After 4124 training step(s),cross entropy on all data is 0.0056041
After 4125 training step(s),cross entropy on all data is 0.00560257
After 4126 training step(s),cross entropy on all data is 0.0056012
After 4127 training step(s),cross entropy on all data is 0.00559997
After 4128 training step(s),cross entropy on all data is 0.00559886
After 4129 training step(s),cross entropy on all data is 0.00559786
After 4130 training step(s),cross entropy on all data is 0.00559696
After 4131 training step(s),cross entropy on all data is 0.00559615
After 4132 training step(s),cross entropy on all data is 0.00559541
After 4133 training step(s),cross entropy on all data is 0.00559476
After 4134 training step(s),cross entropy on all data is 0.00559416
After 4135 training step(s),cross entropy on all data is 0.0055913
After 4136 training step(s),cross entropy on all data is 0.00558873
After 4137 training step(s),cross entropy on all data is 0.00558641
After 4138 training step(s),cross entropy on all data is 0.00558432
After 4139 training step(s),cross entropy on all data is 0.00558244
After 4140 training step(s),cross entropy on all data is 0.00558074
After 4141 training step(s),cross entropy on all data is 0.00557922
After 4142 training step(s),cross entropy on all data is 0.00557785
After 4143 training step(s),cross entropy on all data is 0.00557661
After 4144 training step(s),cross entropy on all data is 0.0055755
After 4145 training step(s),cross entropy on all data is 0.0055745
After 4146 training step(s),cross entropy on all data is 0.00557359
After 4147 training step(s),cross entropy on all data is 0.00557278
After 4148 training step(s),cross entropy on all data is 0.00557205
After 4149 training step(s),cross entropy on all data is 0.00557139
After 4150 training step(s),cross entropy on all data is 0.0055708
After 4151 training step(s),cross entropy on all data is 0.00556793
After 4152 training step(s),cross entropy on all data is 0.00556535
After 4153 training step(s),cross entropy on all data is 0.00556303
After 4154 training step(s),cross entropy on all data is 0.00556094
After 4155 training step(s),cross entropy on all data is 0.00555906
After 4156 training step(s),cross entropy on all data is 0.00555736
After 4157 training step(s),cross entropy on all data is 0.00555584
After 4158 training step(s),cross entropy on all data is 0.00555446
After 4159 training step(s),cross entropy on all data is 0.00555323
After 4160 training step(s),cross entropy on all data is 0.00555211
After 4161 training step(s),cross entropy on all data is 0.00555111
After 4162 training step(s),cross entropy on all data is 0.0055502
After 4163 training step(s),cross entropy on all data is 0.00554939
After 4164 training step(s),cross entropy on all data is 0.00554866
After 4165 training step(s),cross entropy on all data is 0.005548
After 4166 training step(s),cross entropy on all data is 0.00554741
After 4167 training step(s),cross entropy on all data is 0.00554454
After 4168 training step(s),cross entropy on all data is 0.00554196
After 4169 training step(s),cross entropy on all data is 0.00553963
After 4170 training step(s),cross entropy on all data is 0.00553754
After 4171 training step(s),cross entropy on all data is 0.00553565
After 4172 training step(s),cross entropy on all data is 0.00553396
After 4173 training step(s),cross entropy on all data is 0.00553243
After 4174 training step(s),cross entropy on all data is 0.00553105
After 4175 training step(s),cross entropy on all data is 0.00552981
After 4176 training step(s),cross entropy on all data is 0.0055287
After 4177 training step(s),cross entropy on all data is 0.0055277
After 4178 training step(s),cross entropy on all data is 0.00552679
After 4179 training step(s),cross entropy on all data is 0.00552598
After 4180 training step(s),cross entropy on all data is 0.00552524
After 4181 training step(s),cross entropy on all data is 0.00552458
After 4182 training step(s),cross entropy on all data is 0.00552399
After 4183 training step(s),cross entropy on all data is 0.00552112
After 4184 training step(s),cross entropy on all data is 0.00551853
After 4185 training step(s),cross entropy on all data is 0.00551621
After 4186 training step(s),cross entropy on all data is 0.00551411
After 4187 training step(s),cross entropy on all data is 0.00551222
After 4188 training step(s),cross entropy on all data is 0.00551052
After 4189 training step(s),cross entropy on all data is 0.005509
After 4190 training step(s),cross entropy on all data is 0.00550762
After 4191 training step(s),cross entropy on all data is 0.00550638
After 4192 training step(s),cross entropy on all data is 0.00550526
After 4193 training step(s),cross entropy on all data is 0.00550426
After 4194 training step(s),cross entropy on all data is 0.00550335
After 4195 training step(s),cross entropy on all data is 0.00550254
After 4196 training step(s),cross entropy on all data is 0.0055018
After 4197 training step(s),cross entropy on all data is 0.00550114
After 4198 training step(s),cross entropy on all data is 0.00550055
After 4199 training step(s),cross entropy on all data is 0.00549767
After 4200 training step(s),cross entropy on all data is 0.00549509
After 4201 training step(s),cross entropy on all data is 0.00549276
After 4202 training step(s),cross entropy on all data is 0.00549066
After 4203 training step(s),cross entropy on all data is 0.00548877
After 4204 training step(s),cross entropy on all data is 0.00548707
After 4205 training step(s),cross entropy on all data is 0.00548554
After 4206 training step(s),cross entropy on all data is 0.00548416
After 4207 training step(s),cross entropy on all data is 0.00548292
After 4208 training step(s),cross entropy on all data is 0.0054818
After 4209 training step(s),cross entropy on all data is 0.00548079
After 4210 training step(s),cross entropy on all data is 0.00547989
After 4211 training step(s),cross entropy on all data is 0.00547907
After 4212 training step(s),cross entropy on all data is 0.00547834
After 4213 training step(s),cross entropy on all data is 0.00547768
After 4214 training step(s),cross entropy on all data is 0.00547708
After 4215 training step(s),cross entropy on all data is 0.0054742
After 4216 training step(s),cross entropy on all data is 0.00547161
After 4217 training step(s),cross entropy on all data is 0.00546928
After 4218 training step(s),cross entropy on all data is 0.00546718
After 4219 training step(s),cross entropy on all data is 0.00546529
After 4220 training step(s),cross entropy on all data is 0.00546359
After 4221 training step(s),cross entropy on all data is 0.00546206
After 4222 training step(s),cross entropy on all data is 0.00546068
After 4223 training step(s),cross entropy on all data is 0.00545943
After 4224 training step(s),cross entropy on all data is 0.00545831
After 4225 training step(s),cross entropy on all data is 0.00545731
After 4226 training step(s),cross entropy on all data is 0.0054564
After 4227 training step(s),cross entropy on all data is 0.00545558
After 4228 training step(s),cross entropy on all data is 0.00545485
After 4229 training step(s),cross entropy on all data is 0.00545419
After 4230 training step(s),cross entropy on all data is 0.00545359
After 4231 training step(s),cross entropy on all data is 0.00545071
After 4232 training step(s),cross entropy on all data is 0.00544812
After 4233 training step(s),cross entropy on all data is 0.00544578
After 4234 training step(s),cross entropy on all data is 0.00544368
After 4235 training step(s),cross entropy on all data is 0.00544179
After 4236 training step(s),cross entropy on all data is 0.00544008
After 4237 training step(s),cross entropy on all data is 0.00543855
After 4238 training step(s),cross entropy on all data is 0.00543717
After 4239 training step(s),cross entropy on all data is 0.00543593
After 4240 training step(s),cross entropy on all data is 0.00543481
After 4241 training step(s),cross entropy on all data is 0.0054338
After 4242 training step(s),cross entropy on all data is 0.00543289
After 4243 training step(s),cross entropy on all data is 0.00543207
After 4244 training step(s),cross entropy on all data is 0.00543134
After 4245 training step(s),cross entropy on all data is 0.00543067
After 4246 training step(s),cross entropy on all data is 0.00543008
After 4247 training step(s),cross entropy on all data is 0.00542719
After 4248 training step(s),cross entropy on all data is 0.0054246
After 4249 training step(s),cross entropy on all data is 0.00542226
After 4250 training step(s),cross entropy on all data is 0.00542016
After 4251 training step(s),cross entropy on all data is 0.00541826
After 4252 training step(s),cross entropy on all data is 0.00541656
After 4253 training step(s),cross entropy on all data is 0.00541502
After 4254 training step(s),cross entropy on all data is 0.00541364
After 4255 training step(s),cross entropy on all data is 0.00541239
After 4256 training step(s),cross entropy on all data is 0.00541127
After 4257 training step(s),cross entropy on all data is 0.00541026
After 4258 training step(s),cross entropy on all data is 0.00540936
After 4259 training step(s),cross entropy on all data is 0.00540854
After 4260 training step(s),cross entropy on all data is 0.0054078
After 4261 training step(s),cross entropy on all data is 0.00540714
After 4262 training step(s),cross entropy on all data is 0.00540654
After 4263 training step(s),cross entropy on all data is 0.00540365
After 4264 training step(s),cross entropy on all data is 0.00540106
After 4265 training step(s),cross entropy on all data is 0.00539872
After 4266 training step(s),cross entropy on all data is 0.00539661
After 4267 training step(s),cross entropy on all data is 0.00539471
After 4268 training step(s),cross entropy on all data is 0.00539301
After 4269 training step(s),cross entropy on all data is 0.00539147
After 4270 training step(s),cross entropy on all data is 0.00539009
After 4271 training step(s),cross entropy on all data is 0.00538884
After 4272 training step(s),cross entropy on all data is 0.00538772
After 4273 training step(s),cross entropy on all data is 0.00538671
After 4274 training step(s),cross entropy on all data is 0.0053858
After 4275 training step(s),cross entropy on all data is 0.00538498
After 4276 training step(s),cross entropy on all data is 0.00538424
After 4277 training step(s),cross entropy on all data is 0.00538358
After 4278 training step(s),cross entropy on all data is 0.00538298
After 4279 training step(s),cross entropy on all data is 0.00538009
After 4280 training step(s),cross entropy on all data is 0.00537749
After 4281 training step(s),cross entropy on all data is 0.00537515
After 4282 training step(s),cross entropy on all data is 0.00537304
After 4283 training step(s),cross entropy on all data is 0.00537114
After 4284 training step(s),cross entropy on all data is 0.00536944
After 4285 training step(s),cross entropy on all data is 0.0053679
After 4286 training step(s),cross entropy on all data is 0.00536651
After 4287 training step(s),cross entropy on all data is 0.00536527
After 4288 training step(s),cross entropy on all data is 0.00536414
After 4289 training step(s),cross entropy on all data is 0.00536313
After 4290 training step(s),cross entropy on all data is 0.00536222
After 4291 training step(s),cross entropy on all data is 0.0053614
After 4292 training step(s),cross entropy on all data is 0.00536066
After 4293 training step(s),cross entropy on all data is 0.00536
After 4294 training step(s),cross entropy on all data is 0.0053594
After 4295 training step(s),cross entropy on all data is 0.00535651
After 4296 training step(s),cross entropy on all data is 0.00535391
After 4297 training step(s),cross entropy on all data is 0.00535156
After 4298 training step(s),cross entropy on all data is 0.00534945
After 4299 training step(s),cross entropy on all data is 0.00534755
After 4300 training step(s),cross entropy on all data is 0.00534584
After 4301 training step(s),cross entropy on all data is 0.0053443
After 4302 training step(s),cross entropy on all data is 0.00534292
After 4303 training step(s),cross entropy on all data is 0.00534167
After 4304 training step(s),cross entropy on all data is 0.00534054
After 4305 training step(s),cross entropy on all data is 0.00533953
After 4306 training step(s),cross entropy on all data is 0.00533862
After 4307 training step(s),cross entropy on all data is 0.0053378
After 4308 training step(s),cross entropy on all data is 0.00533706
After 4309 training step(s),cross entropy on all data is 0.0053364
After 4310 training step(s),cross entropy on all data is 0.0053358
After 4311 training step(s),cross entropy on all data is 0.0053329
After 4312 training step(s),cross entropy on all data is 0.0053303
After 4313 training step(s),cross entropy on all data is 0.00532795
After 4314 training step(s),cross entropy on all data is 0.00532584
After 4315 training step(s),cross entropy on all data is 0.00532394
After 4316 training step(s),cross entropy on all data is 0.00532223
After 4317 training step(s),cross entropy on all data is 0.00532069
After 4318 training step(s),cross entropy on all data is 0.0053193
After 4319 training step(s),cross entropy on all data is 0.00531805
After 4320 training step(s),cross entropy on all data is 0.00531692
After 4321 training step(s),cross entropy on all data is 0.00531591
After 4322 training step(s),cross entropy on all data is 0.005315
After 4323 training step(s),cross entropy on all data is 0.00531418
After 4324 training step(s),cross entropy on all data is 0.00531344
After 4325 training step(s),cross entropy on all data is 0.00531277
After 4326 training step(s),cross entropy on all data is 0.00531217
After 4327 training step(s),cross entropy on all data is 0.00530928
After 4328 training step(s),cross entropy on all data is 0.00530667
After 4329 training step(s),cross entropy on all data is 0.00530432
After 4330 training step(s),cross entropy on all data is 0.00530221
After 4331 training step(s),cross entropy on all data is 0.0053003
After 4332 training step(s),cross entropy on all data is 0.00529859
After 4333 training step(s),cross entropy on all data is 0.00529705
After 4334 training step(s),cross entropy on all data is 0.00529566
After 4335 training step(s),cross entropy on all data is 0.00529441
After 4336 training step(s),cross entropy on all data is 0.00529328
After 4337 training step(s),cross entropy on all data is 0.00529227
After 4338 training step(s),cross entropy on all data is 0.00529136
After 4339 training step(s),cross entropy on all data is 0.00529054
After 4340 training step(s),cross entropy on all data is 0.00528979
After 4341 training step(s),cross entropy on all data is 0.00528913
After 4342 training step(s),cross entropy on all data is 0.00528853
After 4343 training step(s),cross entropy on all data is 0.00528563
After 4344 training step(s),cross entropy on all data is 0.00528302
After 4345 training step(s),cross entropy on all data is 0.00528067
After 4346 training step(s),cross entropy on all data is 0.00527856
After 4347 training step(s),cross entropy on all data is 0.00527665
After 4348 training step(s),cross entropy on all data is 0.00527494
After 4349 training step(s),cross entropy on all data is 0.00527339
After 4350 training step(s),cross entropy on all data is 0.005272
After 4351 training step(s),cross entropy on all data is 0.00527075
After 4352 training step(s),cross entropy on all data is 0.00526962
After 4353 training step(s),cross entropy on all data is 0.00526861
After 4354 training step(s),cross entropy on all data is 0.0052677
After 4355 training step(s),cross entropy on all data is 0.00526687
After 4356 training step(s),cross entropy on all data is 0.00526613
After 4357 training step(s),cross entropy on all data is 0.00526547
After 4358 training step(s),cross entropy on all data is 0.00526486
After 4359 training step(s),cross entropy on all data is 0.00526196
After 4360 training step(s),cross entropy on all data is 0.00525935
After 4361 training step(s),cross entropy on all data is 0.005257
After 4362 training step(s),cross entropy on all data is 0.00525488
After 4363 training step(s),cross entropy on all data is 0.00525298
After 4364 training step(s),cross entropy on all data is 0.00525126
After 4365 training step(s),cross entropy on all data is 0.00524972
After 4366 training step(s),cross entropy on all data is 0.00524833
After 4367 training step(s),cross entropy on all data is 0.00524707
After 4368 training step(s),cross entropy on all data is 0.00524595
After 4369 training step(s),cross entropy on all data is 0.00524493
After 4370 training step(s),cross entropy on all data is 0.00524402
After 4371 training step(s),cross entropy on all data is 0.00524319
After 4372 training step(s),cross entropy on all data is 0.00524245
After 4373 training step(s),cross entropy on all data is 0.00524178
After 4374 training step(s),cross entropy on all data is 0.00524118
After 4375 training step(s),cross entropy on all data is 0.00523828
After 4376 training step(s),cross entropy on all data is 0.00523567
After 4377 training step(s),cross entropy on all data is 0.00523331
After 4378 training step(s),cross entropy on all data is 0.00523119
After 4379 training step(s),cross entropy on all data is 0.00522929
After 4380 training step(s),cross entropy on all data is 0.00522757
After 4381 training step(s),cross entropy on all data is 0.00522602
After 4382 training step(s),cross entropy on all data is 0.00522463
After 4383 training step(s),cross entropy on all data is 0.00522338
After 4384 training step(s),cross entropy on all data is 0.00522225
After 4385 training step(s),cross entropy on all data is 0.00522123
After 4386 training step(s),cross entropy on all data is 0.00522032
After 4387 training step(s),cross entropy on all data is 0.00521949
After 4388 training step(s),cross entropy on all data is 0.00521875
After 4389 training step(s),cross entropy on all data is 0.00521808
After 4390 training step(s),cross entropy on all data is 0.00521748
After 4391 training step(s),cross entropy on all data is 0.00521458
After 4392 training step(s),cross entropy on all data is 0.00521196
After 4393 training step(s),cross entropy on all data is 0.00520961
After 4394 training step(s),cross entropy on all data is 0.00520749
After 4395 training step(s),cross entropy on all data is 0.00520558
After 4396 training step(s),cross entropy on all data is 0.00520386
After 4397 training step(s),cross entropy on all data is 0.00520231
After 4398 training step(s),cross entropy on all data is 0.00520092
After 4399 training step(s),cross entropy on all data is 0.00519966
After 4400 training step(s),cross entropy on all data is 0.00519853
After 4401 training step(s),cross entropy on all data is 0.00519752
After 4402 training step(s),cross entropy on all data is 0.0051966
After 4403 training step(s),cross entropy on all data is 0.00519578
After 4404 training step(s),cross entropy on all data is 0.00519503
After 4405 training step(s),cross entropy on all data is 0.00519437
After 4406 training step(s),cross entropy on all data is 0.00519376
After 4407 training step(s),cross entropy on all data is 0.00519086
After 4408 training step(s),cross entropy on all data is 0.00518824
After 4409 training step(s),cross entropy on all data is 0.00518588
After 4410 training step(s),cross entropy on all data is 0.00518376
After 4411 training step(s),cross entropy on all data is 0.00518185
After 4412 training step(s),cross entropy on all data is 0.00518013
After 4413 training step(s),cross entropy on all data is 0.00517858
After 4414 training step(s),cross entropy on all data is 0.00517719
After 4415 training step(s),cross entropy on all data is 0.00517593
After 4416 training step(s),cross entropy on all data is 0.0051748
After 4417 training step(s),cross entropy on all data is 0.00517378
After 4418 training step(s),cross entropy on all data is 0.00517287
After 4419 training step(s),cross entropy on all data is 0.00517204
After 4420 training step(s),cross entropy on all data is 0.0051713
After 4421 training step(s),cross entropy on all data is 0.00517063
After 4422 training step(s),cross entropy on all data is 0.00517002
After 4423 training step(s),cross entropy on all data is 0.00516712
After 4424 training step(s),cross entropy on all data is 0.0051645
After 4425 training step(s),cross entropy on all data is 0.00516214
After 4426 training step(s),cross entropy on all data is 0.00516001
After 4427 training step(s),cross entropy on all data is 0.0051581
After 4428 training step(s),cross entropy on all data is 0.00515638
After 4429 training step(s),cross entropy on all data is 0.00515483
After 4430 training step(s),cross entropy on all data is 0.00515344
After 4431 training step(s),cross entropy on all data is 0.00515218
After 4432 training step(s),cross entropy on all data is 0.00515105
After 4433 training step(s),cross entropy on all data is 0.00515003
After 4434 training step(s),cross entropy on all data is 0.00514911
After 4435 training step(s),cross entropy on all data is 0.00514829
After 4436 training step(s),cross entropy on all data is 0.00514754
After 4437 training step(s),cross entropy on all data is 0.00514687
After 4438 training step(s),cross entropy on all data is 0.00514627
After 4439 training step(s),cross entropy on all data is 0.00514336
After 4440 training step(s),cross entropy on all data is 0.00514074
After 4441 training step(s),cross entropy on all data is 0.00513838
After 4442 training step(s),cross entropy on all data is 0.00513625
After 4443 training step(s),cross entropy on all data is 0.00513434
After 4444 training step(s),cross entropy on all data is 0.00513262
After 4445 training step(s),cross entropy on all data is 0.00513107
After 4446 training step(s),cross entropy on all data is 0.00512967
After 4447 training step(s),cross entropy on all data is 0.00512841
After 4448 training step(s),cross entropy on all data is 0.00512728
After 4449 training step(s),cross entropy on all data is 0.00512626
After 4450 training step(s),cross entropy on all data is 0.00512534
After 4451 training step(s),cross entropy on all data is 0.00512452
After 4452 training step(s),cross entropy on all data is 0.00512377
After 4453 training step(s),cross entropy on all data is 0.0051231
After 4454 training step(s),cross entropy on all data is 0.0051225
After 4455 training step(s),cross entropy on all data is 0.00511959
After 4456 training step(s),cross entropy on all data is 0.00511696
After 4457 training step(s),cross entropy on all data is 0.0051146
After 4458 training step(s),cross entropy on all data is 0.00511248
After 4459 training step(s),cross entropy on all data is 0.00511056
After 4460 training step(s),cross entropy on all data is 0.00510884
After 4461 training step(s),cross entropy on all data is 0.00510729
After 4462 training step(s),cross entropy on all data is 0.00510589
After 4463 training step(s),cross entropy on all data is 0.00510463
After 4464 training step(s),cross entropy on all data is 0.0051035
After 4465 training step(s),cross entropy on all data is 0.00510248
After 4466 training step(s),cross entropy on all data is 0.00510156
After 4467 training step(s),cross entropy on all data is 0.00510073
After 4468 training step(s),cross entropy on all data is 0.00509999
After 4469 training step(s),cross entropy on all data is 0.00509932
After 4470 training step(s),cross entropy on all data is 0.00509871
After 4471 training step(s),cross entropy on all data is 0.0050958
After 4472 training step(s),cross entropy on all data is 0.00509317
After 4473 training step(s),cross entropy on all data is 0.00509081
After 4474 training step(s),cross entropy on all data is 0.00508868
After 4475 training step(s),cross entropy on all data is 0.00508677
After 4476 training step(s),cross entropy on all data is 0.00508504
After 4477 training step(s),cross entropy on all data is 0.00508349
After 4478 training step(s),cross entropy on all data is 0.00508209
After 4479 training step(s),cross entropy on all data is 0.00508083
After 4480 training step(s),cross entropy on all data is 0.0050797
After 4481 training step(s),cross entropy on all data is 0.00507868
After 4482 training step(s),cross entropy on all data is 0.00507776
After 4483 training step(s),cross entropy on all data is 0.00507693
After 4484 training step(s),cross entropy on all data is 0.00507619
After 4485 training step(s),cross entropy on all data is 0.00507551
After 4486 training step(s),cross entropy on all data is 0.00507491
After 4487 training step(s),cross entropy on all data is 0.00507199
After 4488 training step(s),cross entropy on all data is 0.00506937
After 4489 training step(s),cross entropy on all data is 0.005067
After 4490 training step(s),cross entropy on all data is 0.00506487
After 4491 training step(s),cross entropy on all data is 0.00506295
After 4492 training step(s),cross entropy on all data is 0.00506123
After 4493 training step(s),cross entropy on all data is 0.00505968
After 4494 training step(s),cross entropy on all data is 0.00505828
After 4495 training step(s),cross entropy on all data is 0.00505702
After 4496 training step(s),cross entropy on all data is 0.00505588
After 4497 training step(s),cross entropy on all data is 0.00505486
After 4498 training step(s),cross entropy on all data is 0.00505394
After 4499 training step(s),cross entropy on all data is 0.00505311
After 4500 training step(s),cross entropy on all data is 0.00505237
After 4501 training step(s),cross entropy on all data is 0.0050517
After 4502 training step(s),cross entropy on all data is 0.00505109
After 4503 training step(s),cross entropy on all data is 0.00504817
After 4504 training step(s),cross entropy on all data is 0.00504554
After 4505 training step(s),cross entropy on all data is 0.00504318
After 4506 training step(s),cross entropy on all data is 0.00504105
After 4507 training step(s),cross entropy on all data is 0.00503913
After 4508 training step(s),cross entropy on all data is 0.0050374
After 4509 training step(s),cross entropy on all data is 0.00503585
After 4510 training step(s),cross entropy on all data is 0.00503445
After 4511 training step(s),cross entropy on all data is 0.00503319
After 4512 training step(s),cross entropy on all data is 0.00503205
After 4513 training step(s),cross entropy on all data is 0.00503103
After 4514 training step(s),cross entropy on all data is 0.00503011
After 4515 training step(s),cross entropy on all data is 0.00502928
After 4516 training step(s),cross entropy on all data is 0.00502854
After 4517 training step(s),cross entropy on all data is 0.00502787
After 4518 training step(s),cross entropy on all data is 0.00502726
After 4519 training step(s),cross entropy on all data is 0.00502434
After 4520 training step(s),cross entropy on all data is 0.00502171
After 4521 training step(s),cross entropy on all data is 0.00501934
After 4522 training step(s),cross entropy on all data is 0.00501721
After 4523 training step(s),cross entropy on all data is 0.00501529
After 4524 training step(s),cross entropy on all data is 0.00501356
After 4525 training step(s),cross entropy on all data is 0.00501201
After 4526 training step(s),cross entropy on all data is 0.00501061
After 4527 training step(s),cross entropy on all data is 0.00500935
After 4528 training step(s),cross entropy on all data is 0.00500821
After 4529 training step(s),cross entropy on all data is 0.00500719
After 4530 training step(s),cross entropy on all data is 0.00500627
After 4531 training step(s),cross entropy on all data is 0.00500544
After 4532 training step(s),cross entropy on all data is 0.00500469
After 4533 training step(s),cross entropy on all data is 0.00500402
After 4534 training step(s),cross entropy on all data is 0.00500341
After 4535 training step(s),cross entropy on all data is 0.00500049
After 4536 training step(s),cross entropy on all data is 0.00499786
After 4537 training step(s),cross entropy on all data is 0.00499549
After 4538 training step(s),cross entropy on all data is 0.00499336
After 4539 training step(s),cross entropy on all data is 0.00499144
After 4540 training step(s),cross entropy on all data is 0.00498971
After 4541 training step(s),cross entropy on all data is 0.00498815
After 4542 training step(s),cross entropy on all data is 0.00498675
After 4543 training step(s),cross entropy on all data is 0.00498549
After 4544 training step(s),cross entropy on all data is 0.00498435
After 4545 training step(s),cross entropy on all data is 0.00498333
After 4546 training step(s),cross entropy on all data is 0.00498241
After 4547 training step(s),cross entropy on all data is 0.00498158
After 4548 training step(s),cross entropy on all data is 0.00498083
After 4549 training step(s),cross entropy on all data is 0.00498016
After 4550 training step(s),cross entropy on all data is 0.00497956
After 4551 training step(s),cross entropy on all data is 0.00497663
After 4552 training step(s),cross entropy on all data is 0.004974
After 4553 training step(s),cross entropy on all data is 0.00497163
After 4554 training step(s),cross entropy on all data is 0.00496949
After 4555 training step(s),cross entropy on all data is 0.00496757
After 4556 training step(s),cross entropy on all data is 0.00496584
After 4557 training step(s),cross entropy on all data is 0.00496428
After 4558 training step(s),cross entropy on all data is 0.00496288
After 4559 training step(s),cross entropy on all data is 0.00496162
After 4560 training step(s),cross entropy on all data is 0.00496048
After 4561 training step(s),cross entropy on all data is 0.00495946
After 4562 training step(s),cross entropy on all data is 0.00495854
After 4563 training step(s),cross entropy on all data is 0.00495771
After 4564 training step(s),cross entropy on all data is 0.00495696
After 4565 training step(s),cross entropy on all data is 0.00495629
After 4566 training step(s),cross entropy on all data is 0.00495568
After 4567 training step(s),cross entropy on all data is 0.00495276
After 4568 training step(s),cross entropy on all data is 0.00495012
After 4569 training step(s),cross entropy on all data is 0.00494775
After 4570 training step(s),cross entropy on all data is 0.00494562
After 4571 training step(s),cross entropy on all data is 0.00494369
After 4572 training step(s),cross entropy on all data is 0.00494196
After 4573 training step(s),cross entropy on all data is 0.0049404
After 4574 training step(s),cross entropy on all data is 0.004939
After 4575 training step(s),cross entropy on all data is 0.00493774
After 4576 training step(s),cross entropy on all data is 0.0049366
After 4577 training step(s),cross entropy on all data is 0.00493558
After 4578 training step(s),cross entropy on all data is 0.00493465
After 4579 training step(s),cross entropy on all data is 0.00493382
After 4580 training step(s),cross entropy on all data is 0.00493308
After 4581 training step(s),cross entropy on all data is 0.0049324
After 4582 training step(s),cross entropy on all data is 0.0049318
After 4583 training step(s),cross entropy on all data is 0.00492887
After 4584 training step(s),cross entropy on all data is 0.00492623
After 4585 training step(s),cross entropy on all data is 0.00492386
After 4586 training step(s),cross entropy on all data is 0.00492172
After 4587 training step(s),cross entropy on all data is 0.0049198
After 4588 training step(s),cross entropy on all data is 0.00491807
After 4589 training step(s),cross entropy on all data is 0.00491651
After 4590 training step(s),cross entropy on all data is 0.00491511
After 4591 training step(s),cross entropy on all data is 0.00491384
After 4592 training step(s),cross entropy on all data is 0.0049127
After 4593 training step(s),cross entropy on all data is 0.00491168
After 4594 training step(s),cross entropy on all data is 0.00491076
After 4595 training step(s),cross entropy on all data is 0.00490993
After 4596 training step(s),cross entropy on all data is 0.00490918
After 4597 training step(s),cross entropy on all data is 0.00490851
After 4598 training step(s),cross entropy on all data is 0.0049079
After 4599 training step(s),cross entropy on all data is 0.00490497
After 4600 training step(s),cross entropy on all data is 0.00490233
After 4601 training step(s),cross entropy on all data is 0.00489996
After 4602 training step(s),cross entropy on all data is 0.00489782
After 4603 training step(s),cross entropy on all data is 0.0048959
After 4604 training step(s),cross entropy on all data is 0.00489416
After 4605 training step(s),cross entropy on all data is 0.0048926
After 4606 training step(s),cross entropy on all data is 0.0048912
After 4607 training step(s),cross entropy on all data is 0.00488994
After 4608 training step(s),cross entropy on all data is 0.0048888
After 4609 training step(s),cross entropy on all data is 0.00488777
After 4610 training step(s),cross entropy on all data is 0.00488685
After 4611 training step(s),cross entropy on all data is 0.00488602
After 4612 training step(s),cross entropy on all data is 0.00488527
After 4613 training step(s),cross entropy on all data is 0.0048846
After 4614 training step(s),cross entropy on all data is 0.00488399
After 4615 training step(s),cross entropy on all data is 0.00488106
After 4616 training step(s),cross entropy on all data is 0.00487842
After 4617 training step(s),cross entropy on all data is 0.00487605
After 4618 training step(s),cross entropy on all data is 0.00487391
After 4619 training step(s),cross entropy on all data is 0.00487198
After 4620 training step(s),cross entropy on all data is 0.00487025
After 4621 training step(s),cross entropy on all data is 0.00486869
After 4622 training step(s),cross entropy on all data is 0.00486728
After 4623 training step(s),cross entropy on all data is 0.00486602
After 4624 training step(s),cross entropy on all data is 0.00486488
After 4625 training step(s),cross entropy on all data is 0.00486385
After 4626 training step(s),cross entropy on all data is 0.00486293
After 4627 training step(s),cross entropy on all data is 0.0048621
After 4628 training step(s),cross entropy on all data is 0.00486135
After 4629 training step(s),cross entropy on all data is 0.00486067
After 4630 training step(s),cross entropy on all data is 0.00486007
After 4631 training step(s),cross entropy on all data is 0.00485714
After 4632 training step(s),cross entropy on all data is 0.0048545
After 4633 training step(s),cross entropy on all data is 0.00485212
After 4634 training step(s),cross entropy on all data is 0.00484998
After 4635 training step(s),cross entropy on all data is 0.00484806
After 4636 training step(s),cross entropy on all data is 0.00484632
After 4637 training step(s),cross entropy on all data is 0.00484476
After 4638 training step(s),cross entropy on all data is 0.00484335
After 4639 training step(s),cross entropy on all data is 0.00484209
After 4640 training step(s),cross entropy on all data is 0.00484095
After 4641 training step(s),cross entropy on all data is 0.00483992
After 4642 training step(s),cross entropy on all data is 0.004839
After 4643 training step(s),cross entropy on all data is 0.00483817
After 4644 training step(s),cross entropy on all data is 0.00483742
After 4645 training step(s),cross entropy on all data is 0.00483674
After 4646 training step(s),cross entropy on all data is 0.00483614
After 4647 training step(s),cross entropy on all data is 0.0048332
After 4648 training step(s),cross entropy on all data is 0.00483056
After 4649 training step(s),cross entropy on all data is 0.00482819
After 4650 training step(s),cross entropy on all data is 0.00482605
After 4651 training step(s),cross entropy on all data is 0.00482412
After 4652 training step(s),cross entropy on all data is 0.00482238
After 4653 training step(s),cross entropy on all data is 0.00482082
After 4654 training step(s),cross entropy on all data is 0.00481942
After 4655 training step(s),cross entropy on all data is 0.00481815
After 4656 training step(s),cross entropy on all data is 0.00481701
After 4657 training step(s),cross entropy on all data is 0.00481598
After 4658 training step(s),cross entropy on all data is 0.00481506
After 4659 training step(s),cross entropy on all data is 0.00481423
After 4660 training step(s),cross entropy on all data is 0.00481348
After 4661 training step(s),cross entropy on all data is 0.0048128
After 4662 training step(s),cross entropy on all data is 0.00481219
After 4663 training step(s),cross entropy on all data is 0.00480926
After 4664 training step(s),cross entropy on all data is 0.00480662
After 4665 training step(s),cross entropy on all data is 0.00480424
After 4666 training step(s),cross entropy on all data is 0.0048021
After 4667 training step(s),cross entropy on all data is 0.00480017
After 4668 training step(s),cross entropy on all data is 0.00479844
After 4669 training step(s),cross entropy on all data is 0.00479687
After 4670 training step(s),cross entropy on all data is 0.00479547
After 4671 training step(s),cross entropy on all data is 0.0047942
After 4672 training step(s),cross entropy on all data is 0.00479306
After 4673 training step(s),cross entropy on all data is 0.00479203
After 4674 training step(s),cross entropy on all data is 0.00479111
After 4675 training step(s),cross entropy on all data is 0.00479027
After 4676 training step(s),cross entropy on all data is 0.00478953
After 4677 training step(s),cross entropy on all data is 0.00478885
After 4678 training step(s),cross entropy on all data is 0.00478824
After 4679 training step(s),cross entropy on all data is 0.00478531
After 4680 training step(s),cross entropy on all data is 0.00478267
After 4681 training step(s),cross entropy on all data is 0.00478029
After 4682 training step(s),cross entropy on all data is 0.00477814
After 4683 training step(s),cross entropy on all data is 0.00477622
After 4684 training step(s),cross entropy on all data is 0.00477448
After 4685 training step(s),cross entropy on all data is 0.00477292
After 4686 training step(s),cross entropy on all data is 0.00477151
After 4687 training step(s),cross entropy on all data is 0.00477024
After 4688 training step(s),cross entropy on all data is 0.0047691
After 4689 training step(s),cross entropy on all data is 0.00476807
After 4690 training step(s),cross entropy on all data is 0.00476715
After 4691 training step(s),cross entropy on all data is 0.00476631
After 4692 training step(s),cross entropy on all data is 0.00476557
After 4693 training step(s),cross entropy on all data is 0.00476489
After 4694 training step(s),cross entropy on all data is 0.00476428
After 4695 training step(s),cross entropy on all data is 0.00476135
After 4696 training step(s),cross entropy on all data is 0.0047587
After 4697 training step(s),cross entropy on all data is 0.00475632
After 4698 training step(s),cross entropy on all data is 0.00475418
After 4699 training step(s),cross entropy on all data is 0.00475225
After 4700 training step(s),cross entropy on all data is 0.00475051
After 4701 training step(s),cross entropy on all data is 0.00474895
After 4702 training step(s),cross entropy on all data is 0.00474754
After 4703 training step(s),cross entropy on all data is 0.00474627
After 4704 training step(s),cross entropy on all data is 0.00474513
After 4705 training step(s),cross entropy on all data is 0.00474411
After 4706 training step(s),cross entropy on all data is 0.00474318
After 4707 training step(s),cross entropy on all data is 0.00474235
After 4708 training step(s),cross entropy on all data is 0.0047416
After 4709 training step(s),cross entropy on all data is 0.00474092
After 4710 training step(s),cross entropy on all data is 0.00474031
After 4711 training step(s),cross entropy on all data is 0.00473737
After 4712 training step(s),cross entropy on all data is 0.00473473
After 4713 training step(s),cross entropy on all data is 0.00473235
After 4714 training step(s),cross entropy on all data is 0.00473021
After 4715 training step(s),cross entropy on all data is 0.00472828
After 4716 training step(s),cross entropy on all data is 0.00472654
After 4717 training step(s),cross entropy on all data is 0.00472497
After 4718 training step(s),cross entropy on all data is 0.00472357
After 4719 training step(s),cross entropy on all data is 0.0047223
After 4720 training step(s),cross entropy on all data is 0.00472115
After 4721 training step(s),cross entropy on all data is 0.00472013
After 4722 training step(s),cross entropy on all data is 0.0047192
After 4723 training step(s),cross entropy on all data is 0.00471837
After 4724 training step(s),cross entropy on all data is 0.00471762
After 4725 training step(s),cross entropy on all data is 0.00471694
After 4726 training step(s),cross entropy on all data is 0.00471633
After 4727 training step(s),cross entropy on all data is 0.0047134
After 4728 training step(s),cross entropy on all data is 0.00471075
After 4729 training step(s),cross entropy on all data is 0.00470837
After 4730 training step(s),cross entropy on all data is 0.00470622
After 4731 training step(s),cross entropy on all data is 0.00470429
After 4732 training step(s),cross entropy on all data is 0.00470256
After 4733 training step(s),cross entropy on all data is 0.00470099
After 4734 training step(s),cross entropy on all data is 0.00469958
After 4735 training step(s),cross entropy on all data is 0.00469831
After 4736 training step(s),cross entropy on all data is 0.00469717
After 4737 training step(s),cross entropy on all data is 0.00469614
After 4738 training step(s),cross entropy on all data is 0.00469522
After 4739 training step(s),cross entropy on all data is 0.00469438
After 4740 training step(s),cross entropy on all data is 0.00469363
After 4741 training step(s),cross entropy on all data is 0.00469296
After 4742 training step(s),cross entropy on all data is 0.00469235
After 4743 training step(s),cross entropy on all data is 0.00468941
After 4744 training step(s),cross entropy on all data is 0.00468676
After 4745 training step(s),cross entropy on all data is 0.00468438
After 4746 training step(s),cross entropy on all data is 0.00468223
After 4747 training step(s),cross entropy on all data is 0.0046803
After 4748 training step(s),cross entropy on all data is 0.00467857
After 4749 training step(s),cross entropy on all data is 0.004677
After 4750 training step(s),cross entropy on all data is 0.00467559
After 4751 training step(s),cross entropy on all data is 0.00467432
After 4752 training step(s),cross entropy on all data is 0.00467318
After 4753 training step(s),cross entropy on all data is 0.00467215
After 4754 training step(s),cross entropy on all data is 0.00467122
After 4755 training step(s),cross entropy on all data is 0.00467039
After 4756 training step(s),cross entropy on all data is 0.00466964
After 4757 training step(s),cross entropy on all data is 0.00466896
After 4758 training step(s),cross entropy on all data is 0.00466835
After 4759 training step(s),cross entropy on all data is 0.00466541
After 4760 training step(s),cross entropy on all data is 0.00466277
After 4761 training step(s),cross entropy on all data is 0.00466038
After 4762 training step(s),cross entropy on all data is 0.00465824
After 4763 training step(s),cross entropy on all data is 0.00465631
After 4764 training step(s),cross entropy on all data is 0.00465457
After 4765 training step(s),cross entropy on all data is 0.004653
After 4766 training step(s),cross entropy on all data is 0.00465159
After 4767 training step(s),cross entropy on all data is 0.00465032
After 4768 training step(s),cross entropy on all data is 0.00464918
After 4769 training step(s),cross entropy on all data is 0.00464815
After 4770 training step(s),cross entropy on all data is 0.00464722
After 4771 training step(s),cross entropy on all data is 0.00464639
After 4772 training step(s),cross entropy on all data is 0.00464564
After 4773 training step(s),cross entropy on all data is 0.00464496
After 4774 training step(s),cross entropy on all data is 0.00464435
After 4775 training step(s),cross entropy on all data is 0.00464141
After 4776 training step(s),cross entropy on all data is 0.00463876
After 4777 training step(s),cross entropy on all data is 0.00463638
After 4778 training step(s),cross entropy on all data is 0.00463423
After 4779 training step(s),cross entropy on all data is 0.0046323
After 4780 training step(s),cross entropy on all data is 0.00463056
After 4781 training step(s),cross entropy on all data is 0.004629
After 4782 training step(s),cross entropy on all data is 0.00462759
After 4783 training step(s),cross entropy on all data is 0.00462632
After 4784 training step(s),cross entropy on all data is 0.00462517
After 4785 training step(s),cross entropy on all data is 0.00462414
After 4786 training step(s),cross entropy on all data is 0.00462322
After 4787 training step(s),cross entropy on all data is 0.00462238
After 4788 training step(s),cross entropy on all data is 0.00462163
After 4789 training step(s),cross entropy on all data is 0.00462095
After 4790 training step(s),cross entropy on all data is 0.00462034
After 4791 training step(s),cross entropy on all data is 0.0046174
After 4792 training step(s),cross entropy on all data is 0.00461475
After 4793 training step(s),cross entropy on all data is 0.00461237
After 4794 training step(s),cross entropy on all data is 0.00461022
After 4795 training step(s),cross entropy on all data is 0.00460829
After 4796 training step(s),cross entropy on all data is 0.00460655
After 4797 training step(s),cross entropy on all data is 0.00460498
After 4798 training step(s),cross entropy on all data is 0.00460357
After 4799 training step(s),cross entropy on all data is 0.0046023
After 4800 training step(s),cross entropy on all data is 0.00460116
After 4801 training step(s),cross entropy on all data is 0.00460013
After 4802 training step(s),cross entropy on all data is 0.0045992
After 4803 training step(s),cross entropy on all data is 0.00459837
After 4804 training step(s),cross entropy on all data is 0.00459762
After 4805 training step(s),cross entropy on all data is 0.00459694
After 4806 training step(s),cross entropy on all data is 0.00459633
After 4807 training step(s),cross entropy on all data is 0.00459339
After 4808 training step(s),cross entropy on all data is 0.00459074
After 4809 training step(s),cross entropy on all data is 0.00458835
After 4810 training step(s),cross entropy on all data is 0.00458621
After 4811 training step(s),cross entropy on all data is 0.00458427
After 4812 training step(s),cross entropy on all data is 0.00458253
After 4813 training step(s),cross entropy on all data is 0.00458097
After 4814 training step(s),cross entropy on all data is 0.00457956
After 4815 training step(s),cross entropy on all data is 0.00457829
After 4816 training step(s),cross entropy on all data is 0.00457714
After 4817 training step(s),cross entropy on all data is 0.00457611
After 4818 training step(s),cross entropy on all data is 0.00457518
After 4819 training step(s),cross entropy on all data is 0.00457435
After 4820 training step(s),cross entropy on all data is 0.0045736
After 4821 training step(s),cross entropy on all data is 0.00457292
After 4822 training step(s),cross entropy on all data is 0.00457231
After 4823 training step(s),cross entropy on all data is 0.00456937
After 4824 training step(s),cross entropy on all data is 0.00456672
After 4825 training step(s),cross entropy on all data is 0.00456433
After 4826 training step(s),cross entropy on all data is 0.00456218
After 4827 training step(s),cross entropy on all data is 0.00456025
After 4828 training step(s),cross entropy on all data is 0.00455851
After 4829 training step(s),cross entropy on all data is 0.00455694
After 4830 training step(s),cross entropy on all data is 0.00455553
After 4831 training step(s),cross entropy on all data is 0.00455426
After 4832 training step(s),cross entropy on all data is 0.00455312
After 4833 training step(s),cross entropy on all data is 0.00455209
After 4834 training step(s),cross entropy on all data is 0.00455116
After 4835 training step(s),cross entropy on all data is 0.00455032
After 4836 training step(s),cross entropy on all data is 0.00454957
After 4837 training step(s),cross entropy on all data is 0.00454889
After 4838 training step(s),cross entropy on all data is 0.00454828
After 4839 training step(s),cross entropy on all data is 0.00454534
After 4840 training step(s),cross entropy on all data is 0.00454269
After 4841 training step(s),cross entropy on all data is 0.0045403
After 4842 training step(s),cross entropy on all data is 0.00453816
After 4843 training step(s),cross entropy on all data is 0.00453622
After 4844 training step(s),cross entropy on all data is 0.00453448
After 4845 training step(s),cross entropy on all data is 0.00453291
After 4846 training step(s),cross entropy on all data is 0.0045315
After 4847 training step(s),cross entropy on all data is 0.00453023
After 4848 training step(s),cross entropy on all data is 0.00452909
After 4849 training step(s),cross entropy on all data is 0.00452806
After 4850 training step(s),cross entropy on all data is 0.00452713
After 4851 training step(s),cross entropy on all data is 0.00452629
After 4852 training step(s),cross entropy on all data is 0.00452554
After 4853 training step(s),cross entropy on all data is 0.00452486
After 4854 training step(s),cross entropy on all data is 0.00452425
After 4855 training step(s),cross entropy on all data is 0.00452131
After 4856 training step(s),cross entropy on all data is 0.00451866
After 4857 training step(s),cross entropy on all data is 0.00451627
After 4858 training step(s),cross entropy on all data is 0.00451412
After 4859 training step(s),cross entropy on all data is 0.00451219
After 4860 training step(s),cross entropy on all data is 0.00451045
After 4861 training step(s),cross entropy on all data is 0.00450888
After 4862 training step(s),cross entropy on all data is 0.00450747
After 4863 training step(s),cross entropy on all data is 0.0045062
After 4864 training step(s),cross entropy on all data is 0.00450505
After 4865 training step(s),cross entropy on all data is 0.00450402
After 4866 training step(s),cross entropy on all data is 0.00450309
After 4867 training step(s),cross entropy on all data is 0.00450226
After 4868 training step(s),cross entropy on all data is 0.00450151
After 4869 training step(s),cross entropy on all data is 0.00450083
After 4870 training step(s),cross entropy on all data is 0.00450022
After 4871 training step(s),cross entropy on all data is 0.00449727
After 4872 training step(s),cross entropy on all data is 0.00449462
After 4873 training step(s),cross entropy on all data is 0.00449224
After 4874 training step(s),cross entropy on all data is 0.00449009
After 4875 training step(s),cross entropy on all data is 0.00448815
After 4876 training step(s),cross entropy on all data is 0.00448641
After 4877 training step(s),cross entropy on all data is 0.00448484
After 4878 training step(s),cross entropy on all data is 0.00448343
After 4879 training step(s),cross entropy on all data is 0.00448216
After 4880 training step(s),cross entropy on all data is 0.00448101
After 4881 training step(s),cross entropy on all data is 0.00447998
After 4882 training step(s),cross entropy on all data is 0.00447905
After 4883 training step(s),cross entropy on all data is 0.00447822
After 4884 training step(s),cross entropy on all data is 0.00447747
After 4885 training step(s),cross entropy on all data is 0.00447679
After 4886 training step(s),cross entropy on all data is 0.00447618
After 4887 training step(s),cross entropy on all data is 0.00447323
After 4888 training step(s),cross entropy on all data is 0.00447058
After 4889 training step(s),cross entropy on all data is 0.0044682
After 4890 training step(s),cross entropy on all data is 0.00446605
After 4891 training step(s),cross entropy on all data is 0.00446411
After 4892 training step(s),cross entropy on all data is 0.00446237
After 4893 training step(s),cross entropy on all data is 0.0044608
After 4894 training step(s),cross entropy on all data is 0.00445939
After 4895 training step(s),cross entropy on all data is 0.00445812
After 4896 training step(s),cross entropy on all data is 0.00445697
After 4897 training step(s),cross entropy on all data is 0.00445594
After 4898 training step(s),cross entropy on all data is 0.00445501
After 4899 training step(s),cross entropy on all data is 0.00445418
After 4900 training step(s),cross entropy on all data is 0.00445342
After 4901 training step(s),cross entropy on all data is 0.00445275
After 4902 training step(s),cross entropy on all data is 0.00445214
After 4903 training step(s),cross entropy on all data is 0.00444919
After 4904 training step(s),cross entropy on all data is 0.00444654
After 4905 training step(s),cross entropy on all data is 0.00444415
After 4906 training step(s),cross entropy on all data is 0.004442
After 4907 training step(s),cross entropy on all data is 0.00444007
After 4908 training step(s),cross entropy on all data is 0.00443832
After 4909 training step(s),cross entropy on all data is 0.00443675
After 4910 training step(s),cross entropy on all data is 0.00443534
After 4911 training step(s),cross entropy on all data is 0.00443407
After 4912 training step(s),cross entropy on all data is 0.00443293
After 4913 training step(s),cross entropy on all data is 0.00443189
After 4914 training step(s),cross entropy on all data is 0.00443097
After 4915 training step(s),cross entropy on all data is 0.00443013
After 4916 training step(s),cross entropy on all data is 0.00442938
After 4917 training step(s),cross entropy on all data is 0.0044287
After 4918 training step(s),cross entropy on all data is 0.00442809
After 4919 training step(s),cross entropy on all data is 0.00442514
After 4920 training step(s),cross entropy on all data is 0.00442249
After 4921 training step(s),cross entropy on all data is 0.0044201
After 4922 training step(s),cross entropy on all data is 0.00441795
After 4923 training step(s),cross entropy on all data is 0.00441602
After 4924 training step(s),cross entropy on all data is 0.00441428
After 4925 training step(s),cross entropy on all data is 0.00441271
After 4926 training step(s),cross entropy on all data is 0.00441129
After 4927 training step(s),cross entropy on all data is 0.00441002
After 4928 training step(s),cross entropy on all data is 0.00440888
After 4929 training step(s),cross entropy on all data is 0.00440785
After 4930 training step(s),cross entropy on all data is 0.00440692
After 4931 training step(s),cross entropy on all data is 0.00440608
After 4932 training step(s),cross entropy on all data is 0.00440533
After 4933 training step(s),cross entropy on all data is 0.00440465
After 4934 training step(s),cross entropy on all data is 0.00440404
After 4935 training step(s),cross entropy on all data is 0.00440109
After 4936 training step(s),cross entropy on all data is 0.00439844
After 4937 training step(s),cross entropy on all data is 0.00439605
After 4938 training step(s),cross entropy on all data is 0.0043939
After 4939 training step(s),cross entropy on all data is 0.00439197
After 4940 training step(s),cross entropy on all data is 0.00439022
After 4941 training step(s),cross entropy on all data is 0.00438866
After 4942 training step(s),cross entropy on all data is 0.00438724
After 4943 training step(s),cross entropy on all data is 0.00438597
After 4944 training step(s),cross entropy on all data is 0.00438483
After 4945 training step(s),cross entropy on all data is 0.00438379
After 4946 training step(s),cross entropy on all data is 0.00438287
After 4947 training step(s),cross entropy on all data is 0.00438203
After 4948 training step(s),cross entropy on all data is 0.00438128
After 4949 training step(s),cross entropy on all data is 0.0043806
After 4950 training step(s),cross entropy on all data is 0.00437999
After 4951 training step(s),cross entropy on all data is 0.00437704
After 4952 training step(s),cross entropy on all data is 0.00437439
After 4953 training step(s),cross entropy on all data is 0.004372
After 4954 training step(s),cross entropy on all data is 0.00436985
After 4955 training step(s),cross entropy on all data is 0.00436791
After 4956 training step(s),cross entropy on all data is 0.00436617
After 4957 training step(s),cross entropy on all data is 0.0043646
After 4958 training step(s),cross entropy on all data is 0.00436319
After 4959 training step(s),cross entropy on all data is 0.00436192
After 4960 training step(s),cross entropy on all data is 0.00436077
After 4961 training step(s),cross entropy on all data is 0.00435974
After 4962 training step(s),cross entropy on all data is 0.00435881
After 4963 training step(s),cross entropy on all data is 0.00435797
After 4964 training step(s),cross entropy on all data is 0.00435722
After 4965 training step(s),cross entropy on all data is 0.00435654
After 4966 training step(s),cross entropy on all data is 0.00435593
After 4967 training step(s),cross entropy on all data is 0.00435299
After 4968 training step(s),cross entropy on all data is 0.00435033
After 4969 training step(s),cross entropy on all data is 0.00434795
After 4970 training step(s),cross entropy on all data is 0.0043458
After 4971 training step(s),cross entropy on all data is 0.00434386
After 4972 training step(s),cross entropy on all data is 0.00434212
After 4973 training step(s),cross entropy on all data is 0.00434055
After 4974 training step(s),cross entropy on all data is 0.00433913
After 4975 training step(s),cross entropy on all data is 0.00433786
After 4976 training step(s),cross entropy on all data is 0.00433671
After 4977 training step(s),cross entropy on all data is 0.00433568
After 4978 training step(s),cross entropy on all data is 0.00433475
After 4979 training step(s),cross entropy on all data is 0.00433392
After 4980 training step(s),cross entropy on all data is 0.00433317
After 4981 training step(s),cross entropy on all data is 0.00433249
After 4982 training step(s),cross entropy on all data is 0.00433188
After 4983 training step(s),cross entropy on all data is 0.00432893
After 4984 training step(s),cross entropy on all data is 0.00432628
After 4985 training step(s),cross entropy on all data is 0.00432389
After 4986 training step(s),cross entropy on all data is 0.00432174
After 4987 training step(s),cross entropy on all data is 0.0043198
After 4988 training step(s),cross entropy on all data is 0.00431806
After 4989 training step(s),cross entropy on all data is 0.00431649
After 4990 training step(s),cross entropy on all data is 0.00431508
After 4991 training step(s),cross entropy on all data is 0.0043138
After 4992 training step(s),cross entropy on all data is 0.00431266
After 4993 training step(s),cross entropy on all data is 0.00431163
After 4994 training step(s),cross entropy on all data is 0.0043107
After 4995 training step(s),cross entropy on all data is 0.00430986
After 4996 training step(s),cross entropy on all data is 0.00430911
After 4997 training step(s),cross entropy on all data is 0.00430843
After 4998 training step(s),cross entropy on all data is 0.00430782
After 4999 training step(s),cross entropy on all data is 0.00430487
[[-1.9618274   2.58235407  1.68203783]
 [-3.4681716   1.06982327  2.11788988]]
[[-1.8247149 ]
 [ 2.68546653]
 [ 1.41819501]]

In [ ]: