In [1]:
from sklearn.ensemble import RandomForestClassifier
from sklearn.linear_model import SGDClassifier
#from sklearn.model_selection import cross_val_score
from scipy.io import mmread
import numpy as np
In [2]:
malware_classes = ["Agent", "AutoRun", "FraudLoad", "FraudPack", "Hupigon", "Krap",
"Lipler", "Magania", "None", "Poison", "Swizzor", "Tdss",
"VB", "Virut", "Zbot"]
# a function for writing predictions in the required format
def write_predictions(predictions, ids, outfile):
"""
assumes len(predictions) == len(ids), and that predictions[i] is the
index of the predicted class with the malware_classes list above for
the executable corresponding to ids[i].
outfile will be overwritten
"""
with open(outfile,"w+") as f:
# write header
f.write("Id,Prediction\n")
for i, history_id in enumerate(ids):
f.write("%s,%d\n" % (history_id, predictions[i]))
def classes_to_Y(classes):
output = []
for cls in classes:
output.append(malware_classes.index(cls))
return np.array(output)
In [4]:
# load training classes
classes = np.load("../data/features/train_classes.npy")
# load sparse matrix of training data
sparse_mat_train_test = mmread("../data/features/naive_word_hashed_full_features.mtx")
In [4]:
# classes and load BIG tfidf feature matrix
classes = np.load("../data/features/train_classes.npy")
# load sparse matrix of training data
sparse_mat_train_test = mmread("../data/features/tfifd_4gram_hashed_full_features.mtx")
In [5]:
# convert csr to a numpy array
sparse = sparse_mat_train_test
# pull out training examples
X = sparse.tocsc()[:classes.shape[0],:]
# X_CV = X[-300:]
# X = X[:-300]
X_test = sparse.tocsc()[classes.shape[0]:,:]
print X_test.shape
Y = classes_to_Y(classes)
# Y_CV = Y[-300:]
# Y = Y[:-300]
(3724, 1048576)
In [6]:
RF = RandomForestClassifier()
RF.fit(X, Y)
Out[6]:
RandomForestClassifier(bootstrap=True, class_weight=None, criterion='gini',
max_depth=None, max_features='auto', max_leaf_nodes=None,
min_impurity_split=1e-07, min_samples_leaf=1,
min_samples_split=2, min_weight_fraction_leaf=0.0,
n_estimators=10, n_jobs=1, oob_score=False, random_state=None,
verbose=0, warm_start=False)
In [1]:
# preds = RF.predict(X_CV)
# mistakes = 0
# for i in range(len(preds)):
# if preds[i] != Y_CV[i]:
# mistakes += 1
# print malware_classes[Y_CV[i]]
# print mistakes
---------------------------------------------------------------------------
NameError Traceback (most recent call last)
<ipython-input-1-ed548c1bc0cd> in <module>()
----> 1 preds = RF.predict(X_CV)
2
3 mistakes = 0
4 for i in range(len(preds)):
5 if preds[i] != Y_CV[i]:
NameError: name 'RF' is not defined
In [ ]:
test_pred = RF.predict(X_test)
In [ ]:
print test_pred
test_ids = np.load("../data/features/test_ids.npy")
print test_ids
write_predictions(test_pred, test_ids, "../predictions/rfc_10.csv")
In [6]:
# Try an SGDClassifier learning directly from the sparse matrix
SGD = SGDClassifier(n_jobs=1, n_iter=100, verbose=1, loss="modified_huber")
SGD.fit(X,Y)
-- Epoch 1
Norm: 77.67, NNZs: 1042090, Bias: -1.302051, T: 3086, Avg. loss: 1.456797
Total training time: 0.95 seconds.
-- Epoch 2
Norm: 59.59, NNZs: 1048073, Bias: -1.360660, T: 6172, Avg. loss: 0.908354
Total training time: 1.88 seconds.
-- Epoch 3
Norm: 48.76, NNZs: 1048417, Bias: -1.596870, T: 9258, Avg. loss: 0.657365
Total training time: 2.81 seconds.
-- Epoch 4
Norm: 41.35, NNZs: 1048540, Bias: -1.502075, T: 12344, Avg. loss: 0.513506
Total training time: 3.76 seconds.
-- Epoch 5
Norm: 36.60, NNZs: 1048561, Bias: -1.494563, T: 15430, Avg. loss: 0.423420
Total training time: 4.71 seconds.
-- Epoch 6
Norm: 33.26, NNZs: 1048569, Bias: -1.469440, T: 18516, Avg. loss: 0.361178
Total training time: 5.67 seconds.
-- Epoch 7
Norm: 30.88, NNZs: 1048575, Bias: -1.445343, T: 21602, Avg. loss: 0.315927
Total training time: 6.66 seconds.
-- Epoch 8
Norm: 29.38, NNZs: 1048575, Bias: -1.422461, T: 24688, Avg. loss: 0.281520
Total training time: 7.65 seconds.
-- Epoch 9
Norm: 28.11, NNZs: 1048575, Bias: -1.409079, T: 27774, Avg. loss: 0.254595
Total training time: 8.67 seconds.
-- Epoch 10
Norm: 27.21, NNZs: 1048575, Bias: -1.393612, T: 30860, Avg. loss: 0.233107
Total training time: 9.69 seconds.
-- Epoch 11
Norm: 26.59, NNZs: 1048576, Bias: -1.375169, T: 33946, Avg. loss: 0.215281
Total training time: 10.73 seconds.
-- Epoch 12
Norm: 26.06, NNZs: 1048576, Bias: -1.357556, T: 37032, Avg. loss: 0.200374
Total training time: 11.77 seconds.
-- Epoch 13
Norm: 25.63, NNZs: 1048576, Bias: -1.343194, T: 40118, Avg. loss: 0.187738
Total training time: 12.83 seconds.
-- Epoch 14
Norm: 25.26, NNZs: 1048576, Bias: -1.328021, T: 43204, Avg. loss: 0.176998
Total training time: 13.89 seconds.
-- Epoch 15
Norm: 24.93, NNZs: 1048576, Bias: -1.318604, T: 46290, Avg. loss: 0.167585
Total training time: 14.97 seconds.
-- Epoch 16
Norm: 24.64, NNZs: 1048576, Bias: -1.317068, T: 49376, Avg. loss: 0.159323
Total training time: 16.05 seconds.
-- Epoch 17
Norm: 24.39, NNZs: 1048576, Bias: -1.305546, T: 52462, Avg. loss: 0.152026
Total training time: 17.11 seconds.
-- Epoch 18
Norm: 24.17, NNZs: 1048576, Bias: -1.301301, T: 55548, Avg. loss: 0.145469
Total training time: 18.15 seconds.
-- Epoch 19
Norm: 23.99, NNZs: 1048576, Bias: -1.291367, T: 58634, Avg. loss: 0.139672
Total training time: 19.25 seconds.
-- Epoch 20
Norm: 23.82, NNZs: 1048576, Bias: -1.287426, T: 61720, Avg. loss: 0.134393
Total training time: 20.32 seconds.
-- Epoch 21
Norm: 23.66, NNZs: 1048576, Bias: -1.284001, T: 64806, Avg. loss: 0.129594
Total training time: 21.39 seconds.
-- Epoch 22
Norm: 23.52, NNZs: 1048576, Bias: -1.281684, T: 67892, Avg. loss: 0.125268
Total training time: 22.47 seconds.
-- Epoch 23
Norm: 23.45, NNZs: 1048576, Bias: -1.267348, T: 70978, Avg. loss: 0.121304
Total training time: 23.55 seconds.
-- Epoch 24
Norm: 23.34, NNZs: 1048576, Bias: -1.264132, T: 74064, Avg. loss: 0.117654
Total training time: 24.64 seconds.
-- Epoch 25
Norm: 23.23, NNZs: 1048576, Bias: -1.262490, T: 77150, Avg. loss: 0.114283
Total training time: 25.73 seconds.
-- Epoch 26
Norm: 23.15, NNZs: 1048576, Bias: -1.259324, T: 80236, Avg. loss: 0.111164
Total training time: 26.84 seconds.
-- Epoch 27
Norm: 23.09, NNZs: 1048576, Bias: -1.248037, T: 83322, Avg. loss: 0.108293
Total training time: 27.94 seconds.
-- Epoch 28
Norm: 23.00, NNZs: 1048576, Bias: -1.250925, T: 86408, Avg. loss: 0.105602
Total training time: 29.04 seconds.
-- Epoch 29
Norm: 22.91, NNZs: 1048576, Bias: -1.253672, T: 89494, Avg. loss: 0.103110
Total training time: 30.15 seconds.
-- Epoch 30
Norm: 22.87, NNZs: 1048576, Bias: -1.240805, T: 92580, Avg. loss: 0.100778
Total training time: 31.23 seconds.
-- Epoch 31
Norm: 22.79, NNZs: 1048576, Bias: -1.244566, T: 95666, Avg. loss: 0.098577
Total training time: 32.32 seconds.
-- Epoch 32
Norm: 22.74, NNZs: 1048576, Bias: -1.240373, T: 98752, Avg. loss: 0.096533
Total training time: 33.41 seconds.
-- Epoch 33
Norm: 22.71, NNZs: 1048576, Bias: -1.232836, T: 101838, Avg. loss: 0.094608
Total training time: 34.54 seconds.
-- Epoch 34
Norm: 22.64, NNZs: 1048576, Bias: -1.233997, T: 104924, Avg. loss: 0.092796
Total training time: 35.64 seconds.
-- Epoch 35
Norm: 22.62, NNZs: 1048576, Bias: -1.225989, T: 108010, Avg. loss: 0.091089
Total training time: 36.73 seconds.
-- Epoch 36
Norm: 22.56, NNZs: 1048576, Bias: -1.227333, T: 111096, Avg. loss: 0.089480
Total training time: 37.87 seconds.
-- Epoch 37
Norm: 22.54, NNZs: 1048576, Bias: -1.221439, T: 114182, Avg. loss: 0.087938
Total training time: 39.00 seconds.
-- Epoch 38
Norm: 22.50, NNZs: 1048576, Bias: -1.221137, T: 117268, Avg. loss: 0.086465
Total training time: 40.13 seconds.
-- Epoch 39
Norm: 22.45, NNZs: 1048576, Bias: -1.221648, T: 120354, Avg. loss: 0.085084
Total training time: 41.24 seconds.
-- Epoch 40
Norm: 22.43, NNZs: 1048576, Bias: -1.217199, T: 123440, Avg. loss: 0.083770
Total training time: 42.34 seconds.
-- Epoch 41
Norm: 22.38, NNZs: 1048576, Bias: -1.218209, T: 126526, Avg. loss: 0.082521
Total training time: 43.48 seconds.
-- Epoch 42
Norm: 22.36, NNZs: 1048576, Bias: -1.213363, T: 129612, Avg. loss: 0.081323
Total training time: 44.58 seconds.
-- Epoch 43
Norm: 22.32, NNZs: 1048576, Bias: -1.212747, T: 132698, Avg. loss: 0.080179
Total training time: 45.71 seconds.
-- Epoch 44
Norm: 22.32, NNZs: 1048576, Bias: -1.205459, T: 135784, Avg. loss: 0.079096
Total training time: 46.85 seconds.
-- Epoch 45
Norm: 22.30, NNZs: 1048576, Bias: -1.204819, T: 138870, Avg. loss: 0.078058
Total training time: 47.96 seconds.
-- Epoch 46
Norm: 22.27, NNZs: 1048576, Bias: -1.205774, T: 141956, Avg. loss: 0.077068
Total training time: 49.12 seconds.
-- Epoch 47
Norm: 22.26, NNZs: 1048576, Bias: -1.201781, T: 145042, Avg. loss: 0.076120
Total training time: 50.25 seconds.
-- Epoch 48
Norm: 22.25, NNZs: 1048576, Bias: -1.196711, T: 148128, Avg. loss: 0.075210
Total training time: 51.41 seconds.
-- Epoch 49
Norm: 22.22, NNZs: 1048576, Bias: -1.197819, T: 151214, Avg. loss: 0.074329
Total training time: 52.54 seconds.
-- Epoch 50
Norm: 22.19, NNZs: 1048576, Bias: -1.198979, T: 154300, Avg. loss: 0.073485
Total training time: 53.67 seconds.
-- Epoch 51
Norm: 22.17, NNZs: 1048576, Bias: -1.196627, T: 157386, Avg. loss: 0.072673
Total training time: 54.80 seconds.
-- Epoch 52
Norm: 22.16, NNZs: 1048576, Bias: -1.191958, T: 160472, Avg. loss: 0.071895
Total training time: 55.92 seconds.
-- Epoch 53
Norm: 22.14, NNZs: 1048576, Bias: -1.194991, T: 163558, Avg. loss: 0.071137
Total training time: 57.08 seconds.
-- Epoch 54
Norm: 22.13, NNZs: 1048576, Bias: -1.187069, T: 166644, Avg. loss: 0.070408
Total training time: 58.19 seconds.
-- Epoch 55
Norm: 22.11, NNZs: 1048576, Bias: -1.188746, T: 169730, Avg. loss: 0.069708
Total training time: 59.33 seconds.
-- Epoch 56
Norm: 22.09, NNZs: 1048576, Bias: -1.189913, T: 172816, Avg. loss: 0.069034
Total training time: 60.46 seconds.
-- Epoch 57
Norm: 22.07, NNZs: 1048576, Bias: -1.187669, T: 175902, Avg. loss: 0.068387
Total training time: 61.61 seconds.
-- Epoch 58
Norm: 22.06, NNZs: 1048576, Bias: -1.186179, T: 178988, Avg. loss: 0.067761
Total training time: 62.76 seconds.
-- Epoch 59
Norm: 22.05, NNZs: 1048576, Bias: -1.183565, T: 182074, Avg. loss: 0.067155
Total training time: 63.89 seconds.
-- Epoch 60
Norm: 22.02, NNZs: 1048576, Bias: -1.183524, T: 185160, Avg. loss: 0.066566
Total training time: 65.03 seconds.
-- Epoch 61
Norm: 22.02, NNZs: 1048576, Bias: -1.179021, T: 188246, Avg. loss: 0.065997
Total training time: 66.17 seconds.
-- Epoch 62
Norm: 22.00, NNZs: 1048576, Bias: -1.180775, T: 191332, Avg. loss: 0.065453
Total training time: 67.32 seconds.
-- Epoch 63
Norm: 21.99, NNZs: 1048576, Bias: -1.180874, T: 194418, Avg. loss: 0.064920
Total training time: 68.45 seconds.
-- Epoch 64
Norm: 21.98, NNZs: 1048576, Bias: -1.177321, T: 197504, Avg. loss: 0.064407
Total training time: 69.58 seconds.
-- Epoch 65
Norm: 21.97, NNZs: 1048576, Bias: -1.177286, T: 200590, Avg. loss: 0.063905
Total training time: 70.72 seconds.
-- Epoch 66
Norm: 21.95, NNZs: 1048576, Bias: -1.179452, T: 203676, Avg. loss: 0.063414
Total training time: 71.88 seconds.
-- Epoch 67
Norm: 21.94, NNZs: 1048576, Bias: -1.177844, T: 206762, Avg. loss: 0.062946
Total training time: 73.04 seconds.
-- Epoch 68
Norm: 21.93, NNZs: 1048576, Bias: -1.177308, T: 209848, Avg. loss: 0.062490
Total training time: 74.17 seconds.
-- Epoch 69
Norm: 21.93, NNZs: 1048576, Bias: -1.171366, T: 212934, Avg. loss: 0.062047
Total training time: 75.31 seconds.
-- Epoch 70
Norm: 21.91, NNZs: 1048576, Bias: -1.170824, T: 216020, Avg. loss: 0.061619
Total training time: 76.47 seconds.
-- Epoch 71
Norm: 21.90, NNZs: 1048576, Bias: -1.171329, T: 219106, Avg. loss: 0.061197
Total training time: 77.62 seconds.
-- Epoch 72
Norm: 21.89, NNZs: 1048576, Bias: -1.170357, T: 222192, Avg. loss: 0.060791
Total training time: 78.78 seconds.
-- Epoch 73
Norm: 21.88, NNZs: 1048576, Bias: -1.169003, T: 225278, Avg. loss: 0.060394
Total training time: 79.94 seconds.
-- Epoch 74
Norm: 21.88, NNZs: 1048576, Bias: -1.166433, T: 228364, Avg. loss: 0.060003
Total training time: 81.09 seconds.
-- Epoch 75
Norm: 21.86, NNZs: 1048576, Bias: -1.168478, T: 231450, Avg. loss: 0.059626
Total training time: 82.26 seconds.
-- Epoch 76
Norm: 21.85, NNZs: 1048576, Bias: -1.168009, T: 234536, Avg. loss: 0.059260
Total training time: 83.39 seconds.
-- Epoch 77
Norm: 21.84, NNZs: 1048576, Bias: -1.166813, T: 237622, Avg. loss: 0.058897
Total training time: 84.53 seconds.
-- Epoch 78
Norm: 21.84, NNZs: 1048576, Bias: -1.165954, T: 240708, Avg. loss: 0.058549
Total training time: 85.68 seconds.
-- Epoch 79
Norm: 21.83, NNZs: 1048576, Bias: -1.164672, T: 243794, Avg. loss: 0.058208
Total training time: 86.83 seconds.
-- Epoch 80
Norm: 21.82, NNZs: 1048576, Bias: -1.164671, T: 246880, Avg. loss: 0.057877
Total training time: 87.96 seconds.
-- Epoch 81
Norm: 21.81, NNZs: 1048576, Bias: -1.163039, T: 249966, Avg. loss: 0.057553
Total training time: 89.11 seconds.
-- Epoch 82
Norm: 21.80, NNZs: 1048576, Bias: -1.162639, T: 253052, Avg. loss: 0.057236
Total training time: 90.26 seconds.
-- Epoch 83
Norm: 21.81, NNZs: 1048576, Bias: -1.160212, T: 256138, Avg. loss: 0.056926
Total training time: 91.42 seconds.
-- Epoch 84
Norm: 21.79, NNZs: 1048576, Bias: -1.161217, T: 259224, Avg. loss: 0.056628
Total training time: 92.59 seconds.
-- Epoch 85
Norm: 21.79, NNZs: 1048576, Bias: -1.159867, T: 262310, Avg. loss: 0.056336
Total training time: 93.75 seconds.
-- Epoch 86
Norm: 21.79, NNZs: 1048576, Bias: -1.157562, T: 265396, Avg. loss: 0.056050
Total training time: 94.89 seconds.
-- Epoch 87
Norm: 21.78, NNZs: 1048576, Bias: -1.158538, T: 268482, Avg. loss: 0.055770
Total training time: 96.04 seconds.
-- Epoch 88
Norm: 21.77, NNZs: 1048576, Bias: -1.158842, T: 271568, Avg. loss: 0.055492
Total training time: 97.19 seconds.
-- Epoch 89
Norm: 21.77, NNZs: 1048576, Bias: -1.155767, T: 274654, Avg. loss: 0.055223
Total training time: 98.36 seconds.
-- Epoch 90
Norm: 21.76, NNZs: 1048576, Bias: -1.155814, T: 277740, Avg. loss: 0.054962
Total training time: 99.54 seconds.
-- Epoch 91
Norm: 21.75, NNZs: 1048576, Bias: -1.154413, T: 280826, Avg. loss: 0.054706
Total training time: 100.70 seconds.
-- Epoch 92
Norm: 21.75, NNZs: 1048576, Bias: -1.154173, T: 283912, Avg. loss: 0.054454
Total training time: 101.87 seconds.
-- Epoch 93
Norm: 21.74, NNZs: 1048576, Bias: -1.154553, T: 286998, Avg. loss: 0.054209
Total training time: 103.04 seconds.
-- Epoch 94
Norm: 21.74, NNZs: 1048576, Bias: -1.152786, T: 290084, Avg. loss: 0.053967
Total training time: 104.19 seconds.
-- Epoch 95
Norm: 21.73, NNZs: 1048576, Bias: -1.152330, T: 293170, Avg. loss: 0.053734
Total training time: 105.52 seconds.
-- Epoch 96
Norm: 21.73, NNZs: 1048576, Bias: -1.149618, T: 296256, Avg. loss: 0.053503
Total training time: 106.66 seconds.
-- Epoch 97
Norm: 21.72, NNZs: 1048576, Bias: -1.151733, T: 299342, Avg. loss: 0.053276
Total training time: 107.86 seconds.
-- Epoch 98
Norm: 21.72, NNZs: 1048576, Bias: -1.150719, T: 302428, Avg. loss: 0.053054
Total training time: 108.99 seconds.
-- Epoch 99
Norm: 21.71, NNZs: 1048576, Bias: -1.150707, T: 305514, Avg. loss: 0.052835
Total training time: 110.18 seconds.
-- Epoch 100
Norm: 21.71, NNZs: 1048576, Bias: -1.149837, T: 308600, Avg. loss: 0.052620
Total training time: 111.32 seconds.
-- Epoch 1
Norm: 48.76, NNZs: 268410, Bias: -1.094205, T: 3086, Avg. loss: 0.362955
Total training time: 0.85 seconds.
-- Epoch 2
Norm: 33.05, NNZs: 660020, Bias: -1.167910, T: 6172, Avg. loss: 0.209077
Total training time: 1.69 seconds.
-- Epoch 3
Norm: 24.03, NNZs: 675065, Bias: -1.205391, T: 9258, Avg. loss: 0.146811
Total training time: 2.54 seconds.
-- Epoch 4
Norm: 19.77, NNZs: 679990, Bias: -1.204209, T: 12344, Avg. loss: 0.113609
Total training time: 3.38 seconds.
-- Epoch 5
Norm: 17.30, NNZs: 690045, Bias: -1.172828, T: 15430, Avg. loss: 0.092479
Total training time: 4.22 seconds.
-- Epoch 6
Norm: 15.84, NNZs: 761212, Bias: -1.156251, T: 18516, Avg. loss: 0.078776
Total training time: 5.07 seconds.
-- Epoch 7
Norm: 14.75, NNZs: 885135, Bias: -1.150141, T: 21602, Avg. loss: 0.068553
Total training time: 5.93 seconds.
-- Epoch 8
Norm: 13.91, NNZs: 906604, Bias: -1.151863, T: 24688, Avg. loss: 0.060850
Total training time: 6.78 seconds.
-- Epoch 9
Norm: 13.49, NNZs: 972284, Bias: -1.133839, T: 27774, Avg. loss: 0.054896
Total training time: 7.64 seconds.
-- Epoch 10
Norm: 13.16, NNZs: 975230, Bias: -1.132622, T: 30860, Avg. loss: 0.050122
Total training time: 8.51 seconds.
-- Epoch 11
Norm: 12.83, NNZs: 981227, Bias: -1.122867, T: 33946, Avg. loss: 0.046129
Total training time: 9.37 seconds.
-- Epoch 12
Norm: 12.59, NNZs: 989720, Bias: -1.118108, T: 37032, Avg. loss: 0.042729
Total training time: 10.24 seconds.
-- Epoch 13
Norm: 12.35, NNZs: 992333, Bias: -1.116211, T: 40118, Avg. loss: 0.039956
Total training time: 11.11 seconds.
-- Epoch 14
Norm: 12.09, NNZs: 1004857, Bias: -1.114919, T: 43204, Avg. loss: 0.037554
Total training time: 11.99 seconds.
-- Epoch 15
Norm: 11.98, NNZs: 1005807, Bias: -1.109148, T: 46290, Avg. loss: 0.035521
Total training time: 12.87 seconds.
-- Epoch 16
Norm: 11.84, NNZs: 1005916, Bias: -1.107373, T: 49376, Avg. loss: 0.033679
Total training time: 13.74 seconds.
-- Epoch 17
Norm: 11.84, NNZs: 1007510, Bias: -1.103772, T: 52462, Avg. loss: 0.032053
Total training time: 14.63 seconds.
-- Epoch 18
Norm: 11.74, NNZs: 1008107, Bias: -1.103243, T: 55548, Avg. loss: 0.030628
Total training time: 15.50 seconds.
-- Epoch 19
Norm: 11.66, NNZs: 1008139, Bias: -1.098769, T: 58634, Avg. loss: 0.029344
Total training time: 16.37 seconds.
-- Epoch 20
Norm: 11.56, NNZs: 1008275, Bias: -1.096136, T: 61720, Avg. loss: 0.028188
Total training time: 17.24 seconds.
-- Epoch 21
Norm: 11.54, NNZs: 1008559, Bias: -1.094597, T: 64806, Avg. loss: 0.027147
Total training time: 18.12 seconds.
-- Epoch 22
Norm: 11.46, NNZs: 1008668, Bias: -1.093778, T: 67892, Avg. loss: 0.026173
Total training time: 19.00 seconds.
-- Epoch 23
Norm: 11.45, NNZs: 1011582, Bias: -1.091468, T: 70978, Avg. loss: 0.025290
Total training time: 19.89 seconds.
-- Epoch 24
Norm: 11.43, NNZs: 1011626, Bias: -1.090222, T: 74064, Avg. loss: 0.024490
Total training time: 20.77 seconds.
-- Epoch 25
Norm: 11.36, NNZs: 1011682, Bias: -1.091281, T: 77150, Avg. loss: 0.023742
Total training time: 21.66 seconds.
-- Epoch 26
Norm: 11.38, NNZs: 1011705, Bias: -1.088688, T: 80236, Avg. loss: 0.023066
Total training time: 22.55 seconds.
-- Epoch 27
Norm: 11.35, NNZs: 1011719, Bias: -1.087146, T: 83322, Avg. loss: 0.022429
Total training time: 23.42 seconds.
-- Epoch 28
Norm: 11.30, NNZs: 1011729, Bias: -1.085678, T: 86408, Avg. loss: 0.021849
Total training time: 24.31 seconds.
-- Epoch 29
Norm: 11.27, NNZs: 1011787, Bias: -1.085264, T: 89494, Avg. loss: 0.021303
Total training time: 25.19 seconds.
-- Epoch 30
Norm: 11.22, NNZs: 1011806, Bias: -1.086529, T: 92580, Avg. loss: 0.020788
Total training time: 26.08 seconds.
-- Epoch 31
Norm: 11.23, NNZs: 1011835, Bias: -1.084689, T: 95666, Avg. loss: 0.020313
Total training time: 26.97 seconds.
-- Epoch 32
Norm: 11.20, NNZs: 1011888, Bias: -1.082472, T: 98752, Avg. loss: 0.019863
Total training time: 27.84 seconds.
-- Epoch 33
Norm: 11.18, NNZs: 1011918, Bias: -1.081300, T: 101838, Avg. loss: 0.019440
Total training time: 28.73 seconds.
-- Epoch 34
Norm: 11.20, NNZs: 1012018, Bias: -1.078283, T: 104924, Avg. loss: 0.019045
Total training time: 29.63 seconds.
-- Epoch 35
Norm: 11.14, NNZs: 1012065, Bias: -1.081106, T: 108010, Avg. loss: 0.018655
Total training time: 30.52 seconds.
-- Epoch 36
Norm: 11.16, NNZs: 1012068, Bias: -1.078816, T: 111096, Avg. loss: 0.018308
Total training time: 31.40 seconds.
-- Epoch 37
Norm: 11.17, NNZs: 1012082, Bias: -1.075873, T: 114182, Avg. loss: 0.017968
Total training time: 32.29 seconds.
-- Epoch 38
Norm: 11.13, NNZs: 1012090, Bias: -1.077820, T: 117268, Avg. loss: 0.017653
Total training time: 33.18 seconds.
-- Epoch 39
Norm: 11.15, NNZs: 1012094, Bias: -1.074639, T: 120354, Avg. loss: 0.017351
Total training time: 34.07 seconds.
-- Epoch 40
Norm: 11.13, NNZs: 1012094, Bias: -1.075721, T: 123440, Avg. loss: 0.017064
Total training time: 34.96 seconds.
-- Epoch 41
Norm: 11.09, NNZs: 1012144, Bias: -1.077111, T: 126526, Avg. loss: 0.016793
Total training time: 35.85 seconds.
-- Epoch 42
Norm: 11.08, NNZs: 1012145, Bias: -1.073466, T: 129612, Avg. loss: 0.016535
Total training time: 36.73 seconds.
-- Epoch 43
Norm: 11.07, NNZs: 1012153, Bias: -1.073860, T: 132698, Avg. loss: 0.016288
Total training time: 37.63 seconds.
-- Epoch 44
Norm: 11.05, NNZs: 1012182, Bias: -1.073622, T: 135784, Avg. loss: 0.016050
Total training time: 38.53 seconds.
-- Epoch 45
Norm: 11.06, NNZs: 1012200, Bias: -1.072512, T: 138870, Avg. loss: 0.015823
Total training time: 39.43 seconds.
-- Epoch 46
Norm: 11.07, NNZs: 1012202, Bias: -1.069087, T: 141956, Avg. loss: 0.015606
Total training time: 40.32 seconds.
-- Epoch 47
Norm: 11.02, NNZs: 1012202, Bias: -1.072562, T: 145042, Avg. loss: 0.015396
Total training time: 41.22 seconds.
-- Epoch 48
Norm: 11.05, NNZs: 1012202, Bias: -1.070236, T: 148128, Avg. loss: 0.015200
Total training time: 42.12 seconds.
-- Epoch 49
Norm: 11.02, NNZs: 1012202, Bias: -1.070622, T: 151214, Avg. loss: 0.015002
Total training time: 43.01 seconds.
-- Epoch 50
Norm: 11.02, NNZs: 1012256, Bias: -1.070181, T: 154300, Avg. loss: 0.014818
Total training time: 43.91 seconds.
-- Epoch 51
Norm: 11.02, NNZs: 1012256, Bias: -1.069047, T: 157386, Avg. loss: 0.014642
Total training time: 44.80 seconds.
-- Epoch 52
Norm: 11.02, NNZs: 1012257, Bias: -1.069103, T: 160472, Avg. loss: 0.014473
Total training time: 45.70 seconds.
-- Epoch 53
Norm: 11.00, NNZs: 1012257, Bias: -1.068669, T: 163558, Avg. loss: 0.014307
Total training time: 46.59 seconds.
-- Epoch 54
Norm: 11.02, NNZs: 1012257, Bias: -1.066491, T: 166644, Avg. loss: 0.014148
Total training time: 47.48 seconds.
-- Epoch 55
Norm: 10.99, NNZs: 1012257, Bias: -1.066976, T: 169730, Avg. loss: 0.013997
Total training time: 48.38 seconds.
-- Epoch 56
Norm: 10.99, NNZs: 1012257, Bias: -1.064913, T: 172816, Avg. loss: 0.013851
Total training time: 49.27 seconds.
-- Epoch 57
Norm: 10.98, NNZs: 1012259, Bias: -1.066820, T: 175902, Avg. loss: 0.013712
Total training time: 50.18 seconds.
-- Epoch 58
Norm: 10.99, NNZs: 1012259, Bias: -1.064707, T: 178988, Avg. loss: 0.013575
Total training time: 51.08 seconds.
-- Epoch 59
Norm: 11.02, NNZs: 1012276, Bias: -1.061418, T: 182074, Avg. loss: 0.013442
Total training time: 51.98 seconds.
-- Epoch 60
Norm: 11.01, NNZs: 1012286, Bias: -1.063053, T: 185160, Avg. loss: 0.013314
Total training time: 52.88 seconds.
-- Epoch 61
Norm: 11.00, NNZs: 1012286, Bias: -1.063182, T: 188246, Avg. loss: 0.013190
Total training time: 53.77 seconds.
-- Epoch 62
Norm: 10.98, NNZs: 1012286, Bias: -1.062385, T: 191332, Avg. loss: 0.013073
Total training time: 54.67 seconds.
-- Epoch 63
Norm: 11.00, NNZs: 1012290, Bias: -1.061551, T: 194418, Avg. loss: 0.012954
Total training time: 55.57 seconds.
-- Epoch 64
Norm: 10.97, NNZs: 1012296, Bias: -1.062428, T: 197504, Avg. loss: 0.012841
Total training time: 56.47 seconds.
-- Epoch 65
Norm: 10.98, NNZs: 1012296, Bias: -1.062294, T: 200590, Avg. loss: 0.012733
Total training time: 57.38 seconds.
-- Epoch 66
Norm: 10.99, NNZs: 1012311, Bias: -1.061549, T: 203676, Avg. loss: 0.012626
Total training time: 58.27 seconds.
-- Epoch 67
Norm: 10.97, NNZs: 1012320, Bias: -1.061085, T: 206762, Avg. loss: 0.012525
Total training time: 59.17 seconds.
-- Epoch 68
Norm: 10.97, NNZs: 1012320, Bias: -1.060694, T: 209848, Avg. loss: 0.012425
Total training time: 60.08 seconds.
-- Epoch 69
Norm: 10.98, NNZs: 1012324, Bias: -1.059666, T: 212934, Avg. loss: 0.012327
Total training time: 60.98 seconds.
-- Epoch 70
Norm: 10.97, NNZs: 1012324, Bias: -1.059192, T: 216020, Avg. loss: 0.012234
Total training time: 61.89 seconds.
-- Epoch 71
Norm: 10.96, NNZs: 1012324, Bias: -1.059816, T: 219106, Avg. loss: 0.012143
Total training time: 62.79 seconds.
-- Epoch 72
Norm: 10.96, NNZs: 1012325, Bias: -1.059340, T: 222192, Avg. loss: 0.012054
Total training time: 63.69 seconds.
-- Epoch 73
Norm: 10.96, NNZs: 1012330, Bias: -1.058963, T: 225278, Avg. loss: 0.011968
Total training time: 64.59 seconds.
-- Epoch 74
Norm: 10.97, NNZs: 1012351, Bias: -1.057695, T: 228364, Avg. loss: 0.011884
Total training time: 65.50 seconds.
-- Epoch 75
Norm: 10.96, NNZs: 1012351, Bias: -1.058323, T: 231450, Avg. loss: 0.011802
Total training time: 66.41 seconds.
-- Epoch 76
Norm: 10.95, NNZs: 1012351, Bias: -1.057632, T: 234536, Avg. loss: 0.011722
Total training time: 67.30 seconds.
-- Epoch 77
Norm: 10.94, NNZs: 1012351, Bias: -1.058062, T: 237622, Avg. loss: 0.011642
Total training time: 68.21 seconds.
-- Epoch 78
Norm: 10.95, NNZs: 1012351, Bias: -1.056597, T: 240708, Avg. loss: 0.011567
Total training time: 69.11 seconds.
-- Epoch 79
Norm: 10.93, NNZs: 1012351, Bias: -1.057815, T: 243794, Avg. loss: 0.011493
Total training time: 70.02 seconds.
-- Epoch 80
Norm: 10.95, NNZs: 1012352, Bias: -1.055877, T: 246880, Avg. loss: 0.011421
Total training time: 70.92 seconds.
-- Epoch 81
Norm: 10.93, NNZs: 1012358, Bias: -1.057903, T: 249966, Avg. loss: 0.011349
Total training time: 71.84 seconds.
-- Epoch 82
Norm: 10.96, NNZs: 1012358, Bias: -1.054306, T: 253052, Avg. loss: 0.011279
Total training time: 72.73 seconds.
-- Epoch 83
Norm: 10.93, NNZs: 1012358, Bias: -1.056532, T: 256138, Avg. loss: 0.011213
Total training time: 73.64 seconds.
-- Epoch 84
Norm: 10.94, NNZs: 1012358, Bias: -1.054781, T: 259224, Avg. loss: 0.011147
Total training time: 74.54 seconds.
-- Epoch 85
Norm: 10.93, NNZs: 1012358, Bias: -1.055801, T: 262310, Avg. loss: 0.011083
Total training time: 75.45 seconds.
-- Epoch 86
Norm: 10.93, NNZs: 1012358, Bias: -1.055910, T: 265396, Avg. loss: 0.011020
Total training time: 76.36 seconds.
-- Epoch 87
Norm: 10.93, NNZs: 1012358, Bias: -1.054639, T: 268482, Avg. loss: 0.010959
Total training time: 77.25 seconds.
-- Epoch 88
Norm: 10.93, NNZs: 1012358, Bias: -1.054624, T: 271568, Avg. loss: 0.010899
Total training time: 78.16 seconds.
-- Epoch 89
Norm: 10.93, NNZs: 1012431, Bias: -1.054827, T: 274654, Avg. loss: 0.010840
Total training time: 79.06 seconds.
-- Epoch 90
Norm: 10.92, NNZs: 1012431, Bias: -1.053167, T: 277740, Avg. loss: 0.010783
Total training time: 79.96 seconds.
-- Epoch 91
Norm: 10.92, NNZs: 1012432, Bias: -1.054808, T: 280826, Avg. loss: 0.010727
Total training time: 80.86 seconds.
-- Epoch 92
Norm: 10.92, NNZs: 1012432, Bias: -1.053843, T: 283912, Avg. loss: 0.010673
Total training time: 81.77 seconds.
-- Epoch 93
Norm: 10.90, NNZs: 1012432, Bias: -1.054278, T: 286998, Avg. loss: 0.010619
Total training time: 82.67 seconds.
-- Epoch 94
Norm: 10.92, NNZs: 1012432, Bias: -1.052728, T: 290084, Avg. loss: 0.010567
Total training time: 83.58 seconds.
-- Epoch 95
Norm: 10.92, NNZs: 1012432, Bias: -1.052724, T: 293170, Avg. loss: 0.010516
Total training time: 84.48 seconds.
-- Epoch 96
Norm: 10.92, NNZs: 1012432, Bias: -1.052559, T: 296256, Avg. loss: 0.010466
Total training time: 85.38 seconds.
-- Epoch 97
Norm: 10.91, NNZs: 1012432, Bias: -1.052324, T: 299342, Avg. loss: 0.010417
Total training time: 86.29 seconds.
-- Epoch 98
Norm: 10.91, NNZs: 1012432, Bias: -1.051564, T: 302428, Avg. loss: 0.010369
Total training time: 87.19 seconds.
-- Epoch 99
Norm: 10.92, NNZs: 1012434, Bias: -1.051132, T: 305514, Avg. loss: 0.010322
Total training time: 88.10 seconds.
-- Epoch 100
Norm: 10.92, NNZs: 1012438, Bias: -1.051177, T: 308600, Avg. loss: 0.010275
Total training time: 89.00 seconds.
-- Epoch 1
Norm: 43.84, NNZs: 919589, Bias: -1.297817, T: 3086, Avg. loss: 0.441649
Total training time: 0.88 seconds.
-- Epoch 2
Norm: 29.46, NNZs: 969207, Bias: -1.640113, T: 6172, Avg. loss: 0.296224
Total training time: 1.75 seconds.
-- Epoch 3
Norm: 24.28, NNZs: 1025457, Bias: -1.689444, T: 9258, Avg. loss: 0.220149
Total training time: 2.63 seconds.
-- Epoch 4
Norm: 20.41, NNZs: 1046898, Bias: -1.730356, T: 12344, Avg. loss: 0.175269
Total training time: 3.52 seconds.
-- Epoch 5
Norm: 18.64, NNZs: 1048046, Bias: -1.704498, T: 15430, Avg. loss: 0.145320
Total training time: 4.41 seconds.
-- Epoch 6
Norm: 16.94, NNZs: 1048096, Bias: -1.722691, T: 18516, Avg. loss: 0.124282
Total training time: 5.30 seconds.
-- Epoch 7
Norm: 16.01, NNZs: 1048454, Bias: -1.725472, T: 21602, Avg. loss: 0.109577
Total training time: 6.22 seconds.
-- Epoch 8
Norm: 15.21, NNZs: 1048496, Bias: -1.736268, T: 24688, Avg. loss: 0.098590
Total training time: 7.12 seconds.
-- Epoch 9
Norm: 14.61, NNZs: 1048546, Bias: -1.739190, T: 27774, Avg. loss: 0.089462
Total training time: 8.04 seconds.
-- Epoch 10
Norm: 14.00, NNZs: 1048554, Bias: -1.756302, T: 30860, Avg. loss: 0.082054
Total training time: 8.96 seconds.
-- Epoch 11
Norm: 13.69, NNZs: 1048556, Bias: -1.750957, T: 33946, Avg. loss: 0.075992
Total training time: 9.87 seconds.
-- Epoch 12
Norm: 13.31, NNZs: 1048559, Bias: -1.758947, T: 37032, Avg. loss: 0.070978
Total training time: 10.80 seconds.
-- Epoch 13
Norm: 13.24, NNZs: 1048562, Bias: -1.751330, T: 40118, Avg. loss: 0.066614
Total training time: 11.73 seconds.
-- Epoch 14
Norm: 12.96, NNZs: 1048564, Bias: -1.754893, T: 43204, Avg. loss: 0.062952
Total training time: 12.65 seconds.
-- Epoch 15
Norm: 12.62, NNZs: 1048568, Bias: -1.768599, T: 46290, Avg. loss: 0.059723
Total training time: 13.57 seconds.
-- Epoch 16
Norm: 12.54, NNZs: 1048568, Bias: -1.762690, T: 49376, Avg. loss: 0.056876
Total training time: 14.49 seconds.
-- Epoch 17
Norm: 12.49, NNZs: 1048571, Bias: -1.761090, T: 52462, Avg. loss: 0.054365
Total training time: 15.43 seconds.
-- Epoch 18
Norm: 12.42, NNZs: 1048571, Bias: -1.761539, T: 55548, Avg. loss: 0.052132
Total training time: 16.36 seconds.
-- Epoch 19
Norm: 12.21, NNZs: 1048571, Bias: -1.770177, T: 58634, Avg. loss: 0.050096
Total training time: 17.32 seconds.
-- Epoch 20
Norm: 12.27, NNZs: 1048573, Bias: -1.763100, T: 61720, Avg. loss: 0.048242
Total training time: 18.25 seconds.
-- Epoch 21
Norm: 12.17, NNZs: 1048574, Bias: -1.766244, T: 64806, Avg. loss: 0.046558
Total training time: 19.20 seconds.
-- Epoch 22
Norm: 12.05, NNZs: 1048574, Bias: -1.769099, T: 67892, Avg. loss: 0.045051
Total training time: 20.14 seconds.
-- Epoch 23
Norm: 12.00, NNZs: 1048574, Bias: -1.772379, T: 70978, Avg. loss: 0.043659
Total training time: 21.09 seconds.
-- Epoch 24
Norm: 11.98, NNZs: 1048574, Bias: -1.769875, T: 74064, Avg. loss: 0.042404
Total training time: 22.02 seconds.
-- Epoch 25
Norm: 11.86, NNZs: 1048575, Bias: -1.772895, T: 77150, Avg. loss: 0.041256
Total training time: 22.96 seconds.
-- Epoch 26
Norm: 11.82, NNZs: 1048575, Bias: -1.773614, T: 80236, Avg. loss: 0.040158
Total training time: 23.93 seconds.
-- Epoch 27
Norm: 11.75, NNZs: 1048575, Bias: -1.778131, T: 83322, Avg. loss: 0.039158
Total training time: 25.06 seconds.
-- Epoch 28
Norm: 11.79, NNZs: 1048575, Bias: -1.772220, T: 86408, Avg. loss: 0.038237
Total training time: 26.01 seconds.
-- Epoch 29
Norm: 11.69, NNZs: 1048575, Bias: -1.778704, T: 89494, Avg. loss: 0.037344
Total training time: 26.95 seconds.
-- Epoch 30
Norm: 11.71, NNZs: 1048575, Bias: -1.776435, T: 92580, Avg. loss: 0.036535
Total training time: 27.90 seconds.
-- Epoch 31
Norm: 11.65, NNZs: 1048575, Bias: -1.777427, T: 95666, Avg. loss: 0.035777
Total training time: 28.84 seconds.
-- Epoch 32
Norm: 11.66, NNZs: 1048576, Bias: -1.776208, T: 98752, Avg. loss: 0.035040
Total training time: 29.77 seconds.
-- Epoch 33
Norm: 11.61, NNZs: 1048576, Bias: -1.778061, T: 101838, Avg. loss: 0.034373
Total training time: 30.73 seconds.
-- Epoch 34
Norm: 11.61, NNZs: 1048576, Bias: -1.778642, T: 104924, Avg. loss: 0.033723
Total training time: 31.67 seconds.
-- Epoch 35
Norm: 11.51, NNZs: 1048576, Bias: -1.784494, T: 108010, Avg. loss: 0.033128
Total training time: 32.66 seconds.
-- Epoch 36
Norm: 11.50, NNZs: 1048576, Bias: -1.783897, T: 111096, Avg. loss: 0.032564
Total training time: 33.60 seconds.
-- Epoch 37
Norm: 11.50, NNZs: 1048576, Bias: -1.783137, T: 114182, Avg. loss: 0.032034
Total training time: 34.55 seconds.
-- Epoch 38
Norm: 11.46, NNZs: 1048576, Bias: -1.786509, T: 117268, Avg. loss: 0.031518
Total training time: 35.51 seconds.
-- Epoch 39
Norm: 11.48, NNZs: 1048576, Bias: -1.783387, T: 120354, Avg. loss: 0.031029
Total training time: 36.47 seconds.
-- Epoch 40
Norm: 11.49, NNZs: 1048576, Bias: -1.782077, T: 123440, Avg. loss: 0.030564
Total training time: 37.46 seconds.
-- Epoch 41
Norm: 11.46, NNZs: 1048576, Bias: -1.782465, T: 126526, Avg. loss: 0.030129
Total training time: 38.39 seconds.
-- Epoch 42
Norm: 11.39, NNZs: 1048576, Bias: -1.788345, T: 129612, Avg. loss: 0.029710
Total training time: 39.36 seconds.
-- Epoch 43
Norm: 11.41, NNZs: 1048576, Bias: -1.785744, T: 132698, Avg. loss: 0.029313
Total training time: 40.29 seconds.
-- Epoch 44
Norm: 11.44, NNZs: 1048576, Bias: -1.781543, T: 135784, Avg. loss: 0.028928
Total training time: 41.24 seconds.
-- Epoch 45
Norm: 11.34, NNZs: 1048576, Bias: -1.787866, T: 138870, Avg. loss: 0.028564
Total training time: 42.20 seconds.
-- Epoch 46
Norm: 11.35, NNZs: 1048576, Bias: -1.786659, T: 141956, Avg. loss: 0.028216
Total training time: 43.15 seconds.
-- Epoch 47
Norm: 11.31, NNZs: 1048576, Bias: -1.789866, T: 145042, Avg. loss: 0.027884
Total training time: 44.11 seconds.
-- Epoch 48
Norm: 11.32, NNZs: 1048576, Bias: -1.787866, T: 148128, Avg. loss: 0.027566
Total training time: 45.07 seconds.
-- Epoch 49
Norm: 11.31, NNZs: 1048576, Bias: -1.788340, T: 151214, Avg. loss: 0.027259
Total training time: 46.03 seconds.
-- Epoch 50
Norm: 11.34, NNZs: 1048576, Bias: -1.785057, T: 154300, Avg. loss: 0.026960
Total training time: 47.00 seconds.
-- Epoch 51
Norm: 11.26, NNZs: 1048576, Bias: -1.790213, T: 157386, Avg. loss: 0.026673
Total training time: 47.95 seconds.
-- Epoch 52
Norm: 11.26, NNZs: 1048576, Bias: -1.791161, T: 160472, Avg. loss: 0.026398
Total training time: 48.94 seconds.
-- Epoch 53
Norm: 11.24, NNZs: 1048576, Bias: -1.791119, T: 163558, Avg. loss: 0.026133
Total training time: 49.90 seconds.
-- Epoch 54
Norm: 11.23, NNZs: 1048576, Bias: -1.791721, T: 166644, Avg. loss: 0.025877
Total training time: 50.86 seconds.
-- Epoch 55
Norm: 11.24, NNZs: 1048576, Bias: -1.789849, T: 169730, Avg. loss: 0.025630
Total training time: 51.82 seconds.
-- Epoch 56
Norm: 11.22, NNZs: 1048576, Bias: -1.792224, T: 172816, Avg. loss: 0.025393
Total training time: 52.80 seconds.
-- Epoch 57
Norm: 11.23, NNZs: 1048576, Bias: -1.790593, T: 175902, Avg. loss: 0.025168
Total training time: 53.77 seconds.
-- Epoch 58
Norm: 11.24, NNZs: 1048576, Bias: -1.790185, T: 178988, Avg. loss: 0.024945
Total training time: 54.74 seconds.
-- Epoch 59
Norm: 11.21, NNZs: 1048576, Bias: -1.790586, T: 182074, Avg. loss: 0.024732
Total training time: 55.69 seconds.
-- Epoch 60
Norm: 11.20, NNZs: 1048576, Bias: -1.790925, T: 185160, Avg. loss: 0.024526
Total training time: 56.63 seconds.
-- Epoch 61
Norm: 11.21, NNZs: 1048576, Bias: -1.791219, T: 188246, Avg. loss: 0.024324
Total training time: 57.61 seconds.
-- Epoch 62
Norm: 11.20, NNZs: 1048576, Bias: -1.790609, T: 191332, Avg. loss: 0.024127
Total training time: 58.55 seconds.
-- Epoch 63
Norm: 11.19, NNZs: 1048576, Bias: -1.791681, T: 194418, Avg. loss: 0.023938
Total training time: 59.55 seconds.
-- Epoch 64
Norm: 11.17, NNZs: 1048576, Bias: -1.792692, T: 197504, Avg. loss: 0.023757
Total training time: 60.51 seconds.
-- Epoch 65
Norm: 11.18, NNZs: 1048576, Bias: -1.792899, T: 200590, Avg. loss: 0.023580
Total training time: 61.47 seconds.
-- Epoch 66
Norm: 11.14, NNZs: 1048576, Bias: -1.794442, T: 203676, Avg. loss: 0.023406
Total training time: 62.44 seconds.
-- Epoch 67
Norm: 11.13, NNZs: 1048576, Bias: -1.795308, T: 206762, Avg. loss: 0.023238
Total training time: 63.39 seconds.
-- Epoch 68
Norm: 11.14, NNZs: 1048576, Bias: -1.794319, T: 209848, Avg. loss: 0.023078
Total training time: 64.36 seconds.
-- Epoch 69
Norm: 11.13, NNZs: 1048576, Bias: -1.793882, T: 212934, Avg. loss: 0.022922
Total training time: 65.32 seconds.
-- Epoch 70
Norm: 11.15, NNZs: 1048576, Bias: -1.793390, T: 216020, Avg. loss: 0.022770
Total training time: 66.28 seconds.
-- Epoch 71
Norm: 11.13, NNZs: 1048576, Bias: -1.794557, T: 219106, Avg. loss: 0.022621
Total training time: 67.28 seconds.
-- Epoch 72
Norm: 11.12, NNZs: 1048576, Bias: -1.794278, T: 222192, Avg. loss: 0.022477
Total training time: 68.23 seconds.
-- Epoch 73
Norm: 11.10, NNZs: 1048576, Bias: -1.797008, T: 225278, Avg. loss: 0.022334
Total training time: 69.24 seconds.
-- Epoch 74
Norm: 11.14, NNZs: 1048576, Bias: -1.792744, T: 228364, Avg. loss: 0.022198
Total training time: 70.18 seconds.
-- Epoch 75
Norm: 11.12, NNZs: 1048576, Bias: -1.794690, T: 231450, Avg. loss: 0.022063
Total training time: 71.16 seconds.
-- Epoch 76
Norm: 11.12, NNZs: 1048576, Bias: -1.795159, T: 234536, Avg. loss: 0.021934
Total training time: 72.17 seconds.
-- Epoch 77
Norm: 11.13, NNZs: 1048576, Bias: -1.793626, T: 237622, Avg. loss: 0.021806
Total training time: 73.12 seconds.
-- Epoch 78
Norm: 11.09, NNZs: 1048576, Bias: -1.797215, T: 240708, Avg. loss: 0.021680
Total training time: 74.12 seconds.
-- Epoch 79
Norm: 11.09, NNZs: 1048576, Bias: -1.796140, T: 243794, Avg. loss: 0.021559
Total training time: 75.06 seconds.
-- Epoch 80
Norm: 11.11, NNZs: 1048576, Bias: -1.795799, T: 246880, Avg. loss: 0.021441
Total training time: 76.04 seconds.
-- Epoch 81
Norm: 11.11, NNZs: 1048576, Bias: -1.795470, T: 249966, Avg. loss: 0.021326
Total training time: 77.00 seconds.
-- Epoch 82
Norm: 11.08, NNZs: 1048576, Bias: -1.797073, T: 253052, Avg. loss: 0.021214
Total training time: 77.98 seconds.
-- Epoch 83
Norm: 11.08, NNZs: 1048576, Bias: -1.797214, T: 256138, Avg. loss: 0.021102
Total training time: 78.93 seconds.
-- Epoch 84
Norm: 11.08, NNZs: 1048576, Bias: -1.797635, T: 259224, Avg. loss: 0.020996
Total training time: 79.92 seconds.
-- Epoch 85
Norm: 11.06, NNZs: 1048576, Bias: -1.798996, T: 262310, Avg. loss: 0.020890
Total training time: 80.88 seconds.
-- Epoch 86
Norm: 11.07, NNZs: 1048576, Bias: -1.797014, T: 265396, Avg. loss: 0.020789
Total training time: 81.83 seconds.
-- Epoch 87
Norm: 11.08, NNZs: 1048576, Bias: -1.797395, T: 268482, Avg. loss: 0.020689
Total training time: 82.84 seconds.
-- Epoch 88
Norm: 11.09, NNZs: 1048576, Bias: -1.796144, T: 271568, Avg. loss: 0.020591
Total training time: 83.79 seconds.
-- Epoch 89
Norm: 11.06, NNZs: 1048576, Bias: -1.798225, T: 274654, Avg. loss: 0.020496
Total training time: 84.77 seconds.
-- Epoch 90
Norm: 11.06, NNZs: 1048576, Bias: -1.797923, T: 277740, Avg. loss: 0.020403
Total training time: 85.75 seconds.
-- Epoch 91
Norm: 11.06, NNZs: 1048576, Bias: -1.797942, T: 280826, Avg. loss: 0.020312
Total training time: 86.75 seconds.
-- Epoch 92
Norm: 11.06, NNZs: 1048576, Bias: -1.797976, T: 283912, Avg. loss: 0.020221
Total training time: 87.71 seconds.
-- Epoch 93
Norm: 11.06, NNZs: 1048576, Bias: -1.797813, T: 286998, Avg. loss: 0.020134
Total training time: 88.68 seconds.
-- Epoch 94
Norm: 11.05, NNZs: 1048576, Bias: -1.798804, T: 290084, Avg. loss: 0.020048
Total training time: 89.66 seconds.
-- Epoch 95
Norm: 11.04, NNZs: 1048576, Bias: -1.798956, T: 293170, Avg. loss: 0.019965
Total training time: 90.64 seconds.
-- Epoch 96
Norm: 11.04, NNZs: 1048576, Bias: -1.798607, T: 296256, Avg. loss: 0.019882
Total training time: 91.60 seconds.
-- Epoch 97
Norm: 11.03, NNZs: 1048576, Bias: -1.799461, T: 299342, Avg. loss: 0.019802
Total training time: 92.58 seconds.
-- Epoch 98
Norm: 11.02, NNZs: 1048576, Bias: -1.799976, T: 302428, Avg. loss: 0.019723
Total training time: 93.55 seconds.
-- Epoch 99
Norm: 11.02, NNZs: 1048576, Bias: -1.800288, T: 305514, Avg. loss: 0.019646
Total training time: 94.52 seconds.
-- Epoch 100
Norm: 11.04, NNZs: 1048576, Bias: -1.798479, T: 308600, Avg. loss: 0.019569
Total training time: 95.47 seconds.
-- Epoch 1
Norm: 42.77, NNZs: 969992, Bias: -1.237836, T: 3086, Avg. loss: 0.295260
Total training time: 0.87 seconds.
-- Epoch 2
Norm: 28.80, NNZs: 1019663, Bias: -1.193088, T: 6172, Avg. loss: 0.178148
Total training time: 1.74 seconds.
-- Epoch 3
Norm: 22.54, NNZs: 1035747, Bias: -1.152668, T: 9258, Avg. loss: 0.126980
Total training time: 2.61 seconds.
-- Epoch 4
Norm: 18.84, NNZs: 1037201, Bias: -1.116101, T: 12344, Avg. loss: 0.101564
Total training time: 3.47 seconds.
-- Epoch 5
Norm: 16.30, NNZs: 1038876, Bias: -1.107627, T: 15430, Avg. loss: 0.083704
Total training time: 4.34 seconds.
-- Epoch 6
Norm: 14.74, NNZs: 1040330, Bias: -1.065213, T: 18516, Avg. loss: 0.071320
Total training time: 5.21 seconds.
-- Epoch 7
Norm: 13.76, NNZs: 1045559, Bias: -1.046965, T: 21602, Avg. loss: 0.062910
Total training time: 6.11 seconds.
-- Epoch 8
Norm: 12.94, NNZs: 1046515, Bias: -1.041284, T: 24688, Avg. loss: 0.056206
Total training time: 7.01 seconds.
-- Epoch 9
Norm: 12.53, NNZs: 1048216, Bias: -1.031964, T: 27774, Avg. loss: 0.050895
Total training time: 7.92 seconds.
-- Epoch 10
Norm: 12.09, NNZs: 1048277, Bias: -1.017811, T: 30860, Avg. loss: 0.046488
Total training time: 8.81 seconds.
-- Epoch 11
Norm: 11.67, NNZs: 1048313, Bias: -1.026327, T: 33946, Avg. loss: 0.042953
Total training time: 9.72 seconds.
-- Epoch 12
Norm: 11.54, NNZs: 1048380, Bias: -1.012582, T: 37032, Avg. loss: 0.039995
Total training time: 10.64 seconds.
-- Epoch 13
Norm: 11.33, NNZs: 1048481, Bias: -1.009811, T: 40118, Avg. loss: 0.037462
Total training time: 11.57 seconds.
-- Epoch 14
Norm: 11.23, NNZs: 1048526, Bias: -1.005243, T: 43204, Avg. loss: 0.035319
Total training time: 12.51 seconds.
-- Epoch 15
Norm: 11.06, NNZs: 1048533, Bias: -1.000152, T: 46290, Avg. loss: 0.033379
Total training time: 13.44 seconds.
-- Epoch 16
Norm: 10.85, NNZs: 1048536, Bias: -1.009658, T: 49376, Avg. loss: 0.031639
Total training time: 14.35 seconds.
-- Epoch 17
Norm: 10.83, NNZs: 1048539, Bias: -0.997220, T: 52462, Avg. loss: 0.030165
Total training time: 15.26 seconds.
-- Epoch 18
Norm: 10.68, NNZs: 1048544, Bias: -1.000205, T: 55548, Avg. loss: 0.028870
Total training time: 16.19 seconds.
-- Epoch 19
Norm: 10.67, NNZs: 1048558, Bias: -0.991088, T: 58634, Avg. loss: 0.027706
Total training time: 17.10 seconds.
-- Epoch 20
Norm: 10.54, NNZs: 1048558, Bias: -0.990407, T: 61720, Avg. loss: 0.026670
Total training time: 18.03 seconds.
-- Epoch 21
Norm: 10.50, NNZs: 1048561, Bias: -0.984775, T: 64806, Avg. loss: 0.025717
Total training time: 18.95 seconds.
-- Epoch 22
Norm: 10.47, NNZs: 1048562, Bias: -0.982454, T: 67892, Avg. loss: 0.024852
Total training time: 19.86 seconds.
-- Epoch 23
Norm: 10.46, NNZs: 1048563, Bias: -0.977335, T: 70978, Avg. loss: 0.024057
Total training time: 20.79 seconds.
-- Epoch 24
Norm: 10.42, NNZs: 1048565, Bias: -0.973453, T: 74064, Avg. loss: 0.023336
Total training time: 21.71 seconds.
-- Epoch 25
Norm: 10.35, NNZs: 1048567, Bias: -0.972497, T: 77150, Avg. loss: 0.022666
Total training time: 22.64 seconds.
-- Epoch 26
Norm: 10.29, NNZs: 1048567, Bias: -0.972700, T: 80236, Avg. loss: 0.022043
Total training time: 23.58 seconds.
-- Epoch 27
Norm: 10.28, NNZs: 1048567, Bias: -0.969012, T: 83322, Avg. loss: 0.021476
Total training time: 24.50 seconds.
-- Epoch 28
Norm: 10.23, NNZs: 1048568, Bias: -0.969254, T: 86408, Avg. loss: 0.020950
Total training time: 25.45 seconds.
-- Epoch 29
Norm: 10.20, NNZs: 1048570, Bias: -0.968411, T: 89494, Avg. loss: 0.020451
Total training time: 26.38 seconds.
-- Epoch 30
Norm: 10.21, NNZs: 1048570, Bias: -0.964060, T: 92580, Avg. loss: 0.019988
Total training time: 27.31 seconds.
-- Epoch 31
Norm: 10.21, NNZs: 1048571, Bias: -0.963106, T: 95666, Avg. loss: 0.019540
Total training time: 28.26 seconds.
-- Epoch 32
Norm: 10.17, NNZs: 1048571, Bias: -0.959821, T: 98752, Avg. loss: 0.019138
Total training time: 29.19 seconds.
-- Epoch 33
Norm: 10.12, NNZs: 1048571, Bias: -0.961241, T: 101838, Avg. loss: 0.018750
Total training time: 30.13 seconds.
-- Epoch 34
Norm: 10.13, NNZs: 1048571, Bias: -0.953908, T: 104924, Avg. loss: 0.018388
Total training time: 31.06 seconds.
-- Epoch 35
Norm: 10.09, NNZs: 1048571, Bias: -0.956655, T: 108010, Avg. loss: 0.018038
Total training time: 32.00 seconds.
-- Epoch 36
Norm: 10.12, NNZs: 1048571, Bias: -0.951206, T: 111096, Avg. loss: 0.017702
Total training time: 32.93 seconds.
-- Epoch 37
Norm: 10.08, NNZs: 1048571, Bias: -0.952589, T: 114182, Avg. loss: 0.017395
Total training time: 33.87 seconds.
-- Epoch 38
Norm: 10.04, NNZs: 1048571, Bias: -0.951381, T: 117268, Avg. loss: 0.017108
Total training time: 34.79 seconds.
-- Epoch 39
Norm: 10.01, NNZs: 1048571, Bias: -0.953975, T: 120354, Avg. loss: 0.016828
Total training time: 35.75 seconds.
-- Epoch 40
Norm: 9.99, NNZs: 1048571, Bias: -0.950088, T: 123440, Avg. loss: 0.016572
Total training time: 36.67 seconds.
-- Epoch 41
Norm: 9.98, NNZs: 1048571, Bias: -0.954707, T: 126526, Avg. loss: 0.016308
Total training time: 37.64 seconds.
-- Epoch 42
Norm: 9.99, NNZs: 1048571, Bias: -0.947158, T: 129612, Avg. loss: 0.016079
Total training time: 38.57 seconds.
-- Epoch 43
Norm: 9.99, NNZs: 1048571, Bias: -0.946200, T: 132698, Avg. loss: 0.015852
Total training time: 39.50 seconds.
-- Epoch 44
Norm: 9.96, NNZs: 1048571, Bias: -0.947459, T: 135784, Avg. loss: 0.015636
Total training time: 40.47 seconds.
-- Epoch 45
Norm: 9.97, NNZs: 1048571, Bias: -0.943583, T: 138870, Avg. loss: 0.015429
Total training time: 41.39 seconds.
-- Epoch 46
Norm: 9.95, NNZs: 1048571, Bias: -0.943424, T: 141956, Avg. loss: 0.015231
Total training time: 42.33 seconds.
-- Epoch 47
Norm: 9.94, NNZs: 1048571, Bias: -0.942791, T: 145042, Avg. loss: 0.015039
Total training time: 43.29 seconds.
-- Epoch 48
Norm: 9.94, NNZs: 1048571, Bias: -0.940312, T: 148128, Avg. loss: 0.014859
Total training time: 44.21 seconds.
-- Epoch 49
Norm: 9.93, NNZs: 1048571, Bias: -0.940294, T: 151214, Avg. loss: 0.014687
Total training time: 45.16 seconds.
-- Epoch 50
Norm: 9.90, NNZs: 1048571, Bias: -0.940388, T: 154300, Avg. loss: 0.014519
Total training time: 46.11 seconds.
-- Epoch 51
Norm: 9.89, NNZs: 1048571, Bias: -0.939145, T: 157386, Avg. loss: 0.014359
Total training time: 47.05 seconds.
-- Epoch 52
Norm: 9.87, NNZs: 1048571, Bias: -0.940541, T: 160472, Avg. loss: 0.014200
Total training time: 48.02 seconds.
-- Epoch 53
Norm: 9.87, NNZs: 1048571, Bias: -0.937555, T: 163558, Avg. loss: 0.014050
Total training time: 49.15 seconds.
-- Epoch 54
Norm: 9.86, NNZs: 1048571, Bias: -0.936869, T: 166644, Avg. loss: 0.013904
Total training time: 50.09 seconds.
-- Epoch 55
Norm: 9.85, NNZs: 1048571, Bias: -0.936914, T: 169730, Avg. loss: 0.013764
Total training time: 51.05 seconds.
-- Epoch 56
Norm: 9.87, NNZs: 1048572, Bias: -0.933295, T: 172816, Avg. loss: 0.013629
Total training time: 51.97 seconds.
-- Epoch 57
Norm: 9.83, NNZs: 1048572, Bias: -0.934238, T: 175902, Avg. loss: 0.013502
Total training time: 52.91 seconds.
-- Epoch 58
Norm: 9.82, NNZs: 1048572, Bias: -0.933932, T: 178988, Avg. loss: 0.013373
Total training time: 53.87 seconds.
-- Epoch 59
Norm: 9.83, NNZs: 1048572, Bias: -0.933301, T: 182074, Avg. loss: 0.013252
Total training time: 54.81 seconds.
-- Epoch 60
Norm: 9.82, NNZs: 1048572, Bias: -0.931729, T: 185160, Avg. loss: 0.013137
Total training time: 55.74 seconds.
-- Epoch 61
Norm: 9.81, NNZs: 1048572, Bias: -0.932224, T: 188246, Avg. loss: 0.013024
Total training time: 56.70 seconds.
-- Epoch 62
Norm: 9.81, NNZs: 1048572, Bias: -0.930083, T: 191332, Avg. loss: 0.012916
Total training time: 57.64 seconds.
-- Epoch 63
Norm: 9.80, NNZs: 1048573, Bias: -0.932942, T: 194418, Avg. loss: 0.012802
Total training time: 58.63 seconds.
-- Epoch 64
Norm: 9.82, NNZs: 1048573, Bias: -0.927481, T: 197504, Avg. loss: 0.012702
Total training time: 59.54 seconds.
-- Epoch 65
Norm: 9.82, NNZs: 1048574, Bias: -0.926119, T: 200590, Avg. loss: 0.012601
Total training time: 60.47 seconds.
-- Epoch 66
Norm: 9.80, NNZs: 1048574, Bias: -0.928053, T: 203676, Avg. loss: 0.012504
Total training time: 61.44 seconds.
-- Epoch 67
Norm: 9.79, NNZs: 1048574, Bias: -0.928215, T: 206762, Avg. loss: 0.012407
Total training time: 62.40 seconds.
-- Epoch 68
Norm: 9.80, NNZs: 1048574, Bias: -0.923952, T: 209848, Avg. loss: 0.012317
Total training time: 63.32 seconds.
-- Epoch 69
Norm: 9.79, NNZs: 1048574, Bias: -0.925510, T: 212934, Avg. loss: 0.012229
Total training time: 64.28 seconds.
-- Epoch 70
Norm: 9.79, NNZs: 1048574, Bias: -0.922602, T: 216020, Avg. loss: 0.012143
Total training time: 65.21 seconds.
-- Epoch 71
Norm: 9.77, NNZs: 1048574, Bias: -0.924592, T: 219106, Avg. loss: 0.012060
Total training time: 66.17 seconds.
-- Epoch 72
Norm: 9.77, NNZs: 1048574, Bias: -0.923064, T: 222192, Avg. loss: 0.011977
Total training time: 67.12 seconds.
-- Epoch 73
Norm: 9.76, NNZs: 1048574, Bias: -0.922974, T: 225278, Avg. loss: 0.011900
Total training time: 68.06 seconds.
-- Epoch 74
Norm: 9.76, NNZs: 1048574, Bias: -0.920860, T: 228364, Avg. loss: 0.011824
Total training time: 69.00 seconds.
-- Epoch 75
Norm: 9.76, NNZs: 1048574, Bias: -0.921727, T: 231450, Avg. loss: 0.011749
Total training time: 69.97 seconds.
-- Epoch 76
Norm: 9.75, NNZs: 1048574, Bias: -0.921144, T: 234536, Avg. loss: 0.011677
Total training time: 70.92 seconds.
-- Epoch 77
Norm: 9.74, NNZs: 1048574, Bias: -0.920611, T: 237622, Avg. loss: 0.011605
Total training time: 71.88 seconds.
-- Epoch 78
Norm: 9.74, NNZs: 1048574, Bias: -0.919598, T: 240708, Avg. loss: 0.011537
Total training time: 72.82 seconds.
-- Epoch 79
Norm: 9.74, NNZs: 1048574, Bias: -0.918700, T: 243794, Avg. loss: 0.011470
Total training time: 73.76 seconds.
-- Epoch 80
Norm: 9.74, NNZs: 1048574, Bias: -0.918564, T: 246880, Avg. loss: 0.011405
Total training time: 74.71 seconds.
-- Epoch 81
Norm: 9.73, NNZs: 1048574, Bias: -0.918717, T: 249966, Avg. loss: 0.011340
Total training time: 75.68 seconds.
-- Epoch 82
Norm: 9.73, NNZs: 1048574, Bias: -0.917215, T: 253052, Avg. loss: 0.011278
Total training time: 76.63 seconds.
-- Epoch 83
Norm: 9.72, NNZs: 1048574, Bias: -0.918039, T: 256138, Avg. loss: 0.011214
Total training time: 77.60 seconds.
-- Epoch 84
Norm: 9.73, NNZs: 1048574, Bias: -0.916803, T: 259224, Avg. loss: 0.011155
Total training time: 78.55 seconds.
-- Epoch 85
Norm: 9.73, NNZs: 1048574, Bias: -0.915894, T: 262310, Avg. loss: 0.011097
Total training time: 79.50 seconds.
-- Epoch 86
Norm: 9.72, NNZs: 1048574, Bias: -0.916566, T: 265396, Avg. loss: 0.011039
Total training time: 80.47 seconds.
-- Epoch 87
Norm: 9.72, NNZs: 1048574, Bias: -0.915407, T: 268482, Avg. loss: 0.010984
Total training time: 81.41 seconds.
-- Epoch 88
Norm: 9.72, NNZs: 1048574, Bias: -0.914042, T: 271568, Avg. loss: 0.010929
Total training time: 82.38 seconds.
-- Epoch 89
Norm: 9.72, NNZs: 1048574, Bias: -0.912964, T: 274654, Avg. loss: 0.010877
Total training time: 83.32 seconds.
-- Epoch 90
Norm: 9.72, NNZs: 1048574, Bias: -0.913511, T: 277740, Avg. loss: 0.010824
Total training time: 84.30 seconds.
-- Epoch 91
Norm: 9.72, NNZs: 1048574, Bias: -0.912933, T: 280826, Avg. loss: 0.010773
Total training time: 85.24 seconds.
-- Epoch 92
Norm: 9.71, NNZs: 1048574, Bias: -0.913496, T: 283912, Avg. loss: 0.010722
Total training time: 86.23 seconds.
-- Epoch 93
Norm: 9.71, NNZs: 1048574, Bias: -0.912560, T: 286998, Avg. loss: 0.010674
Total training time: 87.18 seconds.
-- Epoch 94
Norm: 9.71, NNZs: 1048574, Bias: -0.910742, T: 290084, Avg. loss: 0.010626
Total training time: 88.14 seconds.
-- Epoch 95
Norm: 9.70, NNZs: 1048574, Bias: -0.913001, T: 293170, Avg. loss: 0.010578
Total training time: 89.13 seconds.
-- Epoch 96
Norm: 9.71, NNZs: 1048574, Bias: -0.910852, T: 296256, Avg. loss: 0.010533
Total training time: 90.07 seconds.
-- Epoch 97
Norm: 9.70, NNZs: 1048574, Bias: -0.910785, T: 299342, Avg. loss: 0.010487
Total training time: 91.03 seconds.
-- Epoch 98
Norm: 9.71, NNZs: 1048574, Bias: -0.908818, T: 302428, Avg. loss: 0.010443
Total training time: 91.96 seconds.
-- Epoch 99
Norm: 9.69, NNZs: 1048574, Bias: -0.911566, T: 305514, Avg. loss: 0.010395
Total training time: 92.96 seconds.
-- Epoch 100
Norm: 9.70, NNZs: 1048574, Bias: -0.908709, T: 308600, Avg. loss: 0.010353
Total training time: 93.89 seconds.
-- Epoch 1
Norm: 52.22, NNZs: 777557, Bias: -1.191743, T: 3086, Avg. loss: 0.345165
Total training time: 0.86 seconds.
-- Epoch 2
Norm: 34.55, NNZs: 788178, Bias: -1.273348, T: 6172, Avg. loss: 0.195040
Total training time: 1.70 seconds.
-- Epoch 3
Norm: 26.52, NNZs: 792338, Bias: -1.345562, T: 9258, Avg. loss: 0.137813
Total training time: 2.54 seconds.
-- Epoch 4
Norm: 21.46, NNZs: 794286, Bias: -1.329919, T: 12344, Avg. loss: 0.106099
Total training time: 3.37 seconds.
-- Epoch 5
Norm: 18.45, NNZs: 800140, Bias: -1.327466, T: 15430, Avg. loss: 0.086409
Total training time: 4.21 seconds.
-- Epoch 6
Norm: 16.66, NNZs: 809053, Bias: -1.320502, T: 18516, Avg. loss: 0.073209
Total training time: 5.06 seconds.
-- Epoch 7
Norm: 15.43, NNZs: 812181, Bias: -1.308318, T: 21602, Avg. loss: 0.063690
Total training time: 5.90 seconds.
-- Epoch 8
Norm: 14.48, NNZs: 815276, Bias: -1.301841, T: 24688, Avg. loss: 0.056529
Total training time: 6.74 seconds.
-- Epoch 9
Norm: 13.89, NNZs: 820439, Bias: -1.297429, T: 27774, Avg. loss: 0.050911
Total training time: 7.59 seconds.
-- Epoch 10
Norm: 13.52, NNZs: 823108, Bias: -1.286105, T: 30860, Avg. loss: 0.046457
Total training time: 8.43 seconds.
-- Epoch 11
Norm: 13.13, NNZs: 827149, Bias: -1.284209, T: 33946, Avg. loss: 0.042786
Total training time: 9.28 seconds.
-- Epoch 12
Norm: 12.83, NNZs: 871388, Bias: -1.281253, T: 37032, Avg. loss: 0.039715
Total training time: 10.14 seconds.
-- Epoch 13
Norm: 12.65, NNZs: 881909, Bias: -1.278617, T: 40118, Avg. loss: 0.037098
Total training time: 10.99 seconds.
-- Epoch 14
Norm: 12.47, NNZs: 883040, Bias: -1.276694, T: 43204, Avg. loss: 0.034863
Total training time: 11.84 seconds.
-- Epoch 15
Norm: 12.32, NNZs: 960053, Bias: -1.274308, T: 46290, Avg. loss: 0.032931
Total training time: 12.71 seconds.
-- Epoch 16
Norm: 12.22, NNZs: 960431, Bias: -1.276081, T: 49376, Avg. loss: 0.031229
Total training time: 13.56 seconds.
-- Epoch 17
Norm: 12.13, NNZs: 965420, Bias: -1.273172, T: 52462, Avg. loss: 0.029734
Total training time: 14.41 seconds.
-- Epoch 18
Norm: 12.08, NNZs: 968131, Bias: -1.268998, T: 55548, Avg. loss: 0.028398
Total training time: 15.27 seconds.
-- Epoch 19
Norm: 11.98, NNZs: 968999, Bias: -1.271257, T: 58634, Avg. loss: 0.027195
Total training time: 16.13 seconds.
-- Epoch 20
Norm: 11.93, NNZs: 989680, Bias: -1.268330, T: 61720, Avg. loss: 0.026111
Total training time: 17.00 seconds.
-- Epoch 21
Norm: 11.87, NNZs: 990015, Bias: -1.266936, T: 64806, Avg. loss: 0.025137
Total training time: 17.86 seconds.
-- Epoch 22
Norm: 11.84, NNZs: 990184, Bias: -1.263968, T: 67892, Avg. loss: 0.024247
Total training time: 18.72 seconds.
-- Epoch 23
Norm: 11.80, NNZs: 990734, Bias: -1.263005, T: 70978, Avg. loss: 0.023425
Total training time: 19.59 seconds.
-- Epoch 24
Norm: 11.74, NNZs: 991075, Bias: -1.264871, T: 74064, Avg. loss: 0.022673
Total training time: 20.46 seconds.
-- Epoch 25
Norm: 11.72, NNZs: 991303, Bias: -1.262589, T: 77150, Avg. loss: 0.021973
Total training time: 21.32 seconds.
-- Epoch 26
Norm: 11.69, NNZs: 991396, Bias: -1.259605, T: 80236, Avg. loss: 0.021340
Total training time: 22.19 seconds.
-- Epoch 27
Norm: 11.65, NNZs: 996256, Bias: -1.259557, T: 83322, Avg. loss: 0.020752
Total training time: 23.06 seconds.
-- Epoch 28
Norm: 11.62, NNZs: 996385, Bias: -1.260394, T: 86408, Avg. loss: 0.020204
Total training time: 23.93 seconds.
-- Epoch 29
Norm: 11.61, NNZs: 996659, Bias: -1.259086, T: 89494, Avg. loss: 0.019688
Total training time: 24.79 seconds.
-- Epoch 30
Norm: 11.59, NNZs: 996769, Bias: -1.257306, T: 92580, Avg. loss: 0.019211
Total training time: 25.66 seconds.
-- Epoch 31
Norm: 11.57, NNZs: 996879, Bias: -1.255814, T: 95666, Avg. loss: 0.018766
Total training time: 26.53 seconds.
-- Epoch 32
Norm: 11.55, NNZs: 997088, Bias: -1.255155, T: 98752, Avg. loss: 0.018346
Total training time: 27.39 seconds.
-- Epoch 33
Norm: 11.53, NNZs: 997214, Bias: -1.254989, T: 101838, Avg. loss: 0.017952
Total training time: 28.26 seconds.
-- Epoch 34
Norm: 11.52, NNZs: 997278, Bias: -1.252776, T: 104924, Avg. loss: 0.017583
Total training time: 29.13 seconds.
-- Epoch 35
Norm: 11.49, NNZs: 997473, Bias: -1.254527, T: 108010, Avg. loss: 0.017227
Total training time: 30.01 seconds.
-- Epoch 36
Norm: 11.48, NNZs: 997615, Bias: -1.252701, T: 111096, Avg. loss: 0.016895
Total training time: 30.88 seconds.
-- Epoch 37
Norm: 11.47, NNZs: 997727, Bias: -1.252116, T: 114182, Avg. loss: 0.016580
Total training time: 31.76 seconds.
-- Epoch 38
Norm: 11.44, NNZs: 997801, Bias: -1.251419, T: 117268, Avg. loss: 0.016283
Total training time: 32.63 seconds.
-- Epoch 39
Norm: 11.44, NNZs: 997920, Bias: -1.249631, T: 120354, Avg. loss: 0.016001
Total training time: 33.50 seconds.
-- Epoch 40
Norm: 11.43, NNZs: 1003043, Bias: -1.250274, T: 123440, Avg. loss: 0.015731
Total training time: 34.38 seconds.
-- Epoch 41
Norm: 11.43, NNZs: 1003067, Bias: -1.247221, T: 126526, Avg. loss: 0.015475
Total training time: 35.25 seconds.
-- Epoch 42
Norm: 11.41, NNZs: 1003126, Bias: -1.249140, T: 129612, Avg. loss: 0.015232
Total training time: 36.12 seconds.
-- Epoch 43
Norm: 11.40, NNZs: 1003200, Bias: -1.247755, T: 132698, Avg. loss: 0.014996
Total training time: 37.00 seconds.
-- Epoch 44
Norm: 11.39, NNZs: 1003226, Bias: -1.246927, T: 135784, Avg. loss: 0.014774
Total training time: 37.87 seconds.
-- Epoch 45
Norm: 11.38, NNZs: 1003283, Bias: -1.247513, T: 138870, Avg. loss: 0.014562
Total training time: 38.74 seconds.
-- Epoch 46
Norm: 11.37, NNZs: 1003329, Bias: -1.246524, T: 141956, Avg. loss: 0.014359
Total training time: 39.61 seconds.
-- Epoch 47
Norm: 11.37, NNZs: 1003351, Bias: -1.246003, T: 145042, Avg. loss: 0.014165
Total training time: 40.48 seconds.
-- Epoch 48
Norm: 11.35, NNZs: 1004595, Bias: -1.245946, T: 148128, Avg. loss: 0.013978
Total training time: 41.36 seconds.
-- Epoch 49
Norm: 11.34, NNZs: 1004641, Bias: -1.245978, T: 151214, Avg. loss: 0.013800
Total training time: 42.24 seconds.
-- Epoch 50
Norm: 11.34, NNZs: 1004690, Bias: -1.244780, T: 154300, Avg. loss: 0.013628
Total training time: 43.12 seconds.
-- Epoch 51
Norm: 11.34, NNZs: 1004740, Bias: -1.243806, T: 157386, Avg. loss: 0.013462
Total training time: 43.99 seconds.
-- Epoch 52
Norm: 11.34, NNZs: 1004779, Bias: -1.242459, T: 160472, Avg. loss: 0.013301
Total training time: 44.86 seconds.
-- Epoch 53
Norm: 11.33, NNZs: 1004822, Bias: -1.243272, T: 163558, Avg. loss: 0.013147
Total training time: 45.73 seconds.
-- Epoch 54
Norm: 11.32, NNZs: 1004851, Bias: -1.242500, T: 166644, Avg. loss: 0.012998
Total training time: 46.61 seconds.
-- Epoch 55
Norm: 11.31, NNZs: 1004886, Bias: -1.242334, T: 169730, Avg. loss: 0.012855
Total training time: 47.49 seconds.
-- Epoch 56
Norm: 11.31, NNZs: 1004893, Bias: -1.241166, T: 172816, Avg. loss: 0.012718
Total training time: 48.36 seconds.
-- Epoch 57
Norm: 11.31, NNZs: 1005074, Bias: -1.240686, T: 175902, Avg. loss: 0.012585
Total training time: 49.24 seconds.
-- Epoch 58
Norm: 11.29, NNZs: 1005148, Bias: -1.242080, T: 178988, Avg. loss: 0.012455
Total training time: 50.11 seconds.
-- Epoch 59
Norm: 11.29, NNZs: 1005172, Bias: -1.240831, T: 182074, Avg. loss: 0.012332
Total training time: 51.00 seconds.
-- Epoch 60
Norm: 11.29, NNZs: 1005222, Bias: -1.241203, T: 185160, Avg. loss: 0.012211
Total training time: 51.87 seconds.
-- Epoch 61
Norm: 11.29, NNZs: 1005232, Bias: -1.240707, T: 188246, Avg. loss: 0.012095
Total training time: 52.74 seconds.
-- Epoch 62
Norm: 11.29, NNZs: 1005233, Bias: -1.238154, T: 191332, Avg. loss: 0.011982
Total training time: 53.61 seconds.
-- Epoch 63
Norm: 11.28, NNZs: 1005270, Bias: -1.239400, T: 194418, Avg. loss: 0.011873
Total training time: 54.49 seconds.
-- Epoch 64
Norm: 11.27, NNZs: 1005332, Bias: -1.239935, T: 197504, Avg. loss: 0.011768
Total training time: 55.37 seconds.
-- Epoch 65
Norm: 11.27, NNZs: 1005336, Bias: -1.237900, T: 200590, Avg. loss: 0.011666
Total training time: 56.24 seconds.
-- Epoch 66
Norm: 11.26, NNZs: 1005352, Bias: -1.238161, T: 203676, Avg. loss: 0.011567
Total training time: 57.13 seconds.
-- Epoch 67
Norm: 11.26, NNZs: 1005359, Bias: -1.237679, T: 206762, Avg. loss: 0.011472
Total training time: 58.01 seconds.
-- Epoch 68
Norm: 11.26, NNZs: 1005381, Bias: -1.236558, T: 209848, Avg. loss: 0.011379
Total training time: 58.89 seconds.
-- Epoch 69
Norm: 11.25, NNZs: 1005413, Bias: -1.238776, T: 212934, Avg. loss: 0.011287
Total training time: 59.77 seconds.
-- Epoch 70
Norm: 11.25, NNZs: 1005416, Bias: -1.237418, T: 216020, Avg. loss: 0.011199
Total training time: 60.65 seconds.
-- Epoch 71
Norm: 11.25, NNZs: 1005478, Bias: -1.236043, T: 219106, Avg. loss: 0.011114
Total training time: 61.53 seconds.
-- Epoch 72
Norm: 11.24, NNZs: 1005480, Bias: -1.236217, T: 222192, Avg. loss: 0.011031
Total training time: 62.41 seconds.
-- Epoch 73
Norm: 11.24, NNZs: 1005513, Bias: -1.235969, T: 225278, Avg. loss: 0.010950
Total training time: 63.29 seconds.
-- Epoch 74
Norm: 11.24, NNZs: 1005520, Bias: -1.235424, T: 228364, Avg. loss: 0.010870
Total training time: 64.17 seconds.
-- Epoch 75
Norm: 11.24, NNZs: 1005535, Bias: -1.235308, T: 231450, Avg. loss: 0.010793
Total training time: 65.05 seconds.
-- Epoch 76
Norm: 11.24, NNZs: 1005540, Bias: -1.234541, T: 234536, Avg. loss: 0.010718
Total training time: 65.93 seconds.
-- Epoch 77
Norm: 11.23, NNZs: 1006172, Bias: -1.235504, T: 237622, Avg. loss: 0.010645
Total training time: 66.81 seconds.
-- Epoch 78
Norm: 11.22, NNZs: 1006182, Bias: -1.234795, T: 240708, Avg. loss: 0.010574
Total training time: 67.69 seconds.
-- Epoch 79
Norm: 11.23, NNZs: 1006197, Bias: -1.233212, T: 243794, Avg. loss: 0.010505
Total training time: 68.56 seconds.
-- Epoch 80
Norm: 11.22, NNZs: 1006219, Bias: -1.234330, T: 246880, Avg. loss: 0.010437
Total training time: 69.44 seconds.
-- Epoch 81
Norm: 11.22, NNZs: 1006219, Bias: -1.234558, T: 249966, Avg. loss: 0.010372
Total training time: 70.33 seconds.
-- Epoch 82
Norm: 11.22, NNZs: 1006251, Bias: -1.233879, T: 253052, Avg. loss: 0.010307
Total training time: 71.21 seconds.
-- Epoch 83
Norm: 11.21, NNZs: 1006267, Bias: -1.234223, T: 256138, Avg. loss: 0.010244
Total training time: 72.10 seconds.
-- Epoch 84
Norm: 11.21, NNZs: 1006267, Bias: -1.233385, T: 259224, Avg. loss: 0.010183
Total training time: 72.98 seconds.
-- Epoch 85
Norm: 11.21, NNZs: 1006272, Bias: -1.232727, T: 262310, Avg. loss: 0.010123
Total training time: 73.86 seconds.
-- Epoch 86
Norm: 11.21, NNZs: 1006318, Bias: -1.232827, T: 265396, Avg. loss: 0.010064
Total training time: 74.88 seconds.
-- Epoch 87
Norm: 11.20, NNZs: 1006325, Bias: -1.233433, T: 268482, Avg. loss: 0.010007
Total training time: 75.82 seconds.
-- Epoch 88
Norm: 11.20, NNZs: 1006325, Bias: -1.232633, T: 271568, Avg. loss: 0.009952
Total training time: 76.69 seconds.
-- Epoch 89
Norm: 11.20, NNZs: 1006339, Bias: -1.231996, T: 274654, Avg. loss: 0.009897
Total training time: 77.58 seconds.
-- Epoch 90
Norm: 11.19, NNZs: 1006347, Bias: -1.232048, T: 277740, Avg. loss: 0.009844
Total training time: 78.45 seconds.
-- Epoch 91
Norm: 11.19, NNZs: 1006347, Bias: -1.231113, T: 280826, Avg. loss: 0.009792
Total training time: 79.34 seconds.
-- Epoch 92
Norm: 11.19, NNZs: 1006357, Bias: -1.231524, T: 283912, Avg. loss: 0.009740
Total training time: 80.23 seconds.
-- Epoch 93
Norm: 11.19, NNZs: 1006361, Bias: -1.231106, T: 286998, Avg. loss: 0.009691
Total training time: 81.10 seconds.
-- Epoch 94
Norm: 11.19, NNZs: 1006380, Bias: -1.230740, T: 290084, Avg. loss: 0.009642
Total training time: 81.99 seconds.
-- Epoch 95
Norm: 11.18, NNZs: 1006391, Bias: -1.231423, T: 293170, Avg. loss: 0.009594
Total training time: 82.89 seconds.
-- Epoch 96
Norm: 11.19, NNZs: 1006391, Bias: -1.230266, T: 296256, Avg. loss: 0.009546
Total training time: 83.76 seconds.
-- Epoch 97
Norm: 11.19, NNZs: 1006398, Bias: -1.229687, T: 299342, Avg. loss: 0.009501
Total training time: 84.64 seconds.
-- Epoch 98
Norm: 11.18, NNZs: 1006404, Bias: -1.229916, T: 302428, Avg. loss: 0.009456
Total training time: 85.53 seconds.
-- Epoch 99
Norm: 11.18, NNZs: 1006404, Bias: -1.229084, T: 305514, Avg. loss: 0.009412
Total training time: 86.42 seconds.
-- Epoch 100
Norm: 11.18, NNZs: 1006404, Bias: -1.229049, T: 308600, Avg. loss: 0.009369
Total training time: 87.30 seconds.
-- Epoch 1
Norm: 43.53, NNZs: 824709, Bias: -1.131929, T: 3086, Avg. loss: 0.362345
Total training time: 0.87 seconds.
-- Epoch 2
Norm: 29.12, NNZs: 886916, Bias: -1.280635, T: 6172, Avg. loss: 0.206335
Total training time: 1.72 seconds.
-- Epoch 3
Norm: 23.00, NNZs: 992093, Bias: -1.256746, T: 9258, Avg. loss: 0.147275
Total training time: 2.57 seconds.
-- Epoch 4
Norm: 19.49, NNZs: 1023067, Bias: -1.249765, T: 12344, Avg. loss: 0.115365
Total training time: 3.44 seconds.
-- Epoch 5
Norm: 16.69, NNZs: 1038905, Bias: -1.272052, T: 15430, Avg. loss: 0.094689
Total training time: 4.29 seconds.
-- Epoch 6
Norm: 15.19, NNZs: 1047317, Bias: -1.273828, T: 18516, Avg. loss: 0.080775
Total training time: 5.17 seconds.
-- Epoch 7
Norm: 14.28, NNZs: 1047694, Bias: -1.247780, T: 21602, Avg. loss: 0.070526
Total training time: 6.04 seconds.
-- Epoch 8
Norm: 13.58, NNZs: 1047880, Bias: -1.243587, T: 24688, Avg. loss: 0.062806
Total training time: 6.92 seconds.
-- Epoch 9
Norm: 13.04, NNZs: 1048341, Bias: -1.243608, T: 27774, Avg. loss: 0.056644
Total training time: 7.81 seconds.
-- Epoch 10
Norm: 12.70, NNZs: 1048447, Bias: -1.228893, T: 30860, Avg. loss: 0.051687
Total training time: 8.70 seconds.
-- Epoch 11
Norm: 12.30, NNZs: 1048487, Bias: -1.226673, T: 33946, Avg. loss: 0.047653
Total training time: 9.60 seconds.
-- Epoch 12
Norm: 12.02, NNZs: 1048507, Bias: -1.230589, T: 37032, Avg. loss: 0.044168
Total training time: 10.50 seconds.
-- Epoch 13
Norm: 11.81, NNZs: 1048527, Bias: -1.227575, T: 40118, Avg. loss: 0.041328
Total training time: 11.39 seconds.
-- Epoch 14
Norm: 11.64, NNZs: 1048535, Bias: -1.223267, T: 43204, Avg. loss: 0.038875
Total training time: 12.29 seconds.
-- Epoch 15
Norm: 11.51, NNZs: 1048544, Bias: -1.222546, T: 46290, Avg. loss: 0.036733
Total training time: 13.19 seconds.
-- Epoch 16
Norm: 11.39, NNZs: 1048558, Bias: -1.225217, T: 49376, Avg. loss: 0.034847
Total training time: 14.09 seconds.
-- Epoch 17
Norm: 11.34, NNZs: 1048559, Bias: -1.215559, T: 52462, Avg. loss: 0.033182
Total training time: 14.99 seconds.
-- Epoch 18
Norm: 11.28, NNZs: 1048564, Bias: -1.213872, T: 55548, Avg. loss: 0.031704
Total training time: 15.90 seconds.
-- Epoch 19
Norm: 11.22, NNZs: 1048568, Bias: -1.207381, T: 58634, Avg. loss: 0.030365
Total training time: 16.83 seconds.
-- Epoch 20
Norm: 11.10, NNZs: 1048573, Bias: -1.219746, T: 61720, Avg. loss: 0.029155
Total training time: 17.76 seconds.
-- Epoch 21
Norm: 11.07, NNZs: 1048575, Bias: -1.213426, T: 64806, Avg. loss: 0.028079
Total training time: 18.69 seconds.
-- Epoch 22
Norm: 11.00, NNZs: 1048575, Bias: -1.213263, T: 67892, Avg. loss: 0.027100
Total training time: 19.59 seconds.
-- Epoch 23
Norm: 10.97, NNZs: 1048575, Bias: -1.210155, T: 70978, Avg. loss: 0.026190
Total training time: 20.50 seconds.
-- Epoch 24
Norm: 10.94, NNZs: 1048575, Bias: -1.207947, T: 74064, Avg. loss: 0.025368
Total training time: 21.40 seconds.
-- Epoch 25
Norm: 10.92, NNZs: 1048575, Bias: -1.206871, T: 77150, Avg. loss: 0.024603
Total training time: 22.35 seconds.
-- Epoch 26
Norm: 10.87, NNZs: 1048575, Bias: -1.201398, T: 80236, Avg. loss: 0.023893
Total training time: 23.24 seconds.
-- Epoch 27
Norm: 10.80, NNZs: 1048575, Bias: -1.208998, T: 83322, Avg. loss: 0.023241
Total training time: 24.16 seconds.
-- Epoch 28
Norm: 10.78, NNZs: 1048575, Bias: -1.206902, T: 86408, Avg. loss: 0.022636
Total training time: 25.11 seconds.
-- Epoch 29
Norm: 10.73, NNZs: 1048575, Bias: -1.207994, T: 89494, Avg. loss: 0.022067
Total training time: 26.02 seconds.
-- Epoch 30
Norm: 10.72, NNZs: 1048575, Bias: -1.205589, T: 92580, Avg. loss: 0.021546
Total training time: 26.95 seconds.
-- Epoch 31
Norm: 10.71, NNZs: 1048575, Bias: -1.202178, T: 95666, Avg. loss: 0.021046
Total training time: 27.85 seconds.
-- Epoch 32
Norm: 10.68, NNZs: 1048575, Bias: -1.202774, T: 98752, Avg. loss: 0.020581
Total training time: 28.77 seconds.
-- Epoch 33
Norm: 10.67, NNZs: 1048575, Bias: -1.202621, T: 101838, Avg. loss: 0.020146
Total training time: 29.72 seconds.
-- Epoch 34
Norm: 10.65, NNZs: 1048575, Bias: -1.202523, T: 104924, Avg. loss: 0.019736
Total training time: 30.64 seconds.
-- Epoch 35
Norm: 10.63, NNZs: 1048575, Bias: -1.201389, T: 108010, Avg. loss: 0.019349
Total training time: 31.57 seconds.
-- Epoch 36
Norm: 10.61, NNZs: 1048575, Bias: -1.200603, T: 111096, Avg. loss: 0.018985
Total training time: 32.48 seconds.
-- Epoch 37
Norm: 10.59, NNZs: 1048575, Bias: -1.200407, T: 114182, Avg. loss: 0.018642
Total training time: 33.43 seconds.
-- Epoch 38
Norm: 10.59, NNZs: 1048575, Bias: -1.198683, T: 117268, Avg. loss: 0.018315
Total training time: 34.35 seconds.
-- Epoch 39
Norm: 10.56, NNZs: 1048575, Bias: -1.199552, T: 120354, Avg. loss: 0.018005
Total training time: 35.28 seconds.
-- Epoch 40
Norm: 10.55, NNZs: 1048575, Bias: -1.200647, T: 123440, Avg. loss: 0.017705
Total training time: 36.23 seconds.
-- Epoch 41
Norm: 10.55, NNZs: 1048575, Bias: -1.194124, T: 126526, Avg. loss: 0.017417
Total training time: 37.12 seconds.
-- Epoch 42
Norm: 10.54, NNZs: 1048575, Bias: -1.197282, T: 129612, Avg. loss: 0.017151
Total training time: 38.09 seconds.
-- Epoch 43
Norm: 10.51, NNZs: 1048575, Bias: -1.200387, T: 132698, Avg. loss: 0.016887
Total training time: 39.04 seconds.
-- Epoch 44
Norm: 10.50, NNZs: 1048575, Bias: -1.199673, T: 135784, Avg. loss: 0.016644
Total training time: 39.97 seconds.
-- Epoch 45
Norm: 10.51, NNZs: 1048575, Bias: -1.196053, T: 138870, Avg. loss: 0.016409
Total training time: 40.88 seconds.
-- Epoch 46
Norm: 10.49, NNZs: 1048575, Bias: -1.197098, T: 141956, Avg. loss: 0.016185
Total training time: 41.82 seconds.
-- Epoch 47
Norm: 10.50, NNZs: 1048575, Bias: -1.194564, T: 145042, Avg. loss: 0.015970
Total training time: 42.75 seconds.
-- Epoch 48
Norm: 10.48, NNZs: 1048575, Bias: -1.194940, T: 148128, Avg. loss: 0.015761
Total training time: 43.68 seconds.
-- Epoch 49
Norm: 10.47, NNZs: 1048575, Bias: -1.195819, T: 151214, Avg. loss: 0.015563
Total training time: 44.61 seconds.
-- Epoch 50
Norm: 10.48, NNZs: 1048575, Bias: -1.193398, T: 154300, Avg. loss: 0.015372
Total training time: 45.53 seconds.
-- Epoch 51
Norm: 10.46, NNZs: 1048575, Bias: -1.194168, T: 157386, Avg. loss: 0.015187
Total training time: 46.46 seconds.
-- Epoch 52
Norm: 10.46, NNZs: 1048575, Bias: -1.194310, T: 160472, Avg. loss: 0.015013
Total training time: 47.39 seconds.
-- Epoch 53
Norm: 10.45, NNZs: 1048575, Bias: -1.193660, T: 163558, Avg. loss: 0.014844
Total training time: 48.35 seconds.
-- Epoch 54
Norm: 10.44, NNZs: 1048575, Bias: -1.194115, T: 166644, Avg. loss: 0.014681
Total training time: 49.29 seconds.
-- Epoch 55
Norm: 10.44, NNZs: 1048575, Bias: -1.193052, T: 169730, Avg. loss: 0.014525
Total training time: 50.21 seconds.
-- Epoch 56
Norm: 10.44, NNZs: 1048575, Bias: -1.193275, T: 172816, Avg. loss: 0.014372
Total training time: 51.17 seconds.
-- Epoch 57
Norm: 10.42, NNZs: 1048575, Bias: -1.194920, T: 175902, Avg. loss: 0.014223
Total training time: 52.13 seconds.
-- Epoch 58
Norm: 10.42, NNZs: 1048575, Bias: -1.192643, T: 178988, Avg. loss: 0.014084
Total training time: 53.04 seconds.
-- Epoch 59
Norm: 10.41, NNZs: 1048575, Bias: -1.193038, T: 182074, Avg. loss: 0.013947
Total training time: 53.99 seconds.
-- Epoch 60
Norm: 10.41, NNZs: 1048575, Bias: -1.191655, T: 185160, Avg. loss: 0.013815
Total training time: 54.90 seconds.
-- Epoch 61
Norm: 10.41, NNZs: 1048575, Bias: -1.191329, T: 188246, Avg. loss: 0.013686
Total training time: 55.84 seconds.
-- Epoch 62
Norm: 10.39, NNZs: 1048575, Bias: -1.192065, T: 191332, Avg. loss: 0.013559
Total training time: 56.80 seconds.
-- Epoch 63
Norm: 10.39, NNZs: 1048575, Bias: -1.191969, T: 194418, Avg. loss: 0.013439
Total training time: 57.72 seconds.
-- Epoch 64
Norm: 10.39, NNZs: 1048575, Bias: -1.190544, T: 197504, Avg. loss: 0.013323
Total training time: 58.67 seconds.
-- Epoch 65
Norm: 10.39, NNZs: 1048575, Bias: -1.189598, T: 200590, Avg. loss: 0.013211
Total training time: 59.62 seconds.
-- Epoch 66
Norm: 10.38, NNZs: 1048575, Bias: -1.190188, T: 203676, Avg. loss: 0.013101
Total training time: 60.58 seconds.
-- Epoch 67
Norm: 10.37, NNZs: 1048575, Bias: -1.191867, T: 206762, Avg. loss: 0.012993
Total training time: 61.53 seconds.
-- Epoch 68
Norm: 10.37, NNZs: 1048575, Bias: -1.189964, T: 209848, Avg. loss: 0.012890
Total training time: 62.46 seconds.
-- Epoch 69
Norm: 10.38, NNZs: 1048575, Bias: -1.187028, T: 212934, Avg. loss: 0.012790
Total training time: 63.40 seconds.
-- Epoch 70
Norm: 10.36, NNZs: 1048575, Bias: -1.189528, T: 216020, Avg. loss: 0.012692
Total training time: 64.34 seconds.
-- Epoch 71
Norm: 10.36, NNZs: 1048575, Bias: -1.188285, T: 219106, Avg. loss: 0.012598
Total training time: 65.29 seconds.
-- Epoch 72
Norm: 10.36, NNZs: 1048575, Bias: -1.188801, T: 222192, Avg. loss: 0.012507
Total training time: 66.24 seconds.
-- Epoch 73
Norm: 10.35, NNZs: 1048575, Bias: -1.189995, T: 225278, Avg. loss: 0.012417
Total training time: 67.20 seconds.
-- Epoch 74
Norm: 10.36, NNZs: 1048575, Bias: -1.187428, T: 228364, Avg. loss: 0.012331
Total training time: 68.14 seconds.
-- Epoch 75
Norm: 10.35, NNZs: 1048575, Bias: -1.188485, T: 231450, Avg. loss: 0.012245
Total training time: 69.09 seconds.
-- Epoch 76
Norm: 10.35, NNZs: 1048575, Bias: -1.187973, T: 234536, Avg. loss: 0.012164
Total training time: 70.05 seconds.
-- Epoch 77
Norm: 10.35, NNZs: 1048575, Bias: -1.186872, T: 237622, Avg. loss: 0.012084
Total training time: 70.99 seconds.
-- Epoch 78
Norm: 10.34, NNZs: 1048575, Bias: -1.188435, T: 240708, Avg. loss: 0.012005
Total training time: 71.95 seconds.
-- Epoch 79
Norm: 10.35, NNZs: 1048575, Bias: -1.185987, T: 243794, Avg. loss: 0.011928
Total training time: 72.88 seconds.
-- Epoch 80
Norm: 10.35, NNZs: 1048575, Bias: -1.186400, T: 246880, Avg. loss: 0.011854
Total training time: 73.83 seconds.
-- Epoch 81
Norm: 10.34, NNZs: 1048575, Bias: -1.185699, T: 249966, Avg. loss: 0.011782
Total training time: 74.78 seconds.
-- Epoch 82
Norm: 10.34, NNZs: 1048575, Bias: -1.185692, T: 253052, Avg. loss: 0.011711
Total training time: 75.76 seconds.
-- Epoch 83
Norm: 10.33, NNZs: 1048575, Bias: -1.186563, T: 256138, Avg. loss: 0.011641
Total training time: 76.70 seconds.
-- Epoch 84
Norm: 10.33, NNZs: 1048575, Bias: -1.186355, T: 259224, Avg. loss: 0.011574
Total training time: 77.65 seconds.
-- Epoch 85
Norm: 10.33, NNZs: 1048575, Bias: -1.186516, T: 262310, Avg. loss: 0.011508
Total training time: 78.60 seconds.
-- Epoch 86
Norm: 10.33, NNZs: 1048575, Bias: -1.186151, T: 265396, Avg. loss: 0.011444
Total training time: 79.56 seconds.
-- Epoch 87
Norm: 10.32, NNZs: 1048575, Bias: -1.187173, T: 268482, Avg. loss: 0.011380
Total training time: 80.54 seconds.
-- Epoch 88
Norm: 10.32, NNZs: 1048575, Bias: -1.186092, T: 271568, Avg. loss: 0.011318
Total training time: 81.49 seconds.
-- Epoch 89
Norm: 10.32, NNZs: 1048575, Bias: -1.185277, T: 274654, Avg. loss: 0.011258
Total training time: 82.43 seconds.
-- Epoch 90
Norm: 10.32, NNZs: 1048575, Bias: -1.184904, T: 277740, Avg. loss: 0.011199
Total training time: 83.37 seconds.
-- Epoch 91
Norm: 10.32, NNZs: 1048575, Bias: -1.185513, T: 280826, Avg. loss: 0.011141
Total training time: 84.34 seconds.
-- Epoch 92
Norm: 10.32, NNZs: 1048575, Bias: -1.184557, T: 283912, Avg. loss: 0.011084
Total training time: 85.26 seconds.
-- Epoch 93
Norm: 10.32, NNZs: 1048575, Bias: -1.183584, T: 286998, Avg. loss: 0.011028
Total training time: 86.21 seconds.
-- Epoch 94
Norm: 10.32, NNZs: 1048575, Bias: -1.184607, T: 290084, Avg. loss: 0.010975
Total training time: 87.18 seconds.
-- Epoch 95
Norm: 10.32, NNZs: 1048575, Bias: -1.183467, T: 293170, Avg. loss: 0.010921
Total training time: 88.11 seconds.
-- Epoch 96
Norm: 10.31, NNZs: 1048575, Bias: -1.184132, T: 296256, Avg. loss: 0.010869
Total training time: 89.09 seconds.
-- Epoch 97
Norm: 10.32, NNZs: 1048575, Bias: -1.182904, T: 299342, Avg. loss: 0.010818
Total training time: 90.05 seconds.
-- Epoch 98
Norm: 10.31, NNZs: 1048575, Bias: -1.183567, T: 302428, Avg. loss: 0.010769
Total training time: 91.01 seconds.
-- Epoch 99
Norm: 10.31, NNZs: 1048575, Bias: -1.183303, T: 305514, Avg. loss: 0.010720
Total training time: 91.95 seconds.
-- Epoch 100
Norm: 10.30, NNZs: 1048575, Bias: -1.183851, T: 308600, Avg. loss: 0.010672
Total training time: 92.91 seconds.
-- Epoch 1
Norm: 40.78, NNZs: 1048108, Bias: -2.206101, T: 3086, Avg. loss: 0.330234
Total training time: 0.93 seconds.
-- Epoch 2
Norm: 26.54, NNZs: 1048516, Bias: -2.360115, T: 6172, Avg. loss: 0.177010
Total training time: 1.83 seconds.
-- Epoch 3
Norm: 20.33, NNZs: 1048553, Bias: -2.380501, T: 9258, Avg. loss: 0.124405
Total training time: 2.75 seconds.
-- Epoch 4
Norm: 16.57, NNZs: 1048563, Bias: -2.386004, T: 12344, Avg. loss: 0.094801
Total training time: 3.65 seconds.
-- Epoch 5
Norm: 14.50, NNZs: 1048565, Bias: -2.376244, T: 15430, Avg. loss: 0.077014
Total training time: 4.57 seconds.
-- Epoch 6
Norm: 13.03, NNZs: 1048567, Bias: -2.377482, T: 18516, Avg. loss: 0.064879
Total training time: 5.49 seconds.
-- Epoch 7
Norm: 12.06, NNZs: 1048568, Bias: -2.380975, T: 21602, Avg. loss: 0.056189
Total training time: 6.43 seconds.
-- Epoch 8
Norm: 11.35, NNZs: 1048570, Bias: -2.382133, T: 24688, Avg. loss: 0.049609
Total training time: 7.35 seconds.
-- Epoch 9
Norm: 10.80, NNZs: 1048574, Bias: -2.383995, T: 27774, Avg. loss: 0.044488
Total training time: 8.31 seconds.
-- Epoch 10
Norm: 10.34, NNZs: 1048574, Bias: -2.384124, T: 30860, Avg. loss: 0.040423
Total training time: 9.27 seconds.
-- Epoch 11
Norm: 9.99, NNZs: 1048575, Bias: -2.384398, T: 33946, Avg. loss: 0.037053
Total training time: 10.23 seconds.
-- Epoch 12
Norm: 9.76, NNZs: 1048576, Bias: -2.383160, T: 37032, Avg. loss: 0.034251
Total training time: 11.20 seconds.
-- Epoch 13
Norm: 9.61, NNZs: 1048576, Bias: -2.381811, T: 40118, Avg. loss: 0.031860
Total training time: 12.18 seconds.
-- Epoch 14
Norm: 9.44, NNZs: 1048576, Bias: -2.381298, T: 43204, Avg. loss: 0.029830
Total training time: 13.17 seconds.
-- Epoch 15
Norm: 9.34, NNZs: 1048576, Bias: -2.382051, T: 46290, Avg. loss: 0.028045
Total training time: 14.17 seconds.
-- Epoch 16
Norm: 9.21, NNZs: 1048576, Bias: -2.382707, T: 49376, Avg. loss: 0.026491
Total training time: 15.37 seconds.
-- Epoch 17
Norm: 9.26, NNZs: 1048576, Bias: -2.378126, T: 52462, Avg. loss: 0.025109
Total training time: 16.35 seconds.
-- Epoch 18
Norm: 9.13, NNZs: 1048576, Bias: -2.380797, T: 55548, Avg. loss: 0.023883
Total training time: 17.35 seconds.
-- Epoch 19
Norm: 9.01, NNZs: 1048576, Bias: -2.382209, T: 58634, Avg. loss: 0.022790
Total training time: 18.33 seconds.
-- Epoch 20
Norm: 9.04, NNZs: 1048576, Bias: -2.380947, T: 61720, Avg. loss: 0.021802
Total training time: 19.33 seconds.
-- Epoch 21
Norm: 9.01, NNZs: 1048576, Bias: -2.379938, T: 64806, Avg. loss: 0.020918
Total training time: 20.33 seconds.
-- Epoch 22
Norm: 8.92, NNZs: 1048576, Bias: -2.382341, T: 67892, Avg. loss: 0.020104
Total training time: 21.33 seconds.
-- Epoch 23
Norm: 8.90, NNZs: 1048576, Bias: -2.382677, T: 70978, Avg. loss: 0.019361
Total training time: 22.33 seconds.
-- Epoch 24
Norm: 8.94, NNZs: 1048576, Bias: -2.381018, T: 74064, Avg. loss: 0.018682
Total training time: 23.35 seconds.
-- Epoch 25
Norm: 8.90, NNZs: 1048576, Bias: -2.382258, T: 77150, Avg. loss: 0.018059
Total training time: 24.36 seconds.
-- Epoch 26
Norm: 8.91, NNZs: 1048576, Bias: -2.381465, T: 80236, Avg. loss: 0.017473
Total training time: 25.37 seconds.
-- Epoch 27
Norm: 8.87, NNZs: 1048576, Bias: -2.382063, T: 83322, Avg. loss: 0.016941
Total training time: 26.38 seconds.
-- Epoch 28
Norm: 8.91, NNZs: 1048576, Bias: -2.381257, T: 86408, Avg. loss: 0.016439
Total training time: 27.40 seconds.
-- Epoch 29
Norm: 8.84, NNZs: 1048576, Bias: -2.383429, T: 89494, Avg. loss: 0.015972
Total training time: 28.41 seconds.
-- Epoch 30
Norm: 8.85, NNZs: 1048576, Bias: -2.382124, T: 92580, Avg. loss: 0.015541
Total training time: 29.41 seconds.
-- Epoch 31
Norm: 8.83, NNZs: 1048576, Bias: -2.382669, T: 95666, Avg. loss: 0.015138
Total training time: 30.41 seconds.
-- Epoch 32
Norm: 8.80, NNZs: 1048576, Bias: -2.383237, T: 98752, Avg. loss: 0.014761
Total training time: 31.42 seconds.
-- Epoch 33
Norm: 8.80, NNZs: 1048576, Bias: -2.382654, T: 101838, Avg. loss: 0.014402
Total training time: 32.43 seconds.
-- Epoch 34
Norm: 8.72, NNZs: 1048576, Bias: -2.384428, T: 104924, Avg. loss: 0.014064
Total training time: 33.45 seconds.
-- Epoch 35
Norm: 8.80, NNZs: 1048576, Bias: -2.381162, T: 108010, Avg. loss: 0.013742
Total training time: 34.45 seconds.
-- Epoch 36
Norm: 8.76, NNZs: 1048576, Bias: -2.381728, T: 111096, Avg. loss: 0.013439
Total training time: 35.47 seconds.
-- Epoch 37
Norm: 8.79, NNZs: 1048576, Bias: -2.380629, T: 114182, Avg. loss: 0.013153
Total training time: 36.49 seconds.
-- Epoch 38
Norm: 8.72, NNZs: 1048576, Bias: -2.383068, T: 117268, Avg. loss: 0.012882
Total training time: 37.50 seconds.
-- Epoch 39
Norm: 8.74, NNZs: 1048576, Bias: -2.382226, T: 120354, Avg. loss: 0.012630
Total training time: 38.51 seconds.
-- Epoch 40
Norm: 8.74, NNZs: 1048576, Bias: -2.382594, T: 123440, Avg. loss: 0.012387
Total training time: 39.54 seconds.
-- Epoch 41
Norm: 8.72, NNZs: 1048576, Bias: -2.382878, T: 126526, Avg. loss: 0.012156
Total training time: 40.55 seconds.
-- Epoch 42
Norm: 8.70, NNZs: 1048576, Bias: -2.383642, T: 129612, Avg. loss: 0.011936
Total training time: 41.56 seconds.
-- Epoch 43
Norm: 8.71, NNZs: 1048576, Bias: -2.382896, T: 132698, Avg. loss: 0.011728
Total training time: 42.57 seconds.
-- Epoch 44
Norm: 8.72, NNZs: 1048576, Bias: -2.382646, T: 135784, Avg. loss: 0.011527
Total training time: 43.59 seconds.
-- Epoch 45
Norm: 8.66, NNZs: 1048576, Bias: -2.384230, T: 138870, Avg. loss: 0.011336
Total training time: 44.59 seconds.
-- Epoch 46
Norm: 8.66, NNZs: 1048576, Bias: -2.384209, T: 141956, Avg. loss: 0.011153
Total training time: 45.60 seconds.
-- Epoch 47
Norm: 8.72, NNZs: 1048576, Bias: -2.382064, T: 145042, Avg. loss: 0.010975
Total training time: 46.62 seconds.
-- Epoch 48
Norm: 8.71, NNZs: 1048576, Bias: -2.382568, T: 148128, Avg. loss: 0.010807
Total training time: 47.64 seconds.
-- Epoch 49
Norm: 8.63, NNZs: 1048576, Bias: -2.385161, T: 151214, Avg. loss: 0.010644
Total training time: 48.65 seconds.
-- Epoch 50
Norm: 8.62, NNZs: 1048576, Bias: -2.385757, T: 154300, Avg. loss: 0.010488
Total training time: 49.68 seconds.
-- Epoch 51
Norm: 8.71, NNZs: 1048576, Bias: -2.382281, T: 157386, Avg. loss: 0.010338
Total training time: 50.71 seconds.
-- Epoch 52
Norm: 8.70, NNZs: 1048576, Bias: -2.382242, T: 160472, Avg. loss: 0.010193
Total training time: 51.73 seconds.
-- Epoch 53
Norm: 8.67, NNZs: 1048576, Bias: -2.383543, T: 163558, Avg. loss: 0.010056
Total training time: 52.77 seconds.
-- Epoch 54
Norm: 8.65, NNZs: 1048576, Bias: -2.384632, T: 166644, Avg. loss: 0.009923
Total training time: 53.80 seconds.
-- Epoch 55
Norm: 8.67, NNZs: 1048576, Bias: -2.383711, T: 169730, Avg. loss: 0.009796
Total training time: 54.82 seconds.
-- Epoch 56
Norm: 8.64, NNZs: 1048576, Bias: -2.384689, T: 172816, Avg. loss: 0.009672
Total training time: 55.85 seconds.
-- Epoch 57
Norm: 8.64, NNZs: 1048576, Bias: -2.384425, T: 175902, Avg. loss: 0.009554
Total training time: 56.88 seconds.
-- Epoch 58
Norm: 8.66, NNZs: 1048576, Bias: -2.383993, T: 178988, Avg. loss: 0.009438
Total training time: 57.90 seconds.
-- Epoch 59
Norm: 8.63, NNZs: 1048576, Bias: -2.384925, T: 182074, Avg. loss: 0.009328
Total training time: 58.93 seconds.
-- Epoch 60
Norm: 8.63, NNZs: 1048576, Bias: -2.384802, T: 185160, Avg. loss: 0.009220
Total training time: 59.96 seconds.
-- Epoch 61
Norm: 8.64, NNZs: 1048576, Bias: -2.384519, T: 188246, Avg. loss: 0.009115
Total training time: 60.97 seconds.
-- Epoch 62
Norm: 8.60, NNZs: 1048576, Bias: -2.385816, T: 191332, Avg. loss: 0.009014
Total training time: 62.01 seconds.
-- Epoch 63
Norm: 8.65, NNZs: 1048576, Bias: -2.384281, T: 194418, Avg. loss: 0.008915
Total training time: 63.03 seconds.
-- Epoch 64
Norm: 8.63, NNZs: 1048576, Bias: -2.385082, T: 197504, Avg. loss: 0.008821
Total training time: 64.07 seconds.
-- Epoch 65
Norm: 8.63, NNZs: 1048576, Bias: -2.384698, T: 200590, Avg. loss: 0.008729
Total training time: 65.10 seconds.
-- Epoch 66
Norm: 8.59, NNZs: 1048576, Bias: -2.386231, T: 203676, Avg. loss: 0.008640
Total training time: 66.13 seconds.
-- Epoch 67
Norm: 8.62, NNZs: 1048576, Bias: -2.385569, T: 206762, Avg. loss: 0.008554
Total training time: 67.16 seconds.
-- Epoch 68
Norm: 8.62, NNZs: 1048576, Bias: -2.385628, T: 209848, Avg. loss: 0.008470
Total training time: 68.18 seconds.
-- Epoch 69
Norm: 8.62, NNZs: 1048576, Bias: -2.385312, T: 212934, Avg. loss: 0.008389
Total training time: 69.21 seconds.
-- Epoch 70
Norm: 8.65, NNZs: 1048576, Bias: -2.384366, T: 216020, Avg. loss: 0.008309
Total training time: 70.23 seconds.
-- Epoch 71
Norm: 8.58, NNZs: 1048576, Bias: -2.387040, T: 219106, Avg. loss: 0.008231
Total training time: 71.26 seconds.
-- Epoch 72
Norm: 8.61, NNZs: 1048576, Bias: -2.385715, T: 222192, Avg. loss: 0.008157
Total training time: 72.29 seconds.
-- Epoch 73
Norm: 8.62, NNZs: 1048576, Bias: -2.385872, T: 225278, Avg. loss: 0.008083
Total training time: 73.32 seconds.
-- Epoch 74
Norm: 8.61, NNZs: 1048576, Bias: -2.385979, T: 228364, Avg. loss: 0.008013
Total training time: 74.35 seconds.
-- Epoch 75
Norm: 8.61, NNZs: 1048576, Bias: -2.385847, T: 231450, Avg. loss: 0.007945
Total training time: 75.38 seconds.
-- Epoch 76
Norm: 8.60, NNZs: 1048576, Bias: -2.386059, T: 234536, Avg. loss: 0.007878
Total training time: 76.41 seconds.
-- Epoch 77
Norm: 8.56, NNZs: 1048576, Bias: -2.387525, T: 237622, Avg. loss: 0.007811
Total training time: 77.45 seconds.
-- Epoch 78
Norm: 8.59, NNZs: 1048576, Bias: -2.386445, T: 240708, Avg. loss: 0.007749
Total training time: 78.47 seconds.
-- Epoch 79
Norm: 8.59, NNZs: 1048576, Bias: -2.386271, T: 243794, Avg. loss: 0.007687
Total training time: 79.50 seconds.
-- Epoch 80
Norm: 8.59, NNZs: 1048576, Bias: -2.386524, T: 246880, Avg. loss: 0.007626
Total training time: 80.54 seconds.
-- Epoch 81
Norm: 8.59, NNZs: 1048576, Bias: -2.386246, T: 249966, Avg. loss: 0.007567
Total training time: 81.55 seconds.
-- Epoch 82
Norm: 8.59, NNZs: 1048576, Bias: -2.386657, T: 253052, Avg. loss: 0.007509
Total training time: 82.59 seconds.
-- Epoch 83
Norm: 8.58, NNZs: 1048576, Bias: -2.386992, T: 256138, Avg. loss: 0.007452
Total training time: 83.63 seconds.
-- Epoch 84
Norm: 8.60, NNZs: 1048576, Bias: -2.386511, T: 259224, Avg. loss: 0.007397
Total training time: 84.67 seconds.
-- Epoch 85
Norm: 8.60, NNZs: 1048576, Bias: -2.386426, T: 262310, Avg. loss: 0.007344
Total training time: 85.70 seconds.
-- Epoch 86
Norm: 8.58, NNZs: 1048576, Bias: -2.387260, T: 265396, Avg. loss: 0.007292
Total training time: 86.74 seconds.
-- Epoch 87
Norm: 8.58, NNZs: 1048576, Bias: -2.387303, T: 268482, Avg. loss: 0.007241
Total training time: 87.77 seconds.
-- Epoch 88
Norm: 8.58, NNZs: 1048576, Bias: -2.387221, T: 271568, Avg. loss: 0.007191
Total training time: 88.81 seconds.
-- Epoch 89
Norm: 8.60, NNZs: 1048576, Bias: -2.386639, T: 274654, Avg. loss: 0.007142
Total training time: 89.84 seconds.
-- Epoch 90
Norm: 8.58, NNZs: 1048576, Bias: -2.387152, T: 277740, Avg. loss: 0.007095
Total training time: 90.87 seconds.
-- Epoch 91
Norm: 8.59, NNZs: 1048576, Bias: -2.386903, T: 280826, Avg. loss: 0.007047
Total training time: 91.91 seconds.
-- Epoch 92
Norm: 8.58, NNZs: 1048576, Bias: -2.387195, T: 283912, Avg. loss: 0.007002
Total training time: 92.95 seconds.
-- Epoch 93
Norm: 8.57, NNZs: 1048576, Bias: -2.387936, T: 286998, Avg. loss: 0.006956
Total training time: 93.99 seconds.
-- Epoch 94
Norm: 8.57, NNZs: 1048576, Bias: -2.387712, T: 290084, Avg. loss: 0.006913
Total training time: 95.03 seconds.
-- Epoch 95
Norm: 8.59, NNZs: 1048576, Bias: -2.387103, T: 293170, Avg. loss: 0.006869
Total training time: 96.06 seconds.
-- Epoch 96
Norm: 8.60, NNZs: 1048576, Bias: -2.386830, T: 296256, Avg. loss: 0.006827
Total training time: 97.09 seconds.
-- Epoch 97
Norm: 8.57, NNZs: 1048576, Bias: -2.388183, T: 299342, Avg. loss: 0.006785
Total training time: 98.14 seconds.
-- Epoch 98
Norm: 8.56, NNZs: 1048576, Bias: -2.388442, T: 302428, Avg. loss: 0.006745
Total training time: 99.17 seconds.
-- Epoch 99
Norm: 8.57, NNZs: 1048576, Bias: -2.387878, T: 305514, Avg. loss: 0.006705
Total training time: 100.20 seconds.
-- Epoch 100
Norm: 8.57, NNZs: 1048576, Bias: -2.387840, T: 308600, Avg. loss: 0.006667
Total training time: 101.24 seconds.
-- Epoch 1
Norm: 39.75, NNZs: 520039, Bias: -1.172487, T: 3086, Avg. loss: 0.328657
Total training time: 0.84 seconds.
-- Epoch 2
Norm: 29.59, NNZs: 593331, Bias: -1.334361, T: 6172, Avg. loss: 0.203309
Total training time: 1.68 seconds.
-- Epoch 3
Norm: 23.76, NNZs: 598940, Bias: -1.350860, T: 9258, Avg. loss: 0.144297
Total training time: 2.53 seconds.
-- Epoch 4
Norm: 20.10, NNZs: 605169, Bias: -1.370536, T: 12344, Avg. loss: 0.111457
Total training time: 3.37 seconds.
-- Epoch 5
Norm: 17.52, NNZs: 609251, Bias: -1.363389, T: 15430, Avg. loss: 0.090362
Total training time: 4.21 seconds.
-- Epoch 6
Norm: 15.84, NNZs: 614894, Bias: -1.375155, T: 18516, Avg. loss: 0.076133
Total training time: 5.06 seconds.
-- Epoch 7
Norm: 14.63, NNZs: 617538, Bias: -1.381805, T: 21602, Avg. loss: 0.065980
Total training time: 5.90 seconds.
-- Epoch 8
Norm: 13.91, NNZs: 623704, Bias: -1.387283, T: 24688, Avg. loss: 0.058441
Total training time: 6.75 seconds.
-- Epoch 9
Norm: 13.36, NNZs: 626048, Bias: -1.391225, T: 27774, Avg. loss: 0.052534
Total training time: 7.59 seconds.
-- Epoch 10
Norm: 12.94, NNZs: 636746, Bias: -1.391878, T: 30860, Avg. loss: 0.047819
Total training time: 8.44 seconds.
-- Epoch 11
Norm: 12.57, NNZs: 639575, Bias: -1.398309, T: 33946, Avg. loss: 0.043952
Total training time: 9.29 seconds.
-- Epoch 12
Norm: 12.37, NNZs: 642117, Bias: -1.397697, T: 37032, Avg. loss: 0.040731
Total training time: 10.14 seconds.
-- Epoch 13
Norm: 12.07, NNZs: 647809, Bias: -1.397327, T: 40118, Avg. loss: 0.037977
Total training time: 10.98 seconds.
-- Epoch 14
Norm: 11.91, NNZs: 648614, Bias: -1.395024, T: 43204, Avg. loss: 0.035643
Total training time: 11.83 seconds.
-- Epoch 15
Norm: 11.69, NNZs: 653727, Bias: -1.401937, T: 46290, Avg. loss: 0.033626
Total training time: 12.68 seconds.
-- Epoch 16
Norm: 11.65, NNZs: 654393, Bias: -1.402239, T: 49376, Avg. loss: 0.031869
Total training time: 13.53 seconds.
-- Epoch 17
Norm: 11.54, NNZs: 654935, Bias: -1.406454, T: 52462, Avg. loss: 0.030316
Total training time: 14.38 seconds.
-- Epoch 18
Norm: 11.52, NNZs: 655136, Bias: -1.403302, T: 55548, Avg. loss: 0.028936
Total training time: 15.23 seconds.
-- Epoch 19
Norm: 11.40, NNZs: 655392, Bias: -1.408476, T: 58634, Avg. loss: 0.027697
Total training time: 16.08 seconds.
-- Epoch 20
Norm: 11.34, NNZs: 655782, Bias: -1.411190, T: 61720, Avg. loss: 0.026582
Total training time: 16.93 seconds.
-- Epoch 21
Norm: 11.31, NNZs: 656496, Bias: -1.413075, T: 64806, Avg. loss: 0.025567
Total training time: 17.79 seconds.
-- Epoch 22
Norm: 11.25, NNZs: 658144, Bias: -1.414211, T: 67892, Avg. loss: 0.024639
Total training time: 18.64 seconds.
-- Epoch 23
Norm: 11.18, NNZs: 658189, Bias: -1.416606, T: 70978, Avg. loss: 0.023788
Total training time: 19.49 seconds.
-- Epoch 24
Norm: 11.14, NNZs: 658349, Bias: -1.416274, T: 74064, Avg. loss: 0.023012
Total training time: 20.34 seconds.
-- Epoch 25
Norm: 11.12, NNZs: 659026, Bias: -1.418407, T: 77150, Avg. loss: 0.022296
Total training time: 21.19 seconds.
-- Epoch 26
Norm: 11.05, NNZs: 659305, Bias: -1.419376, T: 80236, Avg. loss: 0.021645
Total training time: 22.04 seconds.
-- Epoch 27
Norm: 11.08, NNZs: 659482, Bias: -1.418643, T: 83322, Avg. loss: 0.021040
Total training time: 22.90 seconds.
-- Epoch 28
Norm: 11.01, NNZs: 660501, Bias: -1.423481, T: 86408, Avg. loss: 0.020472
Total training time: 23.75 seconds.
-- Epoch 29
Norm: 10.99, NNZs: 660567, Bias: -1.423640, T: 89494, Avg. loss: 0.019948
Total training time: 24.60 seconds.
-- Epoch 30
Norm: 10.97, NNZs: 664392, Bias: -1.425656, T: 92580, Avg. loss: 0.019455
Total training time: 25.45 seconds.
-- Epoch 31
Norm: 10.92, NNZs: 673356, Bias: -1.427894, T: 95666, Avg. loss: 0.018992
Total training time: 26.31 seconds.
-- Epoch 32
Norm: 10.94, NNZs: 673765, Bias: -1.427269, T: 98752, Avg. loss: 0.018561
Total training time: 27.16 seconds.
-- Epoch 33
Norm: 10.90, NNZs: 673912, Bias: -1.429475, T: 101838, Avg. loss: 0.018154
Total training time: 28.01 seconds.
-- Epoch 34
Norm: 10.90, NNZs: 674667, Bias: -1.426645, T: 104924, Avg. loss: 0.017765
Total training time: 28.86 seconds.
-- Epoch 35
Norm: 10.87, NNZs: 675178, Bias: -1.428691, T: 108010, Avg. loss: 0.017406
Total training time: 29.71 seconds.
-- Epoch 36
Norm: 10.86, NNZs: 675178, Bias: -1.430834, T: 111096, Avg. loss: 0.017066
Total training time: 30.57 seconds.
-- Epoch 37
Norm: 10.85, NNZs: 676183, Bias: -1.430985, T: 114182, Avg. loss: 0.016745
Total training time: 31.42 seconds.
-- Epoch 38
Norm: 10.85, NNZs: 676183, Bias: -1.430287, T: 117268, Avg. loss: 0.016440
Total training time: 32.27 seconds.
-- Epoch 39
Norm: 10.82, NNZs: 676183, Bias: -1.432379, T: 120354, Avg. loss: 0.016147
Total training time: 33.26 seconds.
-- Epoch 40
Norm: 10.80, NNZs: 676450, Bias: -1.435225, T: 123440, Avg. loss: 0.015871
Total training time: 34.18 seconds.
-- Epoch 41
Norm: 10.80, NNZs: 676450, Bias: -1.435742, T: 126526, Avg. loss: 0.015610
Total training time: 35.04 seconds.
-- Epoch 42
Norm: 10.78, NNZs: 676478, Bias: -1.436499, T: 129612, Avg. loss: 0.015362
Total training time: 35.89 seconds.
-- Epoch 43
Norm: 10.75, NNZs: 676478, Bias: -1.438975, T: 132698, Avg. loss: 0.015119
Total training time: 36.74 seconds.
-- Epoch 44
Norm: 10.76, NNZs: 676731, Bias: -1.438136, T: 135784, Avg. loss: 0.014891
Total training time: 37.59 seconds.
-- Epoch 45
Norm: 10.75, NNZs: 676731, Bias: -1.437092, T: 138870, Avg. loss: 0.014673
Total training time: 38.44 seconds.
-- Epoch 46
Norm: 10.75, NNZs: 676731, Bias: -1.438113, T: 141956, Avg. loss: 0.014466
Total training time: 39.30 seconds.
-- Epoch 47
Norm: 10.73, NNZs: 676731, Bias: -1.440802, T: 145042, Avg. loss: 0.014268
Total training time: 40.15 seconds.
-- Epoch 48
Norm: 10.74, NNZs: 676731, Bias: -1.441051, T: 148128, Avg. loss: 0.014077
Total training time: 41.01 seconds.
-- Epoch 49
Norm: 10.75, NNZs: 676731, Bias: -1.440810, T: 151214, Avg. loss: 0.013893
Total training time: 41.86 seconds.
-- Epoch 50
Norm: 10.72, NNZs: 676731, Bias: -1.442397, T: 154300, Avg. loss: 0.013717
Total training time: 42.71 seconds.
-- Epoch 51
Norm: 10.72, NNZs: 676731, Bias: -1.442145, T: 157386, Avg. loss: 0.013550
Total training time: 43.56 seconds.
-- Epoch 52
Norm: 10.70, NNZs: 676731, Bias: -1.444459, T: 160472, Avg. loss: 0.013386
Total training time: 44.42 seconds.
-- Epoch 53
Norm: 10.70, NNZs: 676930, Bias: -1.444148, T: 163558, Avg. loss: 0.013231
Total training time: 45.27 seconds.
-- Epoch 54
Norm: 10.69, NNZs: 676930, Bias: -1.445122, T: 166644, Avg. loss: 0.013080
Total training time: 46.12 seconds.
-- Epoch 55
Norm: 10.68, NNZs: 676930, Bias: -1.446134, T: 169730, Avg. loss: 0.012933
Total training time: 46.98 seconds.
-- Epoch 56
Norm: 10.69, NNZs: 676930, Bias: -1.444745, T: 172816, Avg. loss: 0.012793
Total training time: 47.83 seconds.
-- Epoch 57
Norm: 10.68, NNZs: 677996, Bias: -1.446578, T: 175902, Avg. loss: 0.012658
Total training time: 48.68 seconds.
-- Epoch 58
Norm: 10.68, NNZs: 677996, Bias: -1.446980, T: 178988, Avg. loss: 0.012527
Total training time: 49.54 seconds.
-- Epoch 59
Norm: 10.67, NNZs: 678041, Bias: -1.448586, T: 182074, Avg. loss: 0.012400
Total training time: 50.39 seconds.
-- Epoch 60
Norm: 10.67, NNZs: 678041, Bias: -1.448428, T: 185160, Avg. loss: 0.012278
Total training time: 51.25 seconds.
-- Epoch 61
Norm: 10.66, NNZs: 678041, Bias: -1.449285, T: 188246, Avg. loss: 0.012158
Total training time: 52.10 seconds.
-- Epoch 62
Norm: 10.67, NNZs: 678041, Bias: -1.448317, T: 191332, Avg. loss: 0.012044
Total training time: 52.95 seconds.
-- Epoch 63
Norm: 10.65, NNZs: 678072, Bias: -1.450770, T: 194418, Avg. loss: 0.011933
Total training time: 53.81 seconds.
-- Epoch 64
Norm: 10.67, NNZs: 678072, Bias: -1.449019, T: 197504, Avg. loss: 0.011824
Total training time: 54.66 seconds.
-- Epoch 65
Norm: 10.64, NNZs: 678072, Bias: -1.451512, T: 200590, Avg. loss: 0.011719
Total training time: 55.51 seconds.
-- Epoch 66
Norm: 10.64, NNZs: 678072, Bias: -1.452137, T: 203676, Avg. loss: 0.011618
Total training time: 56.37 seconds.
-- Epoch 67
Norm: 10.64, NNZs: 678072, Bias: -1.452552, T: 206762, Avg. loss: 0.011520
Total training time: 57.22 seconds.
-- Epoch 68
Norm: 10.63, NNZs: 678327, Bias: -1.452885, T: 209848, Avg. loss: 0.011423
Total training time: 58.07 seconds.
-- Epoch 69
Norm: 10.61, NNZs: 678327, Bias: -1.455266, T: 212934, Avg. loss: 0.011330
Total training time: 58.93 seconds.
-- Epoch 70
Norm: 10.62, NNZs: 678327, Bias: -1.455033, T: 216020, Avg. loss: 0.011241
Total training time: 59.78 seconds.
-- Epoch 71
Norm: 10.63, NNZs: 678327, Bias: -1.453629, T: 219106, Avg. loss: 0.011154
Total training time: 60.64 seconds.
-- Epoch 72
Norm: 10.62, NNZs: 705449, Bias: -1.454862, T: 222192, Avg. loss: 0.011069
Total training time: 61.50 seconds.
-- Epoch 73
Norm: 10.62, NNZs: 705449, Bias: -1.455562, T: 225278, Avg. loss: 0.010986
Total training time: 62.35 seconds.
-- Epoch 74
Norm: 10.62, NNZs: 705449, Bias: -1.455251, T: 228364, Avg. loss: 0.010906
Total training time: 63.20 seconds.
-- Epoch 75
Norm: 10.63, NNZs: 705449, Bias: -1.455490, T: 231450, Avg. loss: 0.010827
Total training time: 64.06 seconds.
-- Epoch 76
Norm: 10.62, NNZs: 705449, Bias: -1.456308, T: 234536, Avg. loss: 0.010751
Total training time: 64.91 seconds.
-- Epoch 77
Norm: 10.64, NNZs: 705449, Bias: -1.454973, T: 237622, Avg. loss: 0.010675
Total training time: 65.76 seconds.
-- Epoch 78
Norm: 10.62, NNZs: 705449, Bias: -1.456650, T: 240708, Avg. loss: 0.010602
Total training time: 66.62 seconds.
-- Epoch 79
Norm: 10.60, NNZs: 705449, Bias: -1.458473, T: 243794, Avg. loss: 0.010531
Total training time: 67.47 seconds.
-- Epoch 80
Norm: 10.62, NNZs: 705476, Bias: -1.457318, T: 246880, Avg. loss: 0.010462
Total training time: 68.32 seconds.
-- Epoch 81
Norm: 10.61, NNZs: 705476, Bias: -1.458412, T: 249966, Avg. loss: 0.010395
Total training time: 69.18 seconds.
-- Epoch 82
Norm: 10.60, NNZs: 705476, Bias: -1.459469, T: 253052, Avg. loss: 0.010329
Total training time: 70.03 seconds.
-- Epoch 83
Norm: 10.60, NNZs: 705476, Bias: -1.458628, T: 256138, Avg. loss: 0.010265
Total training time: 70.88 seconds.
-- Epoch 84
Norm: 10.61, NNZs: 705476, Bias: -1.459007, T: 259224, Avg. loss: 0.010202
Total training time: 71.74 seconds.
-- Epoch 85
Norm: 10.60, NNZs: 705476, Bias: -1.459641, T: 262310, Avg. loss: 0.010141
Total training time: 72.59 seconds.
-- Epoch 86
Norm: 10.61, NNZs: 705476, Bias: -1.458760, T: 265396, Avg. loss: 0.010080
Total training time: 73.45 seconds.
-- Epoch 87
Norm: 10.60, NNZs: 705476, Bias: -1.460177, T: 268482, Avg. loss: 0.010021
Total training time: 74.30 seconds.
-- Epoch 88
Norm: 10.59, NNZs: 705476, Bias: -1.461403, T: 271568, Avg. loss: 0.009963
Total training time: 75.16 seconds.
-- Epoch 89
Norm: 10.60, NNZs: 705476, Bias: -1.460308, T: 274654, Avg. loss: 0.009906
Total training time: 76.01 seconds.
-- Epoch 90
Norm: 10.58, NNZs: 705476, Bias: -1.462142, T: 277740, Avg. loss: 0.009852
Total training time: 76.87 seconds.
-- Epoch 91
Norm: 10.59, NNZs: 705476, Bias: -1.461373, T: 280826, Avg. loss: 0.009799
Total training time: 77.72 seconds.
-- Epoch 92
Norm: 10.58, NNZs: 705476, Bias: -1.462605, T: 283912, Avg. loss: 0.009747
Total training time: 78.58 seconds.
-- Epoch 93
Norm: 10.58, NNZs: 705476, Bias: -1.462501, T: 286998, Avg. loss: 0.009696
Total training time: 79.43 seconds.
-- Epoch 94
Norm: 10.59, NNZs: 705476, Bias: -1.461625, T: 290084, Avg. loss: 0.009645
Total training time: 80.28 seconds.
-- Epoch 95
Norm: 10.57, NNZs: 705491, Bias: -1.463846, T: 293170, Avg. loss: 0.009596
Total training time: 81.14 seconds.
-- Epoch 96
Norm: 10.57, NNZs: 705491, Bias: -1.463994, T: 296256, Avg. loss: 0.009549
Total training time: 81.99 seconds.
-- Epoch 97
Norm: 10.58, NNZs: 705491, Bias: -1.463350, T: 299342, Avg. loss: 0.009501
Total training time: 82.85 seconds.
-- Epoch 98
Norm: 10.56, NNZs: 705491, Bias: -1.465282, T: 302428, Avg. loss: 0.009454
Total training time: 83.70 seconds.
-- Epoch 99
Norm: 10.58, NNZs: 705491, Bias: -1.463383, T: 305514, Avg. loss: 0.009409
Total training time: 84.55 seconds.
-- Epoch 100
Norm: 10.56, NNZs: 705655, Bias: -1.466201, T: 308600, Avg. loss: 0.009364
Total training time: 85.41 seconds.
-- Epoch 1
Norm: 126.99, NNZs: 1047643, Bias: 0.467605, T: 3086, Avg. loss: 3.077330
Total training time: 0.95 seconds.
-- Epoch 2
Norm: 89.68, NNZs: 1048532, Bias: 0.551026, T: 6172, Avg. loss: 1.896222
Total training time: 1.90 seconds.
-- Epoch 3
Norm: 71.54, NNZs: 1048570, Bias: 0.468141, T: 9258, Avg. loss: 1.377010
Total training time: 2.88 seconds.
-- Epoch 4
Norm: 60.25, NNZs: 1048574, Bias: 0.529939, T: 12344, Avg. loss: 1.077210
Total training time: 3.86 seconds.
-- Epoch 5
Norm: 52.84, NNZs: 1048576, Bias: 0.502964, T: 15430, Avg. loss: 0.884142
Total training time: 4.86 seconds.
-- Epoch 6
Norm: 47.90, NNZs: 1048576, Bias: 0.513831, T: 18516, Avg. loss: 0.754105
Total training time: 5.90 seconds.
-- Epoch 7
Norm: 44.17, NNZs: 1048576, Bias: 0.491099, T: 21602, Avg. loss: 0.658543
Total training time: 6.96 seconds.
-- Epoch 8
Norm: 41.84, NNZs: 1048576, Bias: 0.451884, T: 24688, Avg. loss: 0.585925
Total training time: 8.02 seconds.
-- Epoch 9
Norm: 40.13, NNZs: 1048576, Bias: 0.465085, T: 27774, Avg. loss: 0.529078
Total training time: 9.14 seconds.
-- Epoch 10
Norm: 38.87, NNZs: 1048576, Bias: 0.455133, T: 30860, Avg. loss: 0.483626
Total training time: 10.27 seconds.
-- Epoch 11
Norm: 37.87, NNZs: 1048576, Bias: 0.435238, T: 33946, Avg. loss: 0.446203
Total training time: 11.37 seconds.
-- Epoch 12
Norm: 37.02, NNZs: 1048576, Bias: 0.437174, T: 37032, Avg. loss: 0.414929
Total training time: 12.51 seconds.
-- Epoch 13
Norm: 36.41, NNZs: 1048576, Bias: 0.419509, T: 40118, Avg. loss: 0.388305
Total training time: 13.66 seconds.
-- Epoch 14
Norm: 35.88, NNZs: 1048576, Bias: 0.440014, T: 43204, Avg. loss: 0.365426
Total training time: 14.80 seconds.
-- Epoch 15
Norm: 35.54, NNZs: 1048576, Bias: 0.434295, T: 46290, Avg. loss: 0.345675
Total training time: 15.97 seconds.
-- Epoch 16
Norm: 35.25, NNZs: 1048576, Bias: 0.422166, T: 49376, Avg. loss: 0.328319
Total training time: 17.16 seconds.
-- Epoch 17
Norm: 35.03, NNZs: 1048576, Bias: 0.415247, T: 52462, Avg. loss: 0.313027
Total training time: 18.35 seconds.
-- Epoch 18
Norm: 34.76, NNZs: 1048576, Bias: 0.418613, T: 55548, Avg. loss: 0.299290
Total training time: 19.54 seconds.
-- Epoch 19
Norm: 34.57, NNZs: 1048576, Bias: 0.400862, T: 58634, Avg. loss: 0.286963
Total training time: 20.73 seconds.
-- Epoch 20
Norm: 34.40, NNZs: 1048576, Bias: 0.402182, T: 61720, Avg. loss: 0.275959
Total training time: 21.93 seconds.
-- Epoch 21
Norm: 34.24, NNZs: 1048576, Bias: 0.402108, T: 64806, Avg. loss: 0.265984
Total training time: 23.14 seconds.
-- Epoch 22
Norm: 34.08, NNZs: 1048576, Bias: 0.397133, T: 67892, Avg. loss: 0.256906
Total training time: 24.33 seconds.
-- Epoch 23
Norm: 33.96, NNZs: 1048576, Bias: 0.403552, T: 70978, Avg. loss: 0.248616
Total training time: 25.54 seconds.
-- Epoch 24
Norm: 33.84, NNZs: 1048576, Bias: 0.397291, T: 74064, Avg. loss: 0.240940
Total training time: 26.74 seconds.
-- Epoch 25
Norm: 33.72, NNZs: 1048576, Bias: 0.396498, T: 77150, Avg. loss: 0.233951
Total training time: 27.97 seconds.
-- Epoch 26
Norm: 33.65, NNZs: 1048576, Bias: 0.386990, T: 80236, Avg. loss: 0.227456
Total training time: 29.23 seconds.
-- Epoch 27
Norm: 33.58, NNZs: 1048576, Bias: 0.391163, T: 83322, Avg. loss: 0.221425
Total training time: 30.46 seconds.
-- Epoch 28
Norm: 33.49, NNZs: 1048576, Bias: 0.395420, T: 86408, Avg. loss: 0.215814
Total training time: 31.68 seconds.
-- Epoch 29
Norm: 33.44, NNZs: 1048576, Bias: 0.386859, T: 89494, Avg. loss: 0.210560
Total training time: 32.97 seconds.
-- Epoch 30
Norm: 33.39, NNZs: 1048576, Bias: 0.387481, T: 92580, Avg. loss: 0.205681
Total training time: 34.23 seconds.
-- Epoch 31
Norm: 33.32, NNZs: 1048576, Bias: 0.387182, T: 95666, Avg. loss: 0.201111
Total training time: 35.47 seconds.
-- Epoch 32
Norm: 33.28, NNZs: 1048576, Bias: 0.384413, T: 98752, Avg. loss: 0.196835
Total training time: 36.71 seconds.
-- Epoch 33
Norm: 33.21, NNZs: 1048576, Bias: 0.381962, T: 101838, Avg. loss: 0.192791
Total training time: 37.98 seconds.
-- Epoch 34
Norm: 33.15, NNZs: 1048576, Bias: 0.384489, T: 104924, Avg. loss: 0.188977
Total training time: 39.26 seconds.
-- Epoch 35
Norm: 33.13, NNZs: 1048576, Bias: 0.384823, T: 108010, Avg. loss: 0.185418
Total training time: 40.52 seconds.
-- Epoch 36
Norm: 33.09, NNZs: 1048576, Bias: 0.380463, T: 111096, Avg. loss: 0.182032
Total training time: 41.78 seconds.
-- Epoch 37
Norm: 33.04, NNZs: 1048576, Bias: 0.381027, T: 114182, Avg. loss: 0.178816
Total training time: 43.05 seconds.
-- Epoch 38
Norm: 33.01, NNZs: 1048576, Bias: 0.376214, T: 117268, Avg. loss: 0.175771
Total training time: 44.32 seconds.
-- Epoch 39
Norm: 32.97, NNZs: 1048576, Bias: 0.376310, T: 120354, Avg. loss: 0.172881
Total training time: 45.57 seconds.
-- Epoch 40
Norm: 32.93, NNZs: 1048576, Bias: 0.378163, T: 123440, Avg. loss: 0.170134
Total training time: 46.85 seconds.
-- Epoch 41
Norm: 32.90, NNZs: 1048576, Bias: 0.375240, T: 126526, Avg. loss: 0.167507
Total training time: 48.13 seconds.
-- Epoch 42
Norm: 32.88, NNZs: 1048576, Bias: 0.372173, T: 129612, Avg. loss: 0.165020
Total training time: 49.42 seconds.
-- Epoch 43
Norm: 32.85, NNZs: 1048576, Bias: 0.370888, T: 132698, Avg. loss: 0.162626
Total training time: 50.70 seconds.
-- Epoch 44
Norm: 32.82, NNZs: 1048576, Bias: 0.372830, T: 135784, Avg. loss: 0.160361
Total training time: 51.97 seconds.
-- Epoch 45
Norm: 32.80, NNZs: 1048576, Bias: 0.370261, T: 138870, Avg. loss: 0.158200
Total training time: 53.25 seconds.
-- Epoch 46
Norm: 32.77, NNZs: 1048576, Bias: 0.373206, T: 141956, Avg. loss: 0.156128
Total training time: 54.50 seconds.
-- Epoch 47
Norm: 32.74, NNZs: 1048576, Bias: 0.373751, T: 145042, Avg. loss: 0.154128
Total training time: 55.76 seconds.
-- Epoch 48
Norm: 32.74, NNZs: 1048576, Bias: 0.368557, T: 148128, Avg. loss: 0.152219
Total training time: 57.04 seconds.
-- Epoch 49
Norm: 32.71, NNZs: 1048576, Bias: 0.368791, T: 151214, Avg. loss: 0.150368
Total training time: 58.33 seconds.
-- Epoch 50
Norm: 32.69, NNZs: 1048576, Bias: 0.366586, T: 154300, Avg. loss: 0.148609
Total training time: 59.58 seconds.
-- Epoch 51
Norm: 32.67, NNZs: 1048576, Bias: 0.364009, T: 157386, Avg. loss: 0.146904
Total training time: 60.85 seconds.
-- Epoch 52
Norm: 32.64, NNZs: 1048576, Bias: 0.368638, T: 160472, Avg. loss: 0.145248
Total training time: 62.13 seconds.
-- Epoch 53
Norm: 32.64, NNZs: 1048576, Bias: 0.366758, T: 163558, Avg. loss: 0.143679
Total training time: 63.41 seconds.
-- Epoch 54
Norm: 32.62, NNZs: 1048576, Bias: 0.362123, T: 166644, Avg. loss: 0.142163
Total training time: 64.66 seconds.
-- Epoch 55
Norm: 32.60, NNZs: 1048576, Bias: 0.365537, T: 169730, Avg. loss: 0.140701
Total training time: 65.93 seconds.
-- Epoch 56
Norm: 32.58, NNZs: 1048576, Bias: 0.363543, T: 172816, Avg. loss: 0.139298
Total training time: 67.20 seconds.
-- Epoch 57
Norm: 32.57, NNZs: 1048576, Bias: 0.360071, T: 175902, Avg. loss: 0.137943
Total training time: 68.72 seconds.
-- Epoch 58
Norm: 32.55, NNZs: 1048576, Bias: 0.361456, T: 178988, Avg. loss: 0.136640
Total training time: 70.02 seconds.
-- Epoch 59
Norm: 32.54, NNZs: 1048576, Bias: 0.363521, T: 182074, Avg. loss: 0.135373
Total training time: 71.34 seconds.
-- Epoch 60
Norm: 32.54, NNZs: 1048576, Bias: 0.362528, T: 185160, Avg. loss: 0.134142
Total training time: 72.67 seconds.
-- Epoch 61
Norm: 32.52, NNZs: 1048576, Bias: 0.360267, T: 188246, Avg. loss: 0.132948
Total training time: 73.96 seconds.
-- Epoch 62
Norm: 32.50, NNZs: 1048576, Bias: 0.361567, T: 191332, Avg. loss: 0.131803
Total training time: 75.25 seconds.
-- Epoch 63
Norm: 32.50, NNZs: 1048576, Bias: 0.356758, T: 194418, Avg. loss: 0.130691
Total training time: 76.56 seconds.
-- Epoch 64
Norm: 32.48, NNZs: 1048576, Bias: 0.359106, T: 197504, Avg. loss: 0.129605
Total training time: 77.85 seconds.
-- Epoch 65
Norm: 32.48, NNZs: 1048576, Bias: 0.356143, T: 200590, Avg. loss: 0.128561
Total training time: 79.18 seconds.
-- Epoch 66
Norm: 32.45, NNZs: 1048576, Bias: 0.358177, T: 203676, Avg. loss: 0.127550
Total training time: 80.48 seconds.
-- Epoch 67
Norm: 32.45, NNZs: 1048576, Bias: 0.358556, T: 206762, Avg. loss: 0.126567
Total training time: 81.82 seconds.
-- Epoch 68
Norm: 32.44, NNZs: 1048576, Bias: 0.357500, T: 209848, Avg. loss: 0.125604
Total training time: 83.13 seconds.
-- Epoch 69
Norm: 32.43, NNZs: 1048576, Bias: 0.354133, T: 212934, Avg. loss: 0.124675
Total training time: 84.44 seconds.
-- Epoch 70
Norm: 32.42, NNZs: 1048576, Bias: 0.355801, T: 216020, Avg. loss: 0.123774
Total training time: 85.70 seconds.
-- Epoch 71
Norm: 32.40, NNZs: 1048576, Bias: 0.354090, T: 219106, Avg. loss: 0.122899
Total training time: 87.05 seconds.
-- Epoch 72
Norm: 32.39, NNZs: 1048576, Bias: 0.355480, T: 222192, Avg. loss: 0.122044
Total training time: 88.32 seconds.
-- Epoch 73
Norm: 32.39, NNZs: 1048576, Bias: 0.355981, T: 225278, Avg. loss: 0.121215
Total training time: 89.65 seconds.
-- Epoch 74
Norm: 32.38, NNZs: 1048576, Bias: 0.353984, T: 228364, Avg. loss: 0.120409
Total training time: 90.97 seconds.
-- Epoch 75
Norm: 32.37, NNZs: 1048576, Bias: 0.354412, T: 231450, Avg. loss: 0.119620
Total training time: 92.29 seconds.
-- Epoch 76
Norm: 32.36, NNZs: 1048576, Bias: 0.355660, T: 234536, Avg. loss: 0.118855
Total training time: 93.59 seconds.
-- Epoch 77
Norm: 32.35, NNZs: 1048576, Bias: 0.356777, T: 237622, Avg. loss: 0.118108
Total training time: 94.84 seconds.
-- Epoch 78
Norm: 32.35, NNZs: 1048576, Bias: 0.351818, T: 240708, Avg. loss: 0.117379
Total training time: 96.20 seconds.
-- Epoch 79
Norm: 32.34, NNZs: 1048576, Bias: 0.353002, T: 243794, Avg. loss: 0.116673
Total training time: 97.50 seconds.
-- Epoch 80
Norm: 32.33, NNZs: 1048576, Bias: 0.354604, T: 246880, Avg. loss: 0.115981
Total training time: 98.81 seconds.
-- Epoch 81
Norm: 32.33, NNZs: 1048576, Bias: 0.350320, T: 249966, Avg. loss: 0.115304
Total training time: 100.14 seconds.
-- Epoch 82
Norm: 32.32, NNZs: 1048576, Bias: 0.351505, T: 253052, Avg. loss: 0.114643
Total training time: 101.46 seconds.
-- Epoch 83
Norm: 32.32, NNZs: 1048576, Bias: 0.352578, T: 256138, Avg. loss: 0.113996
Total training time: 102.76 seconds.
-- Epoch 84
Norm: 32.31, NNZs: 1048576, Bias: 0.351172, T: 259224, Avg. loss: 0.113367
Total training time: 104.10 seconds.
-- Epoch 85
Norm: 32.30, NNZs: 1048576, Bias: 0.349552, T: 262310, Avg. loss: 0.112754
Total training time: 105.39 seconds.
-- Epoch 86
Norm: 32.30, NNZs: 1048576, Bias: 0.351072, T: 265396, Avg. loss: 0.112151
Total training time: 106.70 seconds.
-- Epoch 87
Norm: 32.30, NNZs: 1048576, Bias: 0.349928, T: 268482, Avg. loss: 0.111561
Total training time: 108.04 seconds.
-- Epoch 88
Norm: 32.30, NNZs: 1048576, Bias: 0.347433, T: 271568, Avg. loss: 0.110988
Total training time: 109.37 seconds.
-- Epoch 89
Norm: 32.28, NNZs: 1048576, Bias: 0.348634, T: 274654, Avg. loss: 0.110427
Total training time: 110.68 seconds.
-- Epoch 90
Norm: 32.27, NNZs: 1048576, Bias: 0.347943, T: 277740, Avg. loss: 0.109881
Total training time: 111.97 seconds.
-- Epoch 91
Norm: 32.27, NNZs: 1048576, Bias: 0.350040, T: 280826, Avg. loss: 0.109342
Total training time: 113.33 seconds.
-- Epoch 92
Norm: 32.27, NNZs: 1048576, Bias: 0.347406, T: 283912, Avg. loss: 0.108817
Total training time: 114.63 seconds.
-- Epoch 93
Norm: 32.26, NNZs: 1048576, Bias: 0.347929, T: 286998, Avg. loss: 0.108305
Total training time: 115.98 seconds.
-- Epoch 94
Norm: 32.26, NNZs: 1048576, Bias: 0.346743, T: 290084, Avg. loss: 0.107803
Total training time: 117.32 seconds.
-- Epoch 95
Norm: 32.25, NNZs: 1048576, Bias: 0.349089, T: 293170, Avg. loss: 0.107312
Total training time: 118.59 seconds.
-- Epoch 96
Norm: 32.24, NNZs: 1048576, Bias: 0.348864, T: 296256, Avg. loss: 0.106828
Total training time: 119.91 seconds.
-- Epoch 97
Norm: 32.24, NNZs: 1048576, Bias: 0.347671, T: 299342, Avg. loss: 0.106353
Total training time: 121.27 seconds.
-- Epoch 98
Norm: 32.24, NNZs: 1048576, Bias: 0.346834, T: 302428, Avg. loss: 0.105894
Total training time: 122.60 seconds.
-- Epoch 99
Norm: 32.23, NNZs: 1048576, Bias: 0.346883, T: 305514, Avg. loss: 0.105441
Total training time: 123.91 seconds.
-- Epoch 100
Norm: 32.23, NNZs: 1048576, Bias: 0.345527, T: 308600, Avg. loss: 0.104994
Total training time: 125.23 seconds.
-- Epoch 1
Norm: 38.64, NNZs: 171107, Bias: -1.125340, T: 3086, Avg. loss: 0.255091
Total training time: 0.93 seconds.
-- Epoch 2
Norm: 27.14, NNZs: 207000, Bias: -1.151550, T: 6172, Avg. loss: 0.155965
Total training time: 1.86 seconds.
-- Epoch 3
Norm: 21.02, NNZs: 212553, Bias: -1.163631, T: 9258, Avg. loss: 0.112561
Total training time: 2.79 seconds.
-- Epoch 4
Norm: 17.46, NNZs: 242267, Bias: -1.152765, T: 12344, Avg. loss: 0.088504
Total training time: 3.73 seconds.
-- Epoch 5
Norm: 15.21, NNZs: 253820, Bias: -1.152612, T: 15430, Avg. loss: 0.073092
Total training time: 4.66 seconds.
-- Epoch 6
Norm: 13.80, NNZs: 258362, Bias: -1.155061, T: 18516, Avg. loss: 0.062182
Total training time: 5.59 seconds.
-- Epoch 7
Norm: 12.89, NNZs: 265437, Bias: -1.149186, T: 21602, Avg. loss: 0.054244
Total training time: 6.53 seconds.
-- Epoch 8
Norm: 12.01, NNZs: 268279, Bias: -1.154386, T: 24688, Avg. loss: 0.048230
Total training time: 7.46 seconds.
-- Epoch 9
Norm: 11.61, NNZs: 274381, Bias: -1.136866, T: 27774, Avg. loss: 0.043513
Total training time: 8.39 seconds.
-- Epoch 10
Norm: 11.06, NNZs: 278602, Bias: -1.152600, T: 30860, Avg. loss: 0.039800
Total training time: 9.33 seconds.
-- Epoch 11
Norm: 10.86, NNZs: 282663, Bias: -1.143829, T: 33946, Avg. loss: 0.036708
Total training time: 10.26 seconds.
-- Epoch 12
Norm: 10.64, NNZs: 289278, Bias: -1.142647, T: 37032, Avg. loss: 0.034123
Total training time: 11.19 seconds.
-- Epoch 13
Norm: 10.43, NNZs: 299123, Bias: -1.146345, T: 40118, Avg. loss: 0.031888
Total training time: 12.13 seconds.
-- Epoch 14
Norm: 10.31, NNZs: 300855, Bias: -1.141650, T: 43204, Avg. loss: 0.030010
Total training time: 13.06 seconds.
-- Epoch 15
Norm: 10.15, NNZs: 301732, Bias: -1.139459, T: 46290, Avg. loss: 0.028381
Total training time: 14.00 seconds.
-- Epoch 16
Norm: 10.03, NNZs: 308244, Bias: -1.143770, T: 49376, Avg. loss: 0.026956
Total training time: 14.94 seconds.
-- Epoch 17
Norm: 9.95, NNZs: 308782, Bias: -1.141516, T: 52462, Avg. loss: 0.025690
Total training time: 15.88 seconds.
-- Epoch 18
Norm: 9.89, NNZs: 309215, Bias: -1.140929, T: 55548, Avg. loss: 0.024552
Total training time: 16.81 seconds.
-- Epoch 19
Norm: 9.80, NNZs: 312688, Bias: -1.138807, T: 58634, Avg. loss: 0.023525
Total training time: 17.74 seconds.
-- Epoch 20
Norm: 9.79, NNZs: 313460, Bias: -1.134348, T: 61720, Avg. loss: 0.022617
Total training time: 18.68 seconds.
-- Epoch 21
Norm: 9.69, NNZs: 317380, Bias: -1.137670, T: 64806, Avg. loss: 0.021782
Total training time: 19.62 seconds.
-- Epoch 22
Norm: 9.67, NNZs: 319885, Bias: -1.134539, T: 67892, Avg. loss: 0.021034
Total training time: 20.56 seconds.
-- Epoch 23
Norm: 9.60, NNZs: 319959, Bias: -1.136131, T: 70978, Avg. loss: 0.020345
Total training time: 21.50 seconds.
-- Epoch 24
Norm: 9.58, NNZs: 322104, Bias: -1.135319, T: 74064, Avg. loss: 0.019702
Total training time: 22.43 seconds.
-- Epoch 25
Norm: 9.52, NNZs: 324360, Bias: -1.135620, T: 77150, Avg. loss: 0.019114
Total training time: 23.37 seconds.
-- Epoch 26
Norm: 9.51, NNZs: 367464, Bias: -1.134623, T: 80236, Avg. loss: 0.018574
Total training time: 24.32 seconds.
-- Epoch 27
Norm: 9.46, NNZs: 367508, Bias: -1.136472, T: 83322, Avg. loss: 0.018076
Total training time: 25.26 seconds.
-- Epoch 28
Norm: 9.45, NNZs: 385261, Bias: -1.133429, T: 86408, Avg. loss: 0.017616
Total training time: 26.20 seconds.
-- Epoch 29
Norm: 9.41, NNZs: 385918, Bias: -1.131980, T: 89494, Avg. loss: 0.017180
Total training time: 27.14 seconds.
-- Epoch 30
Norm: 9.38, NNZs: 389346, Bias: -1.135097, T: 92580, Avg. loss: 0.016776
Total training time: 28.08 seconds.
-- Epoch 31
Norm: 9.38, NNZs: 389533, Bias: -1.131403, T: 95666, Avg. loss: 0.016395
Total training time: 29.02 seconds.
-- Epoch 32
Norm: 9.37, NNZs: 389765, Bias: -1.129158, T: 98752, Avg. loss: 0.016040
Total training time: 29.96 seconds.
-- Epoch 33
Norm: 9.36, NNZs: 390347, Bias: -1.127257, T: 101838, Avg. loss: 0.015699
Total training time: 30.91 seconds.
-- Epoch 34
Norm: 9.33, NNZs: 390460, Bias: -1.130627, T: 104924, Avg. loss: 0.015389
Total training time: 31.85 seconds.
-- Epoch 35
Norm: 9.32, NNZs: 391349, Bias: -1.131145, T: 108010, Avg. loss: 0.015088
Total training time: 32.79 seconds.
-- Epoch 36
Norm: 9.31, NNZs: 391693, Bias: -1.129680, T: 111096, Avg. loss: 0.014804
Total training time: 33.73 seconds.
-- Epoch 37
Norm: 9.29, NNZs: 392455, Bias: -1.130995, T: 114182, Avg. loss: 0.014537
Total training time: 34.67 seconds.
-- Epoch 38
Norm: 9.26, NNZs: 392568, Bias: -1.132187, T: 117268, Avg. loss: 0.014284
Total training time: 35.61 seconds.
-- Epoch 39
Norm: 9.26, NNZs: 392650, Bias: -1.129262, T: 120354, Avg. loss: 0.014044
Total training time: 36.56 seconds.
-- Epoch 40
Norm: 9.25, NNZs: 393460, Bias: -1.128238, T: 123440, Avg. loss: 0.013818
Total training time: 37.50 seconds.
-- Epoch 41
Norm: 9.24, NNZs: 395464, Bias: -1.128871, T: 126526, Avg. loss: 0.013598
Total training time: 38.44 seconds.
-- Epoch 42
Norm: 9.22, NNZs: 395464, Bias: -1.129720, T: 129612, Avg. loss: 0.013392
Total training time: 39.39 seconds.
-- Epoch 43
Norm: 9.21, NNZs: 395464, Bias: -1.130041, T: 132698, Avg. loss: 0.013194
Total training time: 40.33 seconds.
-- Epoch 44
Norm: 9.21, NNZs: 395464, Bias: -1.127638, T: 135784, Avg. loss: 0.013004
Total training time: 41.27 seconds.
-- Epoch 45
Norm: 9.19, NNZs: 395835, Bias: -1.129452, T: 138870, Avg. loss: 0.012826
Total training time: 42.21 seconds.
-- Epoch 46
Norm: 9.18, NNZs: 395835, Bias: -1.128230, T: 141956, Avg. loss: 0.012655
Total training time: 43.16 seconds.
-- Epoch 47
Norm: 9.18, NNZs: 396013, Bias: -1.126852, T: 145042, Avg. loss: 0.012489
Total training time: 44.10 seconds.
-- Epoch 48
Norm: 9.17, NNZs: 396013, Bias: -1.128285, T: 148128, Avg. loss: 0.012332
Total training time: 45.05 seconds.
-- Epoch 49
Norm: 9.16, NNZs: 396013, Bias: -1.129238, T: 151214, Avg. loss: 0.012179
Total training time: 45.99 seconds.
-- Epoch 50
Norm: 9.15, NNZs: 397215, Bias: -1.128900, T: 154300, Avg. loss: 0.012033
Total training time: 46.94 seconds.
-- Epoch 51
Norm: 9.16, NNZs: 397215, Bias: -1.125386, T: 157386, Avg. loss: 0.011892
Total training time: 47.88 seconds.
-- Epoch 52
Norm: 9.14, NNZs: 397736, Bias: -1.126951, T: 160472, Avg. loss: 0.011758
Total training time: 48.82 seconds.
-- Epoch 53
Norm: 9.13, NNZs: 397778, Bias: -1.128593, T: 163558, Avg. loss: 0.011628
Total training time: 49.77 seconds.
-- Epoch 54
Norm: 9.13, NNZs: 397778, Bias: -1.127484, T: 166644, Avg. loss: 0.011503
Total training time: 50.71 seconds.
-- Epoch 55
Norm: 9.12, NNZs: 398086, Bias: -1.127722, T: 169730, Avg. loss: 0.011384
Total training time: 51.66 seconds.
-- Epoch 56
Norm: 9.11, NNZs: 399519, Bias: -1.127595, T: 172816, Avg. loss: 0.011267
Total training time: 52.60 seconds.
-- Epoch 57
Norm: 9.11, NNZs: 399519, Bias: -1.127328, T: 175902, Avg. loss: 0.011155
Total training time: 53.55 seconds.
-- Epoch 58
Norm: 9.11, NNZs: 399519, Bias: -1.127209, T: 178988, Avg. loss: 0.011046
Total training time: 54.49 seconds.
-- Epoch 59
Norm: 9.11, NNZs: 399519, Bias: -1.126522, T: 182074, Avg. loss: 0.010940
Total training time: 55.43 seconds.
-- Epoch 60
Norm: 9.11, NNZs: 399519, Bias: -1.125748, T: 185160, Avg. loss: 0.010838
Total training time: 56.38 seconds.
-- Epoch 61
Norm: 9.10, NNZs: 399624, Bias: -1.125800, T: 188246, Avg. loss: 0.010740
Total training time: 57.32 seconds.
-- Epoch 62
Norm: 9.10, NNZs: 399624, Bias: -1.125930, T: 191332, Avg. loss: 0.010645
Total training time: 58.27 seconds.
-- Epoch 63
Norm: 9.10, NNZs: 400376, Bias: -1.124605, T: 194418, Avg. loss: 0.010553
Total training time: 59.21 seconds.
-- Epoch 64
Norm: 9.09, NNZs: 400376, Bias: -1.125412, T: 197504, Avg. loss: 0.010464
Total training time: 60.15 seconds.
-- Epoch 65
Norm: 9.09, NNZs: 400376, Bias: -1.125249, T: 200590, Avg. loss: 0.010377
Total training time: 61.10 seconds.
-- Epoch 66
Norm: 9.08, NNZs: 400376, Bias: -1.125447, T: 203676, Avg. loss: 0.010294
Total training time: 62.04 seconds.
-- Epoch 67
Norm: 9.08, NNZs: 400376, Bias: -1.124316, T: 206762, Avg. loss: 0.010212
Total training time: 63.21 seconds.
-- Epoch 68
Norm: 9.08, NNZs: 400376, Bias: -1.124775, T: 209848, Avg. loss: 0.010132
Total training time: 64.17 seconds.
-- Epoch 69
Norm: 9.07, NNZs: 400821, Bias: -1.123608, T: 212934, Avg. loss: 0.010054
Total training time: 65.13 seconds.
-- Epoch 70
Norm: 9.07, NNZs: 401190, Bias: -1.125078, T: 216020, Avg. loss: 0.009980
Total training time: 66.07 seconds.
-- Epoch 71
Norm: 9.07, NNZs: 401655, Bias: -1.124593, T: 219106, Avg. loss: 0.009907
Total training time: 67.02 seconds.
-- Epoch 72
Norm: 9.06, NNZs: 401866, Bias: -1.125388, T: 222192, Avg. loss: 0.009835
Total training time: 67.96 seconds.
-- Epoch 73
Norm: 9.06, NNZs: 403115, Bias: -1.124614, T: 225278, Avg. loss: 0.009766
Total training time: 68.91 seconds.
-- Epoch 74
Norm: 9.06, NNZs: 403115, Bias: -1.125422, T: 228364, Avg. loss: 0.009699
Total training time: 69.86 seconds.
-- Epoch 75
Norm: 9.05, NNZs: 403925, Bias: -1.124429, T: 231450, Avg. loss: 0.009633
Total training time: 70.80 seconds.
-- Epoch 76
Norm: 9.05, NNZs: 403925, Bias: -1.124638, T: 234536, Avg. loss: 0.009569
Total training time: 71.75 seconds.
-- Epoch 77
Norm: 9.05, NNZs: 403925, Bias: -1.122617, T: 237622, Avg. loss: 0.009506
Total training time: 72.70 seconds.
-- Epoch 78
Norm: 9.04, NNZs: 404121, Bias: -1.124590, T: 240708, Avg. loss: 0.009445
Total training time: 73.65 seconds.
-- Epoch 79
Norm: 9.04, NNZs: 404121, Bias: -1.123481, T: 243794, Avg. loss: 0.009386
Total training time: 74.59 seconds.
-- Epoch 80
Norm: 9.04, NNZs: 404121, Bias: -1.122425, T: 246880, Avg. loss: 0.009328
Total training time: 75.53 seconds.
-- Epoch 81
Norm: 9.03, NNZs: 404121, Bias: -1.123135, T: 249966, Avg. loss: 0.009272
Total training time: 76.48 seconds.
-- Epoch 82
Norm: 9.03, NNZs: 404121, Bias: -1.123792, T: 253052, Avg. loss: 0.009218
Total training time: 77.42 seconds.
-- Epoch 83
Norm: 9.03, NNZs: 404582, Bias: -1.124112, T: 256138, Avg. loss: 0.009164
Total training time: 78.37 seconds.
-- Epoch 84
Norm: 9.03, NNZs: 404582, Bias: -1.123004, T: 259224, Avg. loss: 0.009112
Total training time: 79.31 seconds.
-- Epoch 85
Norm: 9.02, NNZs: 404582, Bias: -1.124078, T: 262310, Avg. loss: 0.009061
Total training time: 80.26 seconds.
-- Epoch 86
Norm: 9.03, NNZs: 404582, Bias: -1.122079, T: 265396, Avg. loss: 0.009012
Total training time: 81.20 seconds.
-- Epoch 87
Norm: 9.02, NNZs: 404722, Bias: -1.123623, T: 268482, Avg. loss: 0.008963
Total training time: 82.14 seconds.
-- Epoch 88
Norm: 9.02, NNZs: 404722, Bias: -1.122475, T: 271568, Avg. loss: 0.008915
Total training time: 83.09 seconds.
-- Epoch 89
Norm: 9.02, NNZs: 404722, Bias: -1.122931, T: 274654, Avg. loss: 0.008869
Total training time: 84.03 seconds.
-- Epoch 90
Norm: 9.02, NNZs: 404722, Bias: -1.122195, T: 277740, Avg. loss: 0.008824
Total training time: 84.98 seconds.
-- Epoch 91
Norm: 9.01, NNZs: 404974, Bias: -1.123732, T: 280826, Avg. loss: 0.008779
Total training time: 85.92 seconds.
-- Epoch 92
Norm: 9.01, NNZs: 405294, Bias: -1.122023, T: 283912, Avg. loss: 0.008736
Total training time: 86.87 seconds.
-- Epoch 93
Norm: 9.01, NNZs: 405294, Bias: -1.122691, T: 286998, Avg. loss: 0.008693
Total training time: 87.82 seconds.
-- Epoch 94
Norm: 9.01, NNZs: 405294, Bias: -1.122490, T: 290084, Avg. loss: 0.008651
Total training time: 88.76 seconds.
-- Epoch 95
Norm: 9.01, NNZs: 405294, Bias: -1.121485, T: 293170, Avg. loss: 0.008610
Total training time: 89.71 seconds.
-- Epoch 96
Norm: 9.01, NNZs: 405294, Bias: -1.120901, T: 296256, Avg. loss: 0.008570
Total training time: 90.65 seconds.
-- Epoch 97
Norm: 9.00, NNZs: 405294, Bias: -1.122810, T: 299342, Avg. loss: 0.008531
Total training time: 91.59 seconds.
-- Epoch 98
Norm: 9.00, NNZs: 405294, Bias: -1.122031, T: 302428, Avg. loss: 0.008493
Total training time: 92.54 seconds.
-- Epoch 99
Norm: 9.00, NNZs: 405294, Bias: -1.122510, T: 305514, Avg. loss: 0.008456
Total training time: 93.49 seconds.
-- Epoch 100
Norm: 9.00, NNZs: 405294, Bias: -1.121242, T: 308600, Avg. loss: 0.008419
Total training time: 94.43 seconds.
-- Epoch 1
Norm: 61.97, NNZs: 1045108, Bias: -1.679258, T: 3086, Avg. loss: 0.429146
Total training time: 0.91 seconds.
-- Epoch 2
Norm: 38.35, NNZs: 1046633, Bias: -1.702397, T: 6172, Avg. loss: 0.232606
Total training time: 1.76 seconds.
-- Epoch 3
Norm: 28.38, NNZs: 1047423, Bias: -1.683216, T: 9258, Avg. loss: 0.160219
Total training time: 2.62 seconds.
-- Epoch 4
Norm: 22.38, NNZs: 1048054, Bias: -1.692567, T: 12344, Avg. loss: 0.122710
Total training time: 3.47 seconds.
-- Epoch 5
Norm: 18.97, NNZs: 1048321, Bias: -1.684963, T: 15430, Avg. loss: 0.099518
Total training time: 4.34 seconds.
-- Epoch 6
Norm: 16.92, NNZs: 1048426, Bias: -1.681285, T: 18516, Avg. loss: 0.083886
Total training time: 5.24 seconds.
-- Epoch 7
Norm: 15.66, NNZs: 1048558, Bias: -1.683730, T: 21602, Avg. loss: 0.072674
Total training time: 6.17 seconds.
-- Epoch 8
Norm: 14.94, NNZs: 1048564, Bias: -1.675541, T: 24688, Avg. loss: 0.064232
Total training time: 7.12 seconds.
-- Epoch 9
Norm: 14.46, NNZs: 1048570, Bias: -1.670708, T: 27774, Avg. loss: 0.057669
Total training time: 8.08 seconds.
-- Epoch 10
Norm: 14.03, NNZs: 1048574, Bias: -1.674903, T: 30860, Avg. loss: 0.052396
Total training time: 9.06 seconds.
-- Epoch 11
Norm: 13.72, NNZs: 1048574, Bias: -1.672643, T: 33946, Avg. loss: 0.048094
Total training time: 10.04 seconds.
-- Epoch 12
Norm: 13.47, NNZs: 1048575, Bias: -1.673717, T: 37032, Avg. loss: 0.044506
Total training time: 11.02 seconds.
-- Epoch 13
Norm: 13.30, NNZs: 1048575, Bias: -1.673466, T: 40118, Avg. loss: 0.041457
Total training time: 12.03 seconds.
-- Epoch 14
Norm: 13.21, NNZs: 1048575, Bias: -1.671800, T: 43204, Avg. loss: 0.038851
Total training time: 13.04 seconds.
-- Epoch 15
Norm: 13.11, NNZs: 1048575, Bias: -1.673019, T: 46290, Avg. loss: 0.036587
Total training time: 14.03 seconds.
-- Epoch 16
Norm: 13.04, NNZs: 1048575, Bias: -1.672121, T: 49376, Avg. loss: 0.034597
Total training time: 15.06 seconds.
-- Epoch 17
Norm: 12.93, NNZs: 1048576, Bias: -1.673831, T: 52462, Avg. loss: 0.032838
Total training time: 16.07 seconds.
-- Epoch 18
Norm: 12.95, NNZs: 1048576, Bias: -1.669699, T: 55548, Avg. loss: 0.031284
Total training time: 17.09 seconds.
-- Epoch 19
Norm: 12.93, NNZs: 1048576, Bias: -1.670421, T: 58634, Avg. loss: 0.029876
Total training time: 18.11 seconds.
-- Epoch 20
Norm: 12.85, NNZs: 1048576, Bias: -1.669585, T: 61720, Avg. loss: 0.028607
Total training time: 19.13 seconds.
-- Epoch 21
Norm: 12.83, NNZs: 1048576, Bias: -1.669603, T: 64806, Avg. loss: 0.027466
Total training time: 20.17 seconds.
-- Epoch 22
Norm: 12.69, NNZs: 1048576, Bias: -1.674426, T: 67892, Avg. loss: 0.026422
Total training time: 21.19 seconds.
-- Epoch 23
Norm: 12.76, NNZs: 1048576, Bias: -1.669324, T: 70978, Avg. loss: 0.025478
Total training time: 22.24 seconds.
-- Epoch 24
Norm: 12.72, NNZs: 1048576, Bias: -1.668524, T: 74064, Avg. loss: 0.024604
Total training time: 23.26 seconds.
-- Epoch 25
Norm: 12.68, NNZs: 1048576, Bias: -1.670331, T: 77150, Avg. loss: 0.023800
Total training time: 24.29 seconds.
-- Epoch 26
Norm: 12.68, NNZs: 1048576, Bias: -1.669312, T: 80236, Avg. loss: 0.023051
Total training time: 25.34 seconds.
-- Epoch 27
Norm: 12.68, NNZs: 1048576, Bias: -1.668877, T: 83322, Avg. loss: 0.022366
Total training time: 26.38 seconds.
-- Epoch 28
Norm: 12.65, NNZs: 1048576, Bias: -1.668932, T: 86408, Avg. loss: 0.021729
Total training time: 27.41 seconds.
-- Epoch 29
Norm: 12.64, NNZs: 1048576, Bias: -1.669328, T: 89494, Avg. loss: 0.021135
Total training time: 28.46 seconds.
-- Epoch 30
Norm: 12.61, NNZs: 1048576, Bias: -1.669441, T: 92580, Avg. loss: 0.020579
Total training time: 29.50 seconds.
-- Epoch 31
Norm: 12.62, NNZs: 1048576, Bias: -1.668822, T: 95666, Avg. loss: 0.020054
Total training time: 30.57 seconds.
-- Epoch 32
Norm: 12.61, NNZs: 1048576, Bias: -1.667725, T: 98752, Avg. loss: 0.019567
Total training time: 31.60 seconds.
-- Epoch 33
Norm: 12.58, NNZs: 1048576, Bias: -1.668828, T: 101838, Avg. loss: 0.019110
Total training time: 32.64 seconds.
-- Epoch 34
Norm: 12.57, NNZs: 1048576, Bias: -1.669251, T: 104924, Avg. loss: 0.018676
Total training time: 33.70 seconds.
-- Epoch 35
Norm: 12.50, NNZs: 1048576, Bias: -1.671891, T: 108010, Avg. loss: 0.018264
Total training time: 34.72 seconds.
-- Epoch 36
Norm: 12.55, NNZs: 1048576, Bias: -1.669180, T: 111096, Avg. loss: 0.017877
Total training time: 35.82 seconds.
-- Epoch 37
Norm: 12.52, NNZs: 1048576, Bias: -1.670062, T: 114182, Avg. loss: 0.017514
Total training time: 36.86 seconds.
-- Epoch 38
Norm: 12.53, NNZs: 1048576, Bias: -1.668951, T: 117268, Avg. loss: 0.017168
Total training time: 37.93 seconds.
-- Epoch 39
Norm: 12.53, NNZs: 1048576, Bias: -1.668993, T: 120354, Avg. loss: 0.016840
Total training time: 39.00 seconds.
-- Epoch 40
Norm: 12.50, NNZs: 1048576, Bias: -1.669260, T: 123440, Avg. loss: 0.016528
Total training time: 40.02 seconds.
-- Epoch 41
Norm: 12.50, NNZs: 1048576, Bias: -1.669031, T: 126526, Avg. loss: 0.016230
Total training time: 41.10 seconds.
-- Epoch 42
Norm: 12.51, NNZs: 1048576, Bias: -1.668637, T: 129612, Avg. loss: 0.015947
Total training time: 42.17 seconds.
-- Epoch 43
Norm: 12.50, NNZs: 1048576, Bias: -1.668649, T: 132698, Avg. loss: 0.015678
Total training time: 43.22 seconds.
-- Epoch 44
Norm: 12.51, NNZs: 1048576, Bias: -1.668124, T: 135784, Avg. loss: 0.015419
Total training time: 44.29 seconds.
-- Epoch 45
Norm: 12.48, NNZs: 1048576, Bias: -1.668849, T: 138870, Avg. loss: 0.015173
Total training time: 45.33 seconds.
-- Epoch 46
Norm: 12.49, NNZs: 1048576, Bias: -1.668406, T: 141956, Avg. loss: 0.014938
Total training time: 46.40 seconds.
-- Epoch 47
Norm: 12.51, NNZs: 1048576, Bias: -1.666936, T: 145042, Avg. loss: 0.014711
Total training time: 47.49 seconds.
-- Epoch 48
Norm: 12.49, NNZs: 1048576, Bias: -1.668309, T: 148128, Avg. loss: 0.014494
Total training time: 48.53 seconds.
-- Epoch 49
Norm: 12.48, NNZs: 1048576, Bias: -1.667916, T: 151214, Avg. loss: 0.014287
Total training time: 49.59 seconds.
-- Epoch 50
Norm: 12.49, NNZs: 1048576, Bias: -1.667196, T: 154300, Avg. loss: 0.014087
Total training time: 50.65 seconds.
-- Epoch 51
Norm: 12.47, NNZs: 1048576, Bias: -1.667807, T: 157386, Avg. loss: 0.013897
Total training time: 51.69 seconds.
-- Epoch 52
Norm: 12.46, NNZs: 1048576, Bias: -1.669025, T: 160472, Avg. loss: 0.013711
Total training time: 52.76 seconds.
-- Epoch 53
Norm: 12.42, NNZs: 1048576, Bias: -1.670262, T: 163558, Avg. loss: 0.013533
Total training time: 53.80 seconds.
-- Epoch 54
Norm: 12.47, NNZs: 1048576, Bias: -1.667477, T: 166644, Avg. loss: 0.013362
Total training time: 54.89 seconds.
-- Epoch 55
Norm: 12.44, NNZs: 1048576, Bias: -1.668789, T: 169730, Avg. loss: 0.013197
Total training time: 55.94 seconds.
-- Epoch 56
Norm: 12.46, NNZs: 1048576, Bias: -1.667966, T: 172816, Avg. loss: 0.013038
Total training time: 57.01 seconds.
-- Epoch 57
Norm: 12.42, NNZs: 1048576, Bias: -1.669870, T: 175902, Avg. loss: 0.012884
Total training time: 58.07 seconds.
-- Epoch 58
Norm: 12.44, NNZs: 1048576, Bias: -1.667599, T: 178988, Avg. loss: 0.012736
Total training time: 59.12 seconds.
-- Epoch 59
Norm: 12.41, NNZs: 1048576, Bias: -1.669798, T: 182074, Avg. loss: 0.012592
Total training time: 60.16 seconds.
-- Epoch 60
Norm: 12.44, NNZs: 1048576, Bias: -1.668270, T: 185160, Avg. loss: 0.012452
Total training time: 61.24 seconds.
-- Epoch 61
Norm: 12.42, NNZs: 1048576, Bias: -1.668760, T: 188246, Avg. loss: 0.012318
Total training time: 62.30 seconds.
-- Epoch 62
Norm: 12.44, NNZs: 1048576, Bias: -1.667909, T: 191332, Avg. loss: 0.012188
Total training time: 63.37 seconds.
-- Epoch 63
Norm: 12.45, NNZs: 1048576, Bias: -1.666873, T: 194418, Avg. loss: 0.012062
Total training time: 64.45 seconds.
-- Epoch 64
Norm: 12.44, NNZs: 1048576, Bias: -1.667096, T: 197504, Avg. loss: 0.011941
Total training time: 65.51 seconds.
-- Epoch 65
Norm: 12.42, NNZs: 1048576, Bias: -1.668210, T: 200590, Avg. loss: 0.011823
Total training time: 66.56 seconds.
-- Epoch 66
Norm: 12.43, NNZs: 1048576, Bias: -1.667807, T: 203676, Avg. loss: 0.011709
Total training time: 67.63 seconds.
-- Epoch 67
Norm: 12.41, NNZs: 1048576, Bias: -1.668795, T: 206762, Avg. loss: 0.011597
Total training time: 68.67 seconds.
-- Epoch 68
Norm: 12.40, NNZs: 1048576, Bias: -1.668699, T: 209848, Avg. loss: 0.011488
Total training time: 69.73 seconds.
-- Epoch 69
Norm: 12.41, NNZs: 1048576, Bias: -1.667906, T: 212934, Avg. loss: 0.011384
Total training time: 70.81 seconds.
-- Epoch 70
Norm: 12.42, NNZs: 1048576, Bias: -1.667455, T: 216020, Avg. loss: 0.011282
Total training time: 71.89 seconds.
-- Epoch 71
Norm: 12.39, NNZs: 1048576, Bias: -1.668953, T: 219106, Avg. loss: 0.011182
Total training time: 72.91 seconds.
-- Epoch 72
Norm: 12.42, NNZs: 1048576, Bias: -1.667301, T: 222192, Avg. loss: 0.011085
Total training time: 74.02 seconds.
-- Epoch 73
Norm: 12.40, NNZs: 1048576, Bias: -1.668165, T: 225278, Avg. loss: 0.010992
Total training time: 75.05 seconds.
-- Epoch 74
Norm: 12.41, NNZs: 1048576, Bias: -1.667858, T: 228364, Avg. loss: 0.010901
Total training time: 76.13 seconds.
-- Epoch 75
Norm: 12.42, NNZs: 1048576, Bias: -1.667317, T: 231450, Avg. loss: 0.010812
Total training time: 77.19 seconds.
-- Epoch 76
Norm: 12.40, NNZs: 1048576, Bias: -1.668041, T: 234536, Avg. loss: 0.010725
Total training time: 78.25 seconds.
-- Epoch 77
Norm: 12.41, NNZs: 1048576, Bias: -1.667578, T: 237622, Avg. loss: 0.010640
Total training time: 79.31 seconds.
-- Epoch 78
Norm: 12.40, NNZs: 1048576, Bias: -1.668240, T: 240708, Avg. loss: 0.010558
Total training time: 80.39 seconds.
-- Epoch 79
Norm: 12.40, NNZs: 1048576, Bias: -1.667466, T: 243794, Avg. loss: 0.010477
Total training time: 81.44 seconds.
-- Epoch 80
Norm: 12.41, NNZs: 1048576, Bias: -1.667157, T: 246880, Avg. loss: 0.010399
Total training time: 82.53 seconds.
-- Epoch 81
Norm: 12.38, NNZs: 1048576, Bias: -1.668924, T: 249966, Avg. loss: 0.010322
Total training time: 83.57 seconds.
-- Epoch 82
Norm: 12.42, NNZs: 1048576, Bias: -1.666863, T: 253052, Avg. loss: 0.010247
Total training time: 84.68 seconds.
-- Epoch 83
Norm: 12.40, NNZs: 1048576, Bias: -1.667700, T: 256138, Avg. loss: 0.010175
Total training time: 85.74 seconds.
-- Epoch 84
Norm: 12.38, NNZs: 1048576, Bias: -1.668405, T: 259224, Avg. loss: 0.010104
Total training time: 86.79 seconds.
-- Epoch 85
Norm: 12.37, NNZs: 1048576, Bias: -1.669065, T: 262310, Avg. loss: 0.010034
Total training time: 87.88 seconds.
-- Epoch 86
Norm: 12.40, NNZs: 1048576, Bias: -1.667607, T: 265396, Avg. loss: 0.009967
Total training time: 89.16 seconds.
-- Epoch 87
Norm: 12.41, NNZs: 1048576, Bias: -1.666997, T: 268482, Avg. loss: 0.009901
Total training time: 90.24 seconds.
-- Epoch 88
Norm: 12.40, NNZs: 1048576, Bias: -1.667326, T: 271568, Avg. loss: 0.009837
Total training time: 91.29 seconds.
-- Epoch 89
Norm: 12.41, NNZs: 1048576, Bias: -1.666658, T: 274654, Avg. loss: 0.009773
Total training time: 92.37 seconds.
-- Epoch 90
Norm: 12.39, NNZs: 1048576, Bias: -1.667756, T: 277740, Avg. loss: 0.009712
Total training time: 93.43 seconds.
-- Epoch 91
Norm: 12.39, NNZs: 1048576, Bias: -1.667346, T: 280826, Avg. loss: 0.009651
Total training time: 94.48 seconds.
-- Epoch 92
Norm: 12.39, NNZs: 1048576, Bias: -1.667532, T: 283912, Avg. loss: 0.009593
Total training time: 95.55 seconds.
-- Epoch 93
Norm: 12.39, NNZs: 1048576, Bias: -1.666863, T: 286998, Avg. loss: 0.009535
Total training time: 96.62 seconds.
-- Epoch 94
Norm: 12.38, NNZs: 1048576, Bias: -1.667477, T: 290084, Avg. loss: 0.009478
Total training time: 97.68 seconds.
-- Epoch 95
Norm: 12.39, NNZs: 1048576, Bias: -1.666723, T: 293170, Avg. loss: 0.009422
Total training time: 98.77 seconds.
-- Epoch 96
Norm: 12.39, NNZs: 1048576, Bias: -1.666633, T: 296256, Avg. loss: 0.009368
Total training time: 99.82 seconds.
-- Epoch 97
Norm: 12.38, NNZs: 1048576, Bias: -1.667059, T: 299342, Avg. loss: 0.009315
Total training time: 100.90 seconds.
-- Epoch 98
Norm: 12.37, NNZs: 1048576, Bias: -1.667658, T: 302428, Avg. loss: 0.009263
Total training time: 101.95 seconds.
-- Epoch 99
Norm: 12.38, NNZs: 1048576, Bias: -1.667028, T: 305514, Avg. loss: 0.009212
Total training time: 103.04 seconds.
-- Epoch 100
Norm: 12.37, NNZs: 1048576, Bias: -1.667665, T: 308600, Avg. loss: 0.009161
Total training time: 104.11 seconds.
-- Epoch 1
Norm: 44.08, NNZs: 639227, Bias: -1.365984, T: 3086, Avg. loss: 0.305213
Total training time: 0.86 seconds.
-- Epoch 2
Norm: 29.88, NNZs: 964240, Bias: -1.380770, T: 6172, Avg. loss: 0.184517
Total training time: 1.71 seconds.
-- Epoch 3
Norm: 23.32, NNZs: 1005257, Bias: -1.417820, T: 9258, Avg. loss: 0.133109
Total training time: 2.55 seconds.
-- Epoch 4
Norm: 19.21, NNZs: 1036041, Bias: -1.441796, T: 12344, Avg. loss: 0.103885
Total training time: 3.41 seconds.
-- Epoch 5
Norm: 17.02, NNZs: 1042693, Bias: -1.409172, T: 15430, Avg. loss: 0.085543
Total training time: 4.26 seconds.
-- Epoch 6
Norm: 15.41, NNZs: 1047629, Bias: -1.415142, T: 18516, Avg. loss: 0.072828
Total training time: 5.13 seconds.
-- Epoch 7
Norm: 14.24, NNZs: 1047984, Bias: -1.413177, T: 21602, Avg. loss: 0.063406
Total training time: 6.00 seconds.
-- Epoch 8
Norm: 13.47, NNZs: 1048277, Bias: -1.408829, T: 24688, Avg. loss: 0.056401
Total training time: 6.88 seconds.
-- Epoch 9
Norm: 12.85, NNZs: 1048313, Bias: -1.416355, T: 27774, Avg. loss: 0.050887
Total training time: 7.75 seconds.
-- Epoch 10
Norm: 12.57, NNZs: 1048456, Bias: -1.409159, T: 30860, Avg. loss: 0.046511
Total training time: 8.63 seconds.
-- Epoch 11
Norm: 12.23, NNZs: 1048493, Bias: -1.408113, T: 33946, Avg. loss: 0.042907
Total training time: 9.53 seconds.
-- Epoch 12
Norm: 11.98, NNZs: 1048513, Bias: -1.409290, T: 37032, Avg. loss: 0.039875
Total training time: 10.41 seconds.
-- Epoch 13
Norm: 11.82, NNZs: 1048518, Bias: -1.411048, T: 40118, Avg. loss: 0.037310
Total training time: 11.30 seconds.
-- Epoch 14
Norm: 11.70, NNZs: 1048529, Bias: -1.409885, T: 43204, Avg. loss: 0.035096
Total training time: 12.18 seconds.
-- Epoch 15
Norm: 11.61, NNZs: 1048535, Bias: -1.408248, T: 46290, Avg. loss: 0.033166
Total training time: 13.07 seconds.
-- Epoch 16
Norm: 11.48, NNZs: 1048543, Bias: -1.409240, T: 49376, Avg. loss: 0.031463
Total training time: 13.98 seconds.
-- Epoch 17
Norm: 11.39, NNZs: 1048556, Bias: -1.410181, T: 52462, Avg. loss: 0.029979
Total training time: 14.89 seconds.
-- Epoch 18
Norm: 11.30, NNZs: 1048557, Bias: -1.410177, T: 55548, Avg. loss: 0.028664
Total training time: 15.78 seconds.
-- Epoch 19
Norm: 11.23, NNZs: 1048560, Bias: -1.410130, T: 58634, Avg. loss: 0.027475
Total training time: 16.67 seconds.
-- Epoch 20
Norm: 11.18, NNZs: 1048563, Bias: -1.406741, T: 61720, Avg. loss: 0.026395
Total training time: 17.57 seconds.
-- Epoch 21
Norm: 11.13, NNZs: 1048567, Bias: -1.411218, T: 64806, Avg. loss: 0.025435
Total training time: 18.50 seconds.
-- Epoch 22
Norm: 11.08, NNZs: 1048571, Bias: -1.410641, T: 67892, Avg. loss: 0.024549
Total training time: 19.39 seconds.
-- Epoch 23
Norm: 11.02, NNZs: 1048571, Bias: -1.412824, T: 70978, Avg. loss: 0.023723
Total training time: 20.30 seconds.
-- Epoch 24
Norm: 10.98, NNZs: 1048572, Bias: -1.413107, T: 74064, Avg. loss: 0.022981
Total training time: 21.23 seconds.
-- Epoch 25
Norm: 10.97, NNZs: 1048572, Bias: -1.411672, T: 77150, Avg. loss: 0.022303
Total training time: 22.13 seconds.
-- Epoch 26
Norm: 10.94, NNZs: 1048573, Bias: -1.413230, T: 80236, Avg. loss: 0.021659
Total training time: 23.07 seconds.
-- Epoch 27
Norm: 10.93, NNZs: 1048573, Bias: -1.412257, T: 83322, Avg. loss: 0.021076
Total training time: 23.99 seconds.
-- Epoch 28
Norm: 10.92, NNZs: 1048573, Bias: -1.410361, T: 86408, Avg. loss: 0.020530
Total training time: 24.91 seconds.
-- Epoch 29
Norm: 10.88, NNZs: 1048573, Bias: -1.411003, T: 89494, Avg. loss: 0.020019
Total training time: 25.82 seconds.
-- Epoch 30
Norm: 10.85, NNZs: 1048573, Bias: -1.411581, T: 92580, Avg. loss: 0.019539
Total training time: 26.73 seconds.
-- Epoch 31
Norm: 10.85, NNZs: 1048573, Bias: -1.410680, T: 95666, Avg. loss: 0.019096
Total training time: 27.65 seconds.
-- Epoch 32
Norm: 10.83, NNZs: 1048573, Bias: -1.410644, T: 98752, Avg. loss: 0.018668
Total training time: 28.57 seconds.
-- Epoch 33
Norm: 10.82, NNZs: 1048574, Bias: -1.410491, T: 101838, Avg. loss: 0.018273
Total training time: 29.50 seconds.
-- Epoch 34
Norm: 10.77, NNZs: 1048575, Bias: -1.413558, T: 104924, Avg. loss: 0.017906
Total training time: 30.44 seconds.
-- Epoch 35
Norm: 10.80, NNZs: 1048575, Bias: -1.408885, T: 108010, Avg. loss: 0.017557
Total training time: 31.35 seconds.
-- Epoch 36
Norm: 10.74, NNZs: 1048576, Bias: -1.414119, T: 111096, Avg. loss: 0.017228
Total training time: 32.27 seconds.
-- Epoch 37
Norm: 10.75, NNZs: 1048576, Bias: -1.412098, T: 114182, Avg. loss: 0.016913
Total training time: 33.19 seconds.
-- Epoch 38
Norm: 10.73, NNZs: 1048576, Bias: -1.411228, T: 117268, Avg. loss: 0.016616
Total training time: 34.08 seconds.
-- Epoch 39
Norm: 10.73, NNZs: 1048576, Bias: -1.410648, T: 120354, Avg. loss: 0.016341
Total training time: 35.02 seconds.
-- Epoch 40
Norm: 10.71, NNZs: 1048576, Bias: -1.411497, T: 123440, Avg. loss: 0.016074
Total training time: 35.93 seconds.
-- Epoch 41
Norm: 10.70, NNZs: 1048576, Bias: -1.410790, T: 126526, Avg. loss: 0.015821
Total training time: 36.87 seconds.
-- Epoch 42
Norm: 10.71, NNZs: 1048576, Bias: -1.408888, T: 129612, Avg. loss: 0.015579
Total training time: 37.79 seconds.
-- Epoch 43
Norm: 10.69, NNZs: 1048576, Bias: -1.411479, T: 132698, Avg. loss: 0.015349
Total training time: 38.72 seconds.
-- Epoch 44
Norm: 10.69, NNZs: 1048576, Bias: -1.409842, T: 135784, Avg. loss: 0.015130
Total training time: 39.65 seconds.
-- Epoch 45
Norm: 10.68, NNZs: 1048576, Bias: -1.410782, T: 138870, Avg. loss: 0.014920
Total training time: 40.58 seconds.
-- Epoch 46
Norm: 10.66, NNZs: 1048576, Bias: -1.411550, T: 141956, Avg. loss: 0.014719
Total training time: 41.52 seconds.
-- Epoch 47
Norm: 10.65, NNZs: 1048576, Bias: -1.412997, T: 145042, Avg. loss: 0.014525
Total training time: 42.44 seconds.
-- Epoch 48
Norm: 10.65, NNZs: 1048576, Bias: -1.411801, T: 148128, Avg. loss: 0.014338
Total training time: 43.37 seconds.
-- Epoch 49
Norm: 10.66, NNZs: 1048576, Bias: -1.409439, T: 151214, Avg. loss: 0.014158
Total training time: 44.31 seconds.
-- Epoch 50
Norm: 10.63, NNZs: 1048576, Bias: -1.413028, T: 154300, Avg. loss: 0.013988
Total training time: 45.25 seconds.
-- Epoch 51
Norm: 10.64, NNZs: 1048576, Bias: -1.411857, T: 157386, Avg. loss: 0.013823
Total training time: 46.18 seconds.
-- Epoch 52
Norm: 10.62, NNZs: 1048576, Bias: -1.413654, T: 160472, Avg. loss: 0.013661
Total training time: 47.12 seconds.
-- Epoch 53
Norm: 10.63, NNZs: 1048576, Bias: -1.412381, T: 163558, Avg. loss: 0.013508
Total training time: 48.04 seconds.
-- Epoch 54
Norm: 10.61, NNZs: 1048576, Bias: -1.413892, T: 166644, Avg. loss: 0.013360
Total training time: 48.99 seconds.
-- Epoch 55
Norm: 10.62, NNZs: 1048576, Bias: -1.411867, T: 169730, Avg. loss: 0.013218
Total training time: 49.89 seconds.
-- Epoch 56
Norm: 10.61, NNZs: 1048576, Bias: -1.412045, T: 172816, Avg. loss: 0.013082
Total training time: 50.83 seconds.
-- Epoch 57
Norm: 10.59, NNZs: 1048576, Bias: -1.415366, T: 175902, Avg. loss: 0.012949
Total training time: 51.80 seconds.
-- Epoch 58
Norm: 10.61, NNZs: 1048576, Bias: -1.410465, T: 178988, Avg. loss: 0.012821
Total training time: 52.70 seconds.
-- Epoch 59
Norm: 10.60, NNZs: 1048576, Bias: -1.412818, T: 182074, Avg. loss: 0.012700
Total training time: 53.67 seconds.
-- Epoch 60
Norm: 10.59, NNZs: 1048576, Bias: -1.413175, T: 185160, Avg. loss: 0.012581
Total training time: 54.59 seconds.
-- Epoch 61
Norm: 10.58, NNZs: 1048576, Bias: -1.414188, T: 188246, Avg. loss: 0.012467
Total training time: 55.54 seconds.
-- Epoch 62
Norm: 10.59, NNZs: 1048576, Bias: -1.412889, T: 191332, Avg. loss: 0.012355
Total training time: 56.47 seconds.
-- Epoch 63
Norm: 10.57, NNZs: 1048576, Bias: -1.414065, T: 194418, Avg. loss: 0.012248
Total training time: 57.42 seconds.
-- Epoch 64
Norm: 10.57, NNZs: 1048576, Bias: -1.414523, T: 197504, Avg. loss: 0.012143
Total training time: 58.34 seconds.
-- Epoch 65
Norm: 10.57, NNZs: 1048576, Bias: -1.413630, T: 200590, Avg. loss: 0.012042
Total training time: 59.31 seconds.
-- Epoch 66
Norm: 10.56, NNZs: 1048576, Bias: -1.414746, T: 203676, Avg. loss: 0.011944
Total training time: 60.25 seconds.
-- Epoch 67
Norm: 10.57, NNZs: 1048576, Bias: -1.413022, T: 206762, Avg. loss: 0.011849
Total training time: 61.20 seconds.
-- Epoch 68
Norm: 10.57, NNZs: 1048576, Bias: -1.411876, T: 209848, Avg. loss: 0.011756
Total training time: 62.14 seconds.
-- Epoch 69
Norm: 10.56, NNZs: 1048576, Bias: -1.412941, T: 212934, Avg. loss: 0.011667
Total training time: 63.08 seconds.
-- Epoch 70
Norm: 10.56, NNZs: 1048576, Bias: -1.412479, T: 216020, Avg. loss: 0.011579
Total training time: 64.04 seconds.
-- Epoch 71
Norm: 10.56, NNZs: 1048576, Bias: -1.412452, T: 219106, Avg. loss: 0.011495
Total training time: 64.99 seconds.
-- Epoch 72
Norm: 10.54, NNZs: 1048576, Bias: -1.414202, T: 222192, Avg. loss: 0.011411
Total training time: 65.93 seconds.
-- Epoch 73
Norm: 10.55, NNZs: 1048576, Bias: -1.413034, T: 225278, Avg. loss: 0.011330
Total training time: 66.89 seconds.
-- Epoch 74
Norm: 10.55, NNZs: 1048576, Bias: -1.411996, T: 228364, Avg. loss: 0.011251
Total training time: 67.86 seconds.
-- Epoch 75
Norm: 10.54, NNZs: 1048576, Bias: -1.412888, T: 231450, Avg. loss: 0.011175
Total training time: 68.82 seconds.
-- Epoch 76
Norm: 10.53, NNZs: 1048576, Bias: -1.414063, T: 234536, Avg. loss: 0.011101
Total training time: 69.76 seconds.
-- Epoch 77
Norm: 10.54, NNZs: 1048576, Bias: -1.412448, T: 237622, Avg. loss: 0.011028
Total training time: 70.73 seconds.
-- Epoch 78
Norm: 10.53, NNZs: 1048576, Bias: -1.414316, T: 240708, Avg. loss: 0.010957
Total training time: 71.68 seconds.
-- Epoch 79
Norm: 10.53, NNZs: 1048576, Bias: -1.413542, T: 243794, Avg. loss: 0.010889
Total training time: 72.61 seconds.
-- Epoch 80
Norm: 10.52, NNZs: 1048576, Bias: -1.414051, T: 246880, Avg. loss: 0.010822
Total training time: 73.55 seconds.
-- Epoch 81
Norm: 10.53, NNZs: 1048576, Bias: -1.413453, T: 249966, Avg. loss: 0.010756
Total training time: 74.51 seconds.
-- Epoch 82
Norm: 10.52, NNZs: 1048576, Bias: -1.414522, T: 253052, Avg. loss: 0.010692
Total training time: 75.43 seconds.
-- Epoch 83
Norm: 10.52, NNZs: 1048576, Bias: -1.413285, T: 256138, Avg. loss: 0.010630
Total training time: 76.40 seconds.
-- Epoch 84
Norm: 10.51, NNZs: 1048576, Bias: -1.414640, T: 259224, Avg. loss: 0.010569
Total training time: 77.35 seconds.
-- Epoch 85
Norm: 10.51, NNZs: 1048576, Bias: -1.414794, T: 262310, Avg. loss: 0.010510
Total training time: 78.30 seconds.
-- Epoch 86
Norm: 10.51, NNZs: 1048576, Bias: -1.414295, T: 265396, Avg. loss: 0.010452
Total training time: 79.24 seconds.
-- Epoch 87
Norm: 10.51, NNZs: 1048576, Bias: -1.413308, T: 268482, Avg. loss: 0.010396
Total training time: 80.16 seconds.
-- Epoch 88
Norm: 10.51, NNZs: 1048576, Bias: -1.413087, T: 271568, Avg. loss: 0.010340
Total training time: 81.11 seconds.
-- Epoch 89
Norm: 10.50, NNZs: 1048576, Bias: -1.414496, T: 274654, Avg. loss: 0.010285
Total training time: 82.09 seconds.
-- Epoch 90
Norm: 10.50, NNZs: 1048576, Bias: -1.414267, T: 277740, Avg. loss: 0.010232
Total training time: 83.03 seconds.
-- Epoch 91
Norm: 10.50, NNZs: 1048576, Bias: -1.414941, T: 280826, Avg. loss: 0.010180
Total training time: 83.97 seconds.
-- Epoch 92
Norm: 10.51, NNZs: 1048576, Bias: -1.412614, T: 283912, Avg. loss: 0.010128
Total training time: 84.92 seconds.
-- Epoch 93
Norm: 10.50, NNZs: 1048576, Bias: -1.413815, T: 286998, Avg. loss: 0.010079
Total training time: 85.89 seconds.
-- Epoch 94
Norm: 10.49, NNZs: 1048576, Bias: -1.415025, T: 290084, Avg. loss: 0.010029
Total training time: 86.81 seconds.
-- Epoch 95
Norm: 10.50, NNZs: 1048576, Bias: -1.414457, T: 293170, Avg. loss: 0.009981
Total training time: 87.77 seconds.
-- Epoch 96
Norm: 10.49, NNZs: 1048576, Bias: -1.415301, T: 296256, Avg. loss: 0.009933
Total training time: 88.75 seconds.
-- Epoch 97
Norm: 10.50, NNZs: 1048576, Bias: -1.413412, T: 299342, Avg. loss: 0.009887
Total training time: 89.66 seconds.
-- Epoch 98
Norm: 10.49, NNZs: 1048576, Bias: -1.414696, T: 302428, Avg. loss: 0.009842
Total training time: 90.62 seconds.
-- Epoch 99
Norm: 10.49, NNZs: 1048576, Bias: -1.413966, T: 305514, Avg. loss: 0.009799
Total training time: 91.56 seconds.
-- Epoch 100
Norm: 10.49, NNZs: 1048576, Bias: -1.414600, T: 308600, Avg. loss: 0.009756
Total training time: 92.54 seconds.
-- Epoch 1
Norm: 78.13, NNZs: 613708, Bias: -2.315019, T: 3086, Avg. loss: 1.099688
Total training time: 0.88 seconds.
-- Epoch 2
Norm: 54.46, NNZs: 702767, Bias: -2.320828, T: 6172, Avg. loss: 0.645699
Total training time: 1.73 seconds.
-- Epoch 3
Norm: 42.44, NNZs: 841390, Bias: -2.304876, T: 9258, Avg. loss: 0.463739
Total training time: 2.59 seconds.
-- Epoch 4
Norm: 35.83, NNZs: 867036, Bias: -2.210931, T: 12344, Avg. loss: 0.362179
Total training time: 3.45 seconds.
-- Epoch 5
Norm: 31.16, NNZs: 877850, Bias: -2.158198, T: 15430, Avg. loss: 0.297284
Total training time: 4.31 seconds.
-- Epoch 6
Norm: 27.92, NNZs: 935577, Bias: -2.127622, T: 18516, Avg. loss: 0.252614
Total training time: 5.17 seconds.
-- Epoch 7
Norm: 25.88, NNZs: 950971, Bias: -2.080989, T: 21602, Avg. loss: 0.220578
Total training time: 6.03 seconds.
-- Epoch 8
Norm: 24.49, NNZs: 973070, Bias: -2.034443, T: 24688, Avg. loss: 0.196121
Total training time: 6.91 seconds.
-- Epoch 9
Norm: 23.48, NNZs: 991633, Bias: -1.992127, T: 27774, Avg. loss: 0.177157
Total training time: 7.80 seconds.
-- Epoch 10
Norm: 22.61, NNZs: 993941, Bias: -1.978776, T: 30860, Avg. loss: 0.161962
Total training time: 8.67 seconds.
-- Epoch 11
Norm: 22.07, NNZs: 1005559, Bias: -1.948164, T: 33946, Avg. loss: 0.149420
Total training time: 9.57 seconds.
-- Epoch 12
Norm: 21.55, NNZs: 1005820, Bias: -1.925280, T: 37032, Avg. loss: 0.138871
Total training time: 10.45 seconds.
-- Epoch 13
Norm: 21.20, NNZs: 1014599, Bias: -1.905124, T: 40118, Avg. loss: 0.129986
Total training time: 11.49 seconds.
-- Epoch 14
Norm: 20.87, NNZs: 1020978, Bias: -1.886442, T: 43204, Avg. loss: 0.122413
Total training time: 12.48 seconds.
-- Epoch 15
Norm: 20.55, NNZs: 1021335, Bias: -1.872827, T: 46290, Avg. loss: 0.115737
Total training time: 13.37 seconds.
-- Epoch 16
Norm: 20.33, NNZs: 1024905, Bias: -1.851326, T: 49376, Avg. loss: 0.109970
Total training time: 14.28 seconds.
-- Epoch 17
Norm: 20.13, NNZs: 1025764, Bias: -1.837556, T: 52462, Avg. loss: 0.104832
Total training time: 15.17 seconds.
-- Epoch 18
Norm: 19.94, NNZs: 1028686, Bias: -1.824226, T: 55548, Avg. loss: 0.100260
Total training time: 16.08 seconds.
-- Epoch 19
Norm: 19.85, NNZs: 1031281, Bias: -1.809478, T: 58634, Avg. loss: 0.096161
Total training time: 16.98 seconds.
-- Epoch 20
Norm: 19.71, NNZs: 1032249, Bias: -1.797133, T: 61720, Avg. loss: 0.092462
Total training time: 17.88 seconds.
-- Epoch 21
Norm: 19.61, NNZs: 1033559, Bias: -1.786545, T: 64806, Avg. loss: 0.089116
Total training time: 18.80 seconds.
-- Epoch 22
Norm: 19.51, NNZs: 1033639, Bias: -1.772482, T: 67892, Avg. loss: 0.086059
Total training time: 19.70 seconds.
-- Epoch 23
Norm: 19.39, NNZs: 1035427, Bias: -1.765420, T: 70978, Avg. loss: 0.083244
Total training time: 20.62 seconds.
-- Epoch 24
Norm: 19.33, NNZs: 1035557, Bias: -1.754205, T: 74064, Avg. loss: 0.080657
Total training time: 21.52 seconds.
-- Epoch 25
Norm: 19.26, NNZs: 1037305, Bias: -1.747249, T: 77150, Avg. loss: 0.078313
Total training time: 22.45 seconds.
-- Epoch 26
Norm: 19.19, NNZs: 1039572, Bias: -1.737716, T: 80236, Avg. loss: 0.076123
Total training time: 23.38 seconds.
-- Epoch 27
Norm: 19.08, NNZs: 1039621, Bias: -1.732640, T: 83322, Avg. loss: 0.074074
Total training time: 24.28 seconds.
-- Epoch 28
Norm: 19.05, NNZs: 1039976, Bias: -1.716959, T: 86408, Avg. loss: 0.072209
Total training time: 25.20 seconds.
-- Epoch 29
Norm: 18.99, NNZs: 1040706, Bias: -1.712625, T: 89494, Avg. loss: 0.070468
Total training time: 26.12 seconds.
-- Epoch 30
Norm: 18.85, NNZs: 1041381, Bias: -1.710878, T: 92580, Avg. loss: 0.068826
Total training time: 27.04 seconds.
-- Epoch 31
Norm: 18.87, NNZs: 1041389, Bias: -1.697501, T: 95666, Avg. loss: 0.067292
Total training time: 27.94 seconds.
-- Epoch 32
Norm: 18.83, NNZs: 1042401, Bias: -1.691523, T: 98752, Avg. loss: 0.065855
Total training time: 28.88 seconds.
-- Epoch 33
Norm: 18.76, NNZs: 1042428, Bias: -1.686029, T: 101838, Avg. loss: 0.064515
Total training time: 29.81 seconds.
-- Epoch 34
Norm: 18.74, NNZs: 1042428, Bias: -1.676337, T: 104924, Avg. loss: 0.063249
Total training time: 30.73 seconds.
-- Epoch 35
Norm: 18.66, NNZs: 1042443, Bias: -1.673713, T: 108010, Avg. loss: 0.062057
Total training time: 31.64 seconds.
-- Epoch 36
Norm: 18.66, NNZs: 1042717, Bias: -1.666177, T: 111096, Avg. loss: 0.060925
Total training time: 32.57 seconds.
-- Epoch 37
Norm: 18.65, NNZs: 1042908, Bias: -1.658844, T: 114182, Avg. loss: 0.059861
Total training time: 33.50 seconds.
-- Epoch 38
Norm: 18.61, NNZs: 1042911, Bias: -1.655881, T: 117268, Avg. loss: 0.058838
Total training time: 34.42 seconds.
-- Epoch 39
Norm: 18.61, NNZs: 1042921, Bias: -1.649657, T: 120354, Avg. loss: 0.057850
Total training time: 35.34 seconds.
-- Epoch 40
Norm: 18.57, NNZs: 1042925, Bias: -1.644094, T: 123440, Avg. loss: 0.056928
Total training time: 36.27 seconds.
-- Epoch 41
Norm: 18.54, NNZs: 1042930, Bias: -1.638912, T: 126526, Avg. loss: 0.056048
Total training time: 37.18 seconds.
-- Epoch 42
Norm: 18.51, NNZs: 1043291, Bias: -1.634332, T: 129612, Avg. loss: 0.055213
Total training time: 38.09 seconds.
-- Epoch 43
Norm: 18.50, NNZs: 1043572, Bias: -1.629894, T: 132698, Avg. loss: 0.054415
Total training time: 39.04 seconds.
-- Epoch 44
Norm: 18.47, NNZs: 1043572, Bias: -1.623556, T: 135784, Avg. loss: 0.053646
Total training time: 39.94 seconds.
-- Epoch 45
Norm: 18.48, NNZs: 1043878, Bias: -1.616780, T: 138870, Avg. loss: 0.052920
Total training time: 40.88 seconds.
-- Epoch 46
Norm: 18.44, NNZs: 1043885, Bias: -1.613374, T: 141956, Avg. loss: 0.052221
Total training time: 41.84 seconds.
-- Epoch 47
Norm: 18.42, NNZs: 1043889, Bias: -1.609046, T: 145042, Avg. loss: 0.051559
Total training time: 42.76 seconds.
-- Epoch 48
Norm: 18.39, NNZs: 1043889, Bias: -1.606558, T: 148128, Avg. loss: 0.050925
Total training time: 43.69 seconds.
-- Epoch 49
Norm: 18.39, NNZs: 1043890, Bias: -1.601563, T: 151214, Avg. loss: 0.050309
Total training time: 44.62 seconds.
-- Epoch 50
Norm: 18.35, NNZs: 1043892, Bias: -1.600511, T: 154300, Avg. loss: 0.049719
Total training time: 45.54 seconds.
-- Epoch 51
Norm: 18.37, NNZs: 1043892, Bias: -1.592085, T: 157386, Avg. loss: 0.049155
Total training time: 46.46 seconds.
-- Epoch 52
Norm: 18.33, NNZs: 1043892, Bias: -1.590524, T: 160472, Avg. loss: 0.048605
Total training time: 47.40 seconds.
-- Epoch 53
Norm: 18.31, NNZs: 1043892, Bias: -1.587625, T: 163558, Avg. loss: 0.048081
Total training time: 48.33 seconds.
-- Epoch 54
Norm: 18.31, NNZs: 1043900, Bias: -1.583158, T: 166644, Avg. loss: 0.047571
Total training time: 49.27 seconds.
-- Epoch 55
Norm: 18.30, NNZs: 1043900, Bias: -1.577855, T: 169730, Avg. loss: 0.047088
Total training time: 50.21 seconds.
-- Epoch 56
Norm: 18.28, NNZs: 1043900, Bias: -1.576267, T: 172816, Avg. loss: 0.046615
Total training time: 51.15 seconds.
-- Epoch 57
Norm: 18.27, NNZs: 1043900, Bias: -1.572263, T: 175902, Avg. loss: 0.046161
Total training time: 52.08 seconds.
-- Epoch 58
Norm: 18.24, NNZs: 1043900, Bias: -1.568974, T: 178988, Avg. loss: 0.045725
Total training time: 53.01 seconds.
-- Epoch 59
Norm: 18.23, NNZs: 1043900, Bias: -1.565315, T: 182074, Avg. loss: 0.045301
Total training time: 53.94 seconds.
-- Epoch 60
Norm: 18.21, NNZs: 1043900, Bias: -1.563851, T: 185160, Avg. loss: 0.044893
Total training time: 54.90 seconds.
-- Epoch 61
Norm: 18.21, NNZs: 1043900, Bias: -1.558607, T: 188246, Avg. loss: 0.044499
Total training time: 55.81 seconds.
-- Epoch 62
Norm: 18.20, NNZs: 1043901, Bias: -1.556321, T: 191332, Avg. loss: 0.044118
Total training time: 56.75 seconds.
-- Epoch 63
Norm: 18.18, NNZs: 1044129, Bias: -1.554002, T: 194418, Avg. loss: 0.043747
Total training time: 57.70 seconds.
-- Epoch 64
Norm: 18.18, NNZs: 1044131, Bias: -1.550122, T: 197504, Avg. loss: 0.043383
Total training time: 58.62 seconds.
-- Epoch 65
Norm: 18.18, NNZs: 1044158, Bias: -1.546870, T: 200590, Avg. loss: 0.043031
Total training time: 59.56 seconds.
-- Epoch 66
Norm: 18.17, NNZs: 1044163, Bias: -1.543917, T: 203676, Avg. loss: 0.042690
Total training time: 60.50 seconds.
-- Epoch 67
Norm: 18.15, NNZs: 1044340, Bias: -1.543646, T: 206762, Avg. loss: 0.042355
Total training time: 61.45 seconds.
-- Epoch 68
Norm: 18.14, NNZs: 1044342, Bias: -1.539852, T: 209848, Avg. loss: 0.042036
Total training time: 62.38 seconds.
-- Epoch 69
Norm: 18.12, NNZs: 1044342, Bias: -1.537510, T: 212934, Avg. loss: 0.041722
Total training time: 63.32 seconds.
-- Epoch 70
Norm: 18.12, NNZs: 1044345, Bias: -1.533514, T: 216020, Avg. loss: 0.041416
Total training time: 64.25 seconds.
-- Epoch 71
Norm: 18.10, NNZs: 1044345, Bias: -1.533967, T: 219106, Avg. loss: 0.041121
Total training time: 65.21 seconds.
-- Epoch 72
Norm: 18.13, NNZs: 1044345, Bias: -1.527220, T: 222192, Avg. loss: 0.040833
Total training time: 66.13 seconds.
-- Epoch 73
Norm: 18.09, NNZs: 1044731, Bias: -1.526411, T: 225278, Avg. loss: 0.040552
Total training time: 67.09 seconds.
-- Epoch 74
Norm: 18.11, NNZs: 1044731, Bias: -1.522046, T: 228364, Avg. loss: 0.040282
Total training time: 68.01 seconds.
-- Epoch 75
Norm: 18.09, NNZs: 1044732, Bias: -1.521896, T: 231450, Avg. loss: 0.040016
Total training time: 68.97 seconds.
-- Epoch 76
Norm: 18.08, NNZs: 1044732, Bias: -1.519394, T: 234536, Avg. loss: 0.039758
Total training time: 69.90 seconds.
-- Epoch 77
Norm: 18.07, NNZs: 1044736, Bias: -1.518561, T: 237622, Avg. loss: 0.039504
Total training time: 70.84 seconds.
-- Epoch 78
Norm: 18.07, NNZs: 1044736, Bias: -1.514841, T: 240708, Avg. loss: 0.039259
Total training time: 71.78 seconds.
-- Epoch 79
Norm: 18.06, NNZs: 1044740, Bias: -1.513580, T: 243794, Avg. loss: 0.039020
Total training time: 72.72 seconds.
-- Epoch 80
Norm: 18.05, NNZs: 1044740, Bias: -1.510524, T: 246880, Avg. loss: 0.038789
Total training time: 73.66 seconds.
-- Epoch 81
Norm: 18.04, NNZs: 1044740, Bias: -1.509298, T: 249966, Avg. loss: 0.038563
Total training time: 74.60 seconds.
-- Epoch 82
Norm: 18.03, NNZs: 1044740, Bias: -1.506275, T: 253052, Avg. loss: 0.038341
Total training time: 75.54 seconds.
-- Epoch 83
Norm: 18.04, NNZs: 1044742, Bias: -1.501767, T: 256138, Avg. loss: 0.038123
Total training time: 76.47 seconds.
-- Epoch 84
Norm: 18.02, NNZs: 1044756, Bias: -1.501372, T: 259224, Avg. loss: 0.037914
Total training time: 77.41 seconds.
-- Epoch 85
Norm: 18.01, NNZs: 1044757, Bias: -1.501027, T: 262310, Avg. loss: 0.037705
Total training time: 78.36 seconds.
-- Epoch 86
Norm: 18.02, NNZs: 1044757, Bias: -1.497025, T: 265396, Avg. loss: 0.037504
Total training time: 79.30 seconds.
-- Epoch 87
Norm: 18.01, NNZs: 1044757, Bias: -1.495250, T: 268482, Avg. loss: 0.037307
Total training time: 80.24 seconds.
-- Epoch 88
Norm: 18.01, NNZs: 1044764, Bias: -1.493154, T: 271568, Avg. loss: 0.037112
Total training time: 81.19 seconds.
-- Epoch 89
Norm: 18.00, NNZs: 1044764, Bias: -1.491409, T: 274654, Avg. loss: 0.036925
Total training time: 82.13 seconds.
-- Epoch 90
Norm: 18.00, NNZs: 1044764, Bias: -1.488794, T: 277740, Avg. loss: 0.036740
Total training time: 83.07 seconds.
-- Epoch 91
Norm: 18.00, NNZs: 1044764, Bias: -1.486056, T: 280826, Avg. loss: 0.036559
Total training time: 84.02 seconds.
-- Epoch 92
Norm: 18.00, NNZs: 1044764, Bias: -1.483858, T: 283912, Avg. loss: 0.036384
Total training time: 84.95 seconds.
-- Epoch 93
Norm: 17.99, NNZs: 1044764, Bias: -1.482195, T: 286998, Avg. loss: 0.036210
Total training time: 85.91 seconds.
-- Epoch 94
Norm: 17.96, NNZs: 1044764, Bias: -1.483267, T: 290084, Avg. loss: 0.036040
Total training time: 86.85 seconds.
-- Epoch 95
Norm: 17.97, NNZs: 1044764, Bias: -1.480666, T: 293170, Avg. loss: 0.035873
Total training time: 87.79 seconds.
-- Epoch 96
Norm: 17.96, NNZs: 1044764, Bias: -1.479862, T: 296256, Avg. loss: 0.035712
Total training time: 88.74 seconds.
-- Epoch 97
Norm: 17.96, NNZs: 1044765, Bias: -1.476211, T: 299342, Avg. loss: 0.035549
Total training time: 89.68 seconds.
-- Epoch 98
Norm: 17.95, NNZs: 1044767, Bias: -1.474277, T: 302428, Avg. loss: 0.035394
Total training time: 90.63 seconds.
-- Epoch 99
Norm: 17.95, NNZs: 1044767, Bias: -1.473787, T: 305514, Avg. loss: 0.035241
Total training time: 91.59 seconds.
-- Epoch 100
Norm: 17.97, NNZs: 1044767, Bias: -1.469052, T: 308600, Avg. loss: 0.035090
Total training time: 92.52 seconds.
-- Epoch 1
Norm: 63.57, NNZs: 395248, Bias: -0.776395, T: 3086, Avg. loss: 0.638981
Total training time: 0.85 seconds.
-- Epoch 2
Norm: 45.96, NNZs: 784434, Bias: -0.778416, T: 6172, Avg. loss: 0.368070
Total training time: 1.69 seconds.
-- Epoch 3
Norm: 35.18, NNZs: 794445, Bias: -0.844667, T: 9258, Avg. loss: 0.256250
Total training time: 2.53 seconds.
-- Epoch 4
Norm: 28.61, NNZs: 808485, Bias: -0.829537, T: 12344, Avg. loss: 0.196031
Total training time: 3.37 seconds.
-- Epoch 5
Norm: 24.51, NNZs: 812184, Bias: -0.816307, T: 15430, Avg. loss: 0.159101
Total training time: 4.21 seconds.
-- Epoch 6
Norm: 21.87, NNZs: 818614, Bias: -0.814460, T: 18516, Avg. loss: 0.134097
Total training time: 5.05 seconds.
-- Epoch 7
Norm: 20.16, NNZs: 823616, Bias: -0.808006, T: 21602, Avg. loss: 0.116260
Total training time: 5.89 seconds.
-- Epoch 8
Norm: 19.10, NNZs: 827316, Bias: -0.793359, T: 24688, Avg. loss: 0.102802
Total training time: 6.73 seconds.
-- Epoch 9
Norm: 18.41, NNZs: 829751, Bias: -0.791027, T: 27774, Avg. loss: 0.092364
Total training time: 7.58 seconds.
-- Epoch 10
Norm: 17.90, NNZs: 832835, Bias: -0.788420, T: 30860, Avg. loss: 0.084044
Total training time: 8.42 seconds.
-- Epoch 11
Norm: 17.48, NNZs: 833481, Bias: -0.776385, T: 33946, Avg. loss: 0.077169
Total training time: 9.27 seconds.
-- Epoch 12
Norm: 17.22, NNZs: 836799, Bias: -0.779732, T: 37032, Avg. loss: 0.071465
Total training time: 10.12 seconds.
-- Epoch 13
Norm: 16.94, NNZs: 855966, Bias: -0.778083, T: 40118, Avg. loss: 0.066569
Total training time: 10.97 seconds.
-- Epoch 14
Norm: 16.76, NNZs: 903481, Bias: -0.777494, T: 43204, Avg. loss: 0.062396
Total training time: 11.82 seconds.
-- Epoch 15
Norm: 16.63, NNZs: 920310, Bias: -0.775015, T: 46290, Avg. loss: 0.058831
Total training time: 12.68 seconds.
-- Epoch 16
Norm: 16.50, NNZs: 921408, Bias: -0.768577, T: 49376, Avg. loss: 0.055662
Total training time: 13.54 seconds.
-- Epoch 17
Norm: 16.40, NNZs: 931189, Bias: -0.773960, T: 52462, Avg. loss: 0.052890
Total training time: 14.40 seconds.
-- Epoch 18
Norm: 16.30, NNZs: 931992, Bias: -0.767719, T: 55548, Avg. loss: 0.050418
Total training time: 15.26 seconds.
-- Epoch 19
Norm: 16.22, NNZs: 932060, Bias: -0.769375, T: 58634, Avg. loss: 0.048202
Total training time: 16.11 seconds.
-- Epoch 20
Norm: 16.16, NNZs: 932395, Bias: -0.765379, T: 61720, Avg. loss: 0.046198
Total training time: 16.97 seconds.
-- Epoch 21
Norm: 16.10, NNZs: 932703, Bias: -0.768804, T: 64806, Avg. loss: 0.044394
Total training time: 17.83 seconds.
-- Epoch 22
Norm: 16.05, NNZs: 932892, Bias: -0.767373, T: 67892, Avg. loss: 0.042752
Total training time: 18.69 seconds.
-- Epoch 23
Norm: 16.00, NNZs: 933095, Bias: -0.764462, T: 70978, Avg. loss: 0.041241
Total training time: 19.54 seconds.
-- Epoch 24
Norm: 15.95, NNZs: 946498, Bias: -0.764921, T: 74064, Avg. loss: 0.039854
Total training time: 20.40 seconds.
-- Epoch 25
Norm: 15.92, NNZs: 949401, Bias: -0.766935, T: 77150, Avg. loss: 0.038589
Total training time: 21.27 seconds.
-- Epoch 26
Norm: 15.88, NNZs: 949444, Bias: -0.766333, T: 80236, Avg. loss: 0.037425
Total training time: 22.12 seconds.
-- Epoch 27
Norm: 15.86, NNZs: 949653, Bias: -0.764734, T: 83322, Avg. loss: 0.036339
Total training time: 22.98 seconds.
-- Epoch 28
Norm: 15.83, NNZs: 949663, Bias: -0.762676, T: 86408, Avg. loss: 0.035332
Total training time: 23.84 seconds.
-- Epoch 29
Norm: 15.81, NNZs: 949733, Bias: -0.763269, T: 89494, Avg. loss: 0.034394
Total training time: 24.70 seconds.
-- Epoch 30
Norm: 15.78, NNZs: 949810, Bias: -0.764355, T: 92580, Avg. loss: 0.033518
Total training time: 25.56 seconds.
-- Epoch 31
Norm: 15.75, NNZs: 949885, Bias: -0.759970, T: 95666, Avg. loss: 0.032691
Total training time: 26.42 seconds.
-- Epoch 32
Norm: 15.73, NNZs: 950035, Bias: -0.763623, T: 98752, Avg. loss: 0.031920
Total training time: 27.28 seconds.
-- Epoch 33
Norm: 15.71, NNZs: 950053, Bias: -0.762051, T: 101838, Avg. loss: 0.031196
Total training time: 28.14 seconds.
-- Epoch 34
Norm: 15.69, NNZs: 950110, Bias: -0.761077, T: 104924, Avg. loss: 0.030517
Total training time: 29.00 seconds.
-- Epoch 35
Norm: 15.68, NNZs: 959169, Bias: -0.759743, T: 108010, Avg. loss: 0.029873
Total training time: 29.86 seconds.
-- Epoch 36
Norm: 15.66, NNZs: 1005386, Bias: -0.760078, T: 111096, Avg. loss: 0.029262
Total training time: 30.73 seconds.
-- Epoch 37
Norm: 15.64, NNZs: 1005651, Bias: -0.757991, T: 114182, Avg. loss: 0.028684
Total training time: 31.59 seconds.
-- Epoch 38
Norm: 15.63, NNZs: 1005651, Bias: -0.758120, T: 117268, Avg. loss: 0.028140
Total training time: 32.45 seconds.
-- Epoch 39
Norm: 15.62, NNZs: 1005666, Bias: -0.757327, T: 120354, Avg. loss: 0.027625
Total training time: 33.30 seconds.
-- Epoch 40
Norm: 15.61, NNZs: 1006835, Bias: -0.755822, T: 123440, Avg. loss: 0.027133
Total training time: 34.17 seconds.
-- Epoch 41
Norm: 15.60, NNZs: 1006886, Bias: -0.755314, T: 126526, Avg. loss: 0.026662
Total training time: 35.04 seconds.
-- Epoch 42
Norm: 15.59, NNZs: 1006908, Bias: -0.758849, T: 129612, Avg. loss: 0.026216
Total training time: 35.90 seconds.
-- Epoch 43
Norm: 15.58, NNZs: 1006909, Bias: -0.758931, T: 132698, Avg. loss: 0.025786
Total training time: 36.76 seconds.
-- Epoch 44
Norm: 15.57, NNZs: 1006909, Bias: -0.755203, T: 135784, Avg. loss: 0.025381
Total training time: 37.62 seconds.
-- Epoch 45
Norm: 15.56, NNZs: 1006909, Bias: -0.755827, T: 138870, Avg. loss: 0.024993
Total training time: 38.48 seconds.
-- Epoch 46
Norm: 15.55, NNZs: 1006950, Bias: -0.756522, T: 141956, Avg. loss: 0.024620
Total training time: 39.60 seconds.
-- Epoch 47
Norm: 15.54, NNZs: 1006950, Bias: -0.755859, T: 145042, Avg. loss: 0.024263
Total training time: 40.46 seconds.
-- Epoch 48
Norm: 15.53, NNZs: 1006958, Bias: -0.757915, T: 148128, Avg. loss: 0.023923
Total training time: 41.32 seconds.
-- Epoch 49
Norm: 15.52, NNZs: 1006958, Bias: -0.755363, T: 151214, Avg. loss: 0.023595
Total training time: 42.19 seconds.
-- Epoch 50
Norm: 15.52, NNZs: 1006958, Bias: -0.756787, T: 154300, Avg. loss: 0.023282
Total training time: 43.06 seconds.
-- Epoch 51
Norm: 15.51, NNZs: 1007034, Bias: -0.752983, T: 157386, Avg. loss: 0.022976
Total training time: 43.92 seconds.
-- Epoch 52
Norm: 15.50, NNZs: 1007044, Bias: -0.754439, T: 160472, Avg. loss: 0.022684
Total training time: 44.78 seconds.
-- Epoch 53
Norm: 15.49, NNZs: 1007049, Bias: -0.756421, T: 163558, Avg. loss: 0.022403
Total training time: 45.65 seconds.
-- Epoch 54
Norm: 15.49, NNZs: 1007054, Bias: -0.755766, T: 166644, Avg. loss: 0.022135
Total training time: 46.51 seconds.
-- Epoch 55
Norm: 15.48, NNZs: 1007057, Bias: -0.754606, T: 169730, Avg. loss: 0.021873
Total training time: 47.38 seconds.
-- Epoch 56
Norm: 15.48, NNZs: 1007057, Bias: -0.753732, T: 172816, Avg. loss: 0.021623
Total training time: 48.24 seconds.
-- Epoch 57
Norm: 15.48, NNZs: 1007057, Bias: -0.755653, T: 175902, Avg. loss: 0.021382
Total training time: 49.11 seconds.
-- Epoch 58
Norm: 15.47, NNZs: 1007057, Bias: -0.755519, T: 178988, Avg. loss: 0.021149
Total training time: 49.98 seconds.
-- Epoch 59
Norm: 15.46, NNZs: 1007063, Bias: -0.756032, T: 182074, Avg. loss: 0.020920
Total training time: 50.86 seconds.
-- Epoch 60
Norm: 15.46, NNZs: 1007063, Bias: -0.755887, T: 185160, Avg. loss: 0.020702
Total training time: 51.72 seconds.
-- Epoch 61
Norm: 15.46, NNZs: 1007068, Bias: -0.754467, T: 188246, Avg. loss: 0.020492
Total training time: 52.58 seconds.
-- Epoch 62
Norm: 15.45, NNZs: 1007144, Bias: -0.755110, T: 191332, Avg. loss: 0.020285
Total training time: 53.45 seconds.
-- Epoch 63
Norm: 15.45, NNZs: 1007147, Bias: -0.754974, T: 194418, Avg. loss: 0.020086
Total training time: 54.32 seconds.
-- Epoch 64
Norm: 15.45, NNZs: 1007151, Bias: -0.754349, T: 197504, Avg. loss: 0.019894
Total training time: 55.20 seconds.
-- Epoch 65
Norm: 15.44, NNZs: 1007151, Bias: -0.754107, T: 200590, Avg. loss: 0.019709
Total training time: 56.07 seconds.
-- Epoch 66
Norm: 15.44, NNZs: 1007163, Bias: -0.754650, T: 203676, Avg. loss: 0.019529
Total training time: 56.94 seconds.
-- Epoch 67
Norm: 15.44, NNZs: 1007163, Bias: -0.753802, T: 206762, Avg. loss: 0.019353
Total training time: 57.80 seconds.
-- Epoch 68
Norm: 15.43, NNZs: 1008007, Bias: -0.753997, T: 209848, Avg. loss: 0.019183
Total training time: 58.68 seconds.
-- Epoch 69
Norm: 15.43, NNZs: 1008022, Bias: -0.754760, T: 212934, Avg. loss: 0.019016
Total training time: 59.55 seconds.
-- Epoch 70
Norm: 15.42, NNZs: 1008024, Bias: -0.755771, T: 216020, Avg. loss: 0.018854
Total training time: 60.41 seconds.
-- Epoch 71
Norm: 15.42, NNZs: 1008033, Bias: -0.752346, T: 219106, Avg. loss: 0.018698
Total training time: 61.28 seconds.
-- Epoch 72
Norm: 15.42, NNZs: 1008039, Bias: -0.754019, T: 222192, Avg. loss: 0.018547
Total training time: 62.15 seconds.
-- Epoch 73
Norm: 15.42, NNZs: 1008039, Bias: -0.752735, T: 225278, Avg. loss: 0.018400
Total training time: 63.01 seconds.
-- Epoch 74
Norm: 15.41, NNZs: 1008039, Bias: -0.753769, T: 228364, Avg. loss: 0.018257
Total training time: 63.88 seconds.
-- Epoch 75
Norm: 15.41, NNZs: 1008039, Bias: -0.752808, T: 231450, Avg. loss: 0.018117
Total training time: 64.75 seconds.
-- Epoch 76
Norm: 15.41, NNZs: 1008083, Bias: -0.753752, T: 234536, Avg. loss: 0.017980
Total training time: 65.62 seconds.
-- Epoch 77
Norm: 15.40, NNZs: 1008083, Bias: -0.754202, T: 237622, Avg. loss: 0.017847
Total training time: 66.49 seconds.
-- Epoch 78
Norm: 15.40, NNZs: 1008083, Bias: -0.754319, T: 240708, Avg. loss: 0.017717
Total training time: 67.36 seconds.
-- Epoch 79
Norm: 15.40, NNZs: 1008087, Bias: -0.752903, T: 243794, Avg. loss: 0.017591
Total training time: 68.23 seconds.
-- Epoch 80
Norm: 15.40, NNZs: 1008091, Bias: -0.752774, T: 246880, Avg. loss: 0.017468
Total training time: 69.10 seconds.
-- Epoch 81
Norm: 15.39, NNZs: 1008105, Bias: -0.753050, T: 249966, Avg. loss: 0.017348
Total training time: 69.97 seconds.
-- Epoch 82
Norm: 15.39, NNZs: 1008105, Bias: -0.751515, T: 253052, Avg. loss: 0.017230
Total training time: 70.84 seconds.
-- Epoch 83
Norm: 15.39, NNZs: 1008105, Bias: -0.753302, T: 256138, Avg. loss: 0.017116
Total training time: 71.71 seconds.
-- Epoch 84
Norm: 15.39, NNZs: 1008107, Bias: -0.753282, T: 259224, Avg. loss: 0.017004
Total training time: 72.59 seconds.
-- Epoch 85
Norm: 15.39, NNZs: 1008107, Bias: -0.752609, T: 262310, Avg. loss: 0.016895
Total training time: 73.47 seconds.
-- Epoch 86
Norm: 15.38, NNZs: 1008107, Bias: -0.752838, T: 265396, Avg. loss: 0.016789
Total training time: 74.34 seconds.
-- Epoch 87
Norm: 15.38, NNZs: 1008107, Bias: -0.753020, T: 268482, Avg. loss: 0.016684
Total training time: 75.21 seconds.
-- Epoch 88
Norm: 15.37, NNZs: 1008833, Bias: -0.753572, T: 271568, Avg. loss: 0.016581
Total training time: 76.09 seconds.
-- Epoch 89
Norm: 15.38, NNZs: 1008833, Bias: -0.752248, T: 274654, Avg. loss: 0.016481
Total training time: 76.96 seconds.
-- Epoch 90
Norm: 15.37, NNZs: 1008833, Bias: -0.752837, T: 277740, Avg. loss: 0.016385
Total training time: 77.83 seconds.
-- Epoch 91
Norm: 15.37, NNZs: 1008876, Bias: -0.753409, T: 280826, Avg. loss: 0.016289
Total training time: 78.70 seconds.
-- Epoch 92
Norm: 15.37, NNZs: 1008898, Bias: -0.753082, T: 283912, Avg. loss: 0.016194
Total training time: 79.57 seconds.
-- Epoch 93
Norm: 15.36, NNZs: 1008898, Bias: -0.752565, T: 286998, Avg. loss: 0.016103
Total training time: 80.45 seconds.
-- Epoch 94
Norm: 15.36, NNZs: 1008898, Bias: -0.751389, T: 290084, Avg. loss: 0.016014
Total training time: 81.32 seconds.
-- Epoch 95
Norm: 15.37, NNZs: 1008898, Bias: -0.751699, T: 293170, Avg. loss: 0.015926
Total training time: 82.19 seconds.
-- Epoch 96
Norm: 15.36, NNZs: 1008898, Bias: -0.751833, T: 296256, Avg. loss: 0.015841
Total training time: 83.06 seconds.
-- Epoch 97
Norm: 15.36, NNZs: 1008898, Bias: -0.751286, T: 299342, Avg. loss: 0.015757
Total training time: 83.94 seconds.
-- Epoch 98
Norm: 15.36, NNZs: 1008898, Bias: -0.751715, T: 302428, Avg. loss: 0.015676
Total training time: 84.81 seconds.
-- Epoch 99
Norm: 15.36, NNZs: 1008898, Bias: -0.751920, T: 305514, Avg. loss: 0.015595
Total training time: 85.68 seconds.
-- Epoch 100
Norm: 15.36, NNZs: 1008898, Bias: -0.751872, T: 308600, Avg. loss: 0.015517
Total training time: 86.55 seconds.
-- Epoch 1
Norm: 40.10, NNZs: 253763, Bias: -0.835905, T: 3086, Avg. loss: 0.225260
Total training time: 0.85 seconds.
-- Epoch 2
Norm: 26.44, NNZs: 364895, Bias: -0.813172, T: 6172, Avg. loss: 0.132161
Total training time: 1.70 seconds.
-- Epoch 3
Norm: 21.75, NNZs: 387910, Bias: -0.826581, T: 9258, Avg. loss: 0.097308
Total training time: 2.55 seconds.
-- Epoch 4
Norm: 18.06, NNZs: 392025, Bias: -0.822172, T: 12344, Avg. loss: 0.078356
Total training time: 3.40 seconds.
-- Epoch 5
Norm: 16.13, NNZs: 408847, Bias: -0.808067, T: 15430, Avg. loss: 0.065448
Total training time: 4.26 seconds.
-- Epoch 6
Norm: 14.45, NNZs: 420055, Bias: -0.824321, T: 18516, Avg. loss: 0.055781
Total training time: 5.11 seconds.
-- Epoch 7
Norm: 13.37, NNZs: 424487, Bias: -0.820839, T: 21602, Avg. loss: 0.048929
Total training time: 5.96 seconds.
-- Epoch 8
Norm: 12.59, NNZs: 428112, Bias: -0.818330, T: 24688, Avg. loss: 0.043673
Total training time: 6.82 seconds.
-- Epoch 9
Norm: 11.87, NNZs: 432880, Bias: -0.821291, T: 27774, Avg. loss: 0.039448
Total training time: 7.68 seconds.
-- Epoch 10
Norm: 11.53, NNZs: 441707, Bias: -0.821978, T: 30860, Avg. loss: 0.036118
Total training time: 8.54 seconds.
-- Epoch 11
Norm: 11.19, NNZs: 442421, Bias: -0.817799, T: 33946, Avg. loss: 0.033405
Total training time: 9.40 seconds.
-- Epoch 12
Norm: 10.86, NNZs: 443389, Bias: -0.824530, T: 37032, Avg. loss: 0.031131
Total training time: 10.27 seconds.
-- Epoch 13
Norm: 10.65, NNZs: 446551, Bias: -0.824829, T: 40118, Avg. loss: 0.029202
Total training time: 11.14 seconds.
-- Epoch 14
Norm: 10.54, NNZs: 448493, Bias: -0.823376, T: 43204, Avg. loss: 0.027526
Total training time: 12.01 seconds.
-- Epoch 15
Norm: 10.43, NNZs: 451076, Bias: -0.824225, T: 46290, Avg. loss: 0.026068
Total training time: 12.88 seconds.
-- Epoch 16
Norm: 10.30, NNZs: 451744, Bias: -0.825191, T: 49376, Avg. loss: 0.024813
Total training time: 13.75 seconds.
-- Epoch 17
Norm: 10.25, NNZs: 452668, Bias: -0.823042, T: 52462, Avg. loss: 0.023690
Total training time: 14.62 seconds.
-- Epoch 18
Norm: 10.19, NNZs: 456407, Bias: -0.826030, T: 55548, Avg. loss: 0.022672
Total training time: 15.49 seconds.
-- Epoch 19
Norm: 10.05, NNZs: 457537, Bias: -0.829505, T: 58634, Avg. loss: 0.021773
Total training time: 16.36 seconds.
-- Epoch 20
Norm: 9.99, NNZs: 457841, Bias: -0.828603, T: 61720, Avg. loss: 0.020959
Total training time: 17.23 seconds.
-- Epoch 21
Norm: 9.95, NNZs: 475715, Bias: -0.826494, T: 64806, Avg. loss: 0.020199
Total training time: 18.11 seconds.
-- Epoch 22
Norm: 9.89, NNZs: 475983, Bias: -0.828695, T: 67892, Avg. loss: 0.019534
Total training time: 18.98 seconds.
-- Epoch 23
Norm: 9.87, NNZs: 476850, Bias: -0.827320, T: 70978, Avg. loss: 0.018918
Total training time: 19.85 seconds.
-- Epoch 24
Norm: 9.83, NNZs: 477454, Bias: -0.830433, T: 74064, Avg. loss: 0.018358
Total training time: 20.72 seconds.
-- Epoch 25
Norm: 9.79, NNZs: 477699, Bias: -0.831531, T: 77150, Avg. loss: 0.017843
Total training time: 21.60 seconds.
-- Epoch 26
Norm: 9.82, NNZs: 478073, Bias: -0.829856, T: 80236, Avg. loss: 0.017365
Total training time: 22.47 seconds.
-- Epoch 27
Norm: 9.75, NNZs: 483454, Bias: -0.832732, T: 83322, Avg. loss: 0.016919
Total training time: 23.35 seconds.
-- Epoch 28
Norm: 9.79, NNZs: 483821, Bias: -0.828461, T: 86408, Avg. loss: 0.016503
Total training time: 24.22 seconds.
-- Epoch 29
Norm: 9.74, NNZs: 484181, Bias: -0.829501, T: 89494, Avg. loss: 0.016117
Total training time: 25.10 seconds.
-- Epoch 30
Norm: 9.72, NNZs: 484243, Bias: -0.831333, T: 92580, Avg. loss: 0.015759
Total training time: 25.97 seconds.
-- Epoch 31
Norm: 9.68, NNZs: 484243, Bias: -0.832424, T: 95666, Avg. loss: 0.015425
Total training time: 26.85 seconds.
-- Epoch 32
Norm: 9.68, NNZs: 489314, Bias: -0.831564, T: 98752, Avg. loss: 0.015110
Total training time: 27.72 seconds.
-- Epoch 33
Norm: 9.64, NNZs: 489379, Bias: -0.835034, T: 101838, Avg. loss: 0.014810
Total training time: 28.60 seconds.
-- Epoch 34
Norm: 9.63, NNZs: 489379, Bias: -0.833958, T: 104924, Avg. loss: 0.014529
Total training time: 29.47 seconds.
-- Epoch 35
Norm: 9.62, NNZs: 489981, Bias: -0.831326, T: 108010, Avg. loss: 0.014264
Total training time: 30.35 seconds.
-- Epoch 36
Norm: 9.61, NNZs: 492166, Bias: -0.832735, T: 111096, Avg. loss: 0.014015
Total training time: 31.23 seconds.
-- Epoch 37
Norm: 9.60, NNZs: 495259, Bias: -0.834880, T: 114182, Avg. loss: 0.013777
Total training time: 32.10 seconds.
-- Epoch 38
Norm: 9.61, NNZs: 495785, Bias: -0.832244, T: 117268, Avg. loss: 0.013551
Total training time: 32.98 seconds.
-- Epoch 39
Norm: 9.62, NNZs: 495785, Bias: -0.832558, T: 120354, Avg. loss: 0.013338
Total training time: 33.86 seconds.
-- Epoch 40
Norm: 9.59, NNZs: 496460, Bias: -0.832942, T: 123440, Avg. loss: 0.013135
Total training time: 34.74 seconds.
-- Epoch 41
Norm: 9.58, NNZs: 496460, Bias: -0.833895, T: 126526, Avg. loss: 0.012945
Total training time: 35.61 seconds.
-- Epoch 42
Norm: 9.52, NNZs: 497758, Bias: -0.837518, T: 129612, Avg. loss: 0.012759
Total training time: 36.49 seconds.
-- Epoch 43
Norm: 9.56, NNZs: 497968, Bias: -0.835748, T: 132698, Avg. loss: 0.012583
Total training time: 37.37 seconds.
-- Epoch 44
Norm: 9.54, NNZs: 498093, Bias: -0.834062, T: 135784, Avg. loss: 0.012417
Total training time: 38.24 seconds.
-- Epoch 45
Norm: 9.54, NNZs: 498971, Bias: -0.835798, T: 138870, Avg. loss: 0.012257
Total training time: 39.12 seconds.
-- Epoch 46
Norm: 9.53, NNZs: 499026, Bias: -0.836409, T: 141956, Avg. loss: 0.012103
Total training time: 40.00 seconds.
-- Epoch 47
Norm: 9.53, NNZs: 499452, Bias: -0.837006, T: 145042, Avg. loss: 0.011956
Total training time: 40.88 seconds.
-- Epoch 48
Norm: 9.50, NNZs: 499452, Bias: -0.838292, T: 148128, Avg. loss: 0.011814
Total training time: 41.76 seconds.
-- Epoch 49
Norm: 9.53, NNZs: 500843, Bias: -0.835409, T: 151214, Avg. loss: 0.011680
Total training time: 42.63 seconds.
-- Epoch 50
Norm: 9.51, NNZs: 502672, Bias: -0.836441, T: 154300, Avg. loss: 0.011546
Total training time: 43.51 seconds.
-- Epoch 51
Norm: 9.51, NNZs: 502672, Bias: -0.835973, T: 157386, Avg. loss: 0.011420
Total training time: 44.39 seconds.
-- Epoch 52
Norm: 9.48, NNZs: 502672, Bias: -0.836389, T: 160472, Avg. loss: 0.011299
Total training time: 45.26 seconds.
-- Epoch 53
Norm: 9.48, NNZs: 503926, Bias: -0.838026, T: 163558, Avg. loss: 0.011182
Total training time: 46.14 seconds.
-- Epoch 54
Norm: 9.51, NNZs: 503964, Bias: -0.835943, T: 166644, Avg. loss: 0.011070
Total training time: 47.02 seconds.
-- Epoch 55
Norm: 9.48, NNZs: 504623, Bias: -0.838228, T: 169730, Avg. loss: 0.010963
Total training time: 47.90 seconds.
-- Epoch 56
Norm: 9.46, NNZs: 504957, Bias: -0.837424, T: 172816, Avg. loss: 0.010860
Total training time: 48.78 seconds.
-- Epoch 57
Norm: 9.47, NNZs: 505059, Bias: -0.838279, T: 175902, Avg. loss: 0.010760
Total training time: 49.66 seconds.
-- Epoch 58
Norm: 9.48, NNZs: 505059, Bias: -0.837495, T: 178988, Avg. loss: 0.010663
Total training time: 50.54 seconds.
-- Epoch 59
Norm: 9.49, NNZs: 505059, Bias: -0.835158, T: 182074, Avg. loss: 0.010568
Total training time: 51.42 seconds.
-- Epoch 60
Norm: 9.46, NNZs: 505447, Bias: -0.839021, T: 185160, Avg. loss: 0.010475
Total training time: 52.30 seconds.
-- Epoch 61
Norm: 9.45, NNZs: 505661, Bias: -0.839263, T: 188246, Avg. loss: 0.010387
Total training time: 53.18 seconds.
-- Epoch 62
Norm: 9.45, NNZs: 505661, Bias: -0.839133, T: 191332, Avg. loss: 0.010303
Total training time: 54.06 seconds.
-- Epoch 63
Norm: 9.45, NNZs: 505661, Bias: -0.838781, T: 194418, Avg. loss: 0.010220
Total training time: 54.93 seconds.
-- Epoch 64
Norm: 9.43, NNZs: 505720, Bias: -0.840754, T: 197504, Avg. loss: 0.010139
Total training time: 55.81 seconds.
-- Epoch 65
Norm: 9.44, NNZs: 505776, Bias: -0.840571, T: 200590, Avg. loss: 0.010061
Total training time: 56.69 seconds.
-- Epoch 66
Norm: 9.44, NNZs: 505776, Bias: -0.837919, T: 203676, Avg. loss: 0.009986
Total training time: 57.56 seconds.
-- Epoch 67
Norm: 9.45, NNZs: 505776, Bias: -0.838456, T: 206762, Avg. loss: 0.009913
Total training time: 58.44 seconds.
-- Epoch 68
Norm: 9.43, NNZs: 505776, Bias: -0.840169, T: 209848, Avg. loss: 0.009842
Total training time: 59.32 seconds.
-- Epoch 69
Norm: 9.44, NNZs: 796718, Bias: -0.839952, T: 212934, Avg. loss: 0.009772
Total training time: 60.20 seconds.
-- Epoch 70
Norm: 9.43, NNZs: 796718, Bias: -0.839341, T: 216020, Avg. loss: 0.009705
Total training time: 61.07 seconds.
-- Epoch 71
Norm: 9.43, NNZs: 796718, Bias: -0.838209, T: 219106, Avg. loss: 0.009638
Total training time: 61.94 seconds.
-- Epoch 72
Norm: 9.44, NNZs: 796718, Bias: -0.839381, T: 222192, Avg. loss: 0.009576
Total training time: 62.82 seconds.
-- Epoch 73
Norm: 9.44, NNZs: 796718, Bias: -0.839684, T: 225278, Avg. loss: 0.009514
Total training time: 63.69 seconds.
-- Epoch 74
Norm: 9.41, NNZs: 796718, Bias: -0.841347, T: 228364, Avg. loss: 0.009454
Total training time: 64.57 seconds.
-- Epoch 75
Norm: 9.42, NNZs: 796718, Bias: -0.839861, T: 231450, Avg. loss: 0.009397
Total training time: 65.45 seconds.
-- Epoch 76
Norm: 9.42, NNZs: 796718, Bias: -0.840211, T: 234536, Avg. loss: 0.009341
Total training time: 66.32 seconds.
-- Epoch 77
Norm: 9.41, NNZs: 796718, Bias: -0.838824, T: 237622, Avg. loss: 0.009284
Total training time: 67.20 seconds.
-- Epoch 78
Norm: 9.41, NNZs: 796718, Bias: -0.839978, T: 240708, Avg. loss: 0.009230
Total training time: 68.08 seconds.
-- Epoch 79
Norm: 9.42, NNZs: 796718, Bias: -0.840776, T: 243794, Avg. loss: 0.009177
Total training time: 68.96 seconds.
-- Epoch 80
Norm: 9.42, NNZs: 796743, Bias: -0.839732, T: 246880, Avg. loss: 0.009125
Total training time: 69.84 seconds.
-- Epoch 81
Norm: 9.40, NNZs: 796743, Bias: -0.841977, T: 249966, Avg. loss: 0.009075
Total training time: 70.71 seconds.
-- Epoch 82
Norm: 9.40, NNZs: 796757, Bias: -0.841106, T: 253052, Avg. loss: 0.009026
Total training time: 71.58 seconds.
-- Epoch 83
Norm: 9.39, NNZs: 796757, Bias: -0.842521, T: 256138, Avg. loss: 0.008978
Total training time: 72.71 seconds.
-- Epoch 84
Norm: 9.40, NNZs: 796757, Bias: -0.840811, T: 259224, Avg. loss: 0.008932
Total training time: 73.59 seconds.
-- Epoch 85
Norm: 9.41, NNZs: 796757, Bias: -0.840719, T: 262310, Avg. loss: 0.008886
Total training time: 74.46 seconds.
-- Epoch 86
Norm: 9.40, NNZs: 796757, Bias: -0.841646, T: 265396, Avg. loss: 0.008841
Total training time: 75.34 seconds.
-- Epoch 87
Norm: 9.41, NNZs: 796757, Bias: -0.841524, T: 268482, Avg. loss: 0.008798
Total training time: 76.22 seconds.
-- Epoch 88
Norm: 9.40, NNZs: 797935, Bias: -0.840280, T: 271568, Avg. loss: 0.008754
Total training time: 77.09 seconds.
-- Epoch 89
Norm: 9.39, NNZs: 797935, Bias: -0.842498, T: 274654, Avg. loss: 0.008712
Total training time: 77.97 seconds.
-- Epoch 90
Norm: 9.39, NNZs: 797935, Bias: -0.842963, T: 277740, Avg. loss: 0.008672
Total training time: 78.85 seconds.
-- Epoch 91
Norm: 9.39, NNZs: 797935, Bias: -0.842045, T: 280826, Avg. loss: 0.008632
Total training time: 79.72 seconds.
-- Epoch 92
Norm: 9.39, NNZs: 797935, Bias: -0.842855, T: 283912, Avg. loss: 0.008593
Total training time: 80.60 seconds.
-- Epoch 93
Norm: 9.39, NNZs: 797935, Bias: -0.842017, T: 286998, Avg. loss: 0.008555
Total training time: 81.48 seconds.
-- Epoch 94
Norm: 9.39, NNZs: 797935, Bias: -0.842685, T: 290084, Avg. loss: 0.008518
Total training time: 82.35 seconds.
-- Epoch 95
Norm: 9.38, NNZs: 797935, Bias: -0.843959, T: 293170, Avg. loss: 0.008480
Total training time: 83.23 seconds.
-- Epoch 96
Norm: 9.39, NNZs: 797935, Bias: -0.843056, T: 296256, Avg. loss: 0.008444
Total training time: 84.11 seconds.
-- Epoch 97
Norm: 9.38, NNZs: 797935, Bias: -0.843356, T: 299342, Avg. loss: 0.008408
Total training time: 84.99 seconds.
-- Epoch 98
Norm: 9.38, NNZs: 797935, Bias: -0.842078, T: 302428, Avg. loss: 0.008374
Total training time: 85.86 seconds.
-- Epoch 99
Norm: 9.39, NNZs: 797935, Bias: -0.842275, T: 305514, Avg. loss: 0.008340
Total training time: 86.74 seconds.
-- Epoch 100
Norm: 9.38, NNZs: 797935, Bias: -0.842079, T: 308600, Avg. loss: 0.008307
Total training time: 87.61 seconds.
[Parallel(n_jobs=1)]: Done 15 out of 15 | elapsed: 24.0min finished
Out[6]:
SGDClassifier(alpha=0.0001, average=False, class_weight=None, epsilon=0.1,
eta0=0.0, fit_intercept=True, l1_ratio=0.15,
learning_rate='optimal', loss='modified_huber', n_iter=100,
n_jobs=1, penalty='l2', power_t=0.5, random_state=None,
shuffle=True, verbose=1, warm_start=False)
In [7]:
test_pred = SGD.predict(X_test)
In [8]:
print test_pred
test_ids = np.load("../data/features/test_ids.npy")
print test_ids
write_predictions(test_pred, test_ids, "../predictions/sgd_huber_100_big_tfidf.csv")
[10 5 8 ..., 10 8 8]
['e5b875f7e584b29fd9e85c1f232956849aabcb311'
'18abefbfb74285D709bcf665d594df11bf56e1984'
'47cd5265b1fc52021c025452e084c405a0a03df1e' ...,
'6abb75b149d8e39e30c8df2c19bfd96986f0e35b3'
'f0e968070037717da88665ab091ff2B4973528f30'
'7b2459e11cac9341a00fa7bDcd5b17618a0b97dc8']
In [17]:
from sklearn.linear_model import PassiveAggressiveClassifier
# Try an SGDClassifier learning directly from the sparse matrix
model = PassiveAggressiveClassifier(n_jobs=4, verbose=42, n_iter=20)
model.fit(X,Y)
-- Epoch 1
-- Epoch 1
-- Epoch 1
-- Epoch 1
Norm: 7.55, NNZs: 125613, Bias: -0.138381, T: 3086, Avg. loss: 0.046595
Total training time: 0.03 seconds.
Norm: 5.78, NNZs: 164319, Bias: -0.112992, T: 3086, Avg. loss: 0.120186
Total training time: 0.04 seconds.
-- Epoch 2
-- Epoch 2
Norm: 5.25, NNZs: 75659, Bias: -0.112442, T: 3086, Avg. loss: 0.035022
Total training time: 0.04 seconds.
-- Epoch 2
Norm: 9.22, NNZs: 132801, Bias: -0.179926, T: 6172, Avg. loss: 0.041148
Total training time: 0.06 seconds.
Norm: 5.13, NNZs: 144209, Bias: -0.137939, T: 3086, Avg. loss: 0.042037
Total training time: 0.06 seconds.
-- Epoch 3
-- Epoch 2
Norm: 8.61, NNZs: 182575, Bias: -0.142782, T: 6172, Avg. loss: 0.116928
Total training time: 0.07 seconds.
-- Epoch 3
Norm: 11.13, NNZs: 138897, Bias: -0.200858, T: 9258, Avg. loss: 0.038695Norm: 10.86, NNZs: 194803, Bias: -0.189226, T: 9258, Avg. loss: 0.114809
Total training time: 0.12 seconds.
Total training time: 0.12 seconds.
-- Epoch 4
Norm: 7.00, NNZs: 151584, Bias: -0.180608, T: 6172, Avg. loss: 0.037232
Total training time: 0.11 seconds.
-- Epoch 4
Norm: 7.32, NNZs: 155748, Bias: -0.132659, T: 6172, Avg. loss: 0.031583
Total training time: 0.12 seconds.
-- Epoch 3
-- Epoch 3
Norm: 13.00, NNZs: 201283, Bias: -0.198497, T: 12344, Avg. loss: 0.112699
Total training time: 0.16 seconds.
-- Epoch 5
Norm: 12.44, NNZs: 140909, Bias: -0.209754, T: 12344, Avg. loss: 0.036497
Total training time: 0.17 seconds.
Norm: 9.13, NNZs: 159582, Bias: -0.143230, T: 9258, Avg. loss: 0.029215
Total training time: 0.16 seconds.
-- Epoch 5
-- Epoch 4
Norm: 7.98, NNZs: 159699, Bias: -0.207358, T: 9258, Avg. loss: 0.035670
Total training time: 0.17 seconds.
Norm: 15.22, NNZs: 204819, Bias: -0.259705, T: 15430, Avg. loss: 0.111519
Total training time: 0.20 seconds.
Norm: 11.08, NNZs: 169450, Bias: -0.181081, T: 12344, Avg. loss: 0.027951-- Epoch 4
-- Epoch 6
Total training time: 0.21 seconds.
-- Epoch 5
Norm: 13.97, NNZs: 141832, Bias: -0.235442, T: 15430, Avg. loss: 0.034727
Total training time: 0.23 seconds.
-- Epoch 6
Norm: 12.23, NNZs: 170328, Bias: -0.191514, T: 15430, Avg. loss: 0.026484
Total training time: 0.25 seconds.
Norm: 16.87, NNZs: 206813, Bias: -0.288808, T: 18516, Avg. loss: 0.110610
Total training time: 0.26 seconds.
Norm: 9.22, NNZs: 172804, Bias: -0.264905, T: 12344, Avg. loss: 0.034566
Total training time: 0.25 seconds.
-- Epoch 6
-- Epoch 7
Norm: 15.17, NNZs: 143938, Bias: -0.257578, T: 18516, Avg. loss: 0.033563
Total training time: 0.26 seconds.
-- Epoch 7
-- Epoch 5
Norm: 13.37, NNZs: 172175, Bias: -0.217118, T: 18516, Avg. loss: 0.025669
Total training time: 0.28 seconds.
-- Epoch 7
Norm: 16.31, NNZs: 146074, Bias: -0.270363, T: 21602, Avg. loss: 0.032659
Total training time: 0.30 seconds.
-- Epoch 8
Norm: 18.79, NNZs: 210952, Bias: -0.344830, T: 21602, Avg. loss: 0.109655
Total training time: 0.33 seconds.
Norm: 14.36, NNZs: 173116, Bias: -0.225061, T: 21602, Avg. loss: 0.024868-- Epoch 8
Norm: 9.80, NNZs: 175408, Bias: -0.303223, T: 15430, Avg. loss: 0.033608
Total training time: 0.33 seconds.
Norm: 17.19, NNZs: 146259, Bias: -0.288096, T: 24688, Avg. loss: 0.031612
Total training time: 0.34 seconds.
-- Epoch 6
Total training time: 0.33 seconds.
-- Epoch 9
-- Epoch 8
Norm: 20.46, NNZs: 213597, Bias: -0.360011, T: 24688, Avg. loss: 0.108777
Total training time: 0.36 seconds.
Norm: 10.64, NNZs: 177735, Bias: -0.312725, T: 18516, Avg. loss: 0.033153
Total training time: 0.36 seconds.
-- Epoch 9
-- Epoch 7
Norm: 18.31, NNZs: 146783, Bias: -0.300341, T: 27774, Avg. loss: 0.030977
Total training time: 0.38 seconds.
-- Epoch 10
Norm: 15.55, NNZs: 174001, Bias: -0.231881, T: 24688, Avg. loss: 0.024131
Total training time: 0.37 seconds.
-- Epoch 9
Norm: 22.15, NNZs: 214774, Bias: -0.381537, T: 27774, Avg. loss: 0.107818
Total training time: 0.40 seconds.
-- Epoch 10
Norm: 11.52, NNZs: 182346, Bias: -0.343389, T: 21602, Avg. loss: 0.032644
Total training time: 0.39 seconds.
-- Epoch 8
Norm: 19.36, NNZs: 147399, Bias: -0.302230, T: 30860, Avg. loss: 0.030288
Total training time: 0.42 seconds.
Norm: 16.49, NNZs: 175029, Bias: -0.261609, T: 27774, Avg. loss: 0.023527
Total training time: 0.41 seconds.
-- Epoch 11
Norm: 23.96, NNZs: 215679, Bias: -0.404656, T: 30860, Avg. loss: 0.106963
Total training time: 0.43 seconds.
-- Epoch 10
-- Epoch 11
Norm: 12.34, NNZs: 184478, Bias: -0.368994, T: 24688, Avg. loss: 0.032283
Total training time: 0.42 seconds.
-- Epoch 9
Norm: 20.51, NNZs: 147614, Bias: -0.328488, T: 33946, Avg. loss: 0.029753
Total training time: 0.46 seconds.
Norm: 25.61, NNZs: 216396, Bias: -0.424627, T: 33946, Avg. loss: 0.106017
Total training time: 0.46 seconds.
-- Epoch 12
Norm: 17.28, NNZs: 176292, Bias: -0.269128, T: 30860, Avg. loss: 0.022978
Total training time: 0.45 seconds.
-- Epoch 12
Norm: 13.21, NNZs: 188577, Bias: -0.396467, T: 27774, Avg. loss: 0.031936
Total training time: 0.45 seconds.
-- Epoch 11
-- Epoch 10
Norm: 27.13, NNZs: 217088, Bias: -0.433000, T: 37032, Avg. loss: 0.105353
Total training time: 0.49 seconds.
Norm: 13.85, NNZs: 191080, Bias: -0.428029, T: 30860, Avg. loss: 0.031633
Total training time: 0.48 seconds.
Norm: 21.27, NNZs: 147700, Bias: -0.331995, T: 37032, Avg. loss: 0.029054
Total training time: 0.49 seconds.
-- Epoch 11
-- Epoch 13
-- Epoch 13
Norm: 18.11, NNZs: 176759, Bias: -0.276906, T: 33946, Avg. loss: 0.022376
Total training time: 0.49 seconds.
-- Epoch 12
Norm: 14.42, NNZs: 191998, Bias: -0.460404, T: 33946, Avg. loss: 0.031251
Total training time: 0.51 seconds.
-- Epoch 12
Norm: 28.63, NNZs: 217402, Bias: -0.460138, T: 40118, Avg. loss: 0.104656
Total training time: 0.52 seconds.
-- Epoch 14
Norm: 22.05, NNZs: 147800, Bias: -0.346405, T: 40118, Avg. loss: 0.028445
Total training time: 0.53 seconds.
-- Epoch 14
Norm: 18.85, NNZs: 176852, Bias: -0.281412, T: 37032, Avg. loss: 0.021928
Total training time: 0.53 seconds.
-- Epoch 13
Norm: 15.01, NNZs: 193141, Bias: -0.466874, T: 37032, Avg. loss: 0.030943
Total training time: 0.54 seconds.
-- Epoch 13
Norm: 30.13, NNZs: 217759, Bias: -0.483775, T: 43204, Avg. loss: 0.103850
Total training time: 0.55 seconds.
-- Epoch 15
Norm: 22.92, NNZs: 147857, Bias: -0.361740, T: 43204, Avg. loss: 0.028006
Total training time: 0.57 seconds.
Norm: 19.65, NNZs: 177130, Bias: -0.286754, T: 40118, Avg. loss: 0.021555
Total training time: 0.56 seconds.
-- Epoch 15
-- Epoch 14
Norm: 15.80, NNZs: 194048, Bias: -0.488759, T: 40118, Avg. loss: 0.030693
Total training time: 0.57 seconds.
-- Epoch 14
Norm: 31.42, NNZs: 217935, Bias: -0.515990, T: 46290, Avg. loss: 0.103128
Total training time: 0.58 seconds.
-- Epoch 16
Norm: 16.43, NNZs: 194806, Bias: -0.516277, T: 43204, Avg. loss: 0.030533
Total training time: 0.60 seconds.
Norm: 23.74, NNZs: 147997, Bias: -0.364666, T: 46290, Avg. loss: 0.027344
Total training time: 0.61 seconds.
-- Epoch 15
-- Epoch 16
Norm: 20.28, NNZs: 177212, Bias: -0.280141, T: 43204, Avg. loss: 0.021002
Total training time: 0.61 seconds.
Norm: 32.87, NNZs: 218037, Bias: -0.531316, T: 49376, Avg. loss: 0.102451
Total training time: 0.62 seconds.
-- Epoch 15
-- Epoch 17
Norm: 17.05, NNZs: 195213, Bias: -0.538795, T: 46290, Avg. loss: 0.030362
Total training time: 0.64 seconds.
Norm: 34.22, NNZs: 218445, Bias: -0.562803, T: 52462, Avg. loss: 0.101749
Total training time: 0.65 seconds.
-- Epoch 16
Norm: 24.41, NNZs: 148109, Bias: -0.376257, T: 49376, Avg. loss: 0.026785
Total training time: 0.65 seconds.
-- Epoch 18
-- Epoch 17
Norm: 20.74, NNZs: 177619, Bias: -0.293214, T: 46290, Avg. loss: 0.020484
Total training time: 0.65 seconds.
-- Epoch 16
Norm: 35.50, NNZs: 218778, Bias: -0.571215, T: 55548, Avg. loss: 0.101158
Total training time: 0.67 seconds.
Norm: 17.70, NNZs: 197336, Bias: -0.552810, T: 49376, Avg. loss: 0.030125
Total training time: 0.67 seconds.
-- Epoch 19
-- Epoch 17
Norm: 25.19, NNZs: 148164, Bias: -0.393347, T: 52462, Avg. loss: 0.026394
Total training time: 0.69 seconds.
-- Epoch 18
Norm: 21.30, NNZs: 178484, Bias: -0.319611, T: 49376, Avg. loss: 0.020198
Total training time: 0.68 seconds.
-- Epoch 17
Norm: 36.84, NNZs: 219295, Bias: -0.626140, T: 58634, Avg. loss: 0.100501
Total training time: 0.71 seconds.
-- Epoch 20
Norm: 18.18, NNZs: 198148, Bias: -0.581376, T: 52462, Avg. loss: 0.030019
Total training time: 0.70 seconds.
-- Epoch 18
Norm: 25.88, NNZs: 148223, Bias: -0.407307, T: 55548, Avg. loss: 0.025934
Total training time: 0.72 seconds.
-- Epoch 19
Norm: 21.97, NNZs: 178569, Bias: -0.304032, T: 52462, Avg. loss: 0.019885
Total training time: 0.72 seconds.
-- Epoch 18
Norm: 37.98, NNZs: 219635, Bias: -0.651349, T: 61720, Avg. loss: 0.099810
Total training time: 0.73 seconds.
-- Epoch 1
Norm: 18.54, NNZs: 198513, Bias: -0.610919, T: 55548, Avg. loss: 0.029785
Total training time: 0.73 seconds.
-- Epoch 19
Norm: 26.50, NNZs: 148291, Bias: -0.408269, T: 58634, Avg. loss: 0.025503
Total training time: 0.76 seconds.
Norm: 4.77, NNZs: 57103, Bias: -0.117284, T: 3086, Avg. loss: 0.047042
Total training time: 0.02 seconds.
-- Epoch 2
Norm: 22.58, NNZs: 178623, Bias: -0.314288, T: 55548, Avg. loss: 0.019605
Total training time: 0.76 seconds.
-- Epoch 20
Norm: 19.20, NNZs: 198869, Bias: -0.630483, T: 58634, Avg. loss: 0.029658
Total training time: 0.76 seconds.
-- Epoch 19
-- Epoch 20
Norm: 7.52, NNZs: 62731, Bias: -0.160376, T: 6172, Avg. loss: 0.043775
Total training time: 0.05 seconds.
-- Epoch 3
Norm: 19.97, NNZs: 198990, Bias: -0.649799, T: 61720, Avg. loss: 0.029454
Total training time: 0.79 seconds.
Norm: 27.22, NNZs: 148393, Bias: -0.416649, T: 61720, Avg. loss: 0.025107
Total training time: 0.80 seconds.
-- Epoch 1
-- Epoch 1
Norm: 23.14, NNZs: 178688, Bias: -0.327487, T: 58634, Avg. loss: 0.019361
Total training time: 0.80 seconds.
-- Epoch 20
Norm: 9.66, NNZs: 72087, Bias: -0.207689, T: 9258, Avg. loss: 0.041709
Total training time: 0.08 seconds.
[Parallel(n_jobs=4)]: Done 1 tasks | elapsed: 0.7s
[Parallel(n_jobs=4)]: Done 2 tasks | elapsed: 0.8s
[Parallel(n_jobs=4)]: Done 3 tasks | elapsed: 0.8s
[Parallel(n_jobs=4)]: Done 4 tasks | elapsed: 0.9s
-- Epoch 4
Norm: 5.63, NNZs: 135322, Bias: -0.115125, T: 3086, Avg. loss: 0.036669
Total training time: 0.02 seconds.
-- Epoch 2
Norm: 7.53, NNZs: 171739, Bias: -0.145867, T: 3086, Avg. loss: 0.043442
Total training time: 0.04 seconds.
-- Epoch 2Norm: 23.85, NNZs: 178723, Bias: -0.321923, T: 61720, Avg. loss: 0.019125
Norm: 11.52, NNZs: 80865, Bias: -0.244189, T: 12344, Avg. loss: 0.039950
Total training time: 0.84 seconds.Total training time: 0.11 seconds.
-- Epoch 5
-- Epoch 1
Norm: 7.56, NNZs: 152761, Bias: -0.179906, T: 6172, Avg. loss: 0.032229
Total training time: 0.05 seconds.
-- Epoch 3
Norm: 13.14, NNZs: 82053, Bias: -0.285887, T: 15430, Avg. loss: 0.038661
Total training time: 0.14 seconds.
Norm: 8.83, NNZs: 158628, Bias: -0.208310, T: 9258, Avg. loss: 0.029973
Total training time: 0.08 seconds.
-- Epoch 6
-- Epoch 4
Norm: 10.25, NNZs: 188905, Bias: -0.233700, T: 6172, Avg. loss: 0.035793
Total training time: 0.08 seconds.
Norm: 6.44, NNZs: 110961, Bias: -0.124772, T: 3086, Avg. loss: 0.043867
Total training time: 0.04 seconds.
-- Epoch 3
-- Epoch 2
Norm: 14.40, NNZs: 82526, Bias: -0.301868, T: 18516, Avg. loss: 0.037195
Total training time: 0.17 seconds.
-- Epoch 7
Norm: 9.83, NNZs: 163783, Bias: -0.235602, T: 12344, Avg. loss: 0.028541
Total training time: 0.11 seconds.
-- Epoch 5
Norm: 11.80, NNZs: 189402, Bias: -0.296523, T: 9258, Avg. loss: 0.031332
Total training time: 0.12 seconds.
Norm: 9.10, NNZs: 114630, Bias: -0.174806, T: 6172, Avg. loss: 0.038068
Total training time: 0.08 seconds.
Norm: 15.83, NNZs: 83074, Bias: -0.340314, T: 21602, Avg. loss: 0.036146
Total training time: 0.19 seconds.
-- Epoch 4
-- Epoch 8
-- Epoch 3
Norm: 10.89, NNZs: 165191, Bias: -0.269543, T: 15430, Avg. loss: 0.027473
Total training time: 0.14 seconds.
-- Epoch 6
Norm: 17.21, NNZs: 83501, Bias: -0.357866, T: 24688, Avg. loss: 0.035254
Total training time: 0.22 seconds.
-- Epoch 9
Norm: 10.86, NNZs: 116850, Bias: -0.209307, T: 9258, Avg. loss: 0.034280
Total training time: 0.12 seconds.
Norm: 11.89, NNZs: 168391, Bias: -0.309804, T: 18516, Avg. loss: 0.026769
Total training time: 0.17 seconds.
-- Epoch 7
-- Epoch 4
Norm: 13.12, NNZs: 190206, Bias: -0.333667, T: 12344, Avg. loss: 0.028289
Total training time: 0.17 seconds.
-- Epoch 5
Norm: 18.27, NNZs: 84290, Bias: -0.382119, T: 27774, Avg. loss: 0.034436
Total training time: 0.26 seconds.
-- Epoch 10
Norm: 12.75, NNZs: 168713, Bias: -0.325040, T: 21602, Avg. loss: 0.026026
Total training time: 0.20 seconds.
-- Epoch 8
Norm: 12.29, NNZs: 117741, Bias: -0.239852, T: 12344, Avg. loss: 0.031776
Total training time: 0.16 seconds.
-- Epoch 5
Norm: 14.17, NNZs: 190898, Bias: -0.383946, T: 15430, Avg. loss: 0.026131
Total training time: 0.22 seconds.
Norm: 19.43, NNZs: 84569, Bias: -0.402913, T: 30860, Avg. loss: 0.033658
Total training time: 0.29 seconds.
-- Epoch 6
-- Epoch 11
Norm: 13.66, NNZs: 169562, Bias: -0.362919, T: 24688, Avg. loss: 0.025580
Total training time: 0.23 seconds.
-- Epoch 9
Norm: 13.07, NNZs: 118481, Bias: -0.266576, T: 15430, Avg. loss: 0.029860
Total training time: 0.20 seconds.
Norm: 20.46, NNZs: 85020, Bias: -0.418672, T: 33946, Avg. loss: 0.032972
Total training time: 0.32 seconds.
-- Epoch 6
Norm: 14.54, NNZs: 170222, Bias: -0.388985, T: 27774, Avg. loss: 0.025126
Total training time: 0.26 seconds.
-- Epoch 12
-- Epoch 10
Norm: 15.02, NNZs: 191046, Bias: -0.422014, T: 18516, Avg. loss: 0.024483
Total training time: 0.26 seconds.
-- Epoch 7
Norm: 13.90, NNZs: 118777, Bias: -0.291369, T: 18516, Avg. loss: 0.028516
Total training time: 0.24 seconds.
Norm: 21.51, NNZs: 85213, Bias: -0.434518, T: 37032, Avg. loss: 0.032274
Total training time: 0.36 seconds.
-- Epoch 7
Norm: 15.41, NNZs: 171050, Bias: -0.420134, T: 30860, Avg. loss: 0.024751
Total training time: 0.30 seconds.
-- Epoch 13
-- Epoch 11
Norm: 15.52, NNZs: 191150, Bias: -0.474972, T: 21602, Avg. loss: 0.023024
Total training time: 0.30 seconds.
-- Epoch 8
Norm: 14.77, NNZs: 119125, Bias: -0.325508, T: 21602, Avg. loss: 0.027464
Total training time: 0.28 seconds.
Norm: 16.24, NNZs: 172060, Bias: -0.437492, T: 33946, Avg. loss: 0.024310
Total training time: 0.33 seconds.
-- Epoch 8
Norm: 22.46, NNZs: 85336, Bias: -0.456109, T: 40118, Avg. loss: 0.031723
Total training time: 0.40 seconds.
-- Epoch 12
-- Epoch 14
Norm: 16.39, NNZs: 191307, Bias: -0.492087, T: 24688, Avg. loss: 0.021861
Total training time: 0.34 seconds.
-- Epoch 9
Norm: 15.52, NNZs: 119499, Bias: -0.342131, T: 24688, Avg. loss: 0.026560
Total training time: 0.32 seconds.
Norm: 17.07, NNZs: 172839, Bias: -0.455013, T: 37032, Avg. loss: 0.023959
Total training time: 0.37 seconds.
Norm: 23.30, NNZs: 86849, Bias: -0.472047, T: 43204, Avg. loss: 0.031120
Total training time: 0.44 seconds.
-- Epoch 9
-- Epoch 13
-- Epoch 15
Norm: 17.01, NNZs: 191438, Bias: -0.537543, T: 27774, Avg. loss: 0.021070
Total training time: 0.38 seconds.
-- Epoch 10
Norm: 16.25, NNZs: 119707, Bias: -0.367343, T: 27774, Avg. loss: 0.025772
Total training time: 0.36 seconds.
Norm: 17.94, NNZs: 177399, Bias: -0.496531, T: 40118, Avg. loss: 0.023602
Total training time: 0.41 seconds.
Norm: 24.28, NNZs: 87013, Bias: -0.487143, T: 46290, Avg. loss: 0.030634
Total training time: 0.48 seconds.
-- Epoch 10
-- Epoch 14
-- Epoch 16
Norm: 17.65, NNZs: 191438, Bias: -0.558938, T: 30860, Avg. loss: 0.020122
Total training time: 0.42 seconds.
-- Epoch 11
Norm: 16.98, NNZs: 119994, Bias: -0.386402, T: 30860, Avg. loss: 0.025110
Norm: 18.68, NNZs: 177676, Bias: -0.500565, T: 43204, Avg. loss: 0.023131
Total training time: 0.45 seconds.
Total training time: 0.40 seconds.
Norm: 25.15, NNZs: 87430, Bias: -0.501629, T: 49376, Avg. loss: 0.030153
Total training time: 0.52 seconds.
-- Epoch 15
-- Epoch 11
-- Epoch 17
Norm: 18.48, NNZs: 191948, Bias: -0.601507, T: 33946, Avg. loss: 0.019562
Total training time: 0.45 seconds.
-- Epoch 12
Norm: 17.76, NNZs: 120203, Bias: -0.398813, T: 33946, Avg. loss: 0.024452
Total training time: 0.44 seconds.
Norm: 19.53, NNZs: 178067, Bias: -0.536095, T: 46290, Avg. loss: 0.022870
Total training time: 0.49 seconds.
Norm: 26.03, NNZs: 88487, Bias: -0.518156, T: 52462, Avg. loss: 0.029692
Total training time: 0.55 seconds.
-- Epoch 12
-- Epoch 16
-- Epoch 18
Norm: 19.20, NNZs: 191989, Bias: -0.645841, T: 37032, Avg. loss: 0.019044
Total training time: 0.49 seconds.
-- Epoch 13
Norm: 18.55, NNZs: 120426, Bias: -0.430043, T: 37032, Avg. loss: 0.023980
Total training time: 0.48 seconds.
Norm: 20.25, NNZs: 178516, Bias: -0.559605, T: 49376, Avg. loss: 0.022563
Total training time: 0.53 seconds.
Norm: 26.77, NNZs: 88578, Bias: -0.529122, T: 55548, Avg. loss: 0.029226
Total training time: 0.59 seconds.
-- Epoch 13
-- Epoch 17
-- Epoch 19
Norm: 19.70, NNZs: 191999, Bias: -0.676037, T: 40118, Avg. loss: 0.018486
Total training time: 0.53 seconds.
-- Epoch 14
Norm: 19.24, NNZs: 120656, Bias: -0.442397, T: 40118, Avg. loss: 0.023483
Total training time: 0.51 seconds.
Norm: 21.03, NNZs: 178825, Bias: -0.582264, T: 52462, Avg. loss: 0.022311
Total training time: 0.56 seconds.
Norm: 27.57, NNZs: 88795, Bias: -0.535025, T: 58634, Avg. loss: 0.028820
Total training time: 0.63 seconds.
-- Epoch 14
-- Epoch 18
-- Epoch 20
Norm: 20.25, NNZs: 192487, Bias: -0.695844, T: 43204, Avg. loss: 0.017903
Total training time: 0.57 seconds.
-- Epoch 15
Norm: 21.73, NNZs: 179226, Bias: -0.606356, T: 55548, Avg. loss: 0.022016
Total training time: 0.59 seconds.
Norm: 20.06, NNZs: 120716, Bias: -0.463605, T: 43204, Avg. loss: 0.023175
Total training time: 0.54 seconds.
Norm: 28.35, NNZs: 88931, Bias: -0.550882, T: 61720, Avg. loss: 0.028465
Total training time: 0.66 seconds.
-- Epoch 19
-- Epoch 15
Norm: 20.76, NNZs: 192523, Bias: -0.737590, T: 46290, Avg. loss: 0.017450
Total training time: 0.60 seconds.
-- Epoch 1
-- Epoch 16
Norm: 20.83, NNZs: 120854, Bias: -0.481450, T: 46290, Avg. loss: 0.022737
Total training time: 0.57 seconds.
Norm: 22.32, NNZs: 180617, Bias: -0.621721, T: 58634, Avg. loss: 0.021721
Total training time: 0.62 seconds.
[Parallel(n_jobs=4)]: Done 5 tasks | elapsed: 1.4s
[Parallel(n_jobs=4)]: Done 6 tasks | elapsed: 1.5s
[Parallel(n_jobs=4)]: Done 7 tasks | elapsed: 1.5s
[Parallel(n_jobs=4)]: Done 8 tasks | elapsed: 1.6s
Norm: 21.27, NNZs: 192523, Bias: -0.768249, T: 49376, Avg. loss: 0.017036
Total training time: 0.62 seconds.
-- Epoch 20
-- Epoch 16
-- Epoch 17
Norm: 17.26, NNZs: 179921, Bias: 0.054885, T: 3086, Avg. loss: 0.379791
Total training time: 0.03 seconds.
-- Epoch 2
Norm: 23.05, NNZs: 181732, Bias: -0.640700, T: 61720, Avg. loss: 0.021388
Total training time: 0.65 seconds.
Norm: 21.75, NNZs: 192523, Bias: -0.794348, T: 52462, Avg. loss: 0.016664
Total training time: 0.65 seconds.
Norm: 21.61, NNZs: 121756, Bias: -0.495703, T: 49376, Avg. loss: 0.022391
Total training time: 0.60 seconds.
-- Epoch 18
-- Epoch 1
-- Epoch 17
Norm: 24.26, NNZs: 199880, Bias: 0.092845, T: 6172, Avg. loss: 0.338764
Total training time: 0.06 seconds.
-- Epoch 3
Norm: 22.15, NNZs: 193170, Bias: -0.824890, T: 55548, Avg. loss: 0.016280
Total training time: 0.67 seconds.
Norm: 22.25, NNZs: 122093, Bias: -0.507598, T: 52462, Avg. loss: 0.021986
Total training time: 0.63 seconds.
-- Epoch 19
-- Epoch 18
Norm: 3.98, NNZs: 119747, Bias: -0.097996, T: 3086, Avg. loss: 0.025528
Total training time: 0.04 seconds.
-- Epoch 2
Norm: 28.19, NNZs: 207993, Bias: 0.080277, T: 9258, Avg. loss: 0.318131
Total training time: 0.10 seconds.
Norm: 22.60, NNZs: 193389, Bias: -0.860632, T: 58634, Avg. loss: 0.015974
Total training time: 0.70 seconds.
-- Epoch 4
Norm: 22.88, NNZs: 122149, Bias: -0.523237, T: 55548, Avg. loss: 0.021645
Total training time: 0.66 seconds.
-- Epoch 20
-- Epoch 19
Norm: 5.19, NNZs: 120683, Bias: -0.105031, T: 6172, Avg. loss: 0.023144
Total training time: 0.07 seconds.
-- Epoch 3
Norm: 23.10, NNZs: 193406, Bias: -0.890322, T: 61720, Avg. loss: 0.015649
Total training time: 0.73 seconds.
Norm: 23.58, NNZs: 122381, Bias: -0.540829, T: 58634, Avg. loss: 0.021352
Total training time: 0.68 seconds.
-- Epoch 1
Norm: 31.81, NNZs: 214237, Bias: 0.110182, T: 12344, Avg. loss: 0.304635
Total training time: 0.14 seconds.
-- Epoch 20
-- Epoch 5
Norm: 13.96, NNZs: 111289, Bias: -0.128534, T: 3086, Avg. loss: 0.104556
Total training time: 0.03 seconds.
Norm: 6.09, NNZs: 121605, Bias: -0.123187, T: 9258, Avg. loss: 0.022393
Total training time: 0.11 seconds.
Norm: 35.00, NNZs: 217858, Bias: 0.128803, T: 15430, Avg. loss: 0.293941
Total training time: 0.17 seconds.
-- Epoch 2
-- Epoch 4
-- Epoch 6
Norm: 24.25, NNZs: 122449, Bias: -0.551205, T: 61720, Avg. loss: 0.021079
Total training time: 0.72 seconds.
-- Epoch 1
Norm: 17.68, NNZs: 118296, Bias: -0.170776, T: 6172, Avg. loss: 0.075644
Total training time: 0.06 seconds.
Norm: 38.11, NNZs: 221803, Bias: 0.103495, T: 18516, Avg. loss: 0.285830
Total training time: 0.20 seconds.
-- Epoch 3
-- Epoch 7
Norm: 7.11, NNZs: 122508, Bias: -0.120374, T: 12344, Avg. loss: 0.021582
Total training time: 0.15 seconds.
-- Epoch 5
Norm: 4.43, NNZs: 122635, Bias: -0.136562, T: 3086, Avg. loss: 0.038590
Total training time: 0.03 seconds.
-- Epoch 2
Norm: 20.03, NNZs: 123116, Bias: -0.208258, T: 9258, Avg. loss: 0.062622
Total training time: 0.09 seconds.
-- Epoch 4
Norm: 41.25, NNZs: 223819, Bias: 0.143381, T: 21602, Avg. loss: 0.278759
Total training time: 0.23 seconds.
-- Epoch 8
Norm: 8.08, NNZs: 123350, Bias: -0.149308, T: 15430, Avg. loss: 0.021336
Total training time: 0.18 seconds.
-- Epoch 6
Norm: 6.27, NNZs: 135275, Bias: -0.196787, T: 6172, Avg. loss: 0.036198
Total training time: 0.07 seconds.
-- Epoch 3
Norm: 21.93, NNZs: 125368, Bias: -0.232580, T: 12344, Avg. loss: 0.054708
Total training time: 0.12 seconds.
-- Epoch 5
Norm: 43.64, NNZs: 225102, Bias: 0.145950, T: 24688, Avg. loss: 0.273223
Total training time: 0.27 seconds.
-- Epoch 9
Norm: 8.99, NNZs: 123962, Bias: -0.152150, T: 18516, Avg. loss: 0.020978
Total training time: 0.23 seconds.
Norm: 23.49, NNZs: 197197, Bias: -0.251478, T: 15430, Avg. loss: 0.049232
Total training time: 0.15 seconds.
-- Epoch 7
-- Epoch 6
Norm: 8.10, NNZs: 147494, Bias: -0.253617, T: 9258, Avg. loss: 0.035141
Total training time: 0.11 seconds.
-- Epoch 4
Norm: 46.23, NNZs: 226723, Bias: 0.154517, T: 27774, Avg. loss: 0.268186
Total training time: 0.32 seconds.
Norm: 24.85, NNZs: 197642, Bias: -0.273113, T: 18516, Avg. loss: 0.045086
Total training time: 0.18 seconds.
-- Epoch 10
-- Epoch 7
Norm: 10.21, NNZs: 124235, Bias: -0.174640, T: 21602, Avg. loss: 0.020580
Total training time: 0.27 seconds.
-- Epoch 8
Norm: 10.05, NNZs: 153358, Bias: -0.300442, T: 12344, Avg. loss: 0.033966
Total training time: 0.16 seconds.
-- Epoch 5
Norm: 25.98, NNZs: 198867, Bias: -0.294621, T: 21602, Avg. loss: 0.041610
Total training time: 0.22 seconds.
-- Epoch 8
Norm: 48.73, NNZs: 228073, Bias: 0.140815, T: 30860, Avg. loss: 0.263191
Total training time: 0.36 seconds.
-- Epoch 11
Norm: 11.24, NNZs: 124452, Bias: -0.171303, T: 24688, Avg. loss: 0.020181
Total training time: 0.32 seconds.
-- Epoch 9
Norm: 11.72, NNZs: 155093, Bias: -0.356987, T: 15430, Avg. loss: 0.033239
Total training time: 0.21 seconds.
-- Epoch 6
Norm: 27.02, NNZs: 199543, Bias: -0.313513, T: 24688, Avg. loss: 0.038958
Total training time: 0.28 seconds.
-- Epoch 9
Norm: 12.18, NNZs: 124626, Bias: -0.182191, T: 27774, Avg. loss: 0.019822
Total training time: 0.36 seconds.
-- Epoch 10
Norm: 51.06, NNZs: 229198, Bias: 0.133059, T: 33946, Avg. loss: 0.258760
Total training time: 0.42 seconds.
-- Epoch 12
Norm: 13.31, NNZs: 158115, Bias: -0.401990, T: 18516, Avg. loss: 0.032422
Total training time: 0.26 seconds.
-- Epoch 7
Norm: 27.99, NNZs: 200260, Bias: -0.331259, T: 27774, Avg. loss: 0.036673
Total training time: 0.33 seconds.
Norm: 12.89, NNZs: 124773, Bias: -0.182816, T: 30860, Avg. loss: 0.019544
Total training time: 0.41 seconds.
-- Epoch 10
-- Epoch 11
Norm: 53.41, NNZs: 229657, Bias: 0.136785, T: 37032, Avg. loss: 0.254805
Total training time: 0.47 seconds.
Norm: 14.79, NNZs: 161112, Bias: -0.455908, T: 21602, Avg. loss: 0.031552
Total training time: 0.30 seconds.
-- Epoch 13
-- Epoch 8
Norm: 28.69, NNZs: 200284, Bias: -0.341337, T: 30860, Avg. loss: 0.034679
Total training time: 0.38 seconds.
Norm: 13.81, NNZs: 125078, Bias: -0.187740, T: 33946, Avg. loss: 0.019260
Total training time: 0.46 seconds.
Norm: 55.62, NNZs: 230320, Bias: 0.123497, T: 40118, Avg. loss: 0.251150
Total training time: 0.52 seconds.
-- Epoch 11
-- Epoch 12
-- Epoch 14
Norm: 15.97, NNZs: 162284, Bias: -0.481097, T: 24688, Avg. loss: 0.030750
Total training time: 0.35 seconds.
-- Epoch 9
Norm: 29.28, NNZs: 200768, Bias: -0.344554, T: 33946, Avg. loss: 0.032918
Total training time: 0.42 seconds.
Norm: 58.06, NNZs: 230430, Bias: 0.115743, T: 43204, Avg. loss: 0.247922
Total training time: 0.56 seconds.
-- Epoch 12
-- Epoch 15
Norm: 14.61, NNZs: 125208, Bias: -0.194707, T: 37032, Avg. loss: 0.019022
Total training time: 0.51 seconds.
-- Epoch 13
Norm: 17.25, NNZs: 164104, Bias: -0.532449, T: 27774, Avg. loss: 0.030104
Total training time: 0.40 seconds.
-- Epoch 10
Norm: 29.94, NNZs: 200841, Bias: -0.367645, T: 37032, Avg. loss: 0.031440
Total training time: 0.46 seconds.
-- Epoch 13
Norm: 60.22, NNZs: 230825, Bias: 0.100202, T: 46290, Avg. loss: 0.244781
Total training time: 0.60 seconds.
-- Epoch 16
Norm: 15.25, NNZs: 125673, Bias: -0.211541, T: 40118, Avg. loss: 0.018723
Total training time: 0.56 seconds.
-- Epoch 14
Norm: 18.34, NNZs: 166056, Bias: -0.559797, T: 30860, Avg. loss: 0.029522
Total training time: 0.45 seconds.
-- Epoch 11
Norm: 30.61, NNZs: 200853, Bias: -0.380334, T: 40118, Avg. loss: 0.030217
Total training time: 0.50 seconds.
-- Epoch 14
Norm: 62.34, NNZs: 231738, Bias: 0.094116, T: 49376, Avg. loss: 0.241809
Total training time: 0.65 seconds.
Norm: 15.97, NNZs: 125814, Bias: -0.200610, T: 43204, Avg. loss: 0.018476
Total training time: 0.60 seconds.
-- Epoch 17
-- Epoch 15
Norm: 19.33, NNZs: 166746, Bias: -0.600310, T: 33946, Avg. loss: 0.028775
Total training time: 0.49 seconds.
-- Epoch 12
Norm: 31.21, NNZs: 200893, Bias: -0.378789, T: 43204, Avg. loss: 0.029055
Total training time: 0.54 seconds.
-- Epoch 15
Norm: 64.24, NNZs: 232130, Bias: 0.107547, T: 52462, Avg. loss: 0.238857
Total training time: 0.69 seconds.
-- Epoch 18
Norm: 16.74, NNZs: 125983, Bias: -0.221371, T: 46290, Avg. loss: 0.018235
Total training time: 0.64 seconds.
-- Epoch 16
Norm: 20.43, NNZs: 167263, Bias: -0.630100, T: 37032, Avg. loss: 0.028224
Total training time: 0.53 seconds.
-- Epoch 13
Norm: 31.78, NNZs: 201243, Bias: -0.400927, T: 46290, Avg. loss: 0.028051
Total training time: 0.59 seconds.
Norm: 66.13, NNZs: 232379, Bias: 0.095914, T: 55548, Avg. loss: 0.236210
Total training time: 0.72 seconds.
-- Epoch 16
Norm: 17.38, NNZs: 126084, Bias: -0.228337, T: 49376, Avg. loss: 0.017953
Total training time: 0.67 seconds.
-- Epoch 19
-- Epoch 17
Norm: 21.38, NNZs: 167481, Bias: -0.654408, T: 40118, Avg. loss: 0.027617
Total training time: 0.59 seconds.
Norm: 32.25, NNZs: 201736, Bias: -0.408840, T: 49376, Avg. loss: 0.027064
Total training time: 0.63 seconds.
Norm: 68.15, NNZs: 233140, Bias: 0.106301, T: 58634, Avg. loss: 0.233569
Total training time: 0.77 seconds.
-- Epoch 14
-- Epoch 17
Norm: 17.89, NNZs: 126168, Bias: -0.227317, T: 52462, Avg. loss: 0.017721
Total training time: 0.72 seconds.
-- Epoch 20
-- Epoch 18
Norm: 69.68, NNZs: 233734, Bias: 0.119130, T: 61720, Avg. loss: 0.230943
Total training time: 0.81 seconds.
Norm: 18.54, NNZs: 126237, Bias: -0.239312, T: 55548, Avg. loss: 0.017522
Total training time: 0.76 seconds.
-- Epoch 19
-- Epoch 1
Norm: 32.69, NNZs: 202034, Bias: -0.420348, T: 52462, Avg. loss: 0.026171
Total training time: 0.68 seconds.
-- Epoch 18
Norm: 22.42, NNZs: 167601, Bias: -0.693532, T: 43204, Avg. loss: 0.027133
Total training time: 0.65 seconds.
-- Epoch 15
[Parallel(n_jobs=4)]: Done 16 out of 15 | elapsed: 2.2s remaining: -0.1s
[Parallel(n_jobs=4)]: Done 16 out of 15 | elapsed: 2.3s remaining: -0.1s
[Parallel(n_jobs=4)]: Done 16 out of 15 | elapsed: 2.4s remaining: -0.1s
Norm: 19.15, NNZs: 126304, Bias: -0.257922, T: 58634, Avg. loss: 0.017318
Total training time: 0.79 seconds.
-- Epoch 20
Norm: 16.99, NNZs: 120622, Bias: -0.288076, T: 3086, Avg. loss: 0.190011
Total training time: 0.04 seconds.
-- Epoch 2
Norm: 33.16, NNZs: 202317, Bias: -0.428273, T: 55548, Avg. loss: 0.025384
Total training time: 0.73 seconds.
-- Epoch 19
Norm: 23.18, NNZs: 168430, Bias: -0.708947, T: 46290, Avg. loss: 0.026629
Total training time: 0.70 seconds.
-- Epoch 16
Norm: 19.79, NNZs: 126370, Bias: -0.260907, T: 61720, Avg. loss: 0.017141
Total training time: 0.83 seconds.
-- Epoch 1
Norm: 21.49, NNZs: 124552, Bias: -0.345108, T: 6172, Avg. loss: 0.150839
Total training time: 0.08 seconds.
-- Epoch 3
Norm: 33.54, NNZs: 202500, Bias: -0.431745, T: 58634, Avg. loss: 0.024636
Total training time: 0.79 seconds.
Norm: 23.89, NNZs: 168732, Bias: -0.739428, T: 49376, Avg. loss: 0.026162
Total training time: 0.75 seconds.
Norm: 4.65, NNZs: 112943, Bias: -0.063152, T: 3086, Avg. loss: 0.061934
Total training time: 0.04 seconds.
-- Epoch 20
-- Epoch 17
-- Epoch 2
Norm: 24.34, NNZs: 125943, Bias: -0.400297, T: 9258, Avg. loss: 0.132543
Total training time: 0.11 seconds.
-- Epoch 4
Norm: 6.44, NNZs: 116004, Bias: -0.071132, T: 6172, Avg. loss: 0.060214
Total training time: 0.07 seconds.
Norm: 26.88, NNZs: 128132, Bias: -0.454860, T: 12344, Avg. loss: 0.121961
Total training time: 0.14 seconds.
-- Epoch 3
-- Epoch 5
Norm: 33.93, NNZs: 202502, Bias: -0.445693, T: 61720, Avg. loss: 0.023944
Total training time: 0.83 seconds.
Norm: 24.58, NNZs: 168848, Bias: -0.755637, T: 52462, Avg. loss: 0.025660
Total training time: 0.79 seconds.
-- Epoch 1
-- Epoch 18
Norm: 8.50, NNZs: 119354, Bias: -0.067998, T: 9258, Avg. loss: 0.058256
Total training time: 0.10 seconds.
-- Epoch 4
Norm: 29.06, NNZs: 130767, Bias: -0.492980, T: 15430, Avg. loss: 0.114439
Total training time: 0.17 seconds.
-- Epoch 6
Norm: 6.39, NNZs: 38373, Bias: -0.058019, T: 3086, Avg. loss: 0.034359
Total training time: 0.04 seconds.
Norm: 25.32, NNZs: 169145, Bias: -0.783026, T: 55548, Avg. loss: 0.025262
Total training time: 0.84 seconds.
-- Epoch 2
Norm: 9.91, NNZs: 123613, Bias: -0.065427, T: 12344, Avg. loss: 0.057547
Total training time: 0.13 seconds.
-- Epoch 19
-- Epoch 5
Norm: 30.81, NNZs: 131666, Bias: -0.522188, T: 18516, Avg. loss: 0.108598
Total training time: 0.20 seconds.
-- Epoch 7
Norm: 11.52, NNZs: 124643, Bias: -0.065988, T: 15430, Avg. loss: 0.056621Norm: 8.38, NNZs: 39305, Bias: -0.078471, T: 6172, Avg. loss: 0.029883
Total training time: 0.09 seconds.
Total training time: 0.17 seconds.
Norm: 32.79, NNZs: 136173, Bias: -0.563929, T: 21602, Avg. loss: 0.104146
Total training time: 0.24 seconds.
-- Epoch 6
-- Epoch 8
-- Epoch 3
Norm: 25.94, NNZs: 169618, Bias: -0.798919, T: 58634, Avg. loss: 0.024811
Total training time: 0.89 seconds.
-- Epoch 20
Norm: 12.76, NNZs: 125861, Bias: -0.059752, T: 18516, Avg. loss: 0.055537
Total training time: 0.20 seconds.
Norm: 34.16, NNZs: 139788, Bias: -0.582036, T: 24688, Avg. loss: 0.100189
Total training time: 0.28 seconds.
-- Epoch 7
-- Epoch 9
Norm: 9.10, NNZs: 40003, Bias: -0.070389, T: 9258, Avg. loss: 0.027003
Total training time: 0.13 seconds.
-- Epoch 4
Norm: 26.39, NNZs: 169755, Bias: -0.815149, T: 61720, Avg. loss: 0.024343
Total training time: 0.94 seconds.
Norm: 14.19, NNZs: 126668, Bias: -0.059407, T: 21602, Avg. loss: 0.054872
Total training time: 0.24 seconds.
Norm: 35.75, NNZs: 140606, Bias: -0.625720, T: 27774, Avg. loss: 0.096780
Total training time: 0.32 seconds.
-- Epoch 8
Norm: 10.23, NNZs: 40350, Bias: -0.077548, T: 12344, Avg. loss: 0.025573
Total training time: 0.17 seconds.
-- Epoch 10
-- Epoch 5
Norm: 15.72, NNZs: 127409, Bias: -0.071362, T: 24688, Avg. loss: 0.054077
Total training time: 0.28 seconds.
Norm: 37.09, NNZs: 140766, Bias: -0.639303, T: 30860, Avg. loss: 0.093913
Total training time: 0.35 seconds.
-- Epoch 9
Norm: 11.17, NNZs: 40508, Bias: -0.088963, T: 15430, Avg. loss: 0.024367
Total training time: 0.20 seconds.
-- Epoch 11
-- Epoch 6
Norm: 17.21, NNZs: 128811, Bias: -0.069810, T: 27774, Avg. loss: 0.053357
Total training time: 0.31 seconds.
Norm: 38.40, NNZs: 141879, Bias: -0.655668, T: 33946, Avg. loss: 0.091096
Total training time: 0.38 seconds.
-- Epoch 10
Norm: 11.81, NNZs: 40609, Bias: -0.086161, T: 18516, Avg. loss: 0.023316
Total training time: 0.23 seconds.
-- Epoch 12
-- Epoch 7
Norm: 18.17, NNZs: 129603, Bias: -0.064541, T: 30860, Avg. loss: 0.052668
Total training time: 0.34 seconds.
Norm: 39.77, NNZs: 142218, Bias: -0.675478, T: 37032, Avg. loss: 0.088853
Total training time: 0.42 seconds.
-- Epoch 11
Norm: 12.69, NNZs: 40667, Bias: -0.111582, T: 21602, Avg. loss: 0.022629
Total training time: 0.27 seconds.
-- Epoch 13
-- Epoch 8
[Parallel(n_jobs=4)]: Done 16 out of 15 | elapsed: 2.5s remaining: -0.2s
Norm: 19.52, NNZs: 130246, Bias: -0.058023, T: 33946, Avg. loss: 0.052161
Total training time: 0.38 seconds.
Norm: 40.74, NNZs: 142850, Bias: -0.703940, T: 40118, Avg. loss: 0.086770
Total training time: 0.46 seconds.
-- Epoch 12
Norm: 13.23, NNZs: 40818, Bias: -0.087900, T: 24688, Avg. loss: 0.022145
Total training time: 0.31 seconds.
-- Epoch 14
-- Epoch 9
Norm: 20.80, NNZs: 131729, Bias: -0.064334, T: 37032, Avg. loss: 0.051542
Total training time: 0.42 seconds.
Norm: 41.85, NNZs: 142958, Bias: -0.716650, T: 43204, Avg. loss: 0.084812
Total training time: 0.49 seconds.
-- Epoch 13
Norm: 13.53, NNZs: 40933, Bias: -0.092750, T: 27774, Avg. loss: 0.021465
Total training time: 0.34 seconds.
-- Epoch 15
-- Epoch 10
Norm: 21.88, NNZs: 131825, Bias: -0.077474, T: 40118, Avg. loss: 0.050901
Total training time: 0.45 seconds.
Norm: 42.89, NNZs: 143206, Bias: -0.749313, T: 46290, Avg. loss: 0.082909
Total training time: 0.53 seconds.
-- Epoch 14
Norm: 14.24, NNZs: 40966, Bias: -0.093801, T: 30860, Avg. loss: 0.021145
Total training time: 0.38 seconds.
-- Epoch 16
-- Epoch 11
Norm: 23.01, NNZs: 131909, Bias: -0.076904, T: 43204, Avg. loss: 0.050475
Total training time: 0.49 seconds.
Norm: 44.02, NNZs: 143356, Bias: -0.743375, T: 49376, Avg. loss: 0.081376
Total training time: 0.57 seconds.
-- Epoch 15
-- Epoch 17
Norm: 14.83, NNZs: 41011, Bias: -0.097276, T: 33946, Avg. loss: 0.020717
Total training time: 0.42 seconds.
-- Epoch 12
Norm: 23.98, NNZs: 134833, Bias: -0.095332, T: 46290, Avg. loss: 0.049863
Total training time: 0.53 seconds.
Norm: 44.97, NNZs: 143524, Bias: -0.764066, T: 52462, Avg. loss: 0.079908
Total training time: 0.60 seconds.
-- Epoch 16
Norm: 15.03, NNZs: 41046, Bias: -0.101251, T: 37032, Avg. loss: 0.020372
Total training time: 0.45 seconds.
-- Epoch 18
-- Epoch 13
Norm: 25.01, NNZs: 135123, Bias: -0.081742, T: 49376, Avg. loss: 0.049485
Total training time: 0.56 seconds.
Norm: 45.90, NNZs: 143621, Bias: -0.774208, T: 55548, Avg. loss: 0.078544
Total training time: 0.64 seconds.
-- Epoch 17
Norm: 15.46, NNZs: 41077, Bias: -0.102860, T: 40118, Avg. loss: 0.020123
Total training time: 0.49 seconds.
-- Epoch 19
-- Epoch 14
Norm: 26.07, NNZs: 136108, Bias: -0.080801, T: 52462, Avg. loss: 0.048961
Total training time: 0.60 seconds.
Norm: 46.95, NNZs: 144049, Bias: -0.797482, T: 58634, Avg. loss: 0.077391
Total training time: 0.68 seconds.
-- Epoch 18
-- Epoch 20
Norm: 15.90, NNZs: 41087, Bias: -0.104447, T: 43204, Avg. loss: 0.019908
Total training time: 0.53 seconds.
-- Epoch 15
Norm: 27.11, NNZs: 136187, Bias: -0.086820, T: 55548, Avg. loss: 0.048565
Total training time: 0.64 seconds.
Norm: 47.88, NNZs: 144232, Bias: -0.818237, T: 61720, Avg. loss: 0.076270
Total training time: 0.71 seconds.
-- Epoch 19
Norm: 16.22, NNZs: 41123, Bias: -0.108924, T: 46290, Avg. loss: 0.019647
Total training time: 0.57 seconds.
-- Epoch 16
Norm: 28.09, NNZs: 136447, Bias: -0.091359, T: 58634, Avg. loss: 0.048094
Total training time: 0.67 seconds.
-- Epoch 20
Norm: 16.70, NNZs: 41146, Bias: -0.124716, T: 49376, Avg. loss: 0.019483
Total training time: 0.60 seconds.
-- Epoch 17
Norm: 28.96, NNZs: 136708, Bias: -0.086382, T: 61720, Avg. loss: 0.047732
Total training time: 0.70 seconds.
Norm: 17.23, NNZs: 41198, Bias: -0.121802, T: 52462, Avg. loss: 0.019314
Total training time: 0.63 seconds.
-- Epoch 18
Norm: 17.71, NNZs: 41212, Bias: -0.122078, T: 55548, Avg. loss: 0.019084
Total training time: 0.66 seconds.
-- Epoch 19
Norm: 18.12, NNZs: 41229, Bias: -0.123928, T: 58634, Avg. loss: 0.018849
Total training time: 0.68 seconds.
-- Epoch 20
Norm: 18.52, NNZs: 41248, Bias: -0.134498, T: 61720, Avg. loss: 0.018661
Total training time: 0.71 seconds.
[Parallel(n_jobs=4)]: Done 16 out of 15 | elapsed: 2.9s remaining: -0.2s
[Parallel(n_jobs=4)]: Done 16 out of 15 | elapsed: 3.0s remaining: -0.2s
[Parallel(n_jobs=4)]: Done 16 out of 15 | elapsed: 3.1s remaining: -0.2s
[Parallel(n_jobs=4)]: Done 15 out of 15 | elapsed: 3.1s finished
Out[17]:
PassiveAggressiveClassifier(C=1.0, class_weight=None, fit_intercept=True,
loss='hinge', n_iter=20, n_jobs=4, random_state=None,
shuffle=True, verbose=42, warm_start=False)
In [18]:
test_pred = model.predict(X_test)
In [19]:
print test_pred
test_ids = np.load("../data/features/test_ids.npy")
print test_ids
write_predictions(test_pred, test_ids, "../predictions/passive_basic.csv")
[10 8 8 ..., 10 8 8]
['298379101ad17b816ffeb88e8ba9ce915b7a46fc9'
'cb56d8fd4accec76a5608a000d65711d1cfa9cc3e'
'21ead3c92f31d801b1a887c1b0dc12d503f7204d6' ...,
'E96d65723d24aa91a9fa54f92754444f99491d2e1'
'107e0ba3d61f2650b09ef02a30f0bab0b82c1933d'
'16a64eeb54Ca49adf9608e2206db5aedc22038a09']
In [ ]:
Content source: sandias42/mlware
Similar notebooks: