Compiling...
Training...
epoch 1 / 100 in 119.0s: loss 2.318504, train: 0.134, val 0.157, lr 9.500000e-05 mom 9.100000e-01
epoch 2 / 100 in 118.9s: loss 2.300581, train: 0.166, val 0.146, lr 9.025000e-05 mom 9.190000e-01
epoch 3 / 100 in 119.0s: loss 2.292756, train: 0.206, val 0.191, lr 8.573750e-05 mom 9.270999e-01
epoch 4 / 100 in 119.0s: loss 2.275991, train: 0.248, val 0.232, lr 8.145062e-05 mom 9.343899e-01
epoch 5 / 100 in 119.0s: loss 2.255572, train: 0.265, val 0.253, lr 7.737809e-05 mom 9.409509e-01
epoch 6 / 100 in 119.0s: loss 2.229092, train: 0.292, val 0.258, lr 7.350919e-05 mom 9.468558e-01
epoch 7 / 100 in 119.0s: loss 2.200565, train: 0.289, val 0.285, lr 6.983373e-05 mom 9.521703e-01
epoch 8 / 100 in 119.0s: loss 2.173981, train: 0.307, val 0.299, lr 6.634204e-05 mom 9.569532e-01
epoch 9 / 100 in 119.0s: loss 2.142996, train: 0.318, val 0.311, lr 6.302494e-05 mom 9.612579e-01
epoch 10 / 100 in 118.9s: loss 2.109364, train: 0.335, val 0.338, lr 5.987370e-05 mom 9.651321e-01
epoch 11 / 100 in 118.9s: loss 2.075525, train: 0.367, val 0.372, lr 5.688001e-05 mom 9.686189e-01
epoch 12 / 100 in 118.9s: loss 2.042083, train: 0.369, val 0.379, lr 5.403601e-05 mom 9.717571e-01
epoch 13 / 100 in 119.0s: loss 2.003143, train: 0.355, val 0.374, lr 5.133421e-05 mom 9.745814e-01
epoch 14 / 100 in 119.0s: loss 1.968326, train: 0.382, val 0.401, lr 4.876750e-05 mom 9.771232e-01
epoch 15 / 100 in 118.9s: loss 1.935849, train: 0.400, val 0.416, lr 4.632913e-05 mom 9.794109e-01
epoch 16 / 100 in 119.0s: loss 1.896845, train: 0.394, val 0.410, lr 4.401267e-05 mom 9.814698e-01
epoch 17 / 100 in 118.9s: loss 1.870250, train: 0.405, val 0.429, lr 4.181203e-05 mom 9.833229e-01
epoch 18 / 100 in 118.9s: loss 1.837316, train: 0.415, val 0.439, lr 3.972143e-05 mom 9.849906e-01
epoch 19 / 100 in 118.9s: loss 1.807514, train: 0.432, val 0.434, lr 3.773536e-05 mom 9.864916e-01
epoch 20 / 100 in 118.9s: loss 1.771687, train: 0.423, val 0.464, lr 3.584859e-05 mom 9.878424e-01
epoch 21 / 100 in 118.9s: loss 1.737611, train: 0.438, val 0.467, lr 3.405616e-05 mom 9.890581e-01
epoch 22 / 100 in 118.9s: loss 1.711730, train: 0.448, val 0.477, lr 3.235336e-05 mom 9.901523e-01
epoch 23 / 100 in 119.0s: loss 1.673019, train: 0.477, val 0.499, lr 3.073569e-05 mom 9.911371e-01
epoch 24 / 100 in 118.9s: loss 1.644735, train: 0.460, val 0.488, lr 2.919891e-05 mom 9.920233e-01
epoch 25 / 100 in 119.0s: loss 1.610350, train: 0.485, val 0.493, lr 2.773896e-05 mom 9.928210e-01
epoch 26 / 100 in 119.0s: loss 1.587085, train: 0.500, val 0.503, lr 2.635201e-05 mom 9.935389e-01
epoch 27 / 100 in 118.9s: loss 1.553481, train: 0.500, val 0.513, lr 2.503441e-05 mom 9.941850e-01
epoch 28 / 100 in 118.9s: loss 1.533502, train: 0.517, val 0.536, lr 2.378269e-05 mom 9.947665e-01
epoch 29 / 100 in 118.9s: loss 1.506634, train: 0.499, val 0.532, lr 2.259355e-05 mom 9.952899e-01
epoch 30 / 100 in 118.9s: loss 1.482524, train: 0.516, val 0.526, lr 2.146388e-05 mom 9.957609e-01
epoch 31 / 100 in 118.9s: loss 1.463194, train: 0.539, val 0.535, lr 2.039068e-05 mom 9.961848e-01
epoch 32 / 100 in 119.0s: loss 1.448789, train: 0.546, val 0.535, lr 1.937115e-05 mom 9.965663e-01
epoch 33 / 100 in 118.9s: loss 1.430224, train: 0.544, val 0.549, lr 1.840259e-05 mom 9.969097e-01
epoch 34 / 100 in 119.0s: loss 1.404319, train: 0.567, val 0.552, lr 1.748246e-05 mom 9.972187e-01
epoch 35 / 100 in 118.9s: loss 1.385945, train: 0.540, val 0.545, lr 1.660834e-05 mom 9.974968e-01
epoch 36 / 100 in 119.0s: loss 1.367607, train: 0.561, val 0.569, lr 1.577792e-05 mom 9.977472e-01
epoch 37 / 100 in 118.9s: loss 1.341838, train: 0.583, val 0.562, lr 1.498903e-05 mom 9.979725e-01
epoch 38 / 100 in 118.9s: loss 1.329648, train: 0.580, val 0.552, lr 1.423957e-05 mom 9.981753e-01
epoch 39 / 100 in 119.0s: loss 1.310204, train: 0.592, val 0.573, lr 1.352760e-05 mom 9.983577e-01
epoch 40 / 100 in 118.9s: loss 1.289379, train: 0.593, val 0.589, lr 1.285122e-05 mom 9.985219e-01
epoch 41 / 100 in 118.9s: loss 1.267939, train: 0.597, val 0.587, lr 1.220866e-05 mom 9.986697e-01
epoch 42 / 100 in 119.0s: loss 1.255105, train: 0.622, val 0.590, lr 1.159822e-05 mom 9.988028e-01
epoch 43 / 100 in 119.0s: loss 1.239694, train: 0.602, val 0.590, lr 1.101831e-05 mom 9.989225e-01
epoch 44 / 100 in 119.0s: loss 1.210926, train: 0.612, val 0.600, lr 1.046740e-05 mom 9.990303e-01
epoch 45 / 100 in 118.9s: loss 1.196522, train: 0.637, val 0.637, lr 9.944027e-06 mom 9.991273e-01
epoch 46 / 100 in 118.9s: loss 1.179403, train: 0.641, val 0.621, lr 9.446825e-06 mom 9.992145e-01
epoch 47 / 100 in 118.9s: loss 1.173354, train: 0.625, val 0.617, lr 8.974484e-06 mom 9.992931e-01
epoch 48 / 100 in 118.9s: loss 1.148145, train: 0.671, val 0.635, lr 8.525760e-06 mom 9.993638e-01
epoch 49 / 100 in 119.0s: loss 1.130034, train: 0.665, val 0.654, lr 8.099471e-06 mom 9.994274e-01
epoch 50 / 100 in 118.9s: loss 1.127878, train: 0.662, val 0.651, lr 7.694498e-06 mom 9.994847e-01
epoch 51 / 100 in 118.9s: loss 1.110297, train: 0.696, val 0.661, lr 7.309773e-06 mom 9.995362e-01
epoch 52 / 100 in 119.0s: loss 1.080579, train: 0.682, val 0.647, lr 6.944284e-06 mom 9.995826e-01
epoch 53 / 100 in 118.9s: loss 1.067140, train: 0.696, val 0.660, lr 6.597070e-06 mom 9.996243e-01
epoch 54 / 100 in 119.0s: loss 1.057995, train: 0.698, val 0.663, lr 6.267217e-06 mom 9.996619e-01
epoch 55 / 100 in 119.0s: loss 1.042966, train: 0.722, val 0.667, lr 5.953856e-06 mom 9.996957e-01
epoch 56 / 100 in 118.9s: loss 1.027454, train: 0.711, val 0.677, lr 5.656163e-06 mom 9.997261e-01
epoch 57 / 100 in 119.0s: loss 1.011541, train: 0.715, val 0.686, lr 5.373355e-06 mom 9.997535e-01
epoch 58 / 100 in 119.0s: loss 0.995829, train: 0.734, val 0.679, lr 5.104687e-06 mom 9.997782e-01
epoch 59 / 100 in 118.9s: loss 0.993285, train: 0.708, val 0.690, lr 4.849453e-06 mom 9.998003e-01
epoch 60 / 100 in 118.9s: loss 0.984133, train: 0.732, val 0.686, lr 4.606980e-06 mom 9.998203e-01
epoch 61 / 100 in 118.9s: loss 0.974277, train: 0.720, val 0.651, lr 4.376631e-06 mom 9.998382e-01
epoch 62 / 100 in 118.9s: loss 0.967135, train: 0.715, val 0.675, lr 4.157799e-06 mom 9.998544e-01
epoch 63 / 100 in 119.0s: loss 0.959195, train: 0.709, val 0.710, lr 3.949909e-06 mom 9.998689e-01
epoch 64 / 100 in 119.0s: loss 0.958395, train: 0.717, val 0.645, lr 3.752414e-06 mom 9.998820e-01
epoch 65 / 100 in 118.9s: loss 0.961230, train: 0.749, val 0.667, lr 3.564793e-06 mom 9.998938e-01
epoch 66 / 100 in 119.0s: loss 0.956396, train: 0.728, val 0.682, lr 3.386554e-06 mom 9.999000e-01
epoch 67 / 100 in 118.9s: loss 0.943995, train: 0.748, val 0.684, lr 3.217226e-06 mom 9.999000e-01
epoch 68 / 100 in 119.0s: loss 0.928266, train: 0.702, val 0.675, lr 3.056365e-06 mom 9.999000e-01
epoch 69 / 100 in 119.0s: loss 0.921137, train: 0.727, val 0.706, lr 2.903546e-06 mom 9.999000e-01
epoch 70 / 100 in 119.0s: loss 0.916508, train: 0.750, val 0.692, lr 2.758369e-06 mom 9.999000e-01
epoch 71 / 100 in 119.0s: loss 0.915388, train: 0.710, val 0.688, lr 2.620450e-06 mom 9.999000e-01
epoch 72 / 100 in 119.0s: loss 0.929153, train: 0.728, val 0.682, lr 2.489428e-06 mom 9.999000e-01
epoch 73 / 100 in 119.0s: loss 0.922188, train: 0.733, val 0.665, lr 2.364957e-06 mom 9.999000e-01
epoch 74 / 100 in 119.0s: loss 0.906357, train: 0.729, val 0.658, lr 2.246709e-06 mom 9.999000e-01
epoch 75 / 100 in 119.0s: loss 0.911330, train: 0.729, val 0.658, lr 2.134374e-06 mom 9.999000e-01
epoch 76 / 100 in 119.0s: loss 0.903888, train: 0.731, val 0.673, lr 2.027655e-06 mom 9.999000e-01
epoch 77 / 100 in 118.9s: loss 0.911090, train: 0.721, val 0.674, lr 1.926272e-06 mom 9.999000e-01
epoch 78 / 100 in 119.0s: loss 0.898858, train: 0.728, val 0.665, lr 1.829958e-06 mom 9.999000e-01
epoch 79 / 100 in 119.0s: loss 0.903461, train: 0.723, val 0.684, lr 1.738461e-06 mom 9.999000e-01
epoch 80 / 100 in 119.0s: loss 0.899644, train: 0.738, val 0.685, lr 1.651538e-06 mom 9.999000e-01
epoch 81 / 100 in 119.0s: loss 0.892099, train: 0.741, val 0.670, lr 1.568961e-06 mom 9.999000e-01
epoch 82 / 100 in 119.0s: loss 0.888836, train: 0.753, val 0.693, lr 1.490513e-06 mom 9.999000e-01
epoch 83 / 100 in 119.0s: loss 0.887223, train: 0.717, val 0.652, lr 1.415987e-06 mom 9.999000e-01
epoch 84 / 100 in 119.0s: loss 0.878957, train: 0.739, val 0.667, lr 1.345188e-06 mom 9.999000e-01
epoch 85 / 100 in 118.9s: loss 0.872763, train: 0.772, val 0.703, lr 1.277928e-06 mom 9.999000e-01
epoch 86 / 100 in 119.0s: loss 0.861406, train: 0.748, val 0.669, lr 1.214032e-06 mom 9.999000e-01
epoch 87 / 100 in 119.0s: loss 0.864802, train: 0.741, val 0.677, lr 1.153330e-06 mom 9.999000e-01
epoch 88 / 100 in 119.0s: loss 0.859530, train: 0.752, val 0.700, lr 1.095664e-06 mom 9.999000e-01
epoch 89 / 100 in 119.0s: loss 0.857563, train: 0.746, val 0.694, lr 1.040881e-06 mom 9.999000e-01
epoch 90 / 100 in 119.0s: loss 0.844187, train: 0.750, val 0.699, lr 9.888365e-07 mom 9.999000e-01
epoch 91 / 100 in 119.0s: loss 0.840757, train: 0.747, val 0.679, lr 9.393947e-07 mom 9.999000e-01
epoch 92 / 100 in 119.0s: loss 0.832068, train: 0.754, val 0.688, lr 8.924250e-07 mom 9.999000e-01
epoch 93 / 100 in 119.0s: loss 0.827147, train: 0.749, val 0.696, lr 8.478037e-07 mom 9.999000e-01
epoch 94 / 100 in 119.0s: loss 0.817345, train: 0.748, val 0.683, lr 8.054135e-07 mom 9.999000e-01
epoch 95 / 100 in 119.0s: loss 0.820755, train: 0.754, val 0.684, lr 7.651429e-07 mom 9.999000e-01
epoch 96 / 100 in 119.0s: loss 0.816936, train: 0.775, val 0.698, lr 7.268857e-07 mom 9.999000e-01
epoch 97 / 100 in 119.0s: loss 0.815445, train: 0.759, val 0.701, lr 6.905415e-07 mom 9.999000e-01
epoch 98 / 100 in 119.0s: loss 0.795261, train: 0.779, val 0.708, lr 6.560144e-07 mom 9.999000e-01
epoch 99 / 100 in 119.0s: loss 0.803294, train: 0.765, val 0.701, lr 6.232137e-07 mom 9.999000e-01
epoch 100 / 100 in 119.0s: loss 0.804475, train: 0.767, val 0.703, lr 5.920530e-07 mom 9.999000e-01
0.470 0.779017857143 0.709821428571 crp_filter_size=3 momentum_decay=0.9 num_fc=3 learning_rate=0.0001 batch_size=128 fc_num_units=256 learning_rate_decay=0.95 num_epochs=100 num_crp=3 reg=0.001 momentum=0.9 crp_num_filters=128