notebook.community

Edit and run



In [1]:

    
import tensorflow as tf
import simplejson
import matplotlib.pyplot as plt
%matplotlib inline
import threading
import tensorflow.contrib.slim as slim
from utils import data_utils, train_utils
import datetime
import os
import time
import pandas as pd



In [2]:

    
def argument_scope(H, phase):
    '''
    This returns the arg_scope for slim.arg_scope(), which defines the options for slim.functions
    '''
    padding = H['padding']
    is_training = {'train': True, 'validate': False, 'test': False}[phase]
    pool_kernel = [2, 2]
    pool_stride = 2

    
    params = {
        "decay": 0.997,
        "epsilon": 0.001,
    }

    with slim.arg_scope([slim.conv2d], 
                        # slim.relu would raise an error here
                        activation_fn=tf.nn.relu, 
                        padding=padding, 
                        normalizer_fn=slim.batch_norm, 
                        # normalizer_fn=None,
                        weights_initializer=tf.contrib.layers.variance_scaling_initializer()):
        with slim.arg_scope([slim.batch_norm, slim.dropout], is_training=is_training):
            with slim.arg_scope([slim.max_pool2d], stride=pool_stride, kernel_size=pool_kernel):
                with slim.arg_scope([slim.conv2d_transpose], 
                                    activation_fn=None, 
                                    normalizer_fn=None,
                                    padding=padding, 
                                    weights_initializer=tf.contrib.layers.variance_scaling_initializer()) as sc:
                    return sc



In [3]:

    
def build_pred(x_in, H, phase):
    '''
    This function builds the prediction model
    '''
    num_class = H['num_class']
    
    conv_kernel_1 = [1, 1]
    conv_kernel_3 = [3, 3]
    pool_kernel = [2, 2]
    pool_stride = 2

    early_feature = {}
    reuse = {'train': False, 'validate': True, 'test': False}[phase]
    
    with slim.arg_scope(argument_scope(H, phase)):
        
        scope_name = 'block_1'
        x_input = x_in
        num_outputs = 64
        with tf.variable_scope(scope_name, reuse = reuse):
            layer_1 = slim.conv2d(x_input, num_outputs, conv_kernel_3, scope='conv1')
            layer_2 = slim.conv2d(layer_1, num_outputs, conv_kernel_3, scope='conv2')
            early_feature[scope_name] = layer_2
        
        scope_name = 'block_2'
        x_input = slim.max_pool2d(layer_2)
        num_outputs = 128
        with tf.variable_scope(scope_name, reuse = reuse):
            layer_1 = slim.conv2d(x_input, num_outputs, conv_kernel_3, scope='conv1')
            layer_2 = slim.conv2d(layer_1, num_outputs, conv_kernel_3, scope='conv2')
            early_feature[scope_name] = layer_2

        scope_name = 'block_3'
        x_input = slim.max_pool2d(layer_2)
        num_outputs = 256
        with tf.variable_scope(scope_name, reuse = reuse):
            layer_1 = slim.conv2d(x_input, num_outputs, conv_kernel_3, scope='conv1')
            layer_2 = slim.conv2d(layer_1, num_outputs, conv_kernel_3, scope='conv2')
            early_feature[scope_name] = layer_2
            
        scope_name = 'block_4'
        x_input = slim.max_pool2d(layer_2)
        num_outputs = 512
        with tf.variable_scope(scope_name, reuse = reuse):
            layer_1 = slim.conv2d(x_input, num_outputs, conv_kernel_3, scope='conv1')
            layer_2 = slim.conv2d(layer_1, num_outputs, conv_kernel_3, scope='conv2')
            early_feature[scope_name] = layer_2

        scope_name = 'block_5'
        x_input = slim.max_pool2d(layer_2)
        num_outputs = 1024
        with tf.variable_scope(scope_name, reuse = reuse):
            layer_1 = slim.conv2d(x_input, num_outputs, conv_kernel_3, scope='conv1')
            layer_2 = slim.conv2d(layer_1, num_outputs, conv_kernel_3, scope='conv2')
            early_feature[scope_name] = layer_2
            
        scope_name = 'block_6'
        num_outputs = 512
        with tf.variable_scope(scope_name, reuse = reuse):
            trans_layer = slim.conv2d_transpose(
                layer_2, num_outputs, pool_kernel, pool_stride, scope='conv_trans')
            x_input = tf.concat([early_feature['block_4'], trans_layer], axis=3)
            layer_1 = slim.conv2d(x_input, num_outputs, conv_kernel_3, scope='conv1')
            layer_2 = slim.conv2d(layer_1, num_outputs, conv_kernel_3, scope='conv2')
            early_feature[scope_name] = layer_2
            
        scope_name = 'block_7'
        num_outputs = 256
        with tf.variable_scope(scope_name, reuse = reuse):
            trans_layer = slim.conv2d_transpose(
                layer_2, num_outputs, pool_kernel, pool_stride, scope='conv_trans')
            x_input = tf.concat([early_feature['block_3'], trans_layer], axis=3)
            layer_1 = slim.conv2d(x_input, num_outputs, conv_kernel_3, scope='conv1')
            layer_2 = slim.conv2d(layer_1, num_outputs, conv_kernel_3, scope='conv2')
            early_feature[scope_name] = layer_2
            
        scope_name = 'block_8'
        num_outputs = 128
        with tf.variable_scope(scope_name, reuse = reuse):
            trans_layer = slim.conv2d_transpose(
                layer_2, num_outputs, pool_kernel, pool_stride, scope='conv_trans')
            x_input = tf.concat([early_feature['block_2'], trans_layer], axis=3)
            layer_1 = slim.conv2d(x_input, num_outputs, conv_kernel_3, scope='conv1')
            layer_2 = slim.conv2d(layer_1, num_outputs, conv_kernel_3, scope='conv2')
            early_feature[scope_name] = layer_2
        
        scope_name = 'block_9'
        num_outputs = 64
        with tf.variable_scope(scope_name, reuse = reuse):
            trans_layer = slim.conv2d_transpose(
                layer_2, num_outputs, pool_kernel, pool_stride, scope='conv_trans')
            x_input = tf.concat([early_feature['block_1'], trans_layer], axis=3)
            layer_1 = slim.conv2d(x_input, num_outputs, conv_kernel_3, scope='conv1')
            layer_2 = slim.conv2d(layer_1, num_outputs, conv_kernel_3, scope='conv2')
            early_feature[scope_name] = layer_2
        
        scope_name = 'pred'
        with tf.variable_scope(scope_name, reuse = reuse):
            # layer_1 = slim.conv2d(layer_2, num_class, conv_kernel_1, scope='conv1', activation_fn=None, normalizer_fn=None)
            layer_1 = slim.conv2d(layer_2, 1, conv_kernel_1, scope='conv1', activation_fn=None, normalizer_fn=None)

            early_feature[scope_name] = layer_1
            
            # pred = tf.argmax(tf.nn.softmax(logits=layer_1), axis=3)
            pred = tf.sigmoid(layer_1)
                
        return tf.squeeze(layer_1), tf.squeeze(pred)



In [4]:

    
def build_loss(x_in, y_in, H, phase):
    '''
    This function builds the loss and accuracy
    '''
    im_width = H['im_width']
    im_height = H['im_height']
    batch_size = H['batch_size']
    start_ind = H['start_ind']
    valid_size = H['valid_size']
    num_class = H['num_class']
    epsilon = H['epsilon']
    apply_class_balancing = H['apply_class_balancing']
    
    logits, pred = build_pred(x_in, H, phase)
    y_crop = tf.cast(tf.slice(y_in, begin=[0, start_ind, start_ind], size=[-1, valid_size, valid_size]), tf.float32)
    logits_crop = tf.slice(logits, 
                         begin=[0, start_ind, start_ind], 
                         size=[-1, valid_size, valid_size])
    pred_crop = tf.cast(tf.slice(pred, 
                             begin=[0, start_ind, start_ind], 
                             size=[-1, valid_size, valid_size]), tf.float32)
    
    # formulation of weighted cross entropy loss, dice index: https://arxiv.org/pdf/1707.03237.pdf
    if H['loss_function'] == 'cross_entropy':
        if apply_class_balancing:
            loss = tf.reduce_mean(
                tf.nn.weighted_cross_entropy_with_logits(
                    targets=y_crop, logits=logits_crop, pos_weight=1. / class_weight))
        else:
            loss = tf.reduce_mean(tf.nn.sigmoid_cross_entropy_with_logits(labels=y_crop, logits=logits_crop))
        
    elif H['loss_function'] == 'dice':
        
        intersection = tf.reduce_sum(tf.multiply(y_crop, pred_crop))
        union = tf.reduce_sum(tf.square(y_crop)) + tf.reduce_sum(tf.square(pred_crop))
        loss = 1. - 2 * intersection / (union + tf.constant(epsilon))
                
    elif H['loss_function'] == 'jaccard':
        intersection = tf.reduce_sum(tf.multiply(y_crop, pred_crop))
        union = tf.reduce_sum(y_crop) + tf.reduce_sum(pred_crop) - intersection
        loss = 1. - intersection / (union + tf.constant(epsilon))
    
    elif H['loss_function'] == 'combo-jaccard':
        if apply_class_balancing:
            cen_loss = tf.reduce_mean(
                tf.nn.weighted_cross_entropy_with_logits(
                    targets=y_crop, logits=logits_crop, pos_weight=1. / class_weight))
        else:
            cen_loss = tf.reduce_mean(tf.nn.sigmoid_cross_entropy_with_logits(labels=y_crop, logits=logits_crop))
            
        intersection = tf.reduce_sum(tf.multiply(y_crop, pred_crop))
        union = tf.reduce_sum(y_crop) + tf.reduce_sum(pred_crop) - intersection
        jaccard_loss = - tf.log((intersection + tf.constant(epsilon)) / (union + tf.constant(epsilon)))
        loss = cen_loss + jaccard_loss
        
    elif H['loss_function'] == 'combo-dice':
        if apply_class_balancing:
            cen_loss = tf.reduce_mean(
                tf.nn.weighted_cross_entropy_with_logits(
                    targets=y_crop, logits=logits_crop, pos_weight=1. / class_weight))
        else:
            cen_loss = tf.reduce_mean(tf.nn.sigmoid_cross_entropy_with_logits(labels=y_crop, logits=logits_crop))
            
        intersection = tf.reduce_sum(tf.multiply(y_crop, pred_crop))
        union = tf.reduce_sum(y_crop) + tf.reduce_sum(pred_crop) - intersection
        dice_loss = - tf.log((intersection + tf.constant(epsilon)) / (union + tf.constant(epsilon)))
        loss = cen_loss + dice_loss
        
    pred_thres = tf.cast(tf.greater(pred_crop, 0.5), tf.float32)
    inter = tf.reduce_sum(tf.multiply(tf.cast(y_crop, tf.float32), pred_thres))
    uni = tf.reduce_sum(tf.cast(y_crop, tf.float32)) + tf.reduce_sum(pred_thres) - inter
    jaccard = inter / (uni + tf.constant(epsilon))
    
    return loss, jaccard, logits_crop, pred_crop



In [5]:

    
def build(queues, H):
    '''
    This function returns the train operation, summary, global step
    '''
    im_width = H['im_width']
    im_height = H['im_height']
    num_class = H['num_class']
    num_channel = H['num_channel']
    batch_size = H['batch_size']
    log_dir = H['log_dir']
    norm_threshold = H['norm_threshold']
    
    loss, accuracy, x_in, y_in, logits, pred = {}, {}, {}, {}, {}, {}
    for phase in ['train', 'validate']:
        x_in[phase], y_in[phase] = queues[phase].dequeue_many(batch_size)
        loss[phase], accuracy[phase], logits[phase], pred[phase] = build_loss(x_in[phase], y_in[phase], H, phase)
    
    learning_rate = tf.placeholder(dtype=tf.float32)
    opt = tf.train.AdamOptimizer(learning_rate=learning_rate, beta1=0.8, beta2=0.99)
    global_step = tf.Variable(0, trainable=False)
    tvars = tf.trainable_variables()
    grads= tf.gradients(loss['train'], tvars)
    grads, norm = tf.clip_by_global_norm(grads, norm_threshold)
    update_ops = tf.get_collection(tf.GraphKeys.UPDATE_OPS)
    with tf.control_dependencies(update_ops):
        train_op = opt.apply_gradients(zip(grads, tvars), global_step = global_step)
    
    for phase in ['train', 'validate']:
        
        tf.summary.scalar(name=phase + '/loss', tensor=loss[phase])
        tf.summary.scalar(name=phase + '/accuracy', tensor=accuracy[phase])
        
        mean, var = tf.nn.moments(logits[phase], axes=[0, 1, 2])
        tf.summary.scalar(name=phase + '/logits/mean', tensor=mean)
        tf.summary.scalar(name=phase + '/logits/variance', tensor=var)
        
        mean, var = tf.nn.moments(pred[phase], axes=[0, 1, 2])
        tf.summary.scalar(name=phase + '/pred/mean', tensor=mean)
        tf.summary.scalar(name=phase + '/pred/variance', tensor=var)
        
    summary_op = tf.summary.merge_all()
    return loss, accuracy, train_op, summary_op, learning_rate, global_step



In [6]:

    
hypes = './hypes/hypes.json'
with open(hypes, 'r') as f:
    H = simplejson.load(f)
    # H['loss_function'] = 'dice'
    im_width = H['im_width']
    im_height = H['im_height']
    num_class = H['num_class']
    num_channel = H['num_channel']
    queue_size = H['queue_size']
    save_iter = H['save_iter']
    print_iter = H['print_iter']
    class_type = H['class_type']
    train_iter = H['train_iter']
    lr = H['lr']
    lr_decay_iter = H['lr_decay_iter']
    log_dir = H['log_dir']
    batch_size = H['batch_size']
now = datetime.datetime.now()

now_path = str(now.month) + '-' + str(now.day) + '_' + str(now.hour) + '-' + str(now.minute) + '_' + H['loss_function']
ckpt_path = os.path.join(log_dir, now_path, 'ckpt', 'ckpt')
hypes_path = os.path.join(log_dir, now_path, 'hypes')
summary_path = os.path.join(log_dir, now_path, 'summary')

for path in [ckpt_path, hypes_path, summary_path]:
    if not os.path.exists(path):
        os.makedirs(path)

with open(os.path.join(hypes_path, 'hypes.json'), 'w') as f:
    simplejson.dump(H, f)



In [7]:

    
H









    Out[7]:





{'apply_class_balancing': False,
 'batch_size': 60,
 'class_type': 0,
 'epsilon': 1.0,
 'im_height': 144,
 'im_width': 144,
 'log_dir': 'log_dir',
 'loss_function': 'combo-jaccard',
 'lr': 0.0001,
 'lr_decay_iter': 2000,
 'norm_threshold': 1.0,
 'num_channel': 16,
 'num_class': 2,
 'padding': 'SAME',
 'print_iter': 100,
 'queue_size': 200,
 'save_iter': 1000,
 'start_ind': 32,
 'train_iter': 20000,
 'valid_size': 80}



In [8]:

    
class_weight = data_utils.calculate_class_weights()[data_utils.CLASSES[class_type + 1]]









    



Collecting class stats [========================] 100%



In [9]:

    
def enqueue_thread(sess, data_gen, coord, phase, enqueue_op):
    while not coord.should_stop():
        img, label = data_gen.next()
        sess.run(enqueue_op, feed_dict={x_in[phase]: img, y_in[phase]: label})



In [10]:

    
x_in, y_in, queues, enqueue_op = {}, {}, {}, {}
shape = ((im_width, im_height, num_channel), 
         (im_width, im_height))
for phase in ['train', 'validate']:
    x_in[phase] = tf.placeholder(dtype=tf.float32)
    y_in[phase] = tf.placeholder(dtype=tf.float32)
    queues[phase] = tf.FIFOQueue(capacity=queue_size, shapes=shape, dtypes=(tf.float32,tf.float32))
    enqueue_op[phase] = queues[phase].enqueue_many([x_in[phase], y_in[phase]])



In [ ]:

    
loss, accuracy, train_op, summary_op, learning_rate, global_step = build(queues, H)
data_gen = {}
for phase in ['train', 'validate']:
    is_train = {'train': True, 'validate': False}[phase]
    data_gen[phase] = train_utils.input_data(crop_per_img=1, class_id=class_type, reflection=True,
                                             rotation=360, train=is_train, crop_size=im_width)
    # Run the generator once to make sure the data is loaded into the memory
    # This will take a few minutes
    data_gen[phase].next()









    



Loading training data: [====================] 100%
Loading validation data: [===] 100%



In [ ]:

    
config = tf.ConfigProto()
config.gpu_options.allow_growth = True
coord = tf.train.Coordinator()
threads = {}
saver = tf.train.Saver(max_to_keep = train_iter / save_iter + 1)

with tf.Session(config=config).as_default() as sess:
    summary_writer = tf.summary.FileWriter(logdir = summary_path, flush_secs = 10)
    summary_writer.add_graph(sess.graph)
    for phase in ['train', 'validate']:
        
        threads[phase] = threading.Thread(
            target=enqueue_thread, 
            args=(sess, data_gen[phase], coord, phase, enqueue_op[phase]))
        threads[phase].start()
        
    sess.run(tf.global_variables_initializer())
    start = time.time()
    for step in xrange(train_iter):
        if step and step % lr_decay_iter == 0:
            lr *= 0.1
        
        if step % print_iter == 0 or step == (train_iter - 1):
            dt = (time.time() - start) / batch_size / print_iter
            start = time.time()
            _, train_loss, train_accuracy, validate_loss, validate_accuracy, summaries = \
            sess.run([train_op, loss['train'], accuracy['train'], loss['validate'], accuracy['validate'], summary_op],
                    feed_dict = {learning_rate: lr})
            summary_writer.add_summary(summaries, global_step = global_step.eval())
            str0 = 'Global step ({0}): LR: {1:0.5f}; '.format(global_step.eval(), lr)
            str1 = 'Train loss {0:.2f}; '.format(train_loss)
            str2 = 'Train accuracy {}%; '.format(int(100 * train_accuracy))
            str3 = 'Validate loss {0:.2f}; '.format(validate_loss)
            str4 = 'Validate accuracy {}%; '.format(int(100 * validate_accuracy))
            str5 = 'Time / image: {0:0.1f}ms'.format(1000 * dt if step else 0)
            print str0 + str1 + str2 + str3 + str4 + str5 + '\n'
        else:
            sess.run([train_op, loss['train']], feed_dict = {learning_rate: lr})
        
        if step % save_iter == 0 or step == (train_iter - 1):
            saver.save(sess, ckpt_path, global_step = global_step.eval())









    



Global step (1): LR: 0.00010; Train loss 4.66; Train accuracy 2%; Validate loss 290.63; Validate accuracy 14%; Time / image: 0.0ms

WARNING:tensorflow:Error encountered when serializing LAYER_NAME_UIDS.
Type is unsupported, or the types of the items don't match field type in CollectionDef.
'dict' object has no attribute 'name'
Global step (101): LR: 0.00010; Train loss 0.49; Train accuracy 69%; Validate loss 9.74; Validate accuracy 0%; Time / image: 78.2ms

Global step (201): LR: 0.00010; Train loss 0.70; Train accuracy 58%; Validate loss 10.66; Validate accuracy 14%; Time / image: 74.4ms

Global step (301): LR: 0.00010; Train loss 0.56; Train accuracy 62%; Validate loss 8.84; Validate accuracy 16%; Time / image: 74.4ms

Global step (401): LR: 0.00010; Train loss 0.49; Train accuracy 66%; Validate loss 2.59; Validate accuracy 21%; Time / image: 74.4ms

Global step (501): LR: 0.00010; Train loss 0.49; Train accuracy 65%; Validate loss 4.29; Validate accuracy 23%; Time / image: 74.4ms

Global step (601): LR: 0.00010; Train loss 0.89; Train accuracy 43%; Validate loss 7.59; Validate accuracy 11%; Time / image: 74.4ms

Global step (701): LR: 0.00010; Train loss 0.34; Train accuracy 75%; Validate loss 4.24; Validate accuracy 22%; Time / image: 74.3ms

Global step (801): LR: 0.00010; Train loss 0.50; Train accuracy 64%; Validate loss 2.39; Validate accuracy 20%; Time / image: 74.5ms

Global step (901): LR: 0.00010; Train loss 0.35; Train accuracy 73%; Validate loss 4.47; Validate accuracy 19%; Time / image: 74.8ms

Global step (1001): LR: 0.00010; Train loss 0.61; Train accuracy 57%; Validate loss 4.89; Validate accuracy 9%; Time / image: 74.9ms

WARNING:tensorflow:Error encountered when serializing LAYER_NAME_UIDS.
Type is unsupported, or the types of the items don't match field type in CollectionDef.
'dict' object has no attribute 'name'
Global step (1101): LR: 0.00010; Train loss 0.52; Train accuracy 63%; Validate loss 4.83; Validate accuracy 21%; Time / image: 74.5ms

Global step (1201): LR: 0.00010; Train loss 0.24; Train accuracy 81%; Validate loss 4.44; Validate accuracy 18%; Time / image: 74.4ms

Global step (1301): LR: 0.00010; Train loss 0.68; Train accuracy 56%; Validate loss 6.05; Validate accuracy 15%; Time / image: 74.3ms

Global step (1401): LR: 0.00010; Train loss 1.42; Train accuracy 25%; Validate loss 1.87; Validate accuracy 36%; Time / image: 74.4ms

Global step (1501): LR: 0.00010; Train loss 0.74; Train accuracy 50%; Validate loss 2.26; Validate accuracy 35%; Time / image: 74.4ms

Global step (1601): LR: 0.00010; Train loss 0.64; Train accuracy 55%; Validate loss 4.12; Validate accuracy 21%; Time / image: 74.4ms

Global step (1701): LR: 0.00010; Train loss 0.45; Train accuracy 67%; Validate loss 3.43; Validate accuracy 22%; Time / image: 74.4ms



In [ ]:

    
# coord.requst_stop()
# coord.join()