In [1]:
import numpy as np

In [2]:
from keras.models import Model

from keras.layers import Input, Flatten, Dropout, Reshape, Permute, Activation
from keras.layers import Conv2D, Dense, Conv2DTranspose, Cropping2D
from keras.layers import MaxPool2D, Add
from keras.applications import vgg16, vgg19

  from ._conv import register_converters as _register_converters
Using TensorFlow backend.


In [3]:
# crop o1 wrt o2
def crop( o1 , o2 , i  ):
    o_shape2 = Model( i  , o2 ).output_shape
    outputHeight2 = o_shape2[1]
    outputWidth2 = o_shape2[2]

    o_shape1 = Model( i  , o1 ).output_shape
    outputHeight1 = o_shape1[1]
    outputWidth1 = o_shape1[2]

    cx = abs( outputWidth1 - outputWidth2 )
    cy = abs( outputHeight2 - outputHeight1 )

    if outputWidth1 > outputWidth2:
        o1 = Cropping2D( cropping=((0,0) ,  (  0 , cx )))(o1)
    else:
        o2 = Cropping2D( cropping=((0,0) ,  (  0 , cx )))(o2)

    if outputHeight1 > outputHeight2 :
        o1 = Cropping2D( cropping=((0,cy) ,  (  0 , 0 )))(o1)
    else:
        o2 = Cropping2D( cropping=((0, cy ) ,  (  0 , 0 )))(o2)

    return o1 , o2 

In [4]:
vgg16_model = vgg16.VGG16(include_top=True, 
                    weights='imagenet', input_tensor=None, 
                    input_shape=None, pooling=None, classes=1000)

In [5]:
vgg16_model.summary()

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_1 (InputLayer)         (None, 224, 224, 3)       0         
_________________________________________________________________
block1_conv1 (Conv2D)        (None, 224, 224, 64)      1792      
_________________________________________________________________
block1_conv2 (Conv2D)        (None, 224, 224, 64)      36928     
_________________________________________________________________
block1_pool (MaxPooling2D)   (None, 112, 112, 64)      0         
_________________________________________________________________
block2_conv1 (Conv2D)        (None, 112, 112, 128)     73856     
_________________________________________________________________
block2_conv2 (Conv2D)        (None, 112, 112, 128)     147584    
_________________________________________________________________
block2_pool (MaxPooling2D)   (None, 56, 56, 128)       0         
__________

In [6]:
layer1 = vgg16_model.get_layer('block1_pool').output
layer2 = vgg16_model.get_layer('block2_pool').output
layer3 = vgg16_model.get_layer('block3_pool').output
layer4 = vgg16_model.get_layer('block4_pool').output
layer5 = vgg16_model.get_layer('block5_pool').output

In [7]:
layers = [layer1,layer2,layer3,layer4,layer5]

In [8]:
def fcn8(num_class,feature_layers,model_input):
    out = feature_layers[-1]
    out = Conv2D(4096, (7,7),
                activation='relu', padding='same')(out)
    out = Dropout(0.5)(out)
    out = Conv2D(4096, (1,1), 
                activation='relu', padding='same')(out)
    out = Dropout(0.5)(out)
    
    out = Conv2D(num_class, (1,1), 
                kernel_initializer='he_normal')(out)
    out = Conv2DTranspose(num_class,
                          kernel_size=(4,4),strides=(2,32),
                         use_bias=False)(out)
    
    out2 = feature_layers[-2]
    out2 = Conv2D(num_class, (1,1), 
                kernel_initializer='he_normal')(out2)
    
    out, out2 = crop(out, out2, model_input)
    
    out = Add()([out, out2])
    
    out = Conv2DTranspose(num_class,
                          kernel_size=(4,4),strides=(2,2),
                         use_bias=False)(out)
    out3 = feature_layers[-3]
    out3 = Conv2D(num_class, (1,1), 
                kernel_initializer='he_normal')(out3)
    
    out3, out = crop(out3, out, model_input)
    out = Add()([out3, out])
    
    out = Conv2DTranspose(num_class,
                          kernel_size=(16,16),strides=(8,8),
                         use_bias=False)(out)
    
    out_shape = Model(model_input, out).output_shape
    
    outHeight = out_shape[1]
    outWidth = out_shape[2]
    
    out = Reshape((-1, outHeight * outWidth))(out)
    out = Permute((2,1))(out)
    out = Activation('softmax')(out)
    model = Model(model_input, out)
    model.outHeight = outHeight
    model.outWidth = outWidth
    
    return model

In [9]:
def fcn16(num_class,feature_layers,model_input):
    out = feature_layers[-1]
    out = Conv2D(4096, (7,7),
                activation='relu', padding='same')(out)
    out = Dropout(0.5)(out)
    out = Conv2D(4096, (1,1), 
                activation='relu', padding='same')(out)
    out = Dropout(0.5)(out)
    
    out = Conv2D(num_class, (1,1), 
                kernel_initializer='he_normal')(out)
    out = Conv2DTranspose(num_class,
                          kernel_size=(64,64),strides=(32,32),
                         use_bias=False)(out)
    out_shape = Model(model_input, out).output_shape
    
    outHeight = out_shape[1]
    outWidth = out_shape[2]
    
    out = Reshape((-1, outHeight * outWidth))(out)
    out = Permute((2,1))(out)
    out = Activation('softmax')(out)
    model = Model(model_input, out)
    model.outHeight = outHeight
    model.outWidth = outWidth
    
    return model

In [10]:
fcn16_model = fcn16(1000, layers, vgg16_model.input)

In [11]:
fcn8_model = fcn8(1000, layers, vgg16_model.input)

In [12]:
fcn16_model.summary()

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
input_1 (InputLayer)         (None, 224, 224, 3)       0         
_________________________________________________________________
block1_conv1 (Conv2D)        (None, 224, 224, 64)      1792      
_________________________________________________________________
block1_conv2 (Conv2D)        (None, 224, 224, 64)      36928     
_________________________________________________________________
block1_pool (MaxPooling2D)   (None, 112, 112, 64)      0         
_________________________________________________________________
block2_conv1 (Conv2D)        (None, 112, 112, 128)     73856     
_________________________________________________________________
block2_conv2 (Conv2D)        (None, 112, 112, 128)     147584    
_________________________________________________________________
block2_pool (MaxPooling2D)   (None, 56, 56, 128)       0         
__________

In [13]:
fcn8_model.summary()

__________________________________________________________________________________________________
Layer (type)                    Output Shape         Param #     Connected to                     
input_1 (InputLayer)            (None, 224, 224, 3)  0                                            
__________________________________________________________________________________________________
block1_conv1 (Conv2D)           (None, 224, 224, 64) 1792        input_1[0][0]                    
__________________________________________________________________________________________________
block1_conv2 (Conv2D)           (None, 224, 224, 64) 36928       block1_conv1[0][0]               
__________________________________________________________________________________________________
block1_pool (MaxPooling2D)      (None, 112, 112, 64) 0           block1_conv2[0][0]               
__________________________________________________________________________________________________
block2_con