In [None]:
# Keras model 

In [32]:
import numpy as np 
import tensorflow as tf
import os 

In [33]:
ROOT_DIR = '/Users/joshua.newnham/Documents/Shared Playground Data/Sketches/preprocessed/'
VALID_DIR = os.path.join(ROOT_DIR, "valid")
TRAIN_DIR = os.path.join(ROOT_DIR, "train")
WEIGHTS_FILE = "sketch_classifier.h5"

TARGET_SIZE = (256,256)
INPUT_SHARE = (256,256,1)
NUM_CLASSES = 22

EPOCHS = 1000 
BATCH_SIZE = 32

In [34]:
def count_files(full_path):
    count = 0 
    def is_image(file_path):
        image_extensions = ['png', 'jpg', 'jpeg']
        
        for image_extension in image_extensions:
            if image_extension in file_path.lower():
                return True
            
        return False 
    
    for d in os.listdir(full_path):
        if not os.path.isdir(os.path.join(full_path, d)):
            continue
            
        sub_full_path = os.path.join(full_path, d)
        
        for f in os.listdir(sub_full_path):
            img_path = os.path.join(sub_full_path, f)
            if os.path.isfile(img_path) and is_image(img_path):
                count += 1
            
    return count

In [35]:
NUM_TRAIN_FILES = count_files(TRAIN_DIR)
NUM_VALID_FILES = count_files(VALID_DIR)

In [56]:
def create_model():
    model = tf.keras.models.Sequential() 
    model.add(tf.keras.layers.Conv2D(16, 
                                     kernel_size=(7,7), 
                                     strides=(3,3),  
                                     padding='same', 
                                     input_shape=INPUT_SHARE, 
                                     activation=None, 
                                     name="conv1"))
    model.add(tf.keras.layers.Activation('relu', name="relu1"))    
    model.add(tf.keras.layers.MaxPooling2D(2,2, name="maxpool1"))    
    
    model.add(tf.keras.layers.Conv2D(32, 
                                     kernel_size=(5,5),
                                     strides=(1,1),  
                                     padding='same', 
                                     activation=None, 
                                     name="conv2"))        
    model.add(tf.keras.layers.Activation('relu', name="relu2"))
    model.add(tf.keras.layers.MaxPooling2D(2,2, name="maxpool2"))    
    
    model.add(tf.keras.layers.Conv2D(64, 
                                     kernel_size=(5,5),
                                     strides=(1,1),
                                     padding='same', 
                                     activation=None, 
                                     name="conv3"))
    model.add(tf.keras.layers.Activation('relu', name="relu3"))
    model.add(tf.keras.layers.MaxPooling2D(2,2, name="maxpool3"))  
    model.add(tf.keras.layers.Dropout(0.4, name="dropout1"))
    
    model.add(tf.keras.layers.Conv2D(128, 
                                     kernel_size=(5,5), 
                                     strides=(1,1),  
                                     padding='same', 
                                     activation=None, 
                                     name='conv4'))
    model.add(tf.keras.layers.Activation('relu', name="relu4"))
    model.add(tf.keras.layers.MaxPooling2D(2,2, name='maxpool4'))    
    model.add(tf.keras.layers.Dropout(0.4, name='dropout2'))
    
    model.add(tf.keras.layers.Flatten())  
    
    model.add(tf.keras.layers.Dense(256, 
                                    activation=None, 
                                    name='fc1'))
    model.add(tf.keras.layers.Activation('relu', name="relu5"))
        
    model.add(tf.keras.layers.Dense(NUM_CLASSES, 
                                    activation=None, 
                                    name='fc2'))
    model.add(tf.keras.layers.Activation('softmax', name="output"))
    
    model.compile(
        loss='categorical_crossentropy', 
        optimizer='adam', 
        metrics=['accuracy'])
    
    return model 

In [57]:
def train(model):
    
    datagen = tf.keras.preprocessing.image.ImageDataGenerator(rescale=1./255.)
    
    # create an iterator for the training data 
    train_generator = datagen.flow_from_directory(
        TRAIN_DIR,
        target_size=TARGET_SIZE,
        batch_size=BATCH_SIZE, 
        color_mode='grayscale')
    
    # create an iterator for the validation data 
    validation_generator = datagen.flow_from_directory(
        VALID_DIR,
        target_size=TARGET_SIZE,
        batch_size=BATCH_SIZE, 
        color_mode='grayscale')
    
    checkpoint = tf.keras.callbacks.ModelCheckpoint(WEIGHTS_FILE, 
                                           monitor='val_loss', 
                                           verbose=0, 
                                           save_best_only=True, 
                                           save_weights_only=True, 
                                           mode='auto', 
                                           period=2)
    
    early_stopping = tf.keras.callbacks.EarlyStopping(monitor='val_loss', patience=5)
    
    history = model.fit_generator(
        train_generator,
        steps_per_epoch=int(NUM_TRAIN_FILES/BATCH_SIZE),
        epochs=EPOCHS,
        validation_data=validation_generator,
        validation_steps=int(NUM_VALID_FILES/BATCH_SIZE), 
        callbacks=[checkpoint, early_stopping]) 
    
    return history, model 

In [58]:
model = create_model() 
model.summary()

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv1 (Conv2D)               (None, 86, 86, 16)        800       
_________________________________________________________________
relu1 (Activation)           (None, 86, 86, 16)        0         
_________________________________________________________________
maxpool1 (MaxPooling2D)      (None, 43, 43, 16)        0         
_________________________________________________________________
conv2 (Conv2D)               (None, 43, 43, 32)        12832     
_________________________________________________________________
relu2 (Activation)           (None, 43, 43, 32)        0         
_________________________________________________________________
maxpool2 (MaxPooling2D)      (None, 21, 21, 32)        0         
_________________________________________________________________
conv3 (Conv2D)               (None, 21, 21, 64)        51264     
__________

In [59]:
history, model = train(model)

Found 3605 images belonging to 22 classes.
Found 176 images belonging to 22 classes.
Epoch 1/1000
Epoch 2/1000
Epoch 3/1000
Epoch 4/1000
Epoch 5/1000
Epoch 6/1000
Epoch 7/1000
Epoch 8/1000
Epoch 9/1000
Epoch 10/1000


## Export weights 

Export weights
The type of each entry in array is given by -dataType. The number of entries is equal to:

inputFeatureChannels outputFeatureChannels kernelHeight kernelWidth*

The layout of filter weight is as a 4D tensor (array) weight[ outputChannels ][ kernelHeight ][ kernelWidth ][ inputChannels / groups ]

Note: For binary-convolutions the layout of the weights are: weight[ outputChannels ][ kernelHeight ][ kernelWidth ][ floor((inputChannels/groups)+31) / 32 ] with each 32 sub input feature channel index specified in machine byte order, so that for example the 13th feature channel bit can be extracted using bitmask = (1U << 13).

In [60]:
def export_conv_weights(name, wts_coef, bias_coef):
    print("Exporting weights for {}\n\t{}\n\t{}".format(name, 
          os.path.join('exports', "{}_conv.data".format(name)), 
          os.path.join('exports', "{}_bias.data".format(name))))
    
    print("\n")
    
    # [kernel_width, kernel_height, input_feature_channels, output_feature_channels]
    print("\tOriginal weights shape {}".format(wts_coef.shape))
    if bias_coef is not None:
        # [output_feature_channels]
        print("\tOriginal bias shape {}".format(bias_coef.shape))
    
    # [output_feature_channels, kernel_width, kernel_height, input_feature_channels]
    wts_coef = wts_coef.transpose(3, 0, 1, 2)
    print("\tReshaped weights shape {}".format(wts_coef.shape))    
    wts_coef.tofile(os.path.join('exports', "{}_conv.data".format(name)))    
    
    if bias_coef is not None:
        bias_coef = np.squeeze(bias_coef)
        print("\tReshaped bias_coef shape {}".format(bias_coef.shape))    
        bias_coef.tofile(os.path.join('exports', "{}_bias.data".format(name)))    
        
    print("\n")

In [61]:
def export_dense_weights(name, wts_coef, bias_coef, kernel_width, kernel_height):
    """
    A fully connected layer in a Convolutional Neural Network (CNN) is one where every input channel is connected 
    to every output channel. The kernel width is equal to the width of the source image, and the 
    kernel height is equal to the height of the source image. The width and height of the output is 1 x 1.
    
    A fully connected layer takes an MPSImage object with dimensions 
    source.width x source.height x Ni, convolves it with Weights[No][source.width][source.height][Ni], 
    and produces a 1 x 1 x No output.
    
    Thus, the following conditions must be true:
    - kernelWidth == source.width
    - kernelHeight == source.height
    - clipRect.size.width == 1
    - clipRect.size.height == 1
    
    You can think of a fully connected layer as a matrix multiplication where the image is 
    flattened into a vector of length source.width*source.height*Ni, and the weights are arranged in a 
    matrix of dimension No x (source.width*source.height*Ni) to produce an output vector of length No.
    
    The value of the strideInPixelsX, strideInPixelsY, and groups properties must be 1. 
    The offset property is not applicable and it is ignored. Because the clip rectangle is 
    clamped to the destination image bounds, if the destination is 1 x 1, you do not need to set the 
    clipRect property.
    """
    print("Exporting weights for {}\n\t{}\n\t{}".format(name, 
          os.path.join('exports', "{}_conv.data".format(name)), 
          os.path.join('exports', "{}_bias.data".format(name))))
        
    input_feature_channels = int(wts_coef.shape[0] / kernel_width / kernel_height) 
    output_feature_channels = wts_coef.shape[-1]            
    
    # [kernel_width, kernel_height, input_feature_channels, output_feature_channels]
    print("\tOriginal weights shape {}".format(wts_coef.shape))
    
    #wts_coef = np.reshape(wts_coef, [kernel_width, kernel_height, input_feature_channels, output_feature_channels])    
    wts_coef = np.reshape(wts_coef, [kernel_width, kernel_height, -1, output_feature_channels])    
        
    if bias_coef is not None:
        # [output_feature_channels]
        print("\tOriginal bias shape {}".format(bias_coef.shape))
    
    # [output_feature_channels, kernel_width, kernel_height, input_feature_channels]
    wts_coef = wts_coef.transpose(3, 0, 1, 2)
    print("\tReshaped weights shape {}".format(wts_coef.shape))    
    wts_coef.tofile(os.path.join('exports', "{}_conv.data".format(name)))    
    
    if bias_coef is not None:
        bias_coef = np.squeeze(bias_coef)
        print("\tReshaped bias_coef shape {}".format(bias_coef.shape))    
        bias_coef.tofile(os.path.join('exports', "{}_bias.data".format(name)))   
        
    print("\n")

In [62]:
flatted_input_kernel_width = None
flatted_input_kernel_height = None

for layer in model.layers:        
    if "flatten" in layer.name:
        flatted_input_kernel_width = layer.input_shape[1] # None, 14, 14, 64
        flatted_input_kernel_height = layer.input_shape[2] # None, 14, 14, 64
        print("flatted_input_kernel_width {} flatted_input_kernel_height {}".format(
            flatted_input_kernel_width, flatted_input_kernel_height))
        
    if len(layer.get_weights()) > 0:        
        name = layer.name         
        wts = layer.get_weights()
        
        if "conv" in name:            
            export_conv_weights(layer.name, wts[0], wts[1] if len(wts) == 2 else None)        
        else:
            export_dense_weights(layer.name, wts[0], wts[1] if len(wts) == 2 else None, 
                                flatted_input_kernel_width, flatted_input_kernel_height)        
            # after the initial pass (from cnn to fcn); flattern the kernel down to 1x1 
            # i.e. update the flatted_input_kernel_DIM to have the kernel width and height of 1 
            flatted_input_kernel_width, flatted_input_kernel_height = 1, 1             

conv1
conv2
conv3
conv4
flatted_input_kernel_width 5 flatted_input_kernel_height 5
fc1
fc2
