In [1]:
from __future__ import print_function
import numpy as np
np.random.seed(1337)

In [2]:
import keras
from keras.datasets import cifar10
from keras.models import Model
from keras.layers import Dense, Activation, Input, MaxPooling2D, Flatten
from keras.layers import Conv2D

Using TensorFlow backend.


In [3]:
batch_size = 32
num_classes = 10
epochs = 5

In [4]:
#The data shuffled and split between train and test sets:
(x_train, y_train), (x_test, y_test) = cifar10.load_data()

x_train = x_train.astype('float32')
x_test = x_test.astype('float32')
x_train /= 255
x_test /= 255

print('x_train shape: ', x_train.shape)
print(x_train.shape[0], 'train samples')
print(x_test.shape[0], 'test samples')

x_train shape:  (50000, 32, 32, 3)
50000 train samples
10000 test samples


In [5]:
#Convert class vectors to binary class matrices.
y_train = keras.utils.to_categorical(y_train, num_classes)
y_test = keras.utils.to_categorical(y_test, num_classes)

# Residual Connections

Take a look at the residual connection figure here: https://arxiv.org/pdf/1512.03385.pdf

In [6]:
#Input layer is the same as our typical CNN model
inputs = Input(shape=(32,32,3))

##----------------------New stuffs starts here---------------------

y = Conv2D(3, (3,3), padding='same')(inputs)

z = keras.layers.add([inputs, y])

##----------------------New stuffs ends here-----------------------

x = Conv2D(8, (3,3))(z) #Notice the 'z'
x = Activation('relu')(x)
x = MaxPooling2D(pool_size=(2,2))(x)
x = Flatten()(x)

x = Dense(num_classes)(x)

output = Activation('softmax')(x)

In [7]:
model = Model([inputs], output)

In [8]:
model.summary()

__________________________________________________________________________________________________
Layer (type)                    Output Shape         Param #     Connected to                     
input_1 (InputLayer)            (None, 32, 32, 3)    0                                            
__________________________________________________________________________________________________
conv2d_1 (Conv2D)               (None, 32, 32, 3)    84          input_1[0][0]                    
__________________________________________________________________________________________________
add_1 (Add)                     (None, 32, 32, 3)    0           input_1[0][0]                    
                                                                 conv2d_1[0][0]                   
__________________________________________________________________________________________________
conv2d_2 (Conv2D)               (None, 30, 30, 8)    224         add_1[0][0]                      
__________