In [8]:
import numpy as np
np.random.seed(123)  # for reproducibility
 
from keras.models import Sequential
from keras.layers import Dense, Dropout, Activation, Flatten,GlobalAveragePooling2D
from keras.layers import Convolution2D, MaxPooling2D
from keras.utils import np_utils
from keras.datasets import mnist

In [9]:
#  Load pre-shuffled MNIST data into train and test sets
(X_train, y_train), (X_test, y_test) = mnist.load_data()
 
# Preprocess input data
X_train = X_train.reshape(X_train.shape[0],28, 28,1)
X_test = X_test.reshape(X_test.shape[0], 28, 28,1)
X_train = X_train.astype('float32')
X_test = X_test.astype('float32')
X_train /= 255
X_test /= 255

In [10]:
#  Preprocess class labels
Y_train = np_utils.to_categorical(y_train, 10)
Y_test = np_utils.to_categorical(y_test, 10)

In [11]:
#. Define model architecture
model = Sequential()
 
model.add(Convolution2D(8, kernel_size=(3,3), activation='relu', input_shape=(28,28,1)))   #8*(3*3) + 8 bias term
model.add(Convolution2D(16, kernel_size=(3,3), activation='relu'))   # 16*(8*3*3) + 16
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Convolution2D(32, kernel_size=(3,3), activation='relu'))
model.add(Convolution2D(64, kernel_size=(3,3), activation='relu'))
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Convolution2D(128, kernel_size=(3,3), activation='relu'))
#model.add(GlobalAveragePooling2D())
model.add(Flatten())
model.add(Dropout(0.25))
model.add(Dense(32, activation='relu'))
model.add(Dropout(0.5))
model.add(Dense(10, activation='softmax'))

In [12]:
512*32+32

16416

In [13]:
model.summary()

Model: "sequential_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_5 (Conv2D)           (None, 26, 26, 8)         80        
                                                                 
 conv2d_6 (Conv2D)           (None, 24, 24, 16)        1168      
                                                                 
 max_pooling2d_2 (MaxPooling  (None, 12, 12, 16)       0         
 2D)                                                             
                                                                 
 conv2d_7 (Conv2D)           (None, 10, 10, 32)        4640      
                                                                 
 conv2d_8 (Conv2D)           (None, 8, 8, 64)          18496     
                                                                 
 max_pooling2d_3 (MaxPooling  (None, 4, 4, 64)         0         
 2D)                                                  

In [14]:
# Compile model
model.compile(loss='categorical_crossentropy',
              optimizer='sgd',
              metrics=['accuracy'])

In [15]:
# Fit model on training data
model.fit(X_train, Y_train, 
batch_size=32, verbose=1, epochs = 2)

Epoch 1/2
Epoch 2/2


<keras.callbacks.History at 0x7f780923bbb0>

In [16]:
# Evaluate model on test data
score = model.evaluate(X_test, Y_test, verbose=0)

In [17]:
score  #loss,accuracy

[0.12690097093582153, 0.9598000049591064]