In [1]:
import keras
from keras.models import Sequential
from keras.layers import Dense
from keras.utils import to_categorical

Using TensorFlow backend.


When working with convolutional neural networks in particular, we will need additional packages

In [2]:
from keras.layers.convolutional import Conv2D # to add convolutional layers
from keras.layers.convolutional import MaxPooling2D # to add pooling layers
from keras.layers import Flatten # to flatten data for fully connected layers

In [3]:
# import data
from keras.datasets import mnist

# load data
(X_train, y_train), (X_test, y_test) = mnist.load_data()

In [5]:
# reshape to be [samples][pixels][width][height]
X_train = X_train.reshape(X_train.shape[0], 28, 28, 1).astype('float32')
X_test = X_test.reshape(X_test.shape[0], 28, 28, 1).astype('float32')

In [6]:
X_train.shape

(60000, 28, 28, 1)

In [7]:
X_train = X_train / 255 # normalize training data
X_test = X_test / 255 # normalize test data

In [8]:
y_train = to_categorical(y_train)
y_test = to_categorical(y_test)

num_classes = y_test.shape[1] #

In [12]:
y_test.shape

(10000, 10)

Next, let's define a function that creates our model. Let's start with one set of convolutional and pooling layers.

In [13]:
def convolutional_model():
    
    # create model
    model = Sequential()
    model.add(Conv2D(16, (5, 5), strides=(1, 1), activation='relu', input_shape=(28, 28, 1)))
    model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))
    
    model.add(Flatten())
    model.add(Dense(100, activation='relu'))
    model.add(Dense(num_classes, activation='softmax'))
    
    # compile model
    model.compile(optimizer='adam', loss='categorical_crossentropy',  metrics=['accuracy'])
    return model

In [14]:
# build the model
model = convolutional_model()

# fit the model
model.fit(X_train, y_train, validation_data=(X_test, y_test), epochs=10, batch_size=200, verbose=2)

# evaluate the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("Accuracy: {} \n Error: {}".format(scores[1], 100-scores[1]*100))

Instructions for updating:
Colocations handled automatically by placer.
Instructions for updating:
Use tf.cast instead.
Train on 60000 samples, validate on 10000 samples
Epoch 1/10
 - 29s - loss: 0.2948 - acc: 0.9169 - val_loss: 0.1040 - val_acc: 0.9694
Epoch 2/10
 - 26s - loss: 0.0866 - acc: 0.9750 - val_loss: 0.0681 - val_acc: 0.9774
Epoch 3/10
 - 26s - loss: 0.0582 - acc: 0.9830 - val_loss: 0.0506 - val_acc: 0.9837
Epoch 4/10
 - 26s - loss: 0.0448 - acc: 0.9864 - val_loss: 0.0461 - val_acc: 0.9844
Epoch 5/10
 - 26s - loss: 0.0353 - acc: 0.9888 - val_loss: 0.0388 - val_acc: 0.9865
Epoch 6/10
 - 26s - loss: 0.0288 - acc: 0.9915 - val_loss: 0.0392 - val_acc: 0.9865
Epoch 7/10
 - 26s - loss: 0.0241 - acc: 0.9924 - val_loss: 0.0369 - val_acc: 0.9882
Epoch 8/10
 - 26s - loss: 0.0193 - acc: 0.9945 - val_loss: 0.0407 - val_acc: 0.9872
Epoch 9/10
 - 26s - loss: 0.0167 - acc: 0.9952 - val_loss: 0.0366 - val_acc: 0.9875
Epoch 10/10
 - 27s - loss: 0.0134 - acc: 0.9962 - val_loss: 0.0344 - val_a

## Convolutional Layer with two sets of convolutional and pooling layers

In [15]:
def convolutional_model():
    
    # create model
    model = Sequential()
    model.add(Conv2D(16, (5, 5), activation='relu', input_shape=(28, 28, 1)))
    model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))
    
    model.add(Conv2D(8, (2, 2), activation='relu'))
    model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))
    
    model.add(Flatten())
    model.add(Dense(100, activation='relu'))
    model.add(Dense(num_classes, activation='softmax'))
    
    # Compile model
    model.compile(optimizer='adam', loss='categorical_crossentropy',  metrics=['accuracy'])
    return model

In [16]:
# build the model
model = convolutional_model()

# fit the model
model.fit(X_train, y_train, validation_data=(X_test, y_test), epochs=10, batch_size=200, verbose=2)

# evaluate the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("Accuracy: {} % \n Error: {} %".format(scores[1]*100, 100-scores[1]*100))

Train on 60000 samples, validate on 10000 samples
Epoch 1/10
 - 25s - loss: 0.4859 - acc: 0.8622 - val_loss: 0.1544 - val_acc: 0.9555
Epoch 2/10
 - 22s - loss: 0.1277 - acc: 0.9613 - val_loss: 0.0868 - val_acc: 0.9741
Epoch 3/10
 - 21s - loss: 0.0895 - acc: 0.9730 - val_loss: 0.0668 - val_acc: 0.9794
Epoch 4/10
 - 22s - loss: 0.0721 - acc: 0.9775 - val_loss: 0.0642 - val_acc: 0.9798
Epoch 5/10
 - 22s - loss: 0.0614 - acc: 0.9811 - val_loss: 0.0563 - val_acc: 0.9820
Epoch 6/10
 - 22s - loss: 0.0529 - acc: 0.9841 - val_loss: 0.0519 - val_acc: 0.9832
Epoch 7/10
 - 22s - loss: 0.0481 - acc: 0.9848 - val_loss: 0.0449 - val_acc: 0.9859
Epoch 8/10
 - 22s - loss: 0.0423 - acc: 0.9871 - val_loss: 0.0441 - val_acc: 0.9848
Epoch 9/10
 - 23s - loss: 0.0382 - acc: 0.9886 - val_loss: 0.0392 - val_acc: 0.9872
Epoch 10/10
 - 29s - loss: 0.0345 - acc: 0.9892 - val_loss: 0.0416 - val_acc: 0.9865
Accuracy: 98.65 % 
 Error: 1.3499999999999943 %
