# Problem 2

Use this notebook to write your code for problem 3.

In [1]:
import numpy as np
import matplotlib.pyplot as plt
%matplotlib inline

In [2]:
# load MNIST data into Keras format
import keras
from keras.datasets import mnist

(x_train, y_train), (x_test, y_test) = mnist.load_data()

Using TensorFlow backend.


In [3]:
# look at the shapes
print(x_train.shape)
print(x_test.shape)

(60000, 28, 28)
(10000, 28, 28)


In [4]:
# we'll need to one-hot encode the labels
y_train = keras.utils.np_utils.to_categorical(y_train)
y_test = keras.utils.np_utils.to_categorical(y_test)

In [5]:
# don't forget to NORMALIZE
x_train = np.divide(x_train, 255)
x_test = np.divide(x_test, 255)

In [6]:
# we must reshape the X data (add a channel dimension)
x_train = x_train.reshape(tuple(list(x_train.shape) + [1]))
x_test = x_test.reshape(tuple(list(x_test.shape) + [1]))

In [7]:
# look at the shapes
print(x_train.shape)
print(x_test.shape)

(60000, 28, 28, 1)
(10000, 28, 28, 1)


In [8]:
from keras.models import Sequential
from keras.layers import Dense, Activation, Dropout
from keras.layers import Conv2D, MaxPooling2D, Flatten, BatchNormalization
from keras import regularizers

# sample model
# note: what is the difference between 'same' and 'valid' padding?
# Take a look at the outputs to understand the difference, or read the Keras documentation!
model = Sequential()
model.add(Conv2D(8, (3, 3), padding='same',
                 input_shape=(28, 28, 1)))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.50))

model.add(Conv2D(8, (3, 3), padding='same'))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.50))

model.add(Flatten())
model.add(Dense(64))
model.add(Activation('relu'))
model.add(Dense(10))
model.add(Activation('softmax'))

In [9]:
# why don't we take a look at the layers and outputs
# note: `None` in the first dimension means it can take any batch_size!
for i in range(len(model.layers)):
    layer = model.layers[i]
    print(layer)
    print(layer.output_shape)

<keras.layers.convolutional.Conv2D object at 0x0000017F471C9F98>
(None, 28, 28, 8)
<keras.layers.core.Activation object at 0x0000017F471E6CF8>
(None, 28, 28, 8)
<keras.layers.pooling.MaxPooling2D object at 0x0000017F471E6CC0>
(None, 14, 14, 8)
<keras.layers.core.Dropout object at 0x0000017F3D7CA668>
(None, 14, 14, 8)
<keras.layers.convolutional.Conv2D object at 0x0000017F471CB518>
(None, 14, 14, 8)
<keras.layers.core.Activation object at 0x0000017F47200978>
(None, 14, 14, 8)
<keras.layers.pooling.MaxPooling2D object at 0x0000017F47287B00>
(None, 7, 7, 8)
<keras.layers.core.Dropout object at 0x0000017F3A67C358>
(None, 7, 7, 8)
<keras.layers.core.Flatten object at 0x0000017F472879E8>
(None, 392)
<keras.layers.core.Dense object at 0x0000017F472875F8>
(None, 64)
<keras.layers.core.Activation object at 0x0000017F4725DB38>
(None, 64)
<keras.layers.core.Dense object at 0x0000017F472E4BE0>
(None, 10)
<keras.layers.core.Activation object at 0x0000017F472E46D8>
(None, 10)


In [10]:
# our model has some # of parameters:
model.count_params()

26466

In [11]:
# For a multi-class classification problem
model.compile(optimizer='rmsprop',
              loss='categorical_crossentropy',
              metrics=['accuracy'])

In [12]:
# Train the model, iterating on the data in batches of 32 samples
history = model.fit(x_train, y_train, epochs=10, batch_size=32,
                    validation_data=(x_test, y_test))

Train on 60000 samples, validate on 10000 samples
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


Above, we output the training loss/accuracy as well as the validation (here, the TEST) loss and accuracy. To confirm that these are right, we can explicitly print out the training and test losses/accuracies.

In [13]:
# note that our model outputs two eval params:
# 1. loss (categorical cross-entropy)
# 2. accuracy
model.metrics_names

['loss', 'acc']

In [14]:
model.evaluate(x=x_train, y=y_train)



[0.084354429868236186, 0.97668333333333335]

In [15]:
model.evaluate(x=x_test, y=y_test)



[0.079333119192719459, 0.97889999999999999]

Not bad! Let's see if you can do better.

In [28]:
# Creating model for Problem D


# model with <= 200 hidden units and >= 2 hidden layers
# note: what is the difference between 'same' and 'valid' padding?
# Take a look at the outputs to understand the difference, or read the Keras documentation!
model = Sequential()
model.add(Conv2D(8, (3, 3), padding='same',
                 input_shape=(28, 28, 1)))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.50))

model.add(Conv2D(8, (3, 3), padding='same'))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.50))

model.add(Flatten())
model.add(Dense(128))
model.add(Activation('relu'))
model.add(Dense(128))
model.add(Activation('relu'))
model.add(Dense(10))
model.add(Activation('softmax'))

In [19]:
# why don't we take a look at the layers and outputs
# note: `None` in the first dimension means it can take any batch_size!
for i in range(len(model.layers)):
    layer = model.layers[i]
    print(layer)
    print(layer.output_shape)

<keras.layers.convolutional.Conv2D object at 0x0000017F48D5C940>
(None, 28, 28, 8)
<keras.layers.core.Activation object at 0x0000017F48D5C240>
(None, 28, 28, 8)
<keras.layers.pooling.MaxPooling2D object at 0x0000017F48D5CEB8>
(None, 14, 14, 8)
<keras.layers.core.Dropout object at 0x0000017F479F3F28>
(None, 14, 14, 8)
<keras.layers.convolutional.Conv2D object at 0x0000017F48D8DB38>
(None, 14, 14, 8)
<keras.layers.core.Activation object at 0x0000017F48D5CEF0>
(None, 14, 14, 8)
<keras.layers.pooling.MaxPooling2D object at 0x0000017F48DAC630>
(None, 7, 7, 8)
<keras.layers.core.Dropout object at 0x0000017F48D8D7F0>
(None, 7, 7, 8)
<keras.layers.core.Flatten object at 0x0000017F48E06A90>
(None, 392)
<keras.layers.core.Dense object at 0x0000017F48E066A0>
(None, 128)
<keras.layers.core.Activation object at 0x0000017F48DF5668>
(None, 128)
<keras.layers.core.Dense object at 0x0000017F48E5FF98>
(None, 128)
<keras.layers.core.Activation object at 0x0000017F48E4AA58>
(None, 128)
<keras.layers.core.

In [29]:
# For a multi-class classification problem
model.compile(optimizer='rmsprop',
              loss='categorical_crossentropy',
              metrics=['accuracy'])

In [30]:
# Train the model, iterating on the data in batches of 32 samples
history = model.fit(x_train, y_train, epochs=15, batch_size=32,
                    validation_data=(x_test, y_test))

Train on 60000 samples, validate on 10000 samples
Epoch 1/15
Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15


In [31]:
model.evaluate(x=x_train, y=y_train)



[0.05795507019907236, 0.98271666666666668]

In [32]:
model.evaluate(x=x_test, y=y_test)



[0.058383460562210533, 0.98370000000000002]

In [33]:
# Creating model for Problem E


# model with <= 1000 hidden units and >= 3 hidden layers
# note: what is the difference between 'same' and 'valid' padding?
# Take a look at the outputs to understand the difference, or read the Keras documentation!
model = Sequential()
model.add(Conv2D(8, (3, 3), padding='same',
                 input_shape=(28, 28, 1)))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.50))

model.add(Conv2D(8, (3, 3), padding='same'))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.50))

model.add(Flatten())
model.add(Dense(512))
model.add(Activation('relu'))
model.add(Dense(512))
model.add(Activation('relu'))
model.add(Dense(512))
model.add(Activation('relu'))
model.add(Dense(10))
model.add(Activation('softmax'))

In [34]:
# why don't we take a look at the layers and outputs
# note: `None` in the first dimension means it can take any batch_size!
for i in range(len(model.layers)):
    layer = model.layers[i]
    print(layer)
    print(layer.output_shape)

<keras.layers.convolutional.Conv2D object at 0x0000017F4A581518>
(None, 28, 28, 8)
<keras.layers.core.Activation object at 0x0000017F4A05F0F0>
(None, 28, 28, 8)
<keras.layers.pooling.MaxPooling2D object at 0x0000017F4A05FCF8>
(None, 14, 14, 8)
<keras.layers.core.Dropout object at 0x0000017F4A05FEB8>
(None, 14, 14, 8)
<keras.layers.convolutional.Conv2D object at 0x0000017F4A581908>
(None, 14, 14, 8)
<keras.layers.core.Activation object at 0x0000017F4A05FF60>
(None, 14, 14, 8)
<keras.layers.pooling.MaxPooling2D object at 0x0000017F4A565F60>
(None, 7, 7, 8)
<keras.layers.core.Dropout object at 0x0000017F4A592940>
(None, 7, 7, 8)
<keras.layers.core.Flatten object at 0x0000017F4A220DA0>
(None, 392)
<keras.layers.core.Dense object at 0x0000017F4A073AC8>
(None, 512)
<keras.layers.core.Activation object at 0x0000017F4A232E80>
(None, 512)
<keras.layers.core.Dense object at 0x0000017F4A2B17F0>
(None, 512)
<keras.layers.core.Activation object at 0x0000017F4A2DCDA0>
(None, 512)
<keras.layers.core.

In [35]:
# For a multi-class classification problem
model.compile(optimizer='rmsprop',
              loss='categorical_crossentropy',
              metrics=['accuracy'])

In [36]:
# Train the model, iterating on the data in batches of 32 samples
history = model.fit(x_train, y_train, epochs=20, batch_size=32,
                    validation_data=(x_test, y_test))

Train on 60000 samples, validate on 10000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [37]:
model.evaluate(x=x_train, y=y_train)



[0.085722427699466544, 0.97606666666666664]

In [32]:
model.evaluate(x=x_test, y=y_test)



[0.058383460562210533, 0.98370000000000002]