<a href="https://colab.research.google.com/github/swilsonmfc/deeplearning/blob/master/MnistKerasClassification.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# MNIST Classification
* Simple convnet to classify hand writted digits

In [0]:
from keras.datasets import mnist

from keras import layers
from keras import models
from keras import metrics
from keras import losses

from keras.utils import to_categorical

Using TensorFlow backend.


# Data

In [0]:
[train_img, train_labels], [test_img, test_labels] = mnist.load_data()
train_img = train_img.reshape((60000, 28, 28, 1))
train_img = train_img.astype('float32') / 255

test_img = test_img.reshape((10000, 28, 28, 1))
test_img = test_img.astype('float32') / 255

train_labels = to_categorical(train_labels)
test_labels  = to_categorical(test_labels)

Downloading data from https://s3.amazonaws.com/img-datasets/mnist.npz


# Model
* Convnet taking in tensors (img_height, img_width, img_channels)
* For mnist these are (28, 28, 1)
* Image height, Image width 28 X 28
* Grey scale (1 channel)
* By contrast color images have 3 channels (RGB)
* To get our Convnet to output classes we:
 * Flatten our convnet
 * Pass through a dense layer
 * Output a size 10 softmax dense layer
 * The softmax gives us the probability of the image belonging to the image class 0-9

In [0]:
model = models.Sequential()
model.add(layers.Conv2D(32, (3, 3), activation='relu', input_shape=(28, 28, 1)))
model.add(layers.MaxPooling2D(2, 2))
model.add(layers.Conv2D(64, (3, 3), activation='relu'))
model.add(layers.MaxPooling2D(2, 2))
model.add(layers.Conv2D(64, (3, 3), activation='relu'))
model.add(layers.Flatten())
model.add(layers.Dense(64, activation='relu'))
model.add(layers.Dense(10, activation='softmax'))
model.summary()





Model: "sequential_1"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d_1 (Conv2D)            (None, 26, 26, 32)        320       
_________________________________________________________________
max_pooling2d_1 (MaxPooling2 (None, 13, 13, 32)        0         
_________________________________________________________________
conv2d_2 (Conv2D)            (None, 11, 11, 64)        18496     
_________________________________________________________________
max_pooling2d_2 (MaxPooling2 (None, 5, 5, 64)          0         
_________________________________________________________________
conv2d_3 (Conv2D)            (None, 3, 3, 64)          36928     
_________________________________________________________________
flatten_1 (Flatten)          (None, 576)               0         
_________________________________________________________________
dense_1 (Dense)              (None, 64)           

# Compile & Fit
* Normally, we'd add a validation set
* Look for our training stop point
* Output graphs etc
* Here we're just going to train and look at loss on test
* Timing:
 * On a CPU ~ 5 minutes
 * On a GPU ~ 45 seconds
* Overall we're really accurate without much effort (almost 99%)


In [0]:
model.compile(optimizer='rmsprop',
             loss='categorical_crossentropy',
             metrics=['accuracy'])
model.fit(train_img, train_labels, epochs=5, batch_size=64)
loss, acc = model.evaluate(test_img, test_labels)
print('Test Loss', loss)
print('Test Accuracy', acc)



Instructions for updating:
Use tf.where in 2.0, which has the same broadcast rule as np.where

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
Test Loss 0.03472860807276611
Test Accuracy 0.9895
