# MNIST

## Keras MLP example

In [1]:
from tensorflow.keras.utils import to_categorical
from tensorflow.keras.datasets import mnist
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, Dropout
from tensorflow.keras.optimizers import RMSprop

## Parameters

In [2]:
batch_size = 128
num_classes = 10
epochs = 20

## Data

In [3]:
(x_train, y_train), (x_test, y_test) = mnist.load_data()
x_train = x_train.reshape(60000, 784)
x_test = x_test.reshape(10000, 784)
x_train = x_train.astype('float32')
x_test = x_test.astype('float32')
x_train /= 255
x_test /= 255

In [4]:
x_train.shape

(60000, 784)

In [5]:
x_test.shape

(10000, 784)

In [6]:
# convert class vectors to binary class matrices
y_train = to_categorical(y_train, num_classes)
y_test = to_categorical(y_test, num_classes)

## Building the Arquitecture

In [7]:
model = Sequential()
model.add(Dense(512, activation='relu', input_shape=(784,)))
model.add(Dropout(0.2))
model.add(Dense(512, activation='relu'))
model.add(Dropout(0.2))
model.add(Dense(num_classes, activation='softmax'))

In [8]:
model.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense (Dense)                (None, 512)               401920    
_________________________________________________________________
dropout (Dropout)            (None, 512)               0         
_________________________________________________________________
dense_1 (Dense)              (None, 512)               262656    
_________________________________________________________________
dropout_1 (Dropout)          (None, 512)               0         
_________________________________________________________________
dense_2 (Dense)              (None, 10)                5130      
Total params: 669,706
Trainable params: 669,706
Non-trainable params: 0
_________________________________________________________________


In [9]:
model.compile(loss='categorical_crossentropy',
              optimizer='adam',
              metrics=['accuracy'])

## Training

In [10]:
model.fit(x_train, y_train, batch_size=batch_size, epochs=epochs)

Train on 60000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


<tensorflow.python.keras.callbacks.History at 0x7fb10c1027b8>

## Test & evaluation

In [11]:
model.evaluate(x_test, y_test, verbose=0)[1]

0.9815

In [12]:
import pandas as pd

In [13]:
preds = pd.Series(model.predict_classes(x_test).tolist(),name='preds')
reals = pd.Series([x.tolist().index(1.0) for x in y_test],name='reals')
reals.index = range(len(reals))
pd.crosstab(reals,preds)

preds,0,1,2,3,4,5,6,7,8,9
reals,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
0,971,2,0,2,1,0,2,1,0,1
1,0,1130,2,1,0,0,1,0,1,0
2,3,0,1012,5,3,0,1,4,3,1
3,0,0,4,993,0,3,0,3,2,5
4,1,1,1,0,967,0,5,0,0,7
5,2,0,0,9,0,872,2,3,1,3
6,2,3,0,1,9,4,935,0,4,0
7,0,3,10,0,0,0,0,1008,2,5
8,4,1,3,5,7,5,0,2,940,7
9,1,2,0,4,13,1,0,1,0,987
