# MNIST database of handwritten digits. 1st version of a Keras Neural Network (no hidden layers).

## http://yann.lecun.com/exdb/mnist/

In [0]:
import numpy as np
from keras.datasets import mnist
from keras.models import Sequential
from keras.layers.core import Dense, Activation
from keras.optimizers import SGD
from keras.utils import np_utils

In [0]:
# for reproducibility
np.random.seed(123)

In [0]:
# network and training
NB_EPOCH = 200
BATCH_SIZE = 128
VERBOSE = 1
NB_CLASSES = 10 # number of outputs = number of digits
OPTIMIZER = SGD() # Stochastic Gradient Descent optimizer
# N_HIDDEN = 128 # No hidden layers in this simple model
VALIDATION_SPLIT = 0.2 # how much train is reserved fro validation

In [0]:
# data shuffled and split between train and test sets
(X_train, y_train), (X_test, y_test) = mnist.load_data()

In [47]:
X_train.shape # X_train is 60000 rows of 28x28 values 

(60000, 28, 28)

In [0]:
# X_train to be reshaped in 60000x784
RESHAPED = 784 # number of neurons

X_train = X_train.reshape(60000, RESHAPED)
X_test = X_test.reshape(10000, RESHAPED)
X_train = X_train.astype('float32')
X_test = X_test.astype('float32')

In [49]:
# normalize 
X_train /= 255
X_test /= 255

print(X_train.shape[0], 'training set')
print(X_test.shape[0], 'testing set')

(60000, 'training set')
(10000, 'testing set')


In [0]:
# convert class vectors to binary class matrices
Y_train = np_utils.to_categorical(y_train, NB_CLASSES)
Y_test = np_utils.to_categorical(y_test, NB_CLASSES)

In [0]:
# Define the Sequential model or linear stack of layers
model = Sequential()

# Output layer with 10 neurons
model.add(Dense(NB_CLASSES, input_shape=(RESHAPED,)))
# final stage: softmax
model.add(Activation('softmax'))

In [52]:
model.summary()

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense_2 (Dense)              (None, 10)                7850      
_________________________________________________________________
activation_2 (Activation)    (None, 10)                0         
Total params: 7,850
Trainable params: 7,850
Non-trainable params: 0
_________________________________________________________________


In [0]:
model.compile(loss='categorical_crossentropy', 
              optimizer=OPTIMIZER, 
              metrics=['accuracy'])

In [54]:
history = model.fit(X_train, Y_train, batch_size=BATCH_SIZE, epochs=NB_EPOCH, verbose=VERBOSE, validation_split=VALIDATION_SPLIT)

Train on 48000 samples, validate on 12000 samples
Epoch 1/200
Epoch 2/200
Epoch 3/200
Epoch 4/200
Epoch 5/200
Epoch 6/200
Epoch 7/200
Epoch 8/200

Epoch 9/200
Epoch 10/200
Epoch 11/200
Epoch 12/200
Epoch 13/200
Epoch 14/200
Epoch 15/200
Epoch 16/200

Epoch 17/200
Epoch 18/200
Epoch 19/200
Epoch 20/200
Epoch 21/200
Epoch 22/200
Epoch 23/200
Epoch 24/200
 9984/48000 [=====>........................] - ETA: 0s - loss: 0.3556 - acc: 0.9047

Epoch 25/200
Epoch 26/200
Epoch 27/200
Epoch 28/200
Epoch 29/200
Epoch 30/200
Epoch 31/200
Epoch 32/200

Epoch 33/200
Epoch 34/200
Epoch 35/200
Epoch 36/200
Epoch 37/200
Epoch 38/200
Epoch 39/200
Epoch 40/200
10368/48000 [=====>........................] - ETA: 0s - loss: 0.3339 - acc: 0.9048

Epoch 41/200
Epoch 42/200
Epoch 43/200
Epoch 44/200
Epoch 45/200
Epoch 46/200
Epoch 47/200
Epoch 48/200
10240/48000 [=====>........................] - ETA: 0s - loss: 0.3225 - acc: 0.9065

Epoch 49/200
Epoch 50/200
Epoch 51/200
Epoch 52/200
Epoch 53/200
Epoch 54/200
Epoch 55/200
Epoch 56/200
 7552/48000 [===>..........................] - ETA: 0s - loss: 0.3307 - acc: 0.9084

Epoch 57/200
Epoch 58/200
Epoch 59/200
Epoch 60/200
Epoch 61/200
Epoch 62/200
Epoch 63/200
Epoch 64/200
 7808/48000 [===>..........................] - ETA: 0s - loss: 0.3053 - acc: 0.9155

Epoch 65/200
Epoch 66/200
Epoch 67/200
Epoch 68/200
Epoch 69/200
Epoch 70/200
Epoch 71/200
Epoch 72/200
 7936/48000 [===>..........................] - ETA: 0s - loss: 0.3080 - acc: 0.9171

Epoch 73/200
Epoch 74/200
Epoch 75/200
Epoch 76/200
Epoch 77/200
Epoch 78/200
Epoch 79/200
Epoch 80/200
10112/48000 [=====>........................] - ETA: 0s - loss: 0.2962 - acc: 0.9173

Epoch 81/200
Epoch 82/200
Epoch 83/200
Epoch 84/200
Epoch 85/200
Epoch 86/200
Epoch 87/200
Epoch 88/200
10368/48000 [=====>........................] - ETA: 0s - loss: 0.2970 - acc: 0.9157

Epoch 89/200
Epoch 90/200
Epoch 91/200
Epoch 92/200
Epoch 93/200
Epoch 94/200
Epoch 95/200
Epoch 96/200
 6528/48000 [===>..........................] - ETA: 1s - loss: 0.3074 - acc: 0.9156

Epoch 97/200
Epoch 98/200
Epoch 99/200
Epoch 100/200
Epoch 101/200
Epoch 102/200
Epoch 103/200
Epoch 104/200

Epoch 105/200
Epoch 106/200
Epoch 107/200
Epoch 108/200
Epoch 109/200
Epoch 110/200
Epoch 111/200
Epoch 112/200
 7808/48000 [===>..........................] - ETA: 0s - loss: 0.3022 - acc: 0.9143

Epoch 113/200
Epoch 114/200
Epoch 115/200
Epoch 116/200
Epoch 117/200
Epoch 118/200
Epoch 119/200
Epoch 120/200
 7808/48000 [===>..........................] - ETA: 0s - loss: 0.2846 - acc: 0.9182

Epoch 121/200
Epoch 122/200
Epoch 123/200
Epoch 124/200
Epoch 125/200
Epoch 126/200
Epoch 127/200
Epoch 128/200
 7808/48000 [===>..........................] - ETA: 0s - loss: 0.2924 - acc: 0.9187

Epoch 129/200
Epoch 130/200
Epoch 131/200
Epoch 132/200
Epoch 133/200
Epoch 134/200
Epoch 135/200
Epoch 136/200
10368/48000 [=====>........................] - ETA: 0s - loss: 0.2823 - acc: 0.9243

Epoch 137/200
Epoch 138/200
Epoch 139/200
Epoch 140/200
Epoch 141/200
Epoch 142/200
Epoch 143/200
Epoch 144/200
 5120/48000 [==>...........................] - ETA: 0s - loss: 0.2844 - acc: 0.9256

Epoch 145/200
Epoch 146/200
Epoch 147/200
Epoch 148/200
Epoch 149/200
Epoch 150/200
Epoch 151/200
Epoch 152/200
 7552/48000 [===>..........................] - ETA: 0s - loss: 0.2881 - acc: 0.9216

Epoch 153/200
Epoch 154/200
Epoch 155/200
Epoch 156/200
Epoch 157/200
Epoch 158/200
Epoch 159/200
Epoch 160/200
 5120/48000 [==>...........................] - ETA: 0s - loss: 0.2816 - acc: 0.9201

Epoch 161/200
Epoch 162/200
Epoch 163/200
Epoch 164/200
Epoch 165/200
Epoch 166/200
Epoch 167/200
Epoch 168/200
 7552/48000 [===>..........................] - ETA: 0s - loss: 0.2771 - acc: 0.9249

Epoch 169/200
Epoch 170/200
Epoch 171/200
Epoch 172/200
Epoch 173/200
Epoch 174/200
Epoch 175/200
Epoch 176/200
 2560/48000 [>.............................] - ETA: 1s - loss: 0.2832 - acc: 0.9156

Epoch 177/200
Epoch 178/200
Epoch 179/200
Epoch 180/200
Epoch 181/200
Epoch 182/200
Epoch 183/200
Epoch 184/200
 2688/48000 [>.............................] - ETA: 1s - loss: 0.2885 - acc: 0.9226

Epoch 185/200
Epoch 186/200
Epoch 187/200
Epoch 188/200
Epoch 189/200
Epoch 190/200
Epoch 191/200
Epoch 192/200
10112/48000 [=====>........................] - ETA: 0s - loss: 0.2732 - acc: 0.9253

Epoch 193/200
Epoch 194/200
Epoch 195/200
Epoch 196/200
Epoch 197/200
Epoch 198/200
Epoch 199/200
Epoch 200/200
10496/48000 [=====>........................] - ETA: 0s - loss: 0.2656 - acc: 0.9241



In [58]:
score = model.evaluate(X_test, Y_test, verbose=VERBOSE)

print("Test score: ", score[0])
print("Test accuracy: ", score[1])

('Test score: ', 0.27685544392764566)
('Test accuracy: ', 0.9225)
