In [39]:
from __future__ import print_function
import numpy as np
from keras.datasets import mnist
from keras.models import Sequential
from keras.layers.core import Dense, Activation, Dropout #Add Dropout layer
from keras.optimizers import SGD
from keras.utils import np_utils

In [40]:
np.random.seed(1671) #For reproducability

In [41]:
#network and training
NB_EPOCH = 20
BATCH_SIZE=128
VERBOSE=1
NB_CLASSES=10 # Number of categories (digits) in the Mnist data set
OPTIMIZER=SGD() #Stochastic Gradient Descent Optimizer
N_HIDDEN=128
VALIDATION_SPLIT=0.2 #Split between training and validation sets
#Add a dropout constant
DROPOUT=0.3

In [42]:
(X_train, y_train), (X_test, y_test) = mnist.load_data()
X_train.shape

(60000, 28, 28)

In [43]:
#Data Massaging to get to a usable format
#X_train is 60000 * 28 * 28 which we want to reshape to 60000 * 784
RESHAPED=784
X_train=X_train.reshape(60000, RESHAPED)
X_test=X_test.reshape(10000, RESHAPED)
X_train=X_train.astype('float32')
X_test=X_test.astype('float32')
#normalize
X_train /= 255
X_test /= 255
print(X_train.shape[0], 'training samples')
print(X_test.shape[0], 'testing samples')

60000 training samples
10000 testing samples


In [44]:
#convert class vectors to binary class matrices
Y_train=np_utils.to_categorical(y_train, NB_CLASSES)
Y_test=np_utils.to_categorical(y_test, NB_CLASSES)

In [45]:
#Define model with 10 outputs using a softmax output layer
model=Sequential()
#Add Hidden layer to test the effect on accuracy
model.add(Dense(N_HIDDEN, input_shape=(RESHAPED,)))
model.add(Activation('relu'))
model.add(Dropout(DROPOUT))
model.add(Dense(N_HIDDEN))
model.add(Activation('relu'))
model.add(Dropout(DROPOUT))
#Existing Layers
model.add(Dense(NB_CLASSES)) #Input Shape specification stays on the first layer of the net
model.add(Activation('softmax'))
model.summary()

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense_36 (Dense)             (None, 128)               100480    
_________________________________________________________________
activation_37 (Activation)   (None, 128)               0         
_________________________________________________________________
dropout_1 (Dropout)          (None, 128)               0         
_________________________________________________________________
dense_37 (Dense)             (None, 128)               16512     
_________________________________________________________________
activation_38 (Activation)   (None, 128)               0         
_________________________________________________________________
dropout_2 (Dropout)          (None, 128)               0         
_________________________________________________________________
dense_38 (Dense)             (None, 10)                1290      
__________

In [46]:
model.compile(loss='categorical_crossentropy', optimizer=OPTIMIZER, metrics=['accuracy'])
history=model.fit(X_train, Y_train, batch_size=BATCH_SIZE, epochs=NB_EPOCH, 
                  verbose=VERBOSE, validation_split=VALIDATION_SPLIT)
score=model.evaluate(X_test, Y_test, verbose=VERBOSE)
print("Test score:",score[0])
print("Test accuracy:",score[1])

Train on 48000 samples, validate on 12000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Test score: 0.199432100251
Test accuracy: 0.9401
