In [1]:
import numpy
from keras.models import Sequential
from keras.layers import Dense
from keras.layers import Dropout
from keras.utils import np_utils

Using TensorFlow backend.


In [2]:
from keras.datasets import mnist

(X_train, y_train), (X_test, y_test) = mnist.load_data()

print('X_train shape:', X_train.shape)
print(X_train.shape[0], 'train samples')
print(X_test.shape[0], 'test samples')

X_train shape: (60000, 28, 28)
60000 train samples
10000 test samples


In [3]:
# Show first records
# X_train[0]
# y_train[0:5]

In [4]:
# Each image is a 28x28 pixel image represented as a rank 2 matrix.
# Need to flatten to 784 element vector
num_pixels = 784
X_train = X_train.reshape(X_train.shape[0], num_pixels).astype('float32')
X_test = X_test.reshape(X_test.shape[0], num_pixels).astype('float32')

# Images represent a vector of 784 float values ranging from 0-255.
# Need to normalize inputs to standard scale 0-1
X_train = X_train / 255
X_test = X_test / 255

# Each Y category is represnted as a 0-9 scalar
# Best practice to one hot encode
y_train = np_utils.to_categorical(y_train)
y_test = np_utils.to_categorical(y_test)
num_classes = y_test.shape[1]

In [5]:
# y_train[0:5]

In [6]:
seed = 42
numpy.random.seed(seed)

In [7]:
def FF_model():
    # create model
    model = Sequential()
    model.add(Dense(256, input_dim=num_pixels, init='normal', activation='relu'))
    model.add(Dense(num_classes, init='normal', activation='softmax'))
    # Compile model
    model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

In [8]:
model = FF_model()
# Fit the model
model.fit(X_train, y_train, validation_data=(X_test, y_test), nb_epoch=10, batch_size=200, verbose=2)
# Final evaluation of the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("Baseline Error: %.2f%%" % (100-scores[1]*100))

Train on 60000 samples, validate on 10000 samples
Epoch 1/10
2s - loss: 0.3926 - acc: 0.8963 - val_loss: 0.1964 - val_acc: 0.9424
Epoch 2/10
2s - loss: 0.1613 - acc: 0.9540 - val_loss: 0.1314 - val_acc: 0.9624
Epoch 3/10
2s - loss: 0.1140 - acc: 0.9678 - val_loss: 0.1034 - val_acc: 0.9685
Epoch 4/10
2s - loss: 0.0863 - acc: 0.9750 - val_loss: 0.0903 - val_acc: 0.9735
Epoch 5/10
2s - loss: 0.0682 - acc: 0.9805 - val_loss: 0.0829 - val_acc: 0.9760
Epoch 6/10
2s - loss: 0.0546 - acc: 0.9846 - val_loss: 0.0737 - val_acc: 0.9758
Epoch 7/10
2s - loss: 0.0440 - acc: 0.9880 - val_loss: 0.0700 - val_acc: 0.9782
Epoch 8/10
2s - loss: 0.0365 - acc: 0.9905 - val_loss: 0.0676 - val_acc: 0.9784
Epoch 9/10
2s - loss: 0.0300 - acc: 0.9923 - val_loss: 0.0637 - val_acc: 0.9800
Epoch 10/10
2s - loss: 0.0248 - acc: 0.9939 - val_loss: 0.0642 - val_acc: 0.9795
Baseline Error: 2.05%


In [9]:
# Once we like our model and training results, 
# serialize model to JSON for other apps to use
model_json = model.to_json()
with open("./models/model.json", "w") as json_file:
    json_file.write(model_json)

# serialize weights to HDF5
model.save_weights("./models/weights.h5")
print("Saved model to disk")

Saved model to disk
