In [31]:
from keras.datasets import mnist
import matplotlib.pyplot as plt
import numpy
from keras.models import Sequential
from keras.layers import Dense
from keras.layers import Dropout
from keras.utils import np_utils


(X_train,y_train),(X_test,y_test) = mnist.load_data()

In [32]:
seed = 7
numpy.random.seed(seed)

In [33]:
X_train.shape

(60000, 28, 28)

In [34]:
# Flaten 28 * 28 images to a 784 vector for each image

num_pixels = X_train.shape[1] * X_train.shape[2]

X_train = X_train.reshape(X_train.shape[0],num_pixels).astype('float32')
X_test = X_test.reshape(X_test.shape[0], num_pixels).astype('float32')

# Scaling the pixel values(0 - 255) to get them in the range of 0 - 1 

X_train = X_train/255
X_test = X_test/255

#One hot encodeing the output classes

y_train = np_utils.to_categorical(y_train)
y_test = np_utils.to_categorical(y_test)

num_classes = y_train.shape[1]

In [45]:
def baseline_model():
    model = Sequential()
    model.add(Dense(num_pixels, input_dim = num_pixels, kernel_initializer = 'normal', activation = 'relu'))
   
    model.add(Dense(num_classes, kernel_initializer = 'normal', activation = 'softmax'))
    
    model.compile(loss = 'categorical_crossentropy', optimizer = 'adam', metrics = ['accuracy'])
    return model
    

In [46]:
model = baseline_model()

model.fit(X_train,y_train, validation_data = (X_test, y_test), epochs = 10, batch_size = 200, verbose = 2)

scores = model.evaluate(X_test,y_test,verbose = 2)

print("Baseline Error: %.2f%%" % (100 - scores[1]*100))

Train on 60000 samples, validate on 10000 samples
Epoch 1/10
 - 1s - loss: 0.2856 - acc: 0.9188 - val_loss: 0.1415 - val_acc: 0.9584
Epoch 2/10
 - 1s - loss: 0.1119 - acc: 0.9675 - val_loss: 0.1010 - val_acc: 0.9707
Epoch 3/10
 - 1s - loss: 0.0720 - acc: 0.9791 - val_loss: 0.0798 - val_acc: 0.9763
Epoch 4/10
 - 1s - loss: 0.0507 - acc: 0.9850 - val_loss: 0.0757 - val_acc: 0.9768
Epoch 5/10
 - 1s - loss: 0.0364 - acc: 0.9903 - val_loss: 0.0663 - val_acc: 0.9802
Epoch 6/10
 - 1s - loss: 0.0269 - acc: 0.9928 - val_loss: 0.0647 - val_acc: 0.9806
Epoch 7/10
 - 1s - loss: 0.0195 - acc: 0.9956 - val_loss: 0.0649 - val_acc: 0.9806
Epoch 8/10
 - 1s - loss: 0.0147 - acc: 0.9968 - val_loss: 0.0601 - val_acc: 0.9813
Epoch 9/10
 - 1s - loss: 0.0113 - acc: 0.9977 - val_loss: 0.0650 - val_acc: 0.9805
Epoch 10/10
 - 1s - loss: 0.0081 - acc: 0.9985 - val_loss: 0.0601 - val_acc: 0.9819
Baseline Error: 1.81%


In [4]:
## Trying to implement the same task using a Convolutional Neural Network


In [6]:
import numpy
from keras.datasets import mnist
from keras.models import Sequential
from keras.layers import Dense
from keras.layers import Dropout
from keras.layers import Flatten
from keras.layers.convolutional import Conv2D
from keras.layers.convolutional import MaxPooling2D
from keras.utils import np_utils
from keras import backend as K
K.set_image_dim_ordering('th')


seed = 7
numpy.random.seed(seed)

In [11]:
(X_train, y_train),(X_test,y_test) = mnist.load_data()

# Reshpaing data to [samples, Grayscale =1 / Color = 3, width,height]

X_train = X_train.reshape(X_train.shape[0],1,28,28).astype('float32')
X_test = X_test.reshape(X_test.shape[0],1,28,28).astype('float32')

#Normalise inputs

X_train = X_train/255
X_test = X_test / 255

# one hot encode outputs

y_train = np_utils.to_categorical(y_train) 
y_test = np_utils.to_categorical(y_test)

num_class = y_train.shape[1]


In [25]:
def baseline_cnn():
    model = Sequential()
    model.add(Conv2D(24,(5,5),input_shape=(1,28,28),activation = 'relu'))
    model.add(MaxPooling2D(pool_size = (2,2)))
    model.add(Dropout(0.2))
    model.add(Flatten())
    model.add(Dense(128,activation = 'relu'))
    model.add(Dense(num_class,activation = 'softmax'))
    
    model.compile(loss = 'categorical_crossentropy', optimizer = 'adam', metrics = ['accuracy'])
    return model

In [28]:
model = baseline_cnn()

model.fit(X_train,y_train, validation_data = (X_test,y_test), epochs = 10, batch_size = 200, verbose = 1)

scores = model.evaluate(X_test, y_test, verbose = 0)

print("CNN error :%.2f%%" %(100 - scores[1]*100))

Train on 60000 samples, validate on 10000 samples
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
CNN error :1.04%
