## Mnist dataset with keras

In this project I am trying to predict the digit using pixel values as feature variable. 

In [1]:
# importing numpy with fixed random state

import numpy 
numpy.random.seed(1337)   # for experiment reproducibility 

In [2]:
# importing required libraries

import keras #-----------------------------> Deep learning framework
from keras.models import Sequential #------> Defining model
from keras.layers import Dense #-----------> To add layers in nueral net
from keras.optimizers import SGD 
from keras.datasets import mnist #---------> importing mnist dataset

In [3]:
# Defining required variables

num_classes = 10 #----------------------> number of class is 10 i.e 0-9

batch_size = 128 #----------------------> Number of training samples to be taken at one time
epochs = 20 #---------------------------> Number of times that learning algorithm will work through the entire training dataset

In [4]:
# the data, shuffled and split between train and test sets

(x_train, y_train), (x_test, y_test) = mnist.load_data()

In [5]:
print(x_train.shape, y_train.shape, x_test.shape, y_test.shape)

(60000, 28, 28) (60000,) (10000, 28, 28) (10000,)


In [6]:
x_train = x_train.reshape(60000, 784)  # 28x28 = 784
x_test = x_test.reshape(10000, 784)

x_train = x_train.astype('float32') 
x_test = x_test.astype('float32') 

x_train /= 255  # 0 - 255 ...  0-1 
x_test /= 255   # normalizing your data 


print(x_train.shape[0], 'train samples')
print(x_test.shape[0], 'test samples')

60000 train samples
10000 test samples


In [7]:
print(x_train.shape)
print(y_train.shape)

(60000, 784)
(60000,)


In [8]:
y_train[0]

5

In [9]:
# convert class vectors to binary class matrices

y_train = keras.utils.to_categorical(y_train, num_classes)  # converting class in one hot encoding
y_test = keras.utils.to_categorical(y_test, num_classes)

# one hot encoding
# eg. 4 to [0, 0, 0, 0, 1, 0, 0, 0, 0, 0]

In [10]:
y_train[0]

array([0., 0., 0., 0., 0., 1., 0., 0., 0., 0.], dtype=float32)

That's called a one-hot vector. 

In [11]:
model = Sequential()

In [12]:
model.add(Dense(512, activation='sigmoid', input_shape=(784,)))
model.add(Dense(512, activation='sigmoid' ))
model.add(Dense(num_classes, activation='softmax'))


# Sigmoid function converts between any real number in range b/w 0-1

In [13]:
# What does the model look like? 

model.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense (Dense)                (None, 512)               401920    
_________________________________________________________________
dense_1 (Dense)              (None, 512)               262656    
_________________________________________________________________
dense_2 (Dense)              (None, 10)                5130      
Total params: 669,706
Trainable params: 669,706
Non-trainable params: 0
_________________________________________________________________


In [14]:
# Compile the model 

model.compile(loss='categorical_crossentropy', optimizer=SGD(), metrics=['accuracy'])

In [15]:
# let's perform the learning 

history = model.fit( x_train, y_train, 
           batch_size=batch_size,
           epochs=epochs, 
           verbose=1, 
           validation_data=(x_test, y_test))

Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [16]:
# Let's evaluate the model 

score = model.evaluate(x_test, y_test)



In [17]:
# Accuracy

score[1]

0.880299985408783