In [6]:
from __future__ import print_function

import tensorflow as tf
from keras.datasets import mnist
import keras
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, Dropout, Flatten
from tensorflow.keras.optimizers import RMSprop

In [7]:
batch_size = 128
num_classes = 10
epochs = 20

In [25]:
(x_train, y_train),(x_test,y_test) = mnist.load_data()

x_train = x_train.reshape(60000, 784)
x_test = x_test.reshape(10000, 784)

x_train = x_train.astype('float32')
x_test = x_test.astype('float32')

x_train /= 255
x_test /= 255

In [26]:
print(x_train.shape[0], 'train samples')
print(x_test.shape[0], 'test samples')

60000 train samples
10000 test samples


In [30]:
y_train = keras.utils.to_categorical(y_train,num_classes)

y_test = keras.utils.to_categorical(y_test,num_classes)

In [31]:
y_train[0]

array([0., 0., 0., 0., 0., 1., 0., 0., 0., 0.], dtype=float32)

In [32]:
type(y_train)

numpy.ndarray

## BUILD THE MODEL

In [14]:
model = Sequential()

# will create an empty graphical space to create out input, output and hidden layers

In [16]:
model.add(Dense(512, activation='relu',input_shape=(784,)))  #first hidden layer
# no.of neurons = 512 
#first hidden layer is the only HL that directly interacts with the IL. input_shape=(784,) defines the no.of inputs to each node in HL1


model.add(Dropout(0.2))  #dropout layer or regularization
#with each neuron -> assign probability as 0.2

model.add(Dense(512, activation='relu'))  #second hidden layer
#by default the input_size is 512

model.add(Dropout(0.2))

model.add(Dense(num_classes, activation='softmax'))  #output layer

model.summary()


Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense (Dense)                (None, 512)               401920    
_________________________________________________________________
dropout (Dropout)            (None, 512)               0         
_________________________________________________________________
dense_1 (Dense)              (None, 512)               262656    
_________________________________________________________________
dropout_1 (Dropout)          (None, 512)               0         
_________________________________________________________________
dense_2 (Dense)              (None, 10)                5130      
Total params: 669,706
Trainable params: 669,706
Non-trainable params: 0
_________________________________________________________________


Param # calculation

in HL1:
    
    param # = no of neurons in IL * no of neurons in HL1 + no of neurons in HL1

    748 * 512 + 512 = 401920    
    
    
in OL:

    512 * 10 + 10 = 5130


## COMPILE THE MODEL

In [17]:
model.compile(loss='categorical_crossentropy',
             optimizer=RMSprop(),
             metrics=['accuracy'])

In [18]:
# RMSprop is a varient of gradient descent

## FIT THE MODEL

In [33]:
history = model.fit(x_train, y_train,
                   batch_size=batch_size,
                   epochs=epochs,
                   verbose=1,
                   validation_data=(x_test, y_test))

score = model.evaluate(x_test,y_test,verbose=0)

Train on 60000 samples, validate on 10000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [34]:
print('Test Loss: ', score[0])
print('Test Score: ', score[1])

Test Loss:  0.12168892770384618
Test Score:  0.9838
