In [1]:
import tensorflow as tf
import numpy as np
from tensorflow import keras

In [2]:
#Network and training parameters
EPOCHS = 200
BATCH_SIZE = 128
VERBOSE = 0
NB_CLASSES = 10 #number of digit after OHE
N_HIDDEN = 128
VALIDATION_SPLIT = 0.2
DROPOUT = 0.3

In [3]:
#loading MNIST dataset
mnist = keras.datasets.mnist
(X_train, Y_train), (X_test, Y_test) = mnist.load_data()

In [4]:
#X_train shape
X_train.shape

(60000, 28, 28)

In [5]:
#X must be reshaped from (60000, 28, 28) to 60000 x 784
RESHAPED = 784 #28x28
X_train = X_train.reshape(60000, RESHAPED)
X_test = X_test.reshape(10000, RESHAPED)
X_train = X_train.astype('float32')
X_test = X_test.astype('float32')

In [6]:
#Normalization within [0,1]
X_train /= 255
X_test /= 255

In [7]:
#One-hot representation of the labels
Y_train = tf.keras.utils.to_categorical(Y_train, NB_CLASSES)
Y_test = tf.keras.utils.to_categorical(Y_test, NB_CLASSES)

In [8]:
#Build the model
model = tf.keras.models.Sequential()
model.add(keras.layers.Dense(N_HIDDEN,
                             input_shape= (RESHAPED,),
                             name = 'dense_layer_1',
                             activation = 'relu'))
model.add(keras.layers.Dropout(DROPOUT))
model.add(keras.layers.Dense(N_HIDDEN,
                             input_shape= (RESHAPED,),
                             name = 'dense_layer_2',
                             activation = 'relu'))
model.add(keras.layers.Dropout(DROPOUT))
model.add(keras.layers.Dense(NB_CLASSES,
                             input_shape = (RESHAPED,),
                             name ='dense_layer_3',
                             activation = 'softmax'))
model.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense_layer_1 (Dense)        (None, 128)               100480    
_________________________________________________________________
dropout (Dropout)            (None, 128)               0         
_________________________________________________________________
dense_layer_2 (Dense)        (None, 128)               16512     
_________________________________________________________________
dropout_1 (Dropout)          (None, 128)               0         
_________________________________________________________________
dense_layer_3 (Dense)        (None, 10)                1290      
Total params: 118,282
Trainable params: 118,282
Non-trainable params: 0
_________________________________________________________________


In [9]:
#compiling the model
model.compile(optimizer='Adam',
             loss='categorical_crossentropy',
             metrics=['accuracy'])

In [10]:
#training the model
model.fit(X_train, Y_train,
         batch_size=BATCH_SIZE,
         epochs=EPOCHS,
         verbose=VERBOSE,
         validation_split=VALIDATION_SPLIT)

<tensorflow.python.keras.callbacks.History at 0x24dda430df0>

In [11]:
#evaluate the model
test_loss, test_acc = model.evaluate(X_test,Y_test)
print('Test accuracy -->', test_acc)

Test accuracy --> 0.9805999994277954
