In [None]:
import tensorflow as tf
import numpy as np
from tensorflow import keras

# for reproducibility
np.random.seed(1671)

# network and training
EPOCHS1L = 200 ## for 1-layer
EPOCHS = 50
BATCH_SIZE = 128
VERBOSE = 1
NB_CLASSES = 10   # number of outputs = number of digits
N_HIDDEN = 128
VALIDATION_SPLIT=0.2 # how much TRAIN is reserved for VALIDATION

DROPOUT = 0.3

# loading MNIST dataset
# verify
# the split between train and test is 60,000, and 10,000 respectly 
# one-hot is automatically applied
mnist = keras.datasets.mnist
(X_train, Y_train), (X_test, Y_test) = mnist.load_data()
print(X_train.shape[0], 'train samples')
print(X_test.shape[0], 'test samples')


#normalize in [0,1]
X_train, X_test = X_train / 255.0, X_test / 255.0
#X_train is 60000 rows of 28x28 values --> reshaped in 60000 x 784
RESHAPED = 784   #28x28 input
#
X_train = X_train.reshape(60000, RESHAPED)
X_test = X_test.reshape(10000, RESHAPED)
Y_train = Y_train.astype('float32')
Y_test = Y_test.astype('float32')

### 1-layer NN
model = tf.keras.models.Sequential()
model.add(keras.layers.Dense(NB_CLASSES,input_shape=(RESHAPED,),name='dense_layer', activation='softmax'))


### multi-layer NN
#model = tf.keras.models.Sequential()
#model.add(keras.layers.Dense(N_HIDDEN,input_shape=(RESHAPED,),name='dense_layer', activation='relu'))
#model.add(keras.layers.Dense(N_HIDDEN,name='dense_layer_2', activation='relu'))
#model.add(keras.layers.Dense(NB_CLASSES,name='dense_layer_3', activation='softmax'))

### multi-layer NN with DROPOUT
#model = tf.keras.models.Sequential()
#model.add(keras.layers.Dense(N_HIDDEN,input_shape=(RESHAPED,),name='dense_layer', activation='relu'))
#model.add(keras.layers.Dropout(DROPOUT))
#model.add(keras.layers.Dense(N_HIDDEN,name='dense_layer_2', activation='relu'))
#model.add(keras.layers.Dropout(DROPOUT))
#model.add(keras.layers.Dense(NB_CLASSES,name='dense_layer_3', activation='softmax'))


# summary of the model
model.summary()

# compiling the model SGM 1st try
model.compile(optimizer='SGD', 
              loss='sparse_categorical_crossentropy',
              metrics=['accuracy'])

# compiling the model RMSProp 2nd try
#model.compile(optimizer='RMSProp', 
#              loss='sparse_categorical_crossentropy',
#              metrics=['accuracy'])

# compiling the model Adam 3rd try
#model.compile(optimizer='Adam', 
#              loss='sparse_categorical_crossentropy',
#              metrics=['accuracy'])

#training the moodel with Singlelayer P
model.fit(X_train, Y_train,
		batch_size=BATCH_SIZE, epochs=EPOCHS1L,
		verbose=VERBOSE, validation_split=VALIDATION_SPLIT)

#training the moodel with Multilayer P
#model.fit(X_train, Y_train,
#		batch_size=BATCH_SIZE, epochs=EPOCHS,
#		verbose=VERBOSE, validation_split=VALIDATION_SPLIT)

#evalute the model
test_loss, test_acc = model.evaluate(X_test, Y_test)
print('Test accuracy:', test_acc)

# making prediction
predictions = model.predict(X_test)