# Implementing Multi Layer Perceptron with Keras

In [6]:
import tensorflow

In [8]:
print(tensorflow.__version__)

1.14.0


In [7]:
print(tensorflow.keras.__version__)

2.2.4-tf


In [3]:

from tensorflow.keras.datasets import mnist #since keras is actually a part of tensorflow
import matplotlib.pyplot as plt

  _np_qint8 = np.dtype([("qint8", np.int8, 1)])
  _np_quint8 = np.dtype([("quint8", np.uint8, 1)])
  _np_qint16 = np.dtype([("qint16", np.int16, 1)])
  _np_quint16 = np.dtype([("quint16", np.uint16, 1)])
  _np_qint32 = np.dtype([("qint32", np.int32, 1)])
  np_resource = np.dtype([("resource", np.ubyte, 1)])
  _np_qint8 = np.dtype([("qint8", np.int8, 1)])
  _np_quint8 = np.dtype([("quint8", np.uint8, 1)])
  _np_qint16 = np.dtype([("qint16", np.int16, 1)])
  _np_quint16 = np.dtype([("quint16", np.uint16, 1)])
  _np_qint32 = np.dtype([("qint32", np.int32, 1)])
  np_resource = np.dtype([("resource", np.ubyte, 1)])


In [9]:
import numpy as np
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense
from tensorflow.keras.layers import Dropout
from tensorflow.keras.utils import to_categorical #np_utils is not supported in keras > 2.0 

In [10]:
# load (downloaded if needed) the MNIST dataset
(X_train, y_train), (X_test, y_test) = mnist.load_data()

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/mnist.npz


In [11]:
# flatten 28*28 images to a 784 vector for each image
num_pixels = X_train.shape[1] * X_train.shape[2]
X_train = X_train.reshape(X_train.shape[0], num_pixels).astype('float32')
X_test = X_test.reshape(X_test.shape[0], num_pixels).astype('float32')

In [12]:
# normalize inputs/predictors from 0-255 to 0-1
X_train = X_train / 255
X_test = X_test / 255

In [14]:
# one hot encode outputs
y_train = to_categorical(y_train) #removed np_utils and redirectly using to_categorical
y_test = to_categorical(y_test)
num_classes = y_test.shape[1]

### one hidden layer with the same number of neurons as there are inputs (784)

In [15]:
# define baseline model
def baseline_model():
    # create model
    model = Sequential()
    model.add(Dense(num_pixels, input_dim=num_pixels, kernel_initializer='normal', activation='relu'))
    model.add(Dense(num_classes, kernel_initializer='normal', activation='softmax'))
# Compile model
    model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

In [16]:
model = baseline_model()
# Fit the model
model.fit(X_train, y_train, validation_data=(X_test, y_test), epochs=10, batch_size=200, verbose=2)
# Final evaluation of the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("Baseline Error: %.2f%%" % (100-scores[1]*100))

Instructions for updating:
Call initializer instance with the dtype argument instead of passing it to the constructor
Train on 60000 samples, validate on 10000 samples
Epoch 1/10
60000/60000 - 4s - loss: 0.2787 - acc: 0.9209 - val_loss: 0.1354 - val_acc: 0.9615
Epoch 2/10
60000/60000 - 4s - loss: 0.1093 - acc: 0.9683 - val_loss: 0.0960 - val_acc: 0.9709
Epoch 3/10
60000/60000 - 3s - loss: 0.0708 - acc: 0.9797 - val_loss: 0.0752 - val_acc: 0.9769
Epoch 4/10
60000/60000 - 4s - loss: 0.0507 - acc: 0.9853 - val_loss: 0.0693 - val_acc: 0.9785
Epoch 5/10
60000/60000 - 3s - loss: 0.0360 - acc: 0.9894 - val_loss: 0.0673 - val_acc: 0.9794
Epoch 6/10
60000/60000 - 3s - loss: 0.0253 - acc: 0.9932 - val_loss: 0.0606 - val_acc: 0.9811
Epoch 7/10
60000/60000 - 3s - loss: 0.0194 - acc: 0.9950 - val_loss: 0.0624 - val_acc: 0.9798
Epoch 8/10
60000/60000 - 4s - loss: 0.0145 - acc: 0.9965 - val_loss: 0.0605 - val_acc: 0.9809
Epoch 9/10
60000/60000 - 4s - loss: 0.0104 - acc: 0.9979 - val_loss: 0.0610 - va