In [1]:
# Baseline MLP for MNIST dataset

import numpy
from tensorflow.keras.datasets import mnist
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense
from tensorflow.keras.utils import to_categorical
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)
# load data
(X_train, y_train), (X_test, y_test) = mnist.load_data()
# flatten 28*28 images to a 784 vector for each image
num_pixels = X_train.shape[1] * X_train.shape[2]
X_train = X_train.reshape((X_train.shape[0], num_pixels)).astype('float32')
X_test = X_test.reshape((X_test.shape[0], num_pixels)).astype('float32')
# normalize inputs from 0-255 to 0-1
X_train = X_train / 255
X_test = X_test / 255
# one hot encode outputs
y_train = to_categorical(y_train)
y_test = to_categorical(y_test)
num_classes = y_test.shape[1]
# define baseline model
def baseline_model():
	# create model
	model = Sequential()
	model.add(Dense(num_pixels, input_shape=(num_pixels,), kernel_initializer='normal', activation='relu'))
	model.add(Dense(num_classes, kernel_initializer='normal', activation='softmax'))
	# Compile model
	model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
	return model
# build the model
model = baseline_model()
# Fit the model
model.fit(X_train, y_train, validation_data=(X_test, y_test), epochs=10, batch_size=200, verbose=2)
# Final evaluation of the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("Baseline Error: %.2f%%" % (100-scores[1]*100))

2023-02-11 23:04:06.792508: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations:  SSE4.1
To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.
2023-02-11 23:06:00.501797: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations:  SSE4.1
To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.
2023-02-11 23:06:00.721647: I tensorflow/core/common_runtime/process_util.cc:146] Creating new thread pool with default inter op setting: 2. Tune using inter_op_parallelism_threads for best performance.


Epoch 1/10
300/300 - 26s - loss: 0.2793 - accuracy: 0.9212 - val_loss: 0.1398 - val_accuracy: 0.9598 - 26s/epoch - 88ms/step
Epoch 2/10
300/300 - 10s - loss: 0.1090 - accuracy: 0.9686 - val_loss: 0.1000 - val_accuracy: 0.9689 - 10s/epoch - 33ms/step
Epoch 3/10
300/300 - 13s - loss: 0.0713 - accuracy: 0.9791 - val_loss: 0.0786 - val_accuracy: 0.9745 - 13s/epoch - 43ms/step
Epoch 4/10
300/300 - 11s - loss: 0.0495 - accuracy: 0.9862 - val_loss: 0.0745 - val_accuracy: 0.9757 - 11s/epoch - 36ms/step
Epoch 5/10
300/300 - 12s - loss: 0.0373 - accuracy: 0.9895 - val_loss: 0.0663 - val_accuracy: 0.9798 - 12s/epoch - 40ms/step
Epoch 6/10
300/300 - 10s - loss: 0.0263 - accuracy: 0.9929 - val_loss: 0.0621 - val_accuracy: 0.9802 - 10s/epoch - 35ms/step
Epoch 7/10
300/300 - 11s - loss: 0.0195 - accuracy: 0.9950 - val_loss: 0.0618 - val_accuracy: 0.9811 - 11s/epoch - 38ms/step
Epoch 8/10
300/300 - 13s - loss: 0.0146 - accuracy: 0.9967 - val_loss: 0.0544 - val_accuracy: 0.9829 - 13s/epoch - 43ms/step
