In [103]:
import tensorflow as tf
import tensorflow_datasets as tfds
import numpy as np

Data

In [104]:
# download and load dataset and information of dataset
mnist_dataset, mnist_info = tfds.load(name = 'mnist', with_info = True, as_supervised = True)
# getting train and test data
mnist_train, mnist_test = mnist_dataset['train'], mnist_dataset['test']
# getting validation data
num_validation_samples = 0.1 * mnist_info.splits['train'].num_examples
num_validation_samples = tf.cast(num_validation_samples, tf.int64)

num_test_samples = mnist_info.splits['test'].num_examples
num_test_samples = tf.cast(num_test_samples, tf.int64)

# Scaling/transforming the input data

def scale(image, label):
    image = tf.cast(image, tf.float32)
    image  /= 255.
    return image, label


# dataset.map(function) applies custom transformation to a given dataset. 
# It takes as input a function which determines the transformation 
scaled_train_and_validation_data = mnist_train.map(scale)
test_data = mnist_test.map(scale)

# Shuffle the data 

BUFFER_SIZE = 10000
shuffled_train_and_validation_data = scaled_train_and_validation_data.shuffle(BUFFER_SIZE)

# validation, train data

validation_data = shuffled_train_and_validation_data.take(num_validation_samples)
train_data = shuffled_train_and_validation_data.skip(num_validation_samples)

BATCH_SIZE = 100
# dataset.batch(batch_size) method that combines consecutive elements of a dataset into batches
train_data = train_data.batch(BATCH_SIZE)
validation_data = validation_data.batch(num_validation_samples)
test_data = test_data.batch(num_test_samples)

validation_inputs, validation_targets = next(iter(validation_data))


Model


Outline the model

In [105]:
input_size = 784
output_size = 10
hidden_layer_size = 150 

model = tf.keras.Sequential([
    tf.keras.layers.Flatten(input_shape = (28,28,1)),
    tf.keras.layers.Dense(hidden_layer_size, activation = 'relu'),
    tf.keras.layers.Dense(hidden_layer_size, activation = 'relu'),
    tf.keras.layers.Dense(hidden_layer_size, activation = 'relu'),
    tf.keras.layers.Dense(output_size, activation = 'softmax')
])



The optimizer and loss function

In [106]:
model.compile(optimizer = 'adam', loss = 'sparse_categorical_crossentropy', metrics = ['accuracy'])



Training

In [107]:
epochs = 10
verbose = 2

model.fit(train_data, epochs = epochs, verbose = verbose, validation_steps = 1, validation_data=(validation_inputs, validation_targets))

Epoch 1/10
540/540 - 40s - loss: 0.2896 - accuracy: 0.9133 - val_loss: 0.0000e+00 - val_accuracy: 0.0000e+00
Epoch 2/10
540/540 - 35s - loss: 0.1102 - accuracy: 0.9665 - val_loss: 0.1012 - val_accuracy: 0.9670
Epoch 3/10
540/540 - 41s - loss: 0.0771 - accuracy: 0.9756 - val_loss: 0.0843 - val_accuracy: 0.9757
Epoch 4/10
540/540 - 38s - loss: 0.0595 - accuracy: 0.9812 - val_loss: 0.0695 - val_accuracy: 0.9778
Epoch 5/10
540/540 - 12s - loss: 0.0431 - accuracy: 0.9861 - val_loss: 0.0484 - val_accuracy: 0.9860
Epoch 6/10
540/540 - 12s - loss: 0.0385 - accuracy: 0.9876 - val_loss: 0.0493 - val_accuracy: 0.9850
Epoch 7/10
540/540 - 12s - loss: 0.0319 - accuracy: 0.9899 - val_loss: 0.0374 - val_accuracy: 0.9895
Epoch 8/10
540/540 - 12s - loss: 0.0267 - accuracy: 0.9916 - val_loss: 0.0438 - val_accuracy: 0.9863
Epoch 9/10
540/540 - 12s - loss: 0.0249 - accuracy: 0.9923 - val_loss: 0.0338 - val_accuracy: 0.9903
Epoch 10/10
540/540 - 12s - loss: 0.0229 - accuracy: 0.9923 - val_loss: 0.0274 - va

<tensorflow.python.keras.callbacks.History at 0x7f69e7f4f610>

In [108]:
test_loss , test_accuracy = model.evaluate(test_data)
print(test_loss, test_accuracy)

0.08561475574970245 0.978
