# import the relevant packages


In [1]:
import numpy as np
import tensorflow as tf
import tensorflow_datasets as tfds

  from .autonotebook import tqdm as notebook_tqdm


# load the data

In [2]:
mnist_dataset,mnist_info = tfds.load(name='mnist',with_info=True,as_supervised=True)

In [38]:
mnist_train,mnist_test = mnist_dataset['train'],mnist_dataset['test']
num_validation_samples = 0.1*mnist_info.splits['train'].num_examples
num_validation_samples = tf.cast(num_validation_samples,tf.int64)
num_test_samples = mnist_info.splits['test'].num_examples
num_test_samples = tf.cast(num_test_samples,tf.int64)


def scale(image,label):
    image = tf.cast(image,tf.float32)
    image /=255.
    
    return image,label

scaled_train_and_validation_data = mnist_train.map(scale)
test_data = mnist_test.map(scale)

BUFFER_SIZE = 10000
shuffled_train_and_validation_data=scaled_train_and_validation_data.shuffle(BUFFER_SIZE)
validation_data = shuffled_train_and_validation_data.take(num_validation_samples)
train_data = shuffled_train_and_validation_data.skip(num_validation_samples)
BATCH_SIZE = 150
train_data = train_data.batch(BATCH_SIZE)
validation_data = validation_data.batch(num_validation_samples)
test_data = test_data.batch(num_test_samples)
validation_inputs,validation_targets = next(iter(validation_data))

# model


In [35]:
input_size = 784
output_size = 10
hidden_layer_size = 5000
model = tf.keras.Sequential([
    tf.keras.layers.Flatten(input_shape=(28,28,1)),
    tf.keras.layers.Dense(hidden_layer_size,activation='relu'),
    tf.keras.layers.Dense(hidden_layer_size,activation='relu'),
    tf.keras.layers.Dense(hidden_layer_size,activation='relu'),
    tf.keras.layers.Dense(hidden_layer_size,activation='relu'),
    tf.keras.layers.Dense(hidden_layer_size,activation='relu'),
    tf.keras.layers.Dense(hidden_layer_size,activation='relu'),
    tf.keras.layers.Dense(hidden_layer_size,activation='relu'),
    tf.keras.layers.Dense(hidden_layer_size,activation='relu'),
    tf.keras.layers.Dense(hidden_layer_size,activation='relu'),
    tf.keras.layers.Dense(hidden_layer_size,activation='relu'),
    tf.keras.layers.Dense(output_size,activation='softmax')
])

# optimizer and loss function

In [36]:
model.compile(optimizer='adam',loss='sparse_categorical_crossentropy',metrics=['accuracy'])

In [39]:
NUM_EPOCHS = 10
model.fit(train_data,epochs=NUM_EPOCHS,validation_data=(validation_inputs,validation_targets),verbose = 2)

Epoch 1/10
360/360 - 2s - loss: 0.0172 - accuracy: 0.9949 - val_loss: 0.0267 - val_accuracy: 0.9928 - 2s/epoch - 4ms/step
Epoch 2/10
360/360 - 1s - loss: 0.0103 - accuracy: 0.9974 - val_loss: 0.0211 - val_accuracy: 0.9937 - 1s/epoch - 4ms/step
Epoch 3/10
360/360 - 1s - loss: 0.0077 - accuracy: 0.9981 - val_loss: 0.0166 - val_accuracy: 0.9947 - 1s/epoch - 4ms/step
Epoch 4/10
360/360 - 1s - loss: 0.0057 - accuracy: 0.9986 - val_loss: 0.0141 - val_accuracy: 0.9953 - 1s/epoch - 4ms/step
Epoch 5/10
360/360 - 1s - loss: 0.0048 - accuracy: 0.9990 - val_loss: 0.0118 - val_accuracy: 0.9965 - 1s/epoch - 4ms/step
Epoch 6/10
360/360 - 1s - loss: 0.0033 - accuracy: 0.9994 - val_loss: 0.0099 - val_accuracy: 0.9975 - 1s/epoch - 4ms/step
Epoch 7/10
360/360 - 2s - loss: 0.0033 - accuracy: 0.9994 - val_loss: 0.0076 - val_accuracy: 0.9982 - 2s/epoch - 4ms/step
Epoch 8/10
360/360 - 1s - loss: 0.0026 - accuracy: 0.9996 - val_loss: 0.0062 - val_accuracy: 0.9985 - 1s/epoch - 4ms/step
Epoch 9/10
360/360 - 1s 

<keras.callbacks.History at 0x17d84462ed0>

# test the model

In [40]:
test_loss,test_accuracy = model.evaluate(test_data)



In [41]:
print('test loss:{0:.2f}. test accuracy:{1:.2f}%'.format(test_loss,test_accuracy*100))

test loss:0.08. test accuracy:98.35%
