In [None]:
import tensorflow as tf
import pandas as pd
import numpy as np
from tensorflow import keras
import tensorflow_datasets as tfds

In [None]:
mnist_dataset , mnist_info = tfds.load(name='mnist', with_info = True, as_supervised=True)

mnist_train, mnist_test = mnist_dataset['train'], mnist_dataset['test']

num_validation = 0.1* mnist_info.splits['train'].num_examples
num_validation = tf.cast(num_validation, tf.int64)

num_test_samples = mnist_info.splits['train'].num_examples
num_test_samples = tf.cast(num_test_samples, tf.int64)

def scale(image, label):
  image=tf.cast(image,tf.float32)
  image = image/255.
  return image, label

scaled_train_data = mnist_train.map(scale)

test_data = mnist_test.map(scale)

In [None]:
Buffer_size = 10000

scaled_shuffled_train_data = scaled_train_data.shuffle(Buffer_size)

validation_data = scaled_shuffled_train_data.take(num_validation)

train_data = scaled_shuffled_train_data.skip(num_validation)

In [None]:
Batch_size = 100

train_data = train_data.batch(Batch_size)
validation_data = validation_data.batch(num_validation)
test_data = test_data.batch(num_test_samples)

validation_inputs, validation_targets = next(iter(validation_data))

# **Model**

In [None]:
input_size = 784
output_size = 10
hidden_layer_size = 100

model = tf.keras.Sequential([
                             tf.keras.layers.Flatten(input_shape =(28,28,1)),
                             tf.keras.layers.Dense(hidden_layer_size,
                                                   activation='relu'),
                             tf.keras.layers.Dense(hidden_layer_size,
                                                   activation='relu'),
                             tf.keras.layers.Dense(output_size,
                                                   activation='softmax')
                            ])

*Optimizer and the loss function*


In [None]:
model.compile(optimizer='Adam',
              loss='sparse_categorical_crossentropy',
              metrics=['accuracy'])

## **Training**

In [None]:
num_epochs = 5
model.fit(train_data,
          epochs=num_epochs,
          validation_data=(validation_inputs, validation_targets),
          verbose=2)

Epoch 1/5
540/540 - 5s - loss: 0.3298 - accuracy: 0.9069 - val_loss: 0.1728 - val_accuracy: 0.9462 - 5s/epoch - 9ms/step
Epoch 2/5
540/540 - 6s - loss: 0.1372 - accuracy: 0.9604 - val_loss: 0.1145 - val_accuracy: 0.9652 - 6s/epoch - 10ms/step
Epoch 3/5
540/540 - 4s - loss: 0.0978 - accuracy: 0.9706 - val_loss: 0.0933 - val_accuracy: 0.9710 - 4s/epoch - 7ms/step
Epoch 4/5
540/540 - 5s - loss: 0.0765 - accuracy: 0.9758 - val_loss: 0.0727 - val_accuracy: 0.9780 - 5s/epoch - 10ms/step
Epoch 5/5
540/540 - 4s - loss: 0.0609 - accuracy: 0.9811 - val_loss: 0.0701 - val_accuracy: 0.9777 - 4s/epoch - 7ms/step


<keras.src.callbacks.History at 0x7a0fe9ec7e50>

**WHAT HAPPENS INSIDE AN EPOCH**


1.   At the beginning of each epoch, the training loss will be set to O
2.   The algorithm will iterate over a preset number of batches, all from train_data
3.   The weights and biases will be updated as many times as there are batches
4.   We will get a value for the loss function, indicating how the training is going
5.   We will also see a training accuracy
6.   At the end of the epoch, the algorithm will forward propagate the whole validation set
**When we reach the maximum number of epochs the training will be over*




In [None]:
test_loss, test_acc = model.evaluate(test_data)





In [None]:
print('Test loss = {0:.2f}. Test accuracy: {1:.2f}%'.format(test_loss,
                                                            test_acc*100))

Test loss = 0.09. Test accuracy: 97.20%
