In [None]:
# Importing the relevant packages
import tensorflow as tf
import tensorflow_datasets as tfds
import datetime  # use it for LOG



## Downloading and preprocessing the data

In [None]:

BUFFER_SIZE = 70_000 # same as is
BATCH_SIZE = 128
NUM_EPOCHS = 20

In [None]:
# Downloading the MNIST dataset
mnist_dataset, mnist_info = tfds.load(name='mnist', with_info=True, as_supervised=True)

In [None]:
mnist_train, mnist_test = mnist_dataset['train'], mnist_dataset['test']

In [None]:
# Creating a function to scale our data
def scale(image, label):
    image = tf.cast(image, tf.float32)
    image /= 255.

    return image, label

In [None]:
# Scaling the data
train_and_validation_data = mnist_train.map(scale)
test_data = mnist_test.map(scale)

In [None]:
# size of validation set
num_validation_samples = 0.1 * mnist_info.splits['train'].num_examples
num_validation_samples = tf.cast(num_validation_samples, tf.int64)

In [None]:
# Defining size of test set
num_test_samples = mnist_info.splits['test'].num_examples
num_test_samples = tf.cast(num_test_samples, tf.int64)

In [None]:
# Reshuffle
train_and_validation_data = train_and_validation_data.shuffle(BUFFER_SIZE)

In [None]:
# Splitting the dataset 
train_data = train_and_validation_data.skip(num_validation_samples)
validation_data = train_and_validation_data.take(num_validation_samples)

In [None]:
# Batch
train_data = train_data.batch(BATCH_SIZE)
validation_data = validation_data.batch(num_validation_samples)
test_data = test_data.batch(num_test_samples)

## Creating the model and training it

In [None]:
# SAME

In [None]:

model = tf.keras.Sequential([
    tf.keras.layers.Conv2D(50, 5, activation='relu', input_shape=(28, 28, 1)),
    tf.keras.layers.MaxPooling2D(pool_size=(2,2)),
    tf.keras.layers.Conv2D(50, 3, activation='relu'),
    tf.keras.layers.MaxPooling2D(pool_size=(2,2)), 
    tf.keras.layers.Flatten(),
    tf.keras.layers.Dense(10)
])

In [None]:
model.summary(line_length = 75)

In [None]:
# loss function
loss_fn = tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True)

In [None]:
#  Adam optimizer 
model.compile(optimizer='adam', loss=loss_fn, metrics=['accuracy'])

In [None]:
# prevent overfitting
early_stopping = tf.keras.callbacks.EarlyStopping(
    monitor = 'val_loss',
    mode = 'auto',
    min_delta = 0,
    patience = 2,
    verbose = 0, 
    restore_best_weights = True
)

In [None]:
# Logging the training process data to use later in tensorboard
# we run our model with different parameters thats why datetime ( we have each iteration and each trial)
log_dir = "logs\\fit\\" + datetime.datetime.now().strftime("%Y%m%d-%H%M%S")
#above my parameter for training

tensorboard_callback = tf.keras.callbacks.TensorBoard(log_dir=log_dir, histogram_freq=1)
#callback is a function or an operation that is executed at the end of each epoch
#now we have tensorboard as callback

In [None]:
# Train the network
model.fit(
    train_data, 
    epochs = NUM_EPOCHS, 
    callbacks = [tensorboard_callback, early_stopping],  #2 callbacks earlystop and tfBOARD
    validation_data = validation_data,
    verbose = 2   # now training is recorded
)

## Testing your HOT content

In [None]:
# Testing our model
test_loss, test_accuracy = model.evaluate(test_data)

In [None]:
# Printing the test results
print('Test loss: {0:.4f}. Test accuracy: {1:.2f}%'.format(test_loss, test_accuracy*100.))

## Visualizing in Tensorboard

In [None]:
# Loading the Tensorboard extension   # use it for visualization  #my logs for this training!
%load_ext tensorboard
%tensorboard --logdir "logs/fit" 
