In [None]:
import numpy as np
import matplotlib.pyplot as plt 
import tensorflow as tf
from tensorflow.keras.datasets import mnist
from tensorflow.keras.models import Model, Sequential
from tensorflow.keras.layers import Dense, Conv2D,Flatten,MaxPool2D,Input
from tensorflow.keras.utils import to_categorical



<h1>We load and preprocess our data</h1>

In [None]:
(X_train,y_train), (X_test ,y_test) = mnist.load_data()

#we normalize our data
X_train = np.reshape(X_train,(-1,28,28,1)).astype('float32') / 255.0
X_test = np.reshape(X_test,(-1,28,28,1)).astype('float32') / 255.0

#we categorize it
y_train = to_categorical(y_train,10)
y_test = to_categorical(y_test,10)

<h1>We set our first model</h1>

In [None]:
model = Sequential([
    #we set the expected input
    Input((28,28,1)),

    #We implement the first convolutionnal layers.Wenhave 32 kernel of dimension 3,3.It returns 32 features maps of dimensions 26,26,1. Each filter detects a pattern ,it can be borders
    #After we use an activation function relu for getting non linearity. Without it , we only work with linearity. Relu allows us to implement no linearity tasks such as pattern detection
    Conv2D(32, kernel_size=(3,3),activation='relu'),

    #MaxPool layers decreses the size of features maps and allows us to have a better pattern detection
    MaxPool2D(pool_size=(2,2)),

    Conv2D(64,kernel_size=(3,3),activation='relu',padding='same'),
    MaxPool2D(pool_size=(2,2)),

    #we flatten the feature map
    Flatten(),
    Dense(128,activation='relu'),

    #we use  softmax for calculating probabilities. As soon as we expect 10 value (0-9),we set the first parameter to 10
    Dense(10,activation='softmax')
])

*Lets compile our model*
''
    

In [None]:
model.compile(
    optimizer = 'adam',
    loss = 'categorical_crossentropy',
    metrics=['accuracy']
)

*We can now train 
our model*

In [None]:
history = model.fit(X_train,y_train,epochs=5,batch_size=64,validation_split=0.1)

In [None]:
print('Our loss',history.history['loss'])
print('Our accuracy',history.history['accuracy'])

In [None]:
*Lets visualize the performance*

In [None]:
plt.plot(history.history['loss'],label='train loss')
plt.plot(history.history['val_loss'],label='validation loss')
plt.title('The fluctuation of the precision')
plt.xlabel('Epoch')
plt.ylabel('loss')
plt.legend()
plt.show()

In [None]:
plt.plot(history.history['accuracy'],label='train accuracy')
plt.plot(history.history['val_accuracy'],label='validation accuracy')
plt.title('The fluctuation of the accuracy')
plt.xlabel('Epoch')
plt.ylabel('accuracy')
plt.legend()
plt.show()