In [1]:
import tensorflow as tf

In [2]:
(X_train, y_train), (X_test, y_test) = tf.keras.datasets.mnist.load_data()

In [3]:
X_train = X_train.reshape(-1, 28, 28, 1)
X_test = X_test.reshape(-1, 28, 28, 1)

In [4]:
X_train = X_train.astype('float32')
X_test = X_test.astype('float32')

In [5]:
X_train /= 255
X_test /= 255

In [6]:
# one hot encoding of training and test labels
y_train = tf.keras.utils.to_categorical(y_train)
y_test = tf.keras.utils.to_categorical(y_test)

In [7]:
from sklearn.model_selection import train_test_split
X_train, X_validate, y_train, y_validate = train_test_split(X_train, y_train, test_size=0.2, random_state=13)

In [8]:
batch_size = 64
epochs = 20
num_classes = 10

In [9]:
from tensorflow.keras.models import Sequential, Model
from tensorflow.keras.layers import Dense, Dropout, Flatten, Conv2D, MaxPool2D, LeakyReLU

In [10]:
cnn = Sequential()

In [11]:
cnn.add(Conv2D(32, kernel_size=3, activation='linear', input_shape=(28, 28, 1), padding='same'))
cnn.add(LeakyReLU(alpha=0.1))
cnn.add(MaxPool2D((2, 2), padding='same'))

In [12]:
cnn.add(Dropout(0.25))

In [13]:
cnn.add(Conv2D(64, 3, activation='linear', padding='same'))
cnn.add(LeakyReLU(alpha=0.1))
cnn.add(MaxPool2D((2, 2), padding='same'))

In [14]:
cnn.add(Dropout(0.25))

In [15]:
cnn.add(Conv2D(128, 3, activation='linear', padding='same'))
cnn.add(LeakyReLU(alpha=0.1))                  
cnn.add(MaxPool2D(pool_size=(2, 2), padding='same'))

In [16]:
cnn.add(Dropout(0.4))

In [17]:
cnn.add(Flatten())
cnn.add(Dense(128, activation='linear'))
cnn.add(LeakyReLU(alpha=0.1))

In [18]:
cnn.add(Dropout(0.3))

In [19]:
cnn.add(Dense(num_classes, activation='softmax'))

In [20]:
cnn.compile(loss=tf.keras.losses.categorical_crossentropy, optimizer=tf.keras.optimizers.Adam(), metrics=['accuracy'])

In [21]:
cnn.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d (Conv2D)              (None, 28, 28, 32)        320       
_________________________________________________________________
leaky_re_lu (LeakyReLU)      (None, 28, 28, 32)        0         
_________________________________________________________________
max_pooling2d (MaxPooling2D) (None, 14, 14, 32)        0         
_________________________________________________________________
dropout (Dropout)            (None, 14, 14, 32)        0         
_________________________________________________________________
conv2d_1 (Conv2D)            (None, 14, 14, 64)        18496     
_________________________________________________________________
leaky_re_lu_1 (LeakyReLU)    (None, 14, 14, 64)        0         
_________________________________________________________________
max_pooling2d_1 (MaxPooling2 (None, 7, 7, 64)          0

In [22]:
cnn.fit(X_train, y_train, batch_size=batch_size, epochs=epochs, verbose=1, validation_data=(X_validate, y_validate))

Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


<tensorflow.python.keras.callbacks.History at 0x1b37fd61af0>

In [23]:
cnn.save('mnist.h5py')

Instructions for updating:
This property should not be used in TensorFlow 2.0, as updates are applied automatically.
Instructions for updating:
This property should not be used in TensorFlow 2.0, as updates are applied automatically.
INFO:tensorflow:Assets written to: mnist.h5py\assets


In [24]:
test_eval = cnn.evaluate(X_test, y_test, verbose=1)
print('Test loss:', test_eval[0])
print('Test accuracy:', test_eval[1])

Test loss: 0.02041202411055565
Test accuracy: 0.9940000176429749
