In [1]:
import numpy as np
from tensorflow import keras
import os
import cv2
from os import listdir
from os.path import isfile
from os.path import join
import time

import tensorflow as tf
import tensorflow.keras as keras
from tensorflow.keras.utils import to_categorical
from keras.models import Sequential
from keras.layers import *
from keras.preprocessing.image import ImageDataGenerator
from tensorflow.keras.callbacks import ReduceLROnPlateau
from tensorflow.keras.callbacks import EarlyStopping
from sklearn.model_selection import train_test_split

# Data Processing

In [2]:
(train_data, train_label), (test_data, test_label) = keras.datasets.mnist.load_data()
train_data = train_data.reshape(-1,28,28,1)
test_data = test_data.reshape(-1,28,28,1)

train_label = to_categorical(train_label, 10)
test_label = to_categorical(test_label, 10)


train_datagen=ImageDataGenerator(rescale=1./255, 
                                 #rotation_range = 15, 
                                 width_shift_range = 0.2, 
                                 height_shift_range = 0.2,
                                 shear_range = 0.2,
                                 zoom_range = 0.2)



test_datagen = ImageDataGenerator(rescale=1./255)

train_datagen.fit(train_data)
test_datagen.fit(test_data)

LR_function = ReduceLROnPlateau(monitor = 'val_loss',
                                patience = 2,
                                verbose = 1,
                                factor = 0.5,
                                min_lr = 0.00001)

EarlyStop = EarlyStopping(monitor='val_loss',
                          patience = 6,
                          verbose = 1, 
                          mode = 'min')

print(np.array(train_data).shape)
print(np.array(train_label).shape)

(60000, 28, 28, 1)
(60000, 10)


# CNN-Mnist

In [9]:
# model 
model = Sequential()

#conv1
model.add(Conv2D(128, (3, 3), padding="same", kernel_initializer="he_normal", activation='relu', input_shape=(28, 28, 1)))
model.add(BatchNormalization())

#conv2
model.add(Conv2D(128, (3, 3), padding="same", kernel_initializer="he_normal", activation='relu'))
model.add(BatchNormalization())

#pooling1
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.3))

#conv3
model.add(Conv2D(256,(3,3), padding="same", kernel_initializer="he_normal", activation='relu'))
model.add(BatchNormalization())

#conv4
model.add(Conv2D(256,(3,3), padding="same", kernel_initializer="he_normal", activation='relu'))
model.add(BatchNormalization())

#pooling2
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.3))

#conv5
model.add(Conv2D(256,(3,3), padding="same", kernel_initializer="he_normal", activation='relu'))
model.add(BatchNormalization())

#conv6
model.add(Conv2D(512,(3,3), padding="same", kernel_initializer="he_normal", activation='relu'))
model.add(BatchNormalization())

#conv7
model.add(Conv2D(512,(3,3), padding="same", kernel_initializer="he_normal", activation='relu'))
model.add(BatchNormalization())

#pooling3
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.3))

#conv8
model.add(Conv2D(512,(3,3), padding="same", kernel_initializer="he_normal", activation='relu'))
model.add(BatchNormalization())

#conv9
model.add(Conv2D(512,(3,3), padding="same", kernel_initializer="he_normal", activation='relu'))
model.add(BatchNormalization())

#pooling4
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.3))

model.add(Flatten())

model.add(Dense(512, kernel_initializer="he_normal", activation='relu'))
model.add(BatchNormalization())
model.add(Dropout(0.3))

model.add(Dense(256, kernel_initializer="he_normal", activation='relu'))
model.add(BatchNormalization())
model.add(Dropout(0.3))


model.add(Dense(10, activation='softmax'))

print(model.summary())

Model: "sequential_2"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d_18 (Conv2D)           (None, 28, 28, 128)       1280      
_________________________________________________________________
batch_normalization_22 (Batc (None, 28, 28, 128)       512       
_________________________________________________________________
conv2d_19 (Conv2D)           (None, 28, 28, 128)       147584    
_________________________________________________________________
batch_normalization_23 (Batc (None, 28, 28, 128)       512       
_________________________________________________________________
max_pooling2d_8 (MaxPooling2 (None, 14, 14, 128)       0         
_________________________________________________________________
dropout_12 (Dropout)         (None, 14, 14, 128)       0         
_________________________________________________________________
conv2d_20 (Conv2D)           (None, 14, 14, 256)      

# CNN Evaluation

In [10]:
epoch = 50
batch_size = 32

model.compile(
    loss = "categorical_crossentropy", 
    optimizer = "Adam",
    metrics = ["accuracy"]
)

history = model.fit(train_datagen.flow(train_data,train_label, batch_size = batch_size), 
                    steps_per_epoch = train_data.shape[0] / batch_size , 
                    validation_data = test_datagen.flow(test_data, test_label, batch_size = batch_size),
                    validation_steps = test_data.shape[0] / batch_size,
                    epochs = epoch,
                    callbacks = [LR_function, EarlyStop])

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50

Epoch 00011: ReduceLROnPlateau reducing learning rate to 0.0005000000237487257.
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50

Epoch 00017: ReduceLROnPlateau reducing learning rate to 0.0002500000118743628.
Epoch 18/50
Epoch 19/50

Epoch 00019: ReduceLROnPlateau reducing learning rate to 0.0001250000059371814.
Epoch 20/50
Epoch 21/50
Epoch 22/50

Epoch 00022: ReduceLROnPlateau reducing learning rate to 6.25000029685907e-05.
Epoch 23/50
Epoch 24/50

Epoch 00024: ReduceLROnPlateau reducing learning rate to 3.125000148429535e-05.
Epoch 25/50
Epoch 26/50

Epoch 00026: ReduceLROnPlateau reducing learning rate to 1.5625000742147677e-05.
Epoch 00026: early stopping


# BP-Mnist

In [3]:
# model 
model = Sequential()

model.add(Flatten(input_shape=[28, 28, 1]))

model.add(Dense(512, kernel_initializer="he_normal", activation='relu'))
model.add(BatchNormalization())
model.add(Dropout(0.3))

model.add(Dense(256, kernel_initializer="he_normal", activation='relu'))
model.add(BatchNormalization())
model.add(Dropout(0.3))


model.add(Dense(10, activation='softmax'))

print(model.summary())

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
flatten (Flatten)            (None, 784)               0         
_________________________________________________________________
dense (Dense)                (None, 512)               401920    
_________________________________________________________________
batch_normalization (BatchNo (None, 512)               2048      
_________________________________________________________________
dropout (Dropout)            (None, 512)               0         
_________________________________________________________________
dense_1 (Dense)              (None, 256)               131328    
_________________________________________________________________
batch_normalization_1 (Batch (None, 256)               1024      
_________________________________________________________________
dropout_1 (Dropout)          (None, 256)               0

# BP Evaluation 

In [4]:
epoch = 50
batch_size = 32

model.compile(
    loss = "categorical_crossentropy", 
    optimizer = "Adam",
    metrics = ["accuracy"]
)

history = model.fit(train_datagen.flow(train_data,train_label, batch_size = batch_size), 
                    steps_per_epoch = train_data.shape[0] / batch_size , 
                    validation_data = test_datagen.flow(test_data, test_label, batch_size = batch_size),
                    validation_steps = test_data.shape[0] / batch_size,
                    epochs = epoch,
                    callbacks = [LR_function, EarlyStop])

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50

Epoch 00023: ReduceLROnPlateau reducing learning rate to 0.0005000000237487257.
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50

Epoch 00027: ReduceLROnPlateau reducing learning rate to 0.0002500000118743628.
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50

Epoch 00031: ReduceLROnPlateau reducing learning rate to 0.0001250000059371814.
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50

Epoch 00043: ReduceLROnPlateau reducing learning rate to 6.25000029685907e-05.
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50

Epoch 00047: ReduceLROnPlateau reducing learning rate to 3.125000148429535e-05.
Epoch 48/50
Epoch 49/50

Epoch 00049: Red