**Alexnet implementation with adaptive learning rates and momentum**

In [1]:
import tensorflow as tf
from tensorflow.keras import datasets, layers, models
import matplotlib.pyplot as plt
import numpy as np
from keras.optimizers import SGD
import time

**Loading the dataset**

In [2]:
(X_train, y_train), (X_test,y_test) = datasets.cifar10.load_data()
X_train.shape

Downloading data from https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz


(50000, 32, 32, 3)

In [3]:
y_train = y_train.reshape(-1,)
y_test = y_test.reshape(-1,)

In [4]:
classes = ["airplane","automobile","bird","cat","deer","dog","frog","horse","ship","truck"]

**Visualizing images**

In [5]:
def plot_sample(X, y, index):
    plt.figure(figsize = (15,2))
    plt.imshow(X[index])
    plt.xlabel(classes[y[index]])

**Normalising the dataset**

In [6]:
X_train = X_train / 255.0
X_test = X_test / 255.0

**Training the model**

In [26]:
cnn = models.Sequential([
    layers.Conv2D(filters=32, kernel_size=(3, 3),activation='relu', input_shape=(32, 32, 3)),
    layers.BatchNormalization(),
    layers.MaxPooling2D((2, 2)),
    layers.Dropout(0.2),
    
    layers.Conv2D(filters=64, kernel_size=(3, 3), activation='relu'),
    layers.BatchNormalization(),
    layers.MaxPooling2D((2, 2)),
    layers.Dropout(0.3),

    layers.Conv2D(filters=192, kernel_size=(3, 3), activation='relu'),
    layers.BatchNormalization(),
    layers.MaxPooling2D((2, 2)),
    layers.Dropout(0.4),
    
    layers.Flatten(),
    layers.Dense(64, activation='relu'),
    layers.BatchNormalization(),
    layers.Dense(10, activation='softmax')
])

**Model summary**

In [None]:
cnn.summary()

In [27]:
cnn.compile(optimizer=SGD(learning_rate=0.1, momentum=0.9),
              loss='sparse_categorical_crossentropy',
              metrics=['accuracy'])

In [28]:
start_time = time.time() 
cnn.fit(X_train, y_train, epochs=20)
end_time = time.time()
time_taken = end_time - start_time
print('Time taken:',time_taken)    

Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


<tensorflow.python.keras.callbacks.History at 0x7f9c2e650410>

**Score**

In [29]:
cnn.evaluate(X_test,y_test)



[0.7911699414253235, 0.7272999882698059]

**Classification report ie score on each class and final score**

In [30]:
from sklearn.metrics import confusion_matrix , classification_report
import numpy as np
y_pred = cnn.predict(X_test)
y_pred_classes = [np.argmax(element) for element in y_pred]

print("Classification Report: \n", classification_report(y_test, y_pred_classes))

Classification Report: 
               precision    recall  f1-score   support

           0       0.85      0.69      0.76      1000
           1       0.88      0.86      0.87      1000
           2       0.67      0.54      0.60      1000
           3       0.52      0.66      0.58      1000
           4       0.50      0.88      0.64      1000
           5       0.74      0.56      0.64      1000
           6       0.84      0.77      0.80      1000
           7       0.85      0.67      0.75      1000
           8       0.83      0.85      0.84      1000
           9       0.88      0.80      0.84      1000

    accuracy                           0.73     10000
   macro avg       0.76      0.73      0.73     10000
weighted avg       0.76      0.73      0.73     10000

