# AlexNet

#### AlexNet on CIFAR10 data

### Download the CIFAR10 data and do data preprocessing 

In [2]:
# Load tensorflow
import tensorflow as tf

# Loads the CIFAR dataset
(x_train, y_train), (x_test, y_test) = tf.keras.datasets.cifar10.load_data()

# Display our data shape/dimensions
print('x_train shape:', x_train.shape)
print(x_train.shape[0], 'train samples')
print(x_test.shape[0], 'test samples')

# Now we one hot encode outputs
num_classes = 10
y_train = tf.keras.utils.to_categorical(y_train, num_classes)
y_test = tf.keras.utils.to_categorical(y_test, num_classes)

Downloading data from https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz
x_train shape: (50000, 32, 32, 3)
50000 train samples
10000 test samples


<br>

### AlexNet Architecture

In [3]:
l2_reg = 0

# Initialize model
model = tf.keras.models.Sequential()

# 1st Conv Layer 
model.add(tf.keras.layers.Conv2D(filters=96, 
                                 kernel_size=(11, 11), 
                                 input_shape=x_train.shape[1:], # (32, 32, 3)
                                 padding='same',
                                 strides=(1,1), 
                                 kernel_regularizer=tf.keras.regularizers.l2(l2_reg)))
model.add(tf.keras.layers.BatchNormalization())
model.add(tf.keras.layers.Activation('relu'))
model.add(tf.keras.layers.MaxPooling2D(pool_size=(2, 2)))

# 2nd Conv Layer 
model.add(tf.keras.layers.Conv2D(filters=256, 
                                 kernel_size=(5, 5), 
                                 padding='same',
                                 strides=(1,1)))
model.add(tf.keras.layers.BatchNormalization())
model.add(tf.keras.layers.Activation('relu'))
model.add(tf.keras.layers.MaxPooling2D(pool_size=(2, 2)))

# 3rd Conv Layer 
model.add(tf.keras.layers.ZeroPadding2D((1, 1)))
model.add(tf.keras.layers.Conv2D(filters=512, 
                                 kernel_size=(3, 3), 
                                 padding='same',
                                 strides=(1,1)))
model.add(tf.keras.layers.BatchNormalization())
model.add(tf.keras.layers.Activation('relu'))
model.add(tf.keras.layers.MaxPooling2D(pool_size=(2, 2)))

# 4th Conv Layer 
model.add(tf.keras.layers.ZeroPadding2D((1, 1)))
model.add(tf.keras.layers.Conv2D(filters=1024, 
                                 kernel_size=(3, 3), 
                                 padding='same',
                                 strides=(1,1)))
model.add(tf.keras.layers.BatchNormalization())
model.add(tf.keras.layers.Activation('relu'))

# 5th Conv Layer 
model.add(tf.keras.layers.ZeroPadding2D((1, 1)))
model.add(tf.keras.layers.Conv2D(filters=1024, 
                                 kernel_size=(3, 3), 
                                 padding='same',
                                 strides=(1,1)))
model.add(tf.keras.layers.BatchNormalization())
model.add(tf.keras.layers.Activation('relu'))
model.add(tf.keras.layers.MaxPooling2D(pool_size=(2, 2)))

# 1st FC Layer
model.add(tf.keras.layers.Flatten())
model.add(tf.keras.layers.Dense(units=3072))
model.add(tf.keras.layers.BatchNormalization())
model.add(tf.keras.layers.Activation('relu'))
model.add(tf.keras.layers.Dropout(0.5))

# 2nd FC Layer
model.add(tf.keras.layers.Dense(units=4096))
model.add(tf.keras.layers.BatchNormalization())
model.add(tf.keras.layers.Activation('relu'))
model.add(tf.keras.layers.Dropout(0.5))

# 3rd FC Layer
model.add(tf.keras.layers.Dense(units=num_classes))
model.add(tf.keras.layers.BatchNormalization())
model.add(tf.keras.layers.Activation('softmax'))

print(model.summary())

model.compile(loss = 'categorical_crossentropy',
              optimizer = tf.keras.optimizers.Adadelta(),
              metrics = ['accuracy'])


Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
conv2d (Conv2D)              (None, 32, 32, 96)        34944     
_________________________________________________________________
batch_normalization (BatchNo (None, 32, 32, 96)        384       
_________________________________________________________________
activation (Activation)      (None, 32, 32, 96)        0         
_________________________________________________________________
max_pooling2d (MaxPooling2D) (None, 16, 16, 96)        0         
_________________________________________________________________
conv2d_1 (Conv2D)            (None, 16, 16, 256)       614656    
_________________________________________________________________
batch_normalization_1 (Batch (None, 16, 16, 256)       1024      
_________________________________________________________________
activation_1 (Activation)    (None, 16, 16, 256)       0

<br>

### Train

In [5]:
# Training Parameters
batch_size = 32
epochs = 5

history = model.fit(x_train, 
                    y_train,
                    batch_size=batch_size,
                    epochs=epochs,
                    validation_split=0.1,
                    shuffle=True)

# Evaluate the performance of our trained model
scores = model.evaluate(x_test, y_test, verbose=1)
print('Test loss:', scores[0])
print('Test accuracy:', scores[1])

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
Test loss: 1.4650583267211914
Test accuracy: 0.5123000144958496


<br>

---

<br>