## Dive into Deep Learning 8.1.5 (#4-5)

In [None]:
import torch
from torch import nn
from d2l import torch as d2l
import matplotlib.pyplot as plt

In [None]:
class AlexNet(d2l.Classifier):
    """AlexNet model."""
    def __init__(self, lr=0.1, num_classes=10):
        super().__init__()
        self.save_hyperparameters()
        self.net = nn.Sequential(
            nn.LazyConv2d(96, kernel_size=11, stride=4, padding=1),
            nn.ReLU(), nn.MaxPool2d(kernel_size=3, stride=2),
            nn.LazyConv2d(256, kernel_size=5, padding=2), nn.ReLU(),
            nn.MaxPool2d(kernel_size=3, stride=2),
            nn.LazyConv2d(384, kernel_size=3, padding=1), nn.ReLU(),
            nn.LazyConv2d(384, kernel_size=3, padding=1), nn.ReLU(),
            nn.LazyConv2d(256, kernel_size=3, padding=1), nn.ReLU(),
            nn.MaxPool2d(kernel_size=3, stride=2), nn.Flatten(),
            nn.LazyLinear(4096), nn.ReLU(), nn.Dropout(p=0.5),
            nn.LazyLinear(4096), nn.ReLU(),nn.Dropout(p=0.5),
            nn.LazyLinear(num_classes))
        self.net.apply(d2l.init_cnn)

In [None]:
class LeNet(d2l.Classifier):  #@save
    """The LeNet-5 model."""
    def __init__(self, lr=0.1, num_classes=10):
        super().__init__()
        self.save_hyperparameters()
        self.net = nn.Sequential(
            nn.LazyConv2d(6, kernel_size=5, padding=2), nn.Sigmoid(),
            nn.AvgPool2d(kernel_size=2, stride=2),
            nn.LazyConv2d(16, kernel_size=5), nn.Sigmoid(),
            nn.AvgPool2d(kernel_size=2, stride=2),
            nn.Flatten(),
            nn.LazyLinear(120), nn.Sigmoid(),
            nn.LazyLinear(84), nn.Sigmoid(),
            nn.LazyLinear(num_classes))

In [None]:
AlexNet().layer_summary((1, 1, 224, 224))

### 8.1.5 Exercises (#4)

In [None]:
model_Alex_10 = AlexNet(lr=0.01)
data = d2l.FashionMNIST(batch_size=128, resize=(224, 224))
trainer = d2l.Trainer(max_epochs=10, num_gpus=1)
trainer.fit(model_Alex_10, data)
acc_Alex_10 = model_Alex_10.board.data['val_acc'][-1].y
plt.title(f"AlexNet (10 epochs): {acc_Alex_10*100:.2f}%")
plt.xlabel('Number of Epochs')
plt.ylabel('Loss/Accuracy')
plt.show()

In [None]:
model_LeNet_10 = LeNet(lr=0.01)
trainer.fit(model_LeNet_10, data)
acc_LeNet_10 = model_LeNet_10.board.data['val_acc'][-1].y
plt.title(f"LeNet (10 epochs): {acc_LeNet_10*100:.2f}%")
plt.xlabel('Number of Epochs')
plt.ylabel('Loss/Accuracy')
plt.show()

In [None]:
model_Alex_20 = AlexNet(lr=0.01)
trainer_epoch20 = d2l.Trainer(max_epochs=20, num_gpus=1)
trainer_epoch20.fit(model_Alex_20, data)
acc_Alex_20 = model_Alex_20.board.data['val_acc'][-1].y
plt.title(f"AlexNet (20 epochs): {acc_Alex_20*100:.2f}%")
plt.xlabel('Number of Epochs')
plt.ylabel('Loss/Accuracy')
plt.show()

In [None]:
model_LeNet_20 = LeNet(lr=0.01)
trainer.fit(model_LeNet_20, data)
acc_LeNet_20 = model_LeNet_20.board.data['val_acc'][-1].y
plt.title(f"LeNet (20 epochs): {acc_LeNet_20*100:.2f}%")
plt.xlabel('Number of Epochs')
plt.ylabel('Loss/Accuracy')
plt.show()

In [None]:
model_Alex_30 = AlexNet(lr=0.01)
trainer_epoch30 = d2l.Trainer(max_epochs=30, num_gpus=1)
trainer_epoch30.fit(model_Alex_30, data)
acc_Alex_30 = model_Alex_30.board.data['val_acc'][-1].y
plt.title(f"AlexNet (30 epochs): {acc_Alex_30*100:.2f}%")
plt.xlabel('Number of Epochs')
plt.ylabel('Loss/Accuracy')
plt.show()

In [None]:
model_LeNet_30 = LeNet(lr=0.01)
trainer.fit(model_LeNet_30, data)
acc_LeNet_30 = model_LeNet_30.board.data['val_acc'][-1].y
plt.title(f"LeNet (30 epochs): {acc_LeNet_30*100:.2f}%")
plt.xlabel('Number of Epochs')
plt.ylabel('Loss/Accuracy')
plt.show()

### 8.1.5 Exercises (#5-1)

In [None]:
class SimpleAlexNet(d2l.Classifier):
    """Simple AlexNet model."""
    def __init__(self, lr=0.1, num_classes=10):
        super().__init__()
        self.save_hyperparameters()
        self.net = nn.Sequential(
            nn.Conv2d(16, kernel_size=3, padding=1),
            nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2),
            nn.Flatten(),
            nn.Linear(256),
            nn.ReLU(),
            nn.Linear(num_classes)
        )
        self.net.apply(d2l.init_cnn)

In [None]:
model_SimpleAlex_10 = SimpleAlexNet(lr=0.01)
trainer = d2l.Trainer(max_epochs=10, num_gpus=1)
trainer.fit(model_SimpleAlex_10, data)
acc_SimpleAlex_10 = model_SimpleAlex_10.board.data['val_acc'][-1].y
plt.title(f"Simple AlexNet (10 epochs): {acc_SimpleAlex_10*100:.2f}%")
plt.xlabel('Number of Epochs')
plt.ylabel('Loss/Accuracy')
plt.show()

### 8.1.5 Exercises (#5-2)

In [None]:
class BetterAlexNet(d2l.Classifier):
    """AlexNet model for 28x28 images."""
    def __init__(self, lr=0.1, num_classes=10):
        super().__init__()
        self.save_hyperparameters()
        self.net = nn.Sequential(
            nn.Conv2d(16, kernel_size=3, padding=1),
            nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2),
            nn.Conv2d(32, kernel_size=3, padding=1),
            nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2),
            nn.Conv2d(64, kernel_size=3, padding=1),
            nn.ReLU(),
            nn.Flatten(),
            nn.Linear(128),
            nn.ReLU(),
            nn.Linear(num_classes)
        )
        self.net.apply(d2l.init_cnn)

In [None]:
model_BetterAlex_10 = BetterAlexNet(lr=0.01)
trainer = d2l.Trainer(max_epochs=10, num_gpus=1)
trainer.fit(model_BetterAlex_10, data)
acc_BetterAlex_10 = model_BetterAlex_10.board.data['val_acc'][-1].y
plt.title(f"Better AlexNet (10 epochs): {acc_BetterAlex_10*100:.2f}%")
plt.xlabel('Number of Epochs')
plt.ylabel('Loss/Accuracy')
plt.show()