## AP21110011538

## Write a python Programming to realize the working principles of popular architectures such as AlexNet, GoogleNet and VGG Net.

In [5]:
import torch
import torch.nn as nn
import torch.nn.functional as F

# 1. Simplified AlexNet Implementation
class SimpleAlexNet(nn.Module):
    def __init__(self):
        super(SimpleAlexNet, self).__init__()
        # AlexNet Layer-by-Layer Explanation:
        # - Input size: (3, 224, 224)
        self.conv1 = nn.Conv2d(3, 96, kernel_size=11, stride=4, padding=2)  # Output: (96, 55, 55)
        self.pool1 = nn.MaxPool2d(kernel_size=3, stride=2)                  # Output: (96, 27, 27)
        self.conv2 = nn.Conv2d(96, 256, kernel_size=5, padding=2)           # Output: (256, 27, 27)
        self.pool2 = nn.MaxPool2d(kernel_size=3, stride=2)                  # Output: (256, 13, 13)
        self.conv3 = nn.Conv2d(256, 384, kernel_size=3, padding=1)          # Output: (384, 13, 13)
        self.conv4 = nn.Conv2d(384, 384, kernel_size=3, padding=1)          # Output: (384, 13, 13)
        self.conv5 = nn.Conv2d(384, 256, kernel_size=3, padding=1)          # Output: (256, 13, 13)
        self.pool3 = nn.MaxPool2d(kernel_size=3, stride=2)                  # Output: (256, 6, 6)
        self.fc1 = nn.Linear(256 * 6 * 6, 4096)
        self.fc2 = nn.Linear(4096, 4096)
        self.fc3 = nn.Linear(4096, 1000)  # Output: 1000 classes

    def forward(self, x):
        x = F.relu(self.conv1(x))
        x = self.pool1(x)
        x = F.relu(self.conv2(x))
        x = self.pool2(x)
        x = F.relu(self.conv3(x))
        x = F.relu(self.conv4(x))
        x = F.relu(self.conv5(x))
        x = self.pool3(x)
        x = x.view(x.size(0), -1)  # Flatten
        x = F.relu(self.fc1(x))
        x = F.dropout(x, 0.5)  # Dropout for regularization
        x = F.relu(self.fc2(x))
        x = F.dropout(x, 0.5)  # Dropout for regularization
        x = self.fc3(x)
        return x

# 2. Simplified VGGNet Implementation (VGG16)
class SimpleVGGNet(nn.Module):
    def __init__(self):
        super(SimpleVGGNet, self).__init__()
        # VGG16 Layer-by-Layer Explanation:
        # - Uses multiple 3x3 convolution layers to create a deep network
        self.conv_layers = nn.Sequential(
            nn.Conv2d(3, 64, kernel_size=3, padding=1), nn.ReLU(),
            nn.Conv2d(64, 64, kernel_size=3, padding=1), nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2),  # Output: (64, 112, 112)

            nn.Conv2d(64, 128, kernel_size=3, padding=1), nn.ReLU(),
            nn.Conv2d(128, 128, kernel_size=3, padding=1), nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2),  # Output: (128, 56, 56)

            nn.Conv2d(128, 256, kernel_size=3, padding=1), nn.ReLU(),
            nn.Conv2d(256, 256, kernel_size=3, padding=1), nn.ReLU(),
            nn.Conv2d(256, 256, kernel_size=3, padding=1), nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2),  # Output: (256, 28, 28)

            nn.Conv2d(256, 512, kernel_size=3, padding=1), nn.ReLU(),
            nn.Conv2d(512, 512, kernel_size=3, padding=1), nn.ReLU(),
            nn.Conv2d(512, 512, kernel_size=3, padding=1), nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2),  # Output: (512, 14, 14)

            nn.Conv2d(512, 512, kernel_size=3, padding=1), nn.ReLU(),
            nn.Conv2d(512, 512, kernel_size=3, padding=1), nn.ReLU(),
            nn.Conv2d(512, 512, kernel_size=3, padding=1), nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2)   # Output: (512, 7, 7)
        )
        self.fc_layers = nn.Sequential(
            nn.Linear(512 * 7 * 7, 4096), nn.ReLU(), nn.Dropout(0.5),
            nn.Linear(4096, 4096), nn.ReLU(), nn.Dropout(0.5),
            nn.Linear(4096, 1000)  # Output: 1000 classes
        )

    def forward(self, x):
        x = self.conv_layers(x)
        x = x.view(x.size(0), -1)  # Flatten
        x = self.fc_layers(x)
        return x

# 3. Simplified GoogleNet Implementation
class SimpleGoogleNet(nn.Module):
    def __init__(self):
        super(SimpleGoogleNet, self).__init__()
        # Note: A full implementation of Inception modules is complex
        # Here we simplify to convey the idea of parallel filters
        self.conv1 = nn.Conv2d(3, 64, kernel_size=7, stride=2, padding=3)  # Output: (64, 112, 112)
        self.pool1 = nn.MaxPool2d(kernel_size=3, stride=2, padding=1)       # Output: (64, 56, 56)
        self.conv2 = nn.Conv2d(64, 192, kernel_size=3, padding=1)           # Output: (192, 56, 56)
        self.pool2 = nn.MaxPool2d(kernel_size=3, stride=2, padding=1)       # Output: (192, 28, 28)
        # Inception modules would follow here, simplified for demonstration
        self.fc = nn.Linear(192 * 28 * 28, 1000)  # Simplified final layer

    def forward(self, x):
        x = F.relu(self.conv1(x))
        x = self.pool1(x)
        x = F.relu(self.conv2(x))
        x = self.pool2(x)
        x = x.view(x.size(0), -1)  # Flatten
        x = self.fc(x)
        return x

# Function to display the simplified model summaries
def print_simplified_model_summary():
    x = torch.randn(1, 3, 224, 224)  # Sample input

    # Simple AlexNet
    print("\n=== Simple AlexNet ===")
    alexnet = SimpleAlexNet()
    alexnet_output = alexnet(x)
    print("Output Shape:", alexnet_output.shape)

    # Simple VGGNet
    print("\n=== Simple VGGNet (VGG16) ===")
    vggnet = SimpleVGGNet()
    vggnet_output = vggnet(x)
    print("Output Shape:", vggnet_output.shape)

    # Simple GoogleNet
    print("\n=== Simple GoogleNet ===")
    googlenet = SimpleGoogleNet()
    googlenet_output = googlenet(x)
    print("Output Shape:", googlenet_output.shape)

# Main Function
if __name__ == "__main__":
    print_simplified_model_summary()



=== Simple AlexNet ===
Output Shape: torch.Size([1, 1000])

=== Simple VGGNet (VGG16) ===
Output Shape: torch.Size([1, 1000])

=== Simple GoogleNet ===
Output Shape: torch.Size([1, 1000])
