In [1]:
import torch
import torch.nn as nn
import torch.nn.functional as F

class MLP(nn.Module):
    def __init__(self):
        super(MLP, self).__init__()
        self.fc1 = nn.Linear(784, 100)
        self.fc2 = nn.Linear(100, 50)
        self.fc3 = nn.Linear(50, 10)

    def forward(self, x):
        x = x.view(-1, 784)
        x = F.relu(self.fc1(x))
        x = F.relu(self.fc2(x))
        x = self.fc3(x)
        return x

class CNN(nn.Module):
    def __init__(self):
        super(CNN, self).__init__()
        self.conv1 = nn.Conv2d(1, 3, 3)   # input channels, output channels, kernel size
        self.pool = nn.MaxPool2d(2, 2)    # kernel size, stride
        self.conv2 = nn.Conv2d(3, 5, 3)
        self.conv3 = nn.Conv2d(5, 5, 3)
        self.fc1 = nn.Linear(5 * 3 * 3, 30)
        self.fc2 = nn.Linear(30, 10)

    def forward(self, x):
        x = self.pool(F.relu(self.conv1(x)))
        x = self.pool(F.relu(self.conv2(x)))
        x = self.pool(F.relu(self.conv3(x)))
        x = x.view(-1, 5 * 3 * 3)
        x = F.relu(self.fc1(x))
        x = self.fc2(x)
        return x

# Create instances of MLP and CNN
mlp_model = MLP()
cnn_model = CNN()

# Print the model architecture
print("MLP Architecture:")
print(mlp_model)

print("\nCNN Architecture:")
print(cnn_model)


MLP Architecture:
MLP(
  (fc1): Linear(in_features=784, out_features=100, bias=True)
  (fc2): Linear(in_features=100, out_features=50, bias=True)
  (fc3): Linear(in_features=50, out_features=10, bias=True)
)

CNN Architecture:
CNN(
  (conv1): Conv2d(1, 3, kernel_size=(3, 3), stride=(1, 1))
  (pool): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  (conv2): Conv2d(3, 5, kernel_size=(3, 3), stride=(1, 1))
  (conv3): Conv2d(5, 5, kernel_size=(3, 3), stride=(1, 1))
  (fc1): Linear(in_features=45, out_features=30, bias=True)
  (fc2): Linear(in_features=30, out_features=10, bias=True)
)
