In [31]:
import torch
import torch.nn as nn
from torch.nn import Conv2d, MaxPool2d, Flatten, Linear, Sequential



# 二、激活函数的使用场景
## 1. 隐藏层（卷积层/全连接层后）
目的：引入非线性，增强模型表达能力。

常用激活函数：ReLU、Leaky ReLU、GELU、Swish。

In [36]:
class CNN(nn.Module):
    def __init__(self):
        super(CNN, self).__init__()
        self.conv1 = nn.Conv2d(3, 32, 5, padding=2)
        self.maxpool = nn.MaxPool2d(2)
        self.conv2 = nn.Conv2d(32, 32, 5, padding=2)
        self.maxpool2 = nn.MaxPool2d(2)
        self.conv3 = nn.Conv2d(32, 64, 5, padding=2)
        self.maxpool3 = nn.MaxPool2d(2)

        self.flatten = nn.Flatten()
        # 32/2/2/2 = 4
        # 64 是因為 conv3的out_channels是64
        self.fc1 = nn.Linear(64 * 4 * 4, 64)
        self.fc2 = nn.Linear(64, 10)

    def forward(self, x):
        x = self.conv1(x)
        x = self.maxpool(x)
        x = self.conv2(x)
        x = self.maxpool2(x)
        x = self.conv3(x)
        x = self.maxpool3(x)

        x = self.flatten(x) # nn.Flatten()类的flatten功能start_dim默認為1
        # x = torch.flatten(x, 1) # torch.flatten功能的start_dim默認為0
        x = self.fc1(x)
        x = self.fc2(x)
        return x


class CNN2(nn.Module):
    def __init__(self):
        super(CNN2, self).__init__()
        self.model1 = Sequential(
            Conv2d(3, 32, 5, padding=2),
            MaxPool2d(2),
            Conv2d(32, 32, 5, padding=2),
            MaxPool2d(2),
            Conv2d(32, 64, 5, padding=2),
            MaxPool2d(2),

            Flatten(),
            Linear(64 * 4 * 4, 64),
            Linear(64, 10)
        )

    def forward(self, x):
        x = self.model1(x)
        return x

In [38]:
cnn = CNN()
print(cnn)
input = torch.ones((64, 3, 32, 32))
output = cnn(input)
print(output.shape)
print(output)


cnn2 = CNN2()
print(cnn2)
input2 = torch.ones((64, 3, 32, 32))
output2 = cnn2(input2)
print(output2.shape)
print(output2)

CNN(
  (conv1): Conv2d(3, 32, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
  (maxpool): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  (conv2): Conv2d(32, 32, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
  (maxpool2): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  (conv3): Conv2d(32, 64, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
  (maxpool3): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  (flatten): Flatten(start_dim=1, end_dim=-1)
  (fc1): Linear(in_features=1024, out_features=64, bias=True)
  (fc2): Linear(in_features=64, out_features=10, bias=True)
)
torch.Size([64, 10])
tensor([[ 0.0425,  0.0486, -0.0642, -0.0200, -0.1078, -0.0932, -0.1690,  0.0089,
         -0.0599,  0.0925],
        [ 0.0425,  0.0486, -0.0642, -0.0200, -0.1078, -0.0932, -0.1690,  0.0089,
         -0.0599,  0.0925],
        [ 0.0425,  0.0486, -0.0642, -0.0200, -0.1078, -0.0932, -0.1690,  0.0089,
         

In [39]:
from torch.utils.tensorboard import SummaryWriter
writer = SummaryWriter("./log_seq")
writer.add_graph(cnn, input)
writer.close()
