In [1]:
import torch
from torch import nn
from d2l import torch as d2l

`trans_conv` 函数实现 2 维转置卷积操作，其中输出的大小是 $h_\text{in} + h_k - 1, w_\text{in} + w_k - 1$

In [3]:
def trans_conv(X, K):
    h, w = K.shape
    Y = torch.zeros((X.shape[0] + h - 1, X.shape[1] + w - 1)) # 输出的高宽
    for i in range(X.shape[0]):
        for j in range(X.shape[1]):
            Y[i: i + h, j: j + w] += X[i, j] * K
    return Y

In [6]:
X = torch.arange(4, dtype=torch.float32).reshape(2, 2)
K = torch.arange(4, dtype=torch.float32).reshape(2, 2)
X, K

(tensor([[0., 1.],
         [2., 3.]]),
 tensor([[0., 1.],
         [2., 3.]]))

In [7]:
trans_conv(X, K)

tensor([[ 0.,  0.,  1.],
        [ 0.,  4.,  6.],
        [ 4., 12.,  9.]])

4 维张量的转置卷积使用 API 实现，本身卷积核参数可学习，下面指定了固定的卷积核

In [11]:
X, K = X.reshape(1, 1, 2, 2), K.reshape(1, 1, 2, 2)
tconv = nn.ConvTranspose2d(1, 1, kernel_size=2, bias=False)
tconv.weight.data = K
tconv(X)

tensor([[[[ 0.,  0.,  1.],
          [ 0.,  4.,  6.],
          [ 4., 12.,  9.]]]], grad_fn=<ConvolutionBackward0>)

### 填充，步幅和多通道

填充为 1，步幅为 1 的情况

In [12]:
tconv = nn.ConvTranspose2d(1, 1, kernel_size=2, padding=1 ,bias=False)
tconv.weight.data = K
tconv(X)

tensor([[[[4.]]]], grad_fn=<ConvolutionBackward0>)

填充为 0，步幅为 2 的情况

In [14]:
tconv = nn.ConvTranspose2d(1, 1, kernel_size=2, stride=2, bias=False)
tconv.weight.data = K
tconv(X)

tensor([[[[0., 0., 0., 1.],
          [0., 0., 2., 3.],
          [0., 2., 0., 3.],
          [4., 6., 6., 9.]]]], grad_fn=<ConvolutionBackward0>)

转置卷积和卷积互换，在卷积核形状相同的情况下，转置卷积和卷积操作的输出输入通道数相反，输入和输出的形状也相反

In [19]:
X = torch.arange(3200, dtype=torch.float32).reshape(1, 4, 20, 40)
conv = nn.Conv2d(4, 10, kernel_size=2, padding=1, stride=2)
tconv = nn.ConvTranspose2d(10, 4, kernel_size=2, padding=1, stride=2)
tconv(conv(X)).shape == X.shape

True

### 与矩阵变换的关系

In [22]:
X = torch.arange(9.0).reshape(3, 3)
K = torch.arange(4.0).reshape(2, 2)
Y = d2l.corr2d(X, K)
Y, K

(tensor([[19., 25.],
         [37., 43.]]),
 tensor([[0., 1.],
         [2., 3.]]))

`kernel2matrix` 创建一个稀疏矩阵 W，其中非零元素来自卷积核 K

In [21]:
def kernel2matrix(K):
    k, W = torch.zeros(5), torch.zeros((4, 9))
    k[:2], k[3:5] = K[0, :], K[1, :]
    W[0, :5], W[1, 1:6], W[2, 3:8], W[3, 4:] = k, k, k, k
    return W

W = kernel2matrix(K)
W

tensor([[0., 1., 0., 2., 3., 0., 0., 0., 0.],
        [0., 0., 1., 0., 2., 3., 0., 0., 0.],
        [0., 0., 0., 0., 1., 0., 2., 3., 0.],
        [0., 0., 0., 0., 0., 1., 0., 2., 3.]])

将 W 和 X 的向量形式相乘得到 Y，和卷积操作得到的 Y 相同

In [27]:
torch.matmul(W, X.reshape(-1)).reshape(2, 2)

tensor([[19., 25.],
        [37., 43.]])

同理可得转置卷积得出的结果和乘法结果相同，印证笔记 `原理.2` 中为什么被称为转置卷积部分的内容

In [30]:
trans_conv(Y, K), torch.matmul(W.T, Y.reshape(-1)).reshape(3, 3)

(tensor([[  0.,  19.,  25.],
         [ 38., 144., 118.],
         [ 74., 197., 129.]]),
 tensor([[  0.,  19.,  25.],
         [ 38., 144., 118.],
         [ 74., 197., 129.]]))