<a href="https://colab.research.google.com/github/Shuo-Zh/dl/blob/main/%E8%BD%AC%E7%BD%AE%E5%8D%B7%E7%A7%AF.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# 转置卷积

- 可以用来增大输入高宽
- 卷积不会增加大输入高宽，要不不变、要么减半
- Y[i:i+h, j:j+w] += X[i,j] * K （输入元素 * 卷积核）


# WHY 转置
### 卷积 Y = X * W
- 可以对 W 构造一个 V，使卷积等价于矩阵乘法 Y'= VX'
- 这里 Y', X' 是 Y,X 对应的向量版本

### 转置卷积 == Y' = V^T X'
### 如果卷积将 输入从（h, w） 变成(h', w')
- 同样超参数的 转置卷积从 变成(h', w') 变成 （h, w）

In [1]:
!pip install d2l

Collecting d2l
  Downloading d2l-1.0.3-py3-none-any.whl (111 kB)
[?25l     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m0.0/111.7 kB[0m [31m?[0m eta [36m-:--:--[0m[2K     [91m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m[90m╺[0m[90m━━━━━━[0m [32m92.2/111.7 kB[0m [31m2.6 MB/s[0m eta [36m0:00:01[0m[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m111.7/111.7 kB[0m [31m2.3 MB/s[0m eta [36m0:00:00[0m
[?25hCollecting jupyter==1.0.0 (from d2l)
  Downloading jupyter-1.0.0-py2.py3-none-any.whl (2.7 kB)
Collecting matplotlib==3.7.2 (from d2l)
  Downloading matplotlib-3.7.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (11.6 MB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m11.6/11.6 MB[0m [31m56.8 MB/s[0m eta [36m0:00:00[0m
Collecting pandas==2.0.3 (from d2l)
  Downloading pandas-2.0.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (12.3 MB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m12

In [2]:
import torch
from torch import nn
from d2l import torch as d2l

padding = 1 --> 实现最基本的转置卷积运算

In [5]:
def trans_conv(X, K):
    h, w = K.shape
    Y = torch.zeros((X.shape[0] + h - 1, X.shape[1] + w - 1))
    for i in range(X.shape[0]):
        for j in range(X.shape[1]):
            Y[i: i + h, j: j + w] += X[i, j] * K #kernel
    return Y

In [6]:
X = torch.tensor([[0.0, 1.0], [2.0, 3.0]])
K = torch.tensor([[0.0, 1.0], [2.0, 3.0]])
trans_conv(X, K)

tensor([[ 0.,  0.,  1.],
        [ 0.,  4.,  6.],
        [ 4., 12.,  9.]])

In [7]:
X, K = X.reshape(1, 1, 2, 2), K.reshape(1, 1, 2, 2) #批量大小，通道数1
tconv = nn.ConvTranspose2d(1, 1, kernel_size=2, bias=False) #输出1 输出1 核2（窗口大小）
tconv.weight.data = K
tconv(X)

tensor([[[[ 0.,  0.,  1.],
          [ 0.,  4.,  6.],
          [ 4., 12.,  9.]]]], grad_fn=<ConvolutionBackward0>)

填充、步幅和多通道

In [8]:
# 填充padding=1，输出填充1 --> 单个元素
tconv = nn.ConvTranspose2d(1, 1, kernel_size=2, padding=1, bias=False)
tconv.weight.data = K
tconv(X)

tensor([[[[4.]]]], grad_fn=<ConvolutionBackward0>)

In [9]:
# stride=2，跳两步，输出变大 --> 4*4
tconv = nn.ConvTranspose2d(1, 1, kernel_size=2, stride=2, bias=False)
tconv.weight.data = K
tconv(X)

tensor([[[[0., 0., 0., 1.],
          [0., 0., 2., 3.],
          [0., 2., 0., 3.],
          [4., 6., 6., 9.]]]], grad_fn=<ConvolutionBackward0>)

In [10]:
# 多通道 X=10个通道;Kernel 如何作用在一个上面
X = torch.rand(size=(1, 10, 16, 16))
conv = nn.Conv2d(10, 20, kernel_size=5, padding=2, stride=3) # 卷积 10->20
tconv = nn.ConvTranspose2d(20, 10, kernel_size=5, padding=2, stride=3) # 转置卷积 20->10
tconv(conv(X)).shape == X.shape

True

与矩阵变换的联系

In [11]:
X = torch.arange(9.0).reshape(3, 3)
K = torch.tensor([[1.0, 2.0], [3.0, 4.0]])
Y = d2l.corr2d(X, K) # corr2d函数 卷积最简单版本
Y

tensor([[27., 37.],
        [57., 67.]])

In [12]:
# 卷积核K重写为包含大量0的稀疏权重矩阵W
def kernel2matrix(K):
    k, W = torch.zeros(5), torch.zeros((4, 9))
    k[:2], k[3:5] = K[0, :], K[1, :]
    W[0, :5], W[1, 1:6], W[2, 3:8], W[3, 4:] = k, k, k, k
    return W

W = kernel2matrix(K)
W

tensor([[1., 2., 0., 3., 4., 0., 0., 0., 0.],
        [0., 1., 2., 0., 3., 4., 0., 0., 0.],
        [0., 0., 0., 1., 2., 0., 3., 4., 0.],
        [0., 0., 0., 0., 1., 2., 0., 3., 4.]])

In [13]:
Y == torch.matmul(W, X.reshape(-1)).reshape(2, 2)

tensor([[True, True],
        [True, True]])

In [14]:
Z = trans_conv(Y, K)
Z == torch.matmul(W.T, Y.reshape(-1)).reshape(3, 3) # W.T 转置卷积，对应超参数输出大小变成输入大小

tensor([[True, True, True],
        [True, True, True],
        [True, True, True]])