In [None]:
import torch
import platform
print("PyTorch version:{}".format(torch.__version__))
print("Python version:{}".format(platform.python_version()))

# 第11章 自动编码器

## 11.2.2 通过卷积变换实现自动编码器模型

In [None]:
import torch
import torchvision
from torchvision import datasets, transforms
#from torch.autograd import Variable
import numpy as np
import matplotlib.pyplot as plt
%matplotlib inline

device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")

In [None]:
transform = transforms.Compose([transforms.ToTensor(),
transforms.Normalize(mean=[0.5],std=[0.5])])

dataset_train = datasets.MNIST(root = "./data",
                               transform = transform,
                               train = True,
                               download = True)

dataset_test = datasets.MNIST(root = "./data",
                              transform = transform,
                              train = False)

train_load = torch.utils.data.DataLoader(dataset = dataset_train,
                                         batch_size = 64,
                                         shuffle = True)

test_load = torch.utils.data.DataLoader(dataset = dataset_test,
                                        batch_size = 64,
                                        shuffle = True)

In [None]:
images, label = next(iter(train_load))
print(images.shape)
images_example = torchvision.utils.make_grid(images)
images_example = images_example.numpy().transpose(1,2,0)
mean = [0.5]
std = [0.5]
images_example = images_example*std + mean
plt.imshow(images_example)
plt.show()

In [None]:
noisy_images = images_example + 0.5*np.random.randn(*images_example.shape)
noisy_images = np.clip(noisy_images, 0., 1.)
plt.imshow(noisy_images)
plt.show()

In [None]:
class AutoEncoder(torch.nn.Module):
    def __init__(self):
        super(AutoEncoder, self).__init__()
        self.encoder = torch.nn.Sequential(torch.nn.Conv2d(1,64, kernel_size=3, stride=1, padding=1),
                                           torch.nn.ReLU(),
                                           torch.nn.MaxPool2d(kernel_size=2, stride=2),
                                           torch.nn.Conv2d(64,128, kernel_size=3, stride=1, padding=1),
                                           torch.nn.ReLU(),
                                           torch.nn.MaxPool2d(kernel_size=2, stride=2))
        
        self.decoder = torch.nn.Sequential(torch.nn.Upsample(scale_factor=2, mode="nearest"),
                                           torch.nn.Conv2d(128,64, kernel_size=3, stride=1, padding=1),
                                           torch.nn.ReLU(),
                                           torch.nn.Upsample(scale_factor=2, mode="nearest"),
                                           torch.nn.Conv2d(64,1, kernel_size=3, stride=1, padding=1))
        
    def forward(self, input):
        output = self.encoder(input)
        output = self.decoder(output)
        return output

In [None]:
model = AutoEncoder()
#Use_gpu = torch.cuda.is_available()
# if Use_gpu:
#     model = model.cuda()
model.to(device)
print(model)
    
optimizer = torch.optim.Adam(model.parameters())
loss_f = torch.nn.MSELoss()
epoch_n =5

In [None]:
for epoch in range(epoch_n):
    running_loss = 0.0
    print("Epoch {}/{}".format(epoch, epoch_n))
    print("-"*10)
    
    for data in train_load:
        X_train,_= data
        noisy_X_train = X_train + 0.5*torch.randn(X_train.shape)
        noisy_X_train = torch.clamp(noisy_X_train, 0., 1.)
        #X_train, noisy_X_train = Variable(X_train.cuda()),Variable(noisy_X_train.cuda())
        X_train, noisy_X_train = X_train.to(device),noisy_X_train.to(device)
        
        train_pre = model(noisy_X_train)
        loss = loss_f(train_pre, X_train)
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
        
        running_loss +=loss.data
    print("Loss is:{:.4f}".format(running_loss/len(dataset_train)))