[ref1](https://github.com/L1aoXingyu/pytorch-beginner/blob/master/08-AutoEncoder/Variational_autoencoder.py)
[ref2](https://github.com/pytorch/examples/blob/master/vae/main.py)

In [27]:
import torch
import torchvision
from torch import nn
from torch import optim
import torch.nn.functional as F
from torch.autograd import Variable
from torch.utils.data import DataLoader
from torchvision import transforms
from torchvision.utils import save_image
from torchvision.datasets import MNIST
import os

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

if not os.path.exists('./vae_img'):
    os.mkdir('./vae_img')


def to_img(x):
    x = x.clamp(0, 1)
    x = x.view(x.size(0), 1, 28, 28)
    return x


num_epochs = 100
batch_size = 128
learning_rate = 1e-3

img_transform = transforms.Compose([
    transforms.ToTensor()
    # transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
])

dataset = MNIST('../../data', transform=img_transform, download=True)
dataloader = DataLoader(dataset, batch_size=batch_size, shuffle=True)


class VAE(nn.Module):
    def __init__(self):
        super(VAE, self).__init__()

        self.fc1 = nn.Linear(784, 400)
        self.fc21 = nn.Linear(400, 20)
        self.fc22 = nn.Linear(400, 20)
        self.fc3 = nn.Linear(20, 400)
        self.fc4 = nn.Linear(400, 784)

    def encode(self, x):
        h1 = F.relu(self.fc1(x))
        return self.fc21(h1), self.fc22(h1)

    def reparameterize(self, mu, logvar):
        std = torch.exp(0.5*logvar)
        eps = torch.randn_like(std)
        return mu + eps*std

    def decode(self, z):
        h3 = F.relu(self.fc3(z))
        return torch.sigmoid(self.fc4(h3))

    def forward(self, x):
        mu, logvar = self.encode(x.view(-1, 784))
        z = self.reparameterize(mu, logvar)
        return self.decode(z), mu, logvar


model = VAE().to(device)

def loss_function(recon_x, x, mu, logvar):
    BCE = F.binary_cross_entropy(recon_x, x.view(-1, 784), reduction='sum')

    # see Appendix B from VAE paper:
    # Kingma and Welling. Auto-Encoding Variational Bayes. ICLR, 2014
    # https://arxiv.org/abs/1312.6114
    # 0.5 * sum(1 + log(sigma^2) - mu^2 - sigma^2)
    KLD = -0.5 * torch.sum(1 + logvar - mu.pow(2) - logvar.exp())
    return BCE + KLD


optimizer = optim.Adam(model.parameters(), lr=1e-3)

for epoch in range(num_epochs):
    model.train()
    train_loss = 0
    for batch_idx, (img, _) in enumerate(dataloader):
        img = img.to(device)
        optimizer.zero_grad()
        recon_batch, mu, logvar = model(img)
        loss = loss_function(recon_batch, img, mu, logvar)
        loss.backward()
        train_loss += loss.data.item()
        optimizer.step()
        if batch_idx % 100 == 0:
            print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
                epoch,
                batch_idx * len(img),
                len(dataloader.dataset), 100. * batch_idx / len(dataloader),
                loss.data.item() / len(img)))

    print('====> Epoch: {} Average loss: {:.4f}'.format(
        epoch, train_loss / len(dataloader.dataset)))
    if epoch % 10 == 0:
        save = to_img(recon_batch.cpu().data)
        save_image(save, './vae_img/image_{}.png'.format(epoch))

torch.save(model.state_dict(), './vae.pth')

====> Epoch: 0 Average loss: 164.9630
====> Epoch: 1 Average loss: 121.5355
====> Epoch: 2 Average loss: 114.5389
====> Epoch: 3 Average loss: 111.5229
====> Epoch: 4 Average loss: 109.7489
====> Epoch: 5 Average loss: 108.5419
====> Epoch: 6 Average loss: 107.6366
====> Epoch: 7 Average loss: 106.9689
====> Epoch: 8 Average loss: 106.4354
====> Epoch: 9 Average loss: 106.0675
====> Epoch: 10 Average loss: 105.6246
====> Epoch: 11 Average loss: 105.3050
====> Epoch: 12 Average loss: 105.0911
====> Epoch: 13 Average loss: 104.8341
====> Epoch: 14 Average loss: 104.5841
====> Epoch: 15 Average loss: 104.4130
====> Epoch: 16 Average loss: 104.2710
====> Epoch: 17 Average loss: 104.1574
====> Epoch: 18 Average loss: 103.9044
====> Epoch: 19 Average loss: 103.8022
====> Epoch: 20 Average loss: 103.6960
====> Epoch: 21 Average loss: 103.5524
====> Epoch: 22 Average loss: 103.4368
====> Epoch: 23 Average loss: 103.3474
====> Epoch: 24 Average loss: 103.2533
====> Epoch: 25 Average loss: 103.1

====> Epoch: 27 Average loss: 102.9715
====> Epoch: 28 Average loss: 102.9075
====> Epoch: 29 Average loss: 102.7751
====> Epoch: 30 Average loss: 102.7350
====> Epoch: 31 Average loss: 102.6339
====> Epoch: 32 Average loss: 102.5770
====> Epoch: 33 Average loss: 102.4864
====> Epoch: 34 Average loss: 102.4352
====> Epoch: 35 Average loss: 102.3785
====> Epoch: 36 Average loss: 102.3329
====> Epoch: 37 Average loss: 102.2667
====> Epoch: 38 Average loss: 102.1989
====> Epoch: 39 Average loss: 102.1340
====> Epoch: 40 Average loss: 102.0654
====> Epoch: 41 Average loss: 102.0114
====> Epoch: 42 Average loss: 101.9591
====> Epoch: 43 Average loss: 101.9087
====> Epoch: 44 Average loss: 101.8665
====> Epoch: 45 Average loss: 101.8298
====> Epoch: 46 Average loss: 101.7452
====> Epoch: 47 Average loss: 101.6860
====> Epoch: 48 Average loss: 101.6223
====> Epoch: 49 Average loss: 101.6462
====> Epoch: 50 Average loss: 101.5912
====> Epoch: 51 Average loss: 101.5342
====> Epoch: 52 Average l

====> Epoch: 55 Average loss: 101.4293
====> Epoch: 56 Average loss: 101.3241
====> Epoch: 57 Average loss: 101.3094
====> Epoch: 58 Average loss: 101.2768
====> Epoch: 59 Average loss: 101.2722
====> Epoch: 60 Average loss: 101.2097
====> Epoch: 61 Average loss: 101.2180
====> Epoch: 62 Average loss: 101.1330
====> Epoch: 63 Average loss: 101.1386
====> Epoch: 64 Average loss: 101.0730
====> Epoch: 65 Average loss: 101.0634
====> Epoch: 66 Average loss: 101.0736
====> Epoch: 67 Average loss: 101.0226
====> Epoch: 68 Average loss: 100.9368
====> Epoch: 69 Average loss: 100.9296
====> Epoch: 70 Average loss: 100.9181
====> Epoch: 71 Average loss: 100.8388
====> Epoch: 72 Average loss: 100.8650
====> Epoch: 73 Average loss: 100.8913
====> Epoch: 74 Average loss: 100.8010
====> Epoch: 75 Average loss: 100.7846
====> Epoch: 76 Average loss: 100.7856
====> Epoch: 77 Average loss: 100.7446
====> Epoch: 78 Average loss: 100.7153
====> Epoch: 79 Average loss: 100.7062
====> Epoch: 80 Average l

====> Epoch: 83 Average loss: 100.5869
====> Epoch: 84 Average loss: 100.5951
====> Epoch: 85 Average loss: 100.5822
====> Epoch: 86 Average loss: 100.5493
====> Epoch: 87 Average loss: 100.5286
====> Epoch: 88 Average loss: 100.5135
====> Epoch: 89 Average loss: 100.4700
====> Epoch: 90 Average loss: 100.4572
====> Epoch: 91 Average loss: 100.4536
====> Epoch: 92 Average loss: 100.4448
====> Epoch: 93 Average loss: 100.4261
====> Epoch: 94 Average loss: 100.3949
====> Epoch: 95 Average loss: 100.3890
====> Epoch: 96 Average loss: 100.4004
====> Epoch: 97 Average loss: 100.3320
====> Epoch: 98 Average loss: 100.3246
====> Epoch: 99 Average loss: 100.3288
