In [10]:
import torch
import torchvision
from torch import nn
from torch import optim
import torch.nn.functional as F
from torch.autograd import Variable
from torch.utils.data import DataLoader
from torchvision import transforms
from torchvision.utils import save_image
from torchvision.datasets import MNIST
import os

In [11]:
def to_img(x):
    x = x.clamp(0, 1)
    x = x.view(x.size(0), 1, 28, 28)
    return x

In [12]:
num_epochs = 10
batch_size = 100
learning_rate = 1e-3

In [13]:
img_transform = transforms.Compose([
    transforms.ToTensor()
    # transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
])

In [14]:
dataset = MNIST('./data', transform=img_transform, download=True)
dataloader = DataLoader(dataset, batch_size=batch_size, shuffle=True)

In [15]:
class VAE(nn.Module):
    def __init__(self):
        super(VAE, self).__init__()

        self.fc1 = nn.Linear(784, 400)
        self.fc21 = nn.Linear(400, 20)
        self.fc22 = nn.Linear(400, 20)
        self.fc3 = nn.Linear(20, 400)
        self.fc4 = nn.Linear(400, 784)

    def encode(self, x):
        h1 = F.relu(self.fc1(x))
        return self.fc21(h1), self.fc22(h1)

    def reparametrize(self, mu, logvar):
        std = logvar.mul(0.5).exp_()
        if torch.cuda.is_available():
            eps = torch.cuda.FloatTensor(std.size()).normal_()
        else:
            eps = torch.FloatTensor(std.size()).normal_()
        eps = Variable(eps)
        return eps.mul(std).add_(mu)

    def decode(self, z):
        h3 = F.relu(self.fc3(z))
        #return F.sigmoid(self.fc4(h3))
        return self.fc4(h3)

    def forward(self, x):
        mu, logvar = self.encode(x)
        z = self.reparametrize(mu, logvar)
        return self.decode(z), mu, logvar
    
    

In [1]:
class VAE(nn.Module):
    def __init__(self):
        super(VAE, self).__init__()
        
        self.encoder = nn.Sequential(
            nn.Linear(784, 400),
            nn.ReLU(),
            nn.Linear(400, 20),
            nn.ReLU(),
            nn.Linear(200, 100),
            nn.ReLU(),
            nn.Linear(100, 20)
        )
        
        self.em = nn.Linear(20,latent_dim)  # mu layer
        self.ev = nn.Linear(20,latent_dim)  # logvariance layer
        
    def encode(self, x):
        #h1 = F.relu(self.fc1(x))
        h1 = self.encoder(x)
        mu = self.em(h1)
        logvar = self.ev(out)
        
        return mu,logvar
        
        #return self.fc21(h1), self.fc22(h1)

    def reparametrize(self, mu, logvar):
        std = logvar.mul(0.5).exp_()
        if torch.cuda.is_available():
            eps = torch.cuda.FloatTensor(std.size()).normal_()
        else:
            eps = torch.FloatTensor(std.size()).normal_()
        eps = Variable(eps)
        return eps.mul(std).add_(mu)

    def decode(self, z):
        h3 = F.relu(self.fc3(z))
        #return F.sigmoid(self.fc4(h3))
        return self.fc4(h3)

    def forward(self, x):
        mu, logvar = self.encode(x)
        z = self.reparametrize(mu, logvar)
        return self.decode(z), mu, logvar

NameError: name 'nn' is not defined

In [25]:
for epoch in range(num_epochs):
    model.train()
    train_loss = 0
    for batch_idx, data in enumerate(dataloader):
        img, _ = data
        img = img.view(img.size(0), -1)
        img = Variable(img)
        if torch.cuda.is_available():
            img = img.cuda()
        optimizer.zero_grad()
        recon_batch, mu, logvar = model(img)
        loss = loss_function(recon_batch, img, mu, logvar)
        loss.backward()
        train_loss += loss.data
        optimizer.step()
        if batch_idx % 100 == 0:
            print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
                epoch,
                batch_idx * len(img),
                len(dataloader.dataset), 100. * batch_idx / len(dataloader),
                loss.data / len(img)))

    print('====> Epoch: {} Average loss: {:.4f}'.format(
        epoch, train_loss / len(dataloader.dataset)))
    #if epoch % 10 == 0:
    #    save = to_img(recon_batch.cpu().data)
    #    save_image(save, './vae_img/image_{}.png'.format(epoch))

#torch.save(model.state_dict(), './vae.pth')



====> Epoch: 0 Average loss: 31.6393
====> Epoch: 1 Average loss: 31.4908
====> Epoch: 2 Average loss: 31.4310
====> Epoch: 3 Average loss: 31.3013
====> Epoch: 4 Average loss: 31.2201
====> Epoch: 5 Average loss: 31.1426
====> Epoch: 6 Average loss: 31.0446
====> Epoch: 7 Average loss: 30.9955
====> Epoch: 8 Average loss: 30.9269
====> Epoch: 9 Average loss: 30.8848


In [16]:
model = VAE()
if torch.cuda.is_available():
    model.cuda()

In [17]:
reconstruction_function = nn.MSELoss(size_average=False)



In [18]:
def loss_function(recon_x, x, mu, logvar):
    """
    recon_x: generating images
    x: origin images
    mu: latent mean
    logvar: latent log variance
    """
    BCE = reconstruction_function(recon_x, x)  # mse loss
    # loss = 0.5 * sum(1 + log(sigma^2) - mu^2 - sigma^2)
    KLD_element = mu.pow(2).add_(logvar.exp()).mul_(-1).add_(1).add_(logvar)
    KLD = torch.sum(KLD_element).mul_(-0.5)
    # KL divergence
    return BCE + KLD


def vae_loss(x, x_hat, mu, logvar):
    reconstruction_function = nn.MSELoss(size_average=False)
    BCE = reconstruction_function(x_hat, x)
    KLD = mu.pow(2).add_(logvar.exp()).mul_(-1).add_(1).add_(logvar)
    KLD = torch.sum(KLD).mul_(-0.5)
    return BCE + KLD

In [19]:
def loss_function(x_hat, x, mu, logvar):
    reconstruction_function = nn.MSELoss(size_average=False)
    BCE = reconstruction_function(x_hat, x)
    KLD = mu.pow(2).add_(logvar.exp()).mul_(-1).add_(1).add_(logvar)
    KLD = torch.sum(KLD).mul_(-0.5)
    return BCE + KLD

In [20]:
optimizer = optim.Adam(model.parameters(), lr=1e-3)

In [26]:
for batch_idx, data in enumerate(dataloader):
    break;
img, _ = data
img = img.view(img.size(0), -1)
img = Variable(img)

recon_batch, mu, logvar = model(img)

#img
save_before=to_img(img.cpu().data)
save_image(save_before, 'image_before{}.png'.format(0))


optimizer.zero_grad()
recon_batch, mu, logvar = model(img)

In [27]:
#recon_batch
save_after = to_img(recon_batch.cpu().data)
save_image(save_after, 'image_after{}.png'.format(0))

In [21]:
for epoch in range(num_epochs):
    model.train()
    train_loss = 0
    for batch_idx, data in enumerate(dataloader):
        img, _ = data
        img = img.view(img.size(0), -1)
        img = Variable(img)
        if torch.cuda.is_available():
            img = img.cuda()
        optimizer.zero_grad()
        recon_batch, mu, logvar = model(img)
        loss = loss_function(recon_batch, img, mu, logvar)
        loss.backward()
        train_loss += loss.data
        optimizer.step()
        if batch_idx % 100 == 0:
            print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
                epoch,
                batch_idx * len(img),
                len(dataloader.dataset), 100. * batch_idx / len(dataloader),
                loss.data / len(img)))

    print('====> Epoch: {} Average loss: {:.4f}'.format(
        epoch, train_loss / len(dataloader.dataset)))
    #if epoch % 10 == 0:
    #    save = to_img(recon_batch.cpu().data)
    #    save_image(save, './vae_img/image_{}.png'.format(epoch))

#torch.save(model.state_dict(), './vae.pth')



====> Epoch: 0 Average loss: 41.2877
====> Epoch: 1 Average loss: 34.9482
====> Epoch: 2 Average loss: 33.9798
====> Epoch: 3 Average loss: 33.3849
====> Epoch: 4 Average loss: 32.9356
====> Epoch: 5 Average loss: 32.5814
====> Epoch: 6 Average loss: 32.3406
====> Epoch: 7 Average loss: 32.0923
====> Epoch: 8 Average loss: 31.9354
====> Epoch: 9 Average loss: 31.7456
