In [34]:
import os
os.environ['CUDA_DEVICE_ORDER']='PCI_BUS_ID'
os.environ['CUDA_VISIBLE_DEVICES']='0'

In [35]:
import torch
import torch.nn as nn
import torch.nn.functional as F

import numpy as np
import random
import torchvision.datasets as datasets
import torchvision.transforms as transforms
import torchvision

import torch.optim as optim
from torchvision import datasets, transforms
from torch.autograd import Variable
from torchvision.utils import save_image


In [36]:
bs = 128

train_dataset = datasets.MNIST(root='./mnist_data/', train=True, transform=transforms.ToTensor(), download=True)
test_dataset = datasets.MNIST(root='./mnist_data/', train=False, transform=transforms.ToTensor(), download=False)

train_loader = torch.utils.data.DataLoader(dataset=train_dataset, batch_size=bs, shuffle=True)
test_loader = torch.utils.data.DataLoader(dataset=test_dataset, batch_size=bs, shuffle=False)

In [37]:
def train(epoch, device, weight):
    vae.train()
    train_loss = 0
    for batch_idx, (data, _) in enumerate(train_loader):
        data = data.to(device)
        optimizer.zero_grad()
        
        recon_batch, mu, log_var = vae(data)
        loss = loss_function(recon_batch, data, mu, log_var, weight)
        
        loss.backward()
        train_loss += loss.item()
        optimizer.step()
        
        if batch_idx % 100 == 0:
            print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
                epoch, batch_idx * len(data), len(train_loader.dataset),
                100. * batch_idx / len(train_loader), loss.item() / len(data)))
    print('====> Epoch: {} Average loss: {:.4f}'.format(epoch, train_loss / len(train_loader.dataset)))

In [38]:
def test(device, weight):
    vae.eval()
    test_loss= 0
    with torch.no_grad():
        for data, _ in test_loader:
            data = data.to(device)
            recon, mu, log_var = vae(data)
            
            # sum up batch loss
            test_loss += loss_function(recon, data, mu, log_var, weight).item()
        
    test_loss /= len(test_loader.dataset)
    print('====> Test set loss: {:.4f}'.format(test_loss))

# Task 1: Design the autoencoder structured network for MNIST

In [39]:
# YOUR CODE!!

class VAE(nn.Module):
    def __init__(self, x_dim, h_dim1, h_dim2, z_dim):
        super(VAE, self).__init__()
        
        # encoder part
        
        #############################################################
    
        # YOUR CODE!!
        self.fc1 = nn.Linear(x_dim, h_dim1)
        self.fc2 = nn.Linear(h_dim1, h_dim2)
        self.fc3_1 = nn.Linear(h_dim2, z_dim)
        self.fc3_2 = nn.Linear(h_dim2, z_dim)

        #############################################################
        
        
        # decoder part
        
        #############################################################
    
        # YOUR CODE!!
        self.fc4 = nn.Linear(z_dim, h_dim2)
        self.fc5 = nn.Linear(h_dim2, h_dim1)
        self.fc6 = nn.Linear(h_dim1, x_dim)
        #############################################################
        
        
    def encoder(self, x):
        # return mu, log_var
        
        #############################################################
    
        # YOUR CODE!!
        h = F.relu(self.fc1(x))
        h = F.relu(self.fc2(h))
        return self.fc3_1(h), self.fc3_2(h) # mu, log_var
        #############################################################
    
    def sampling(self, mu, log_var):
        # return z sample
        
        #############################################################
    
        # YOUR CODE!!
        std = torch.exp(0.5*log_var)
        eps = torch.randn_like(std)
        return eps.mul(std).add_(mu) # return z sample
        #############################################################
        
    def decoder(self, z):
        # return generated img
        
        #############################################################
    
        # YOUR CODE!!
        h = F.relu(self.fc4(z))
        h = F.relu(self.fc5(h))
        return F.sigmoid(self.fc6(h))
        #############################################################
    
    def forward(self, x):
        mu, log_var = self.encoder(x.view(-1, 784))
        z = self.sampling(mu, log_var)
        return self.decoder(z), mu, log_var

In [40]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
device

device(type='cuda')

In [41]:
vae = VAE(x_dim=784, h_dim1= 512, h_dim2=256, z_dim=50)
if torch.cuda.is_available():
    vae.to(device)

In [42]:
vae

VAE(
  (fc1): Linear(in_features=784, out_features=512, bias=True)
  (fc2): Linear(in_features=512, out_features=256, bias=True)
  (fc3_1): Linear(in_features=256, out_features=50, bias=True)
  (fc3_2): Linear(in_features=256, out_features=50, bias=True)
  (fc4): Linear(in_features=50, out_features=256, bias=True)
  (fc5): Linear(in_features=256, out_features=512, bias=True)
  (fc6): Linear(in_features=512, out_features=784, bias=True)
)

# Task 2: Design the loss function for autoencoder with weight of KLD term

In [44]:
optimizer = optim.Adam(vae.parameters())

# #Without weight term

In [16]:

def loss_function(recon_x, x, mu, log_var, weight):
    # return reconstruction error + KL divergence losses
    
    #############################################################
    
    # YOUR CODE!!
    BCE = F.binary_cross_entropy(recon_x, x.view(-1, 784), reduction='sum')
    KLD = -0.5 * torch.sum(1 + log_var - mu.pow(2) - log_var.exp())
    return BCE + KLD
    #############################################################
    
    pass

In [17]:
from tqdm.autonotebook import tqdm

for epoch in tqdm(range(1, 51)):
    train(epoch, device, weight)
    test(device, weight)

HBox(children=(FloatProgress(value=0.0, max=50.0), HTML(value='')))



====> Epoch: 1 Average loss: 182.2670
====> Test set loss: 145.4146
====> Epoch: 2 Average loss: 134.3210
====> Test set loss: 125.1247
====> Epoch: 3 Average loss: 120.3644
====> Test set loss: 116.5673
====> Epoch: 4 Average loss: 114.8764
====> Test set loss: 112.1863
====> Epoch: 5 Average loss: 111.6404
====> Test set loss: 109.5952
====> Epoch: 6 Average loss: 109.4455
====> Test set loss: 107.8552
====> Epoch: 7 Average loss: 107.9190
====> Test set loss: 107.1804
====> Epoch: 8 Average loss: 106.6841
====> Test set loss: 105.9575
====> Epoch: 9 Average loss: 105.7612
====> Test set loss: 105.3365
====> Epoch: 10 Average loss: 104.9911
====> Test set loss: 104.6850
====> Epoch: 11 Average loss: 104.2200
====> Test set loss: 103.9184
====> Epoch: 12 Average loss: 103.4692
====> Test set loss: 103.2628
====> Epoch: 13 Average loss: 102.8044
====> Test set loss: 102.5894
====> Epoch: 14 Average loss: 102.3491
====> Test set loss: 102.3423
====> Epoch: 15 Average loss: 101.9024
====

====> Epoch: 26 Average loss: 99.0468
====> Test set loss: 100.1467
====> Epoch: 27 Average loss: 98.8758
====> Test set loss: 100.1053
====> Epoch: 28 Average loss: 98.7179
====> Test set loss: 99.9514
====> Epoch: 29 Average loss: 98.5609
====> Test set loss: 99.9086
====> Epoch: 30 Average loss: 98.4960
====> Test set loss: 99.8539
====> Epoch: 31 Average loss: 98.3548
====> Test set loss: 99.9583
====> Epoch: 32 Average loss: 98.2426
====> Test set loss: 99.8958
====> Epoch: 33 Average loss: 98.1405
====> Test set loss: 99.5314
====> Epoch: 34 Average loss: 97.9777
====> Test set loss: 99.6461
====> Epoch: 35 Average loss: 97.9503
====> Test set loss: 99.4080
====> Epoch: 36 Average loss: 97.8976
====> Test set loss: 99.5897
====> Epoch: 37 Average loss: 97.8074
====> Test set loss: 99.4181
====> Epoch: 38 Average loss: 97.6307
====> Test set loss: 99.1856
====> Epoch: 39 Average loss: 97.6076
====> Test set loss: 99.1253
====> Epoch: 40 Average loss: 97.5239
====> Test set loss: 9

# #With weight term

In [45]:
def loss_function(recon_x, x, mu, log_var, weight):
    # return reconstruction error + weight * KL divergence losses
    
    #############################################################
    
    # YOUR CODE!!
    BCE = F.binary_cross_entropy(recon_x, x.view(-1, 784), reduction='sum')
    KLD = -0.5 * torch.sum(1 + log_var - mu.pow(2) - log_var.exp())
    return BCE + weight*KLD
    #############################################################
    
    pass

In [46]:

# YOU HAVE TO CONTROL THE "weight" Variable!

###############################################

weight = 0.7 # change the value,

###############################################

for epoch in tqdm(range(1, 51)):
    train(epoch, device, weight)
    test(device, weight)

HBox(children=(FloatProgress(value=0.0, max=50.0), HTML(value='')))

====> Epoch: 1 Average loss: 177.5859
====> Test set loss: 137.9021
====> Epoch: 2 Average loss: 124.8393
====> Test set loss: 114.1375
====> Epoch: 3 Average loss: 111.1574
====> Test set loss: 106.9192
====> Epoch: 4 Average loss: 106.1756
====> Test set loss: 103.3382
====> Epoch: 5 Average loss: 102.6439
====> Test set loss: 100.8953
====> Epoch: 6 Average loss: 100.5310
====> Test set loss: 99.4027
====> Epoch: 7 Average loss: 99.0497
====> Test set loss: 97.9786
====> Epoch: 8 Average loss: 97.9548
====> Test set loss: 97.3842
====> Epoch: 9 Average loss: 97.0493
====> Test set loss: 96.3237
====> Epoch: 10 Average loss: 96.3197
====> Test set loss: 96.1948
====> Epoch: 11 Average loss: 95.6684
====> Test set loss: 95.4801
====> Epoch: 12 Average loss: 95.0806
====> Test set loss: 95.0970
====> Epoch: 13 Average loss: 94.5158
====> Test set loss: 94.7249
====> Epoch: 14 Average loss: 94.0908
====> Test set loss: 94.5079
====> Epoch: 15 Average loss: 93.7625
====> Test set loss: 9

====> Epoch: 26 Average loss: 91.4013
====> Test set loss: 92.7872
====> Epoch: 27 Average loss: 91.3030
====> Test set loss: 92.4349
====> Epoch: 28 Average loss: 91.1649
====> Test set loss: 92.6114
====> Epoch: 29 Average loss: 91.0124
====> Test set loss: 92.5491
====> Epoch: 30 Average loss: 90.9459
====> Test set loss: 92.3290
====> Epoch: 31 Average loss: 90.8264
====> Test set loss: 92.2155
====> Epoch: 32 Average loss: 90.7647
====> Test set loss: 92.3680
====> Epoch: 33 Average loss: 90.6174
====> Test set loss: 92.1141
====> Epoch: 34 Average loss: 90.5020
====> Test set loss: 92.3468
====> Epoch: 35 Average loss: 90.4450
====> Test set loss: 92.2921
====> Epoch: 36 Average loss: 90.3640
====> Test set loss: 92.0730
====> Epoch: 37 Average loss: 90.3156
====> Test set loss: 92.0582
====> Epoch: 38 Average loss: 90.2183
====> Test set loss: 91.9141
====> Epoch: 39 Average loss: 90.1002
====> Test set loss: 91.9501
====> Epoch: 40 Average loss: 90.0487
====> Test set loss: 91.

Convergence with weight = 0.7 is faster than no weight

# Task 3

In [47]:
with torch.no_grad():
    
    #########################################################
    
    # YOUR CODE!!
    
    
    #########################################################
    
            
    z = torch.tensor(z).to(device)
    sample = vae.decoder(z.float())
    
    if not os.exists('./samples'):
        os.makedirs('./samples')
    
    save_image(sample.view(64, 1, 28, 28), './samples/sample' + '.png')

NameError: name 'z' is not defined

In [63]:
with torch.no_grad():
    
    #########################################################
    
    # YOUR CODE!!
    z = torch.randn(64, 50).to(device)
    sample = vae.decoder(z).to(device)
    
    
    #########################################################
    
            
    #z = torch.tensor(z).to(device)
    #sample = vae.decoder(z.float())
    
    if not os.path.exists('./samples'):
        os.makedirs('./samples')
    
    save_image(sample.view(64, 1, 28, 28), './samples/sample_50D' + '.png')