[View in Colaboratory](https://colab.research.google.com/github/Alfo5123/DisRecGen/blob/master/VAE_baseline_CIFAR10_collab.ipynb)

# <center>VAE-baseline for CIFAR10 </center>

## Load Data

In [1]:
!pip3 install --upgrade torch torchvision

Requirement already up-to-date: torch in /usr/local/lib/python3.6/dist-packages (0.4.0)
Requirement already up-to-date: torchvision in /usr/local/lib/python3.6/dist-packages (0.2.1)
Requirement not upgraded as not directly required: six in /usr/local/lib/python3.6/dist-packages (from torchvision) (1.11.0)
Requirement not upgraded as not directly required: pillow>=4.1.1 in /usr/local/lib/python3.6/dist-packages (from torchvision) (5.1.0)
Requirement not upgraded as not directly required: numpy in /usr/local/lib/python3.6/dist-packages (from torchvision) (1.14.3)


In [0]:
import torch
import torch.nn as nn
from torch import optim
import torch.nn.functional as F
from torch.autograd import Variable

import torchvision
from torchvision import datasets, transforms
import matplotlib.pyplot as plt
from IPython.display import Image
from google.colab import files


In [3]:
#Set random seed 
torch.manual_seed(512)

<torch._C.Generator at 0x7f96604970f0>

In [4]:
#Get the CIFAR10 train images 
cifar = datasets.CIFAR10('./data/cifar/', train = True, download = True)

Files already downloaded and verified


In [0]:
# Organize training data in batches, 
# normalize them to have values between [-1, 1] (?)

train_images = torch.utils.data.DataLoader ( datasets.CIFAR10('./data/cifar/', train = True, download=False,
                               transform=transforms.Compose([
                               #transforms.Resize(64), 
                               #transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5)),
                               transforms.ToTensor(),])) , 
                               batch_size = 32, shuffle = True)

## Model

We will use the arquitecture suggested by [Radford et al](https://arxiv.org/abs/1511.06434) for both the encoder and decoder. With convolutional layers in the encoder and fractionally-strided  convolutions  in  the  decoder.   In  each convolutional layer in the encoder we double the number of filters present in the previous layer and use a convolutional stride of 2.  In each convolutional layer in the decoder we use a fractional stride of 2 and halve the number of filters on each layer.

In [0]:
class VAE(nn.Module):

    def __init__(self, image_size ,  hidden_dim , encoding_dim):
        
        super(VAE, self).__init__()
        
        self.encoding_dim = encoding_dim
        self.image_size = image_size
        self.hidden_dim = hidden_dim 
        
        # Decoder - Fractional strided convolutional layers
        self.decoder = nn.Sequential(
            nn.ConvTranspose2d(256, 128, 4, 1, 0, bias = False),
            nn.BatchNorm2d(128),
            nn.ReLU(True),
            nn.ConvTranspose2d(128, 64, 4, 2, 1, bias = False),
            nn.BatchNorm2d(64),
            nn.ReLU(True),
            nn.ConvTranspose2d(64, 32, 4, 2, 1, bias = False),
            nn.BatchNorm2d(32),
            nn.ReLU(True),
            nn.ConvTranspose2d(32, 3, 4, 2, 1, bias = False),
            nn.Sigmoid() # nn.Tanh()  
        )
        
        # Encoder
        self.encoder = nn.Sequential(
            nn.Conv2d(3, 32, 4, 2, 1, bias = False),
            nn.LeakyReLU(0.2, inplace = True),
            nn.Conv2d(32, 64, 4, 2, 1, bias = False),
            nn.BatchNorm2d(64),
            nn.LeakyReLU(0.2, inplace = True),
            nn.Conv2d(64, 128, 4, 2, 1, bias = False),
            nn.BatchNorm2d(128),
            nn.LeakyReLU(0.2, inplace = True),
            nn.Conv2d(128, 256, 4, 2, 0, bias = False),
            nn.Sigmoid()
        )
        
        # Fully-connected layers
        self.fc1 = nn.Linear(256, self.hidden_dim)
        self.fc21 = nn.Linear(self.hidden_dim, self.encoding_dim)
        self.fc22 = nn.Linear(self.hidden_dim, self.encoding_dim)
        self.fc3 = nn.Linear(self.encoding_dim, self.hidden_dim)
        self.fc4 = nn.Linear(self.hidden_dim, 256)
    
    def decode(self, z):
        h3 = F.relu(self.fc3(z))
        h4 = F.sigmoid(self.fc4(h3))
        return self.decoder( h4.view(z.size(0),-1,1,1) ) 

        
    def forward(self, x):
        
        # Encode 
        encoded = F.relu(self.fc1( self.encoder(x).view(x.size(0), -1) ) )
        
        #Obtain mu and logvar
        mu = self.fc21( encoded )
        logvar = self.fc22 ( encoded )
        
        #Reparametrization trick
        std = torch.exp(0.5*logvar)
        eps = torch.randn_like(std)
        z = eps.mul(std).add_(mu)
        
        # Decode 
        decoded = self.decode(z)

        # return decoded, mu, logvar
        return decoded, mu , logvar

    
# Reconstruction + KL divergence losses summed over all elements and batch
def loss_function(recon_x, x, mu, logvar):
    BCE = F.binary_cross_entropy(recon_x, x, size_average=False)
    KLD = -0.5 * torch.sum(1 + logvar - mu.pow(2) - logvar.exp())
    return BCE + KLD

In [0]:
#Define model
model = VAE(32, 128, 32).cuda()
optimizer = optim.Adam(model.parameters(), lr=1e-3, amsgrad=True)

#Train model
def train(epoch):
    train_loss = 0
    for batch_idx, (data, _) in enumerate(train_images):
        data = Variable(data).cuda()
        optimizer.zero_grad()
        recon_batch, mu, logvar = model(data)
        loss = loss_function(recon_batch, data, mu, logvar)
        loss.backward()
        train_loss += loss.item()
        optimizer.step()
        if batch_idx % 50 == 0:
            print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
                epoch, batch_idx * len(data), len(train_images.dataset),
                100. * batch_idx / len(train_images),
                loss.item() / len(data)))

    print('====> Epoch: {} Average loss: {:.4f}'.format(
          epoch, train_loss / len(train_images.dataset)))

In [8]:
num_epochs = 100
for epoch in range(1, num_epochs):
    train(epoch)

====> Epoch: 1 Average loss: 1979.8773


====> Epoch: 2 Average loss: 1939.1848
====> Epoch: 3 Average loss: 1926.0714


====> Epoch: 4 Average loss: 1916.4158
====> Epoch: 5 Average loss: 1907.4472


====> Epoch: 6 Average loss: 1904.7381
====> Epoch: 7 Average loss: 1902.5505


====> Epoch: 8 Average loss: 1901.4407
====> Epoch: 9 Average loss: 1898.7230


====> Epoch: 10 Average loss: 1893.1173
====> Epoch: 11 Average loss: 1886.6467


====> Epoch: 12 Average loss: 1883.5094
====> Epoch: 13 Average loss: 1880.2917


====> Epoch: 14 Average loss: 1875.5095


====> Epoch: 15 Average loss: 1874.3139
====> Epoch: 16 Average loss: 1872.3293


====> Epoch: 17 Average loss: 1868.8188
====> Epoch: 18 Average loss: 1867.1256


====> Epoch: 19 Average loss: 1866.3001
====> Epoch: 20 Average loss: 1865.5692


====> Epoch: 21 Average loss: 1864.9439
====> Epoch: 22 Average loss: 1864.6087


====> Epoch: 23 Average loss: 1863.8588
====> Epoch: 24 Average loss: 1863.5809


====> Epoch: 25 Average loss: 1863.0628
====> Epoch: 26 Average loss: 1862.7750


====> Epoch: 27 Average loss: 1862.5389


====> Epoch: 28 Average loss: 1862.0314
====> Epoch: 29 Average loss: 1861.7043


====> Epoch: 30 Average loss: 1861.4146
====> Epoch: 31 Average loss: 1861.1078


====> Epoch: 32 Average loss: 1861.1230
====> Epoch: 33 Average loss: 1860.4253


====> Epoch: 34 Average loss: 1860.1817
====> Epoch: 35 Average loss: 1860.1901


====> Epoch: 36 Average loss: 1859.8369
====> Epoch: 37 Average loss: 1859.4492


====> Epoch: 38 Average loss: 1859.2117
====> Epoch: 39 Average loss: 1858.6202


====> Epoch: 40 Average loss: 1857.6059


====> Epoch: 41 Average loss: 1856.6367
====> Epoch: 42 Average loss: 1855.9021


====> Epoch: 43 Average loss: 1855.4570
====> Epoch: 44 Average loss: 1855.3299


====> Epoch: 45 Average loss: 1854.9080
====> Epoch: 46 Average loss: 1854.6858


====> Epoch: 47 Average loss: 1854.3482
====> Epoch: 48 Average loss: 1854.1255


====> Epoch: 49 Average loss: 1853.8851
====> Epoch: 50 Average loss: 1853.5070


====> Epoch: 51 Average loss: 1853.5375


====> Epoch: 52 Average loss: 1853.3414
====> Epoch: 53 Average loss: 1853.2820


====> Epoch: 54 Average loss: 1852.7286
====> Epoch: 55 Average loss: 1852.6119


====> Epoch: 56 Average loss: 1852.4871
====> Epoch: 57 Average loss: 1852.3144


====> Epoch: 58 Average loss: 1852.0653
====> Epoch: 59 Average loss: 1851.8642


====> Epoch: 60 Average loss: 1851.8117
====> Epoch: 61 Average loss: 1851.4941


====> Epoch: 62 Average loss: 1851.4741
====> Epoch: 63 Average loss: 1851.2986


====> Epoch: 64 Average loss: 1851.2293


====> Epoch: 65 Average loss: 1851.1225
====> Epoch: 66 Average loss: 1850.8125


====> Epoch: 67 Average loss: 1850.5914
====> Epoch: 68 Average loss: 1850.5599


====> Epoch: 69 Average loss: 1850.3218
====> Epoch: 70 Average loss: 1850.2064


====> Epoch: 71 Average loss: 1850.0402
====> Epoch: 72 Average loss: 1849.8462


====> Epoch: 73 Average loss: 1849.7625
====> Epoch: 74 Average loss: 1849.4475


====> Epoch: 75 Average loss: 1849.2341
====> Epoch: 76 Average loss: 1849.2898


====> Epoch: 77 Average loss: 1849.0215


====> Epoch: 78 Average loss: 1849.0222
====> Epoch: 79 Average loss: 1848.9138


====> Epoch: 80 Average loss: 1848.6917
====> Epoch: 81 Average loss: 1848.6570


====> Epoch: 82 Average loss: 1848.5170
====> Epoch: 83 Average loss: 1848.1289


====> Epoch: 84 Average loss: 1848.0176
====> Epoch: 85 Average loss: 1847.9381


====> Epoch: 86 Average loss: 1847.8430
====> Epoch: 87 Average loss: 1847.6514


====> Epoch: 88 Average loss: 1847.4889
====> Epoch: 89 Average loss: 1847.3716


====> Epoch: 90 Average loss: 1847.3229


====> Epoch: 91 Average loss: 1847.2044
====> Epoch: 92 Average loss: 1846.9648


====> Epoch: 93 Average loss: 1846.9187
====> Epoch: 94 Average loss: 1846.7674


====> Epoch: 95 Average loss: 1846.5767
====> Epoch: 96 Average loss: 1846.5511


====> Epoch: 97 Average loss: 1846.4192
====> Epoch: 98 Average loss: 1846.1208


====> Epoch: 99 Average loss: 1846.1730


In [0]:
with torch.no_grad():
        sample = torch.randn(64, 32).cuda()
        sample = model.decode(sample)
        torch.save(model.cpu().state_dict(), "./save_checkpoint_epoch_"+str(epoch)+".pth")
        files.download("./save_checkpoint_epoch_"+str(epoch)+".pth")
        torchvision.utils.save_image(sample.view(64, 3, 32, 32),'./sample_' + str(epoch) + '.png')
        files.download('./sample_' + str(epoch) + '.png')