## Import libraries

In [17]:
import torch
import torchvision
from torch import nn
from torch import optim
import torch.nn.functional as F
from torch.autograd import Variable
from torch.utils.data import DataLoader
from torchvision import transforms
from torchvision.utils import save_image
from torchvision.datasets import MNIST
from torchvision import datasets
import os

## Train Autoencoder

In [2]:
if not os.path.exists('./vae_img'):
    os.mkdir('./vae_img')


def to_img(x):
    x = x.clamp(0, 1)
    x = x.view(x.size(0), 1, 28, 28)
    return x


num_epochs = 100
batch_size = 128
learning_rate = 1e-3

img_transform = transforms.Compose([
    transforms.ToTensor()
    # transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
])

dataset = MNIST('./data', transform=img_transform, download=True)
dataloader = DataLoader(dataset, batch_size=batch_size, shuffle=True)


class VAE(nn.Module):
    def __init__(self):
        super(VAE, self).__init__()

        self.fc1 = nn.Linear(784, 400)
        self.fc21 = nn.Linear(400, 20)
        self.fc22 = nn.Linear(400, 20)
        self.fc3 = nn.Linear(20, 400)
        self.fc4 = nn.Linear(400, 784)

    def encode(self, x):
        h1 = F.relu(self.fc1(x))
        return self.fc21(h1), self.fc22(h1)

    def reparametrize(self, mu, logvar):
        std = logvar.mul(0.5).exp_()
        if torch.cuda.is_available():
            eps = torch.cuda.FloatTensor(std.size()).normal_()
        else:
            eps = torch.FloatTensor(std.size()).normal_()
        eps = Variable(eps)
        return eps.mul(std).add_(mu)

    def decode(self, z):
        h3 = F.relu(self.fc3(z))
        return F.sigmoid(self.fc4(h3))

    def forward(self, x):
        mu, logvar = self.encode(x)
        z = self.reparametrize(mu, logvar)
        return self.decode(z), mu, logvar


model = VAE()
if torch.cuda.is_available():
    model.cuda()

reconstruction_function = nn.MSELoss(size_average=False)


def loss_function(recon_x, x, mu, logvar):
    """
    recon_x: generating images
    x: origin images
    mu: latent mean
    logvar: latent log variance
    """
    BCE = reconstruction_function(recon_x, x)  # mse loss
    # loss = 0.5 * sum(1 + log(sigma^2) - mu^2 - sigma^2)
    KLD_element = mu.pow(2).add_(logvar.exp()).mul_(-1).add_(1).add_(logvar)
    KLD = torch.sum(KLD_element).mul_(-0.5)
    # KL divergence
    return BCE + KLD


optimizer = optim.Adam(model.parameters(), lr=1e-3)

for epoch in range(num_epochs):
    model.train()
    train_loss = 0
    for batch_idx, data in enumerate(dataloader):
        img, _ = data
        img = img.view(img.size(0), -1)
        img = Variable(img)
        if torch.cuda.is_available():
            img = img.cuda()
        optimizer.zero_grad()
        recon_batch, mu, logvar = model(img)
        loss = loss_function(recon_batch, img, mu, logvar)
        loss.backward()
        train_loss += loss.data
        optimizer.step()
        if batch_idx % 100 == 0:
            print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
                epoch,
                batch_idx * len(img),
                len(dataloader.dataset), 100. * batch_idx / len(dataloader),
                loss.data / len(img)))

    print('====> Epoch: {} Average loss: {:.4f}'.format(
        epoch, train_loss / len(dataloader.dataset)))
    if epoch % 10 == 0:
        save = to_img(recon_batch.cpu().data)
        save_image(save, './vae_img/image_{}.png'.format(epoch))

torch.save(model.state_dict(), './vae.pth')

====> Epoch: 0 Average loss: 45.2671
====> Epoch: 1 Average loss: 34.8616
====> Epoch: 2 Average loss: 33.0455
====> Epoch: 3 Average loss: 32.1883
====> Epoch: 4 Average loss: 31.6254
====> Epoch: 5 Average loss: 31.3139
====> Epoch: 6 Average loss: 31.0403
====> Epoch: 7 Average loss: 30.8684
====> Epoch: 8 Average loss: 30.7118
====> Epoch: 9 Average loss: 30.5351
====> Epoch: 10 Average loss: 30.4183
====> Epoch: 11 Average loss: 30.2947
====> Epoch: 12 Average loss: 30.1977
====> Epoch: 13 Average loss: 30.0987
====> Epoch: 14 Average loss: 30.0371
====> Epoch: 15 Average loss: 29.9561
====> Epoch: 16 Average loss: 29.8661
====> Epoch: 17 Average loss: 29.7951
====> Epoch: 18 Average loss: 29.7478
====> Epoch: 19 Average loss: 29.6725
====> Epoch: 20 Average loss: 29.6160
====> Epoch: 21 Average loss: 29.5557
====> Epoch: 22 Average loss: 29.5342
====> Epoch: 23 Average loss: 29.4679
====> Epoch: 24 Average loss: 29.4263
====> Epoch: 25 Average loss: 29.4014
====> Epoch: 26 Averag

====> Epoch: 28 Average loss: 29.2502
====> Epoch: 29 Average loss: 29.2216
====> Epoch: 30 Average loss: 29.1814
====> Epoch: 31 Average loss: 29.1533
====> Epoch: 32 Average loss: 29.1453
====> Epoch: 33 Average loss: 29.0944
====> Epoch: 34 Average loss: 29.0724
====> Epoch: 35 Average loss: 29.0402
====> Epoch: 36 Average loss: 29.0023
====> Epoch: 37 Average loss: 28.9985
====> Epoch: 38 Average loss: 28.9716
====> Epoch: 39 Average loss: 28.9763
====> Epoch: 40 Average loss: 28.9288
====> Epoch: 41 Average loss: 28.9136
====> Epoch: 42 Average loss: 28.9082
====> Epoch: 43 Average loss: 28.8729
====> Epoch: 44 Average loss: 28.8369
====> Epoch: 45 Average loss: 28.8165
====> Epoch: 46 Average loss: 28.8083
====> Epoch: 47 Average loss: 28.8130
====> Epoch: 48 Average loss: 28.7491
====> Epoch: 49 Average loss: 28.7578
====> Epoch: 50 Average loss: 28.7250
====> Epoch: 51 Average loss: 28.7317
====> Epoch: 52 Average loss: 28.7316
====> Epoch: 53 Average loss: 28.6864
====> Epoch:

====> Epoch: 56 Average loss: 28.6577
====> Epoch: 57 Average loss: 28.6252
====> Epoch: 58 Average loss: 28.6294
====> Epoch: 59 Average loss: 28.6291
====> Epoch: 60 Average loss: 28.5834
====> Epoch: 61 Average loss: 28.5803
====> Epoch: 62 Average loss: 28.5684
====> Epoch: 63 Average loss: 28.5605
====> Epoch: 64 Average loss: 28.5305
====> Epoch: 65 Average loss: 28.5173
====> Epoch: 66 Average loss: 28.5280
====> Epoch: 67 Average loss: 28.4794
====> Epoch: 68 Average loss: 28.5116
====> Epoch: 69 Average loss: 28.4760
====> Epoch: 70 Average loss: 28.4794
====> Epoch: 71 Average loss: 28.4662
====> Epoch: 72 Average loss: 28.4597
====> Epoch: 73 Average loss: 28.4325
====> Epoch: 74 Average loss: 28.4311
====> Epoch: 75 Average loss: 28.3988
====> Epoch: 76 Average loss: 28.4251
====> Epoch: 77 Average loss: 28.4052
====> Epoch: 78 Average loss: 28.3748
====> Epoch: 79 Average loss: 28.3682
====> Epoch: 80 Average loss: 28.3640
====> Epoch: 81 Average loss: 28.3632
====> Epoch:

====> Epoch: 84 Average loss: 28.3363
====> Epoch: 85 Average loss: 28.3272
====> Epoch: 86 Average loss: 28.3298
====> Epoch: 87 Average loss: 28.3312
====> Epoch: 88 Average loss: 28.3174
====> Epoch: 89 Average loss: 28.2838
====> Epoch: 90 Average loss: 28.2924
====> Epoch: 91 Average loss: 28.2624
====> Epoch: 92 Average loss: 28.2747
====> Epoch: 93 Average loss: 28.2730
====> Epoch: 94 Average loss: 28.2507
====> Epoch: 95 Average loss: 28.2504
====> Epoch: 96 Average loss: 28.2772
====> Epoch: 97 Average loss: 28.2549
====> Epoch: 98 Average loss: 28.2410
====> Epoch: 99 Average loss: 28.2443


## Use trained model to predict images

In [28]:
IMG_PATH = "D:\\University-Work\CPS040\Main\CPS040-Thesis\Main\Autoencoder\Simple Autoencoder 2\\vae_img\\"
min_img_size = 32
trans = transforms.Compose([transforms.Resize(min_img_size),
                                         transforms.CenterCrop(32),
                                         transforms.ToTensor(),
                                         transforms.Normalize(mean=[0.485, 0.456, 0.406],
                                                              std=[0.229, 0.224, 0.225])])

# # Picture dataset.
# classify_dataset = datasets.ImageFolder(root=IMG_PATH, transform=trans)
# # Create custom random sampler class to iter over dataloader.
# classify_loader = DataLoader(dataset=classify_dataset, batch_size=1, shuffle=True, num_workers=5)

model = torch.load('./vae.pth')

# if cuda is available, move the model to the GPU
# if torch.cuda.is_available():
#     model.cuda()


In [33]:
def to_img(x):
    x = x.clamp(0, 1)
    x = x.view(x.size(0), 1, 28, 28)
    return x
img_transform = transforms.Compose([
    transforms.ToTensor()
    # transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
])

dataset = MNIST('./data', transform=img_transform, download=True)
dataloader = DataLoader(dataset, batch_size=batch_size, shuffle=True)

# for batch_idx, data in enumerate(dataloader):
#     data

img, _ = data
img = img.view(img.size(0), -1)
img = Variable(img)
if torch.cuda.is_available():
    img = img.cuda()
    
model = torch.load('./vae.pth')
model(data)

TypeError: 'collections.OrderedDict' object is not callable