In [None]:
import torch
import torchvision

from torch import nn, optim
from torchvision import transforms
from torch.autograd import Variable
from torchvision.utils import save_image
from torch.utils.data import DataLoader, Dataset

import os
import pylab
import numpy as np
import matplotlib.pyplot as plt

In [None]:
from google.colab import drive
drive.mount('/content/drive')

%cd /content/drive/My Drive/Colab Notebooks/Poatek/GAN
%ls -lah

Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount("/content/drive", force_remount=True).
/content/drive/My Drive/Colab Notebooks/Poatek/GAN
total 36K
-rw------- 1 root root  28K Sep 11 12:59 DCGAN_train.ipynb
drwx------ 2 root root 4.0K Sep 11 12:40 [0m[01;34msamples[0m/
drwx------ 2 root root 4.0K Sep 11 12:40 [01;34msave[0m/


In [None]:
# Hyper-parameters
latent_size = 64
hidden_size = 256
image_size = 784
num_epochs = 300
batch_size = 32
sample_dir = 'samples'
save_dir = 'save'

In [None]:
# Discriminator
D = nn.Sequential(
    nn.Linear(image_size, hidden_size),
    nn.LeakyReLU(0.2),
    nn.Linear(hidden_size, hidden_size),
    nn.LeakyReLU(0.2),
    nn.Linear(hidden_size, 1),
    nn.Sigmoid())

# Generator 
G = nn.Sequential(
    nn.Linear(latent_size, hidden_size),
    nn.ReLU(),
    nn.Linear(hidden_size, hidden_size),
    nn.ReLU(),
    nn.Linear(hidden_size, image_size),
    nn.Tanh())

In [None]:
# Create a directory if not exists
if not os.path.exists(sample_dir):
    os.makedirs(sample_dir)

if not os.path.exists(save_dir):
    os.makedirs(save_dir)

In [None]:
# Image processing
transform = transforms.Compose([
                                transforms.ToTensor(),
                                transforms.Normalize(mean=(0.5),
                                                     std=(0.5))])

# train_dataset = MNIST_Dataset('/content/drive/My Drive/Datasets/MNIST/training', 
#                               is_train=True, 
#                               transform=transform)

# train_loader = DataLoader(train_dataset, 
#                           batch_size=batch_size,  
#                           shuffle=True, 
#                           num_workers=0,
#                           drop_last=False
#                           )

# print(train_dataset.total_samples == train_loader.dataset.total_samples)
# print(train_loader.dataset.total_samples)

# MNIST dataset
mnist = torchvision.datasets.MNIST(root='/content/drive/My Drive/Datasets/mnist_pytorch',
                                   train=True,
                                   transform=transform,
                                   download=True)

# Data loader
train_loader = torch.utils.data.DataLoader(dataset=mnist,
                                           batch_size=batch_size, 
                                           shuffle=True)

print(len(train_loader))

1875


In [None]:
device = "cuda" if torch.cuda.is_available else "cpu"
print(f"We're about to train it on {device.upper()}")

# Device setting
D = D.to(device)
G = G.to(device)

We're about to train it on CUDA


In [None]:
# Binary cross entropy loss and optimizer
criterion = nn.BCELoss()
d_optimizer = torch.optim.Adam(D.parameters(), lr=0.0002)
g_optimizer = torch.optim.Adam(G.parameters(), lr=0.0002)

In [None]:
def denorm(x):
    out = (x + 1) / 2
    return out.clamp(0, 1)

def reset_grad():
    d_optimizer.zero_grad()
    g_optimizer.zero_grad()

In [None]:
# Statistics to be saved
d_losses = np.zeros(num_epochs)
g_losses = np.zeros(num_epochs)
real_scores = np.zeros(num_epochs)
fake_scores = np.zeros(num_epochs)

# Start training
total_step = len(train_loader)
for epoch in range(num_epochs):
    for i, (images, _) in enumerate(train_loader):
        images = images.view(batch_size, -1).cuda()
        images = Variable(images)
        # Create the labels which are later used as input for the BCE loss
        real_labels = torch.ones(batch_size, 1).cuda()
        real_labels = Variable(real_labels)
        fake_labels = torch.zeros(batch_size, 1).cuda()
        fake_labels = Variable(fake_labels)

        # ================================================================== #
        #                      Train the discriminator                       #
        # ================================================================== #

        # Compute BCE_Loss using real images where BCE_Loss(x, y): - y * log(D(x)) - (1-y) * log(1 - D(x))
        # Second term of the loss is always zero since real_labels == 1
        outputs = D(images)
        d_loss_real = criterion(outputs, real_labels)
        real_score = outputs

        # Compute BCELoss using fake images
        # First term of the loss is always zero since fake_labels == 0
        z = torch.randn(batch_size, latent_size).cuda()
        z = Variable(z)
        fake_images = G(z)
        outputs = D(fake_images)
        d_loss_fake = criterion(outputs, fake_labels)
        fake_score = outputs

        # Backprop and optimize
        # If D is trained so well, then don't update
        d_loss = d_loss_real + d_loss_fake
        reset_grad()
        d_loss.backward()
        d_optimizer.step()
        # ================================================================== #
        #                        Train the generator                         #
        # ================================================================== #

        # Compute loss with fake images
        z = torch.randn(batch_size, latent_size).cuda()
        z = Variable(z)
        fake_images = G(z)
        outputs = D(fake_images)

        # We train G to maximize log(D(G(z)) instead of minimizing log(1-D(G(z)))
        # For the reason, see the last paragraph of section 3. https://arxiv.org/pdf/1406.2661.pdf
        g_loss = criterion(outputs, real_labels)

        # Backprop and optimize
        # if G is trained so well, then don't update
        reset_grad()
        g_loss.backward()
        g_optimizer.step()
        # =================================================================== #
        #                          Update Statistics                          #
        # =================================================================== #
        d_losses[epoch] = d_losses[epoch]*(i/(i+1.)) + d_loss.data.item()*(1./(i+1.))
        g_losses[epoch] = g_losses[epoch]*(i/(i+1.)) + g_loss.data.item()*(1./(i+1.))
        real_scores[epoch] = real_scores[epoch]*(i/(i+1.)) + real_score.mean().data.item()*(1./(i+1.))
        fake_scores[epoch] = fake_scores[epoch]*(i/(i+1.)) + fake_score.mean().data.item()*(1./(i+1.))

        if (i+1) % 200 == 0:
            print('Epoch [{}/{}], Step [{}/{}], d_loss: {:.4f}, g_loss: {:.4f}, D(x): {:.2f}, D(G(z)): {:.2f}' 
                    .format(epoch, num_epochs, i+1, total_step, d_loss.data.item(), g_loss.data.item(), 
                            real_score.mean().data.item(), fake_score.mean().data.item()))

    # Save real images
    if (epoch+1) == 1:
        images = images.view(images.size(0), 1, 28, 28)
        save_image(denorm(images.data), os.path.join(sample_dir, 'real_images.png'))

    # Save sampled images
    fake_images = fake_images.view(fake_images.size(0), 1, 28, 28)
    save_image(denorm(fake_images.data), os.path.join(sample_dir, 'fake_images-{}.png'.format(epoch+1)))

    # Save and plot Statistics
    np.save(os.path.join(save_dir, 'd_losses.npy'), d_losses)
    np.save(os.path.join(save_dir, 'g_losses.npy'), g_losses)
    np.save(os.path.join(save_dir, 'fake_scores.npy'), fake_scores)
    np.save(os.path.join(save_dir, 'real_scores.npy'), real_scores)

    plt.figure()
    pylab.xlim(0, num_epochs + 1)
    plt.plot(range(1, num_epochs + 1), d_losses, label='d loss')
    plt.plot(range(1, num_epochs + 1), g_losses, label='g loss')    
    plt.legend()
    plt.savefig(os.path.join(save_dir, 'loss.pdf'))
    plt.close()

    plt.figure()
    pylab.xlim(0, num_epochs + 1)
    pylab.ylim(0, 1)
    plt.plot(range(1, num_epochs + 1), fake_scores, label='fake score')
    plt.plot(range(1, num_epochs + 1), real_scores, label='real score')    
    plt.legend()
    plt.savefig(os.path.join(save_dir, 'accuracy.pdf'))
    plt.close()

    # Save model at checkpoints
    if (epoch+1) % 50 == 0:
        torch.save(G.state_dict(), os.path.join(save_dir, 'G--{}.pth'.format(epoch+1)))
        torch.save(D.state_dict(), os.path.join(save_dir, 'D--{}.pth'.format(epoch+1)))

Epoch [0/300], Step [200/1875], d_loss: 0.0531, g_loss: 4.2382, D(x): 1.00, D(G(z)): 0.05
Epoch [0/300], Step [400/1875], d_loss: 0.1349, g_loss: 5.0713, D(x): 0.95, D(G(z)): 0.05
Epoch [0/300], Step [600/1875], d_loss: 0.0389, g_loss: 5.8919, D(x): 0.98, D(G(z)): 0.02
Epoch [0/300], Step [800/1875], d_loss: 0.1266, g_loss: 5.0103, D(x): 0.98, D(G(z)): 0.09
Epoch [0/300], Step [1000/1875], d_loss: 0.0420, g_loss: 4.7659, D(x): 0.99, D(G(z)): 0.03
Epoch [0/300], Step [1200/1875], d_loss: 0.1394, g_loss: 3.3578, D(x): 0.95, D(G(z)): 0.07
Epoch [0/300], Step [1400/1875], d_loss: 0.3783, g_loss: 3.1944, D(x): 0.83, D(G(z)): 0.09
Epoch [0/300], Step [1600/1875], d_loss: 0.3116, g_loss: 5.0521, D(x): 0.84, D(G(z)): 0.03
Epoch [0/300], Step [1800/1875], d_loss: 0.2187, g_loss: 4.0490, D(x): 0.88, D(G(z)): 0.06
Epoch [1/300], Step [200/1875], d_loss: 0.4172, g_loss: 3.3916, D(x): 0.86, D(G(z)): 0.16
Epoch [1/300], Step [400/1875], d_loss: 0.6948, g_loss: 3.1121, D(x): 0.76, D(G(z)): 0.10
Epoch

In [None]:
# Save the model checkpoints 
torch.save(G.state_dict(), 'G.pth')
torch.save(D.state_dict(), 'D.pth')