## Loading the data

In [1]:
"""
!wget https://s3-us-west-1.amazonaws.com/udacity-dlnfd/datasets/celeba.zip
import zipfile, os
with zipfile.ZipFile(os.getcwd() + '/celeba.zip', 'r') as zip_ref:
  zip_ref.extractall(os.getcwd()+'/data_faces')
"""

"\n!wget https://s3-us-west-1.amazonaws.com/udacity-dlnfd/datasets/celeba.zip\nimport zipfile, os\nwith zipfile.ZipFile(os.getcwd() + '/celeba.zip', 'r') as zip_ref:\n  zip_ref.extractall(os.getcwd()+'/data_faces')\n"

# Importing the libraries

In [2]:
import keras
import numpy as np
import matplotlib.pyplot as plt
import os

Using TensorFlow backend.


## Defining the GAN

In [3]:
def define_GAN(g_model, d_model):
    d_model.trainable = False
    model = keras.models.Sequential()
    model.add(g_model)
    model.add(d_model)
    opt = keras.optimizers.adam(learning_rate= 0.0002,
                                beta_1= 0.5)
    model.compile(loss= 'binary_crossentropy', optimizer= opt)
    return model

## Defining the Discriminator

In [4]:
def define_discriminator(input_shape= (96,80,3)):
    model = keras.models.Sequential()
    
    model.add(keras.layers.Conv2D(filters= 128,
                                  kernel_size= (3,3),
                                  padding= 'same',
                                  input_shape= input_shape))
    model.add(keras.layers.LeakyReLU(0.2))
    model.add(keras.layers.Dropout(0.4))

    # 96 * 80 * 3
    model.add(keras.layers.Conv2D(filters= 128,
                                  kernel_size= (3,3),
                                  strides= (2,2),
                                  padding= 'same'))
    model.add(keras.layers.LeakyReLU(0.2))
    model.add(keras.layers.Dropout(0.4))
    
    # 48 * 40 * 3
    model.add(keras.layers.Conv2D(filters= 128,
                                  kernel_size= (4,4),
                                  strides= (2,2),
                                  padding= 'same'))
    model.add(keras.layers.LeakyReLU(0.2))
    model.add(keras.layers.Dropout(0.4))
    
    # 24 * 20 * 3
    model.add(keras.layers.Conv2D(filters= 128,
                                  kernel_size= (4,4),
                                  strides= (2,2),
                                  padding= 'same'))
    model.add(keras.layers.LeakyReLU(0.2))
    model.add(keras.layers.Dropout(0.4))
    
    # 12 * 10 * 3

    model.add(keras.layers.Flatten())
    model.add(keras.layers.Dropout(0.4))
    model.add(keras.layers.Dense(units= 1,
                                 activation= 'sigmoid'))
    opt = keras.optimizers.adam(learning_rate= 0.0002, beta_1= 0.5)
    model.compile(loss= 'binary_crossentropy', optimizer= opt, metrics= ['accuracy'])
    
    return model

## Defining the Generator

In [5]:
def define_generator(latent_dim):
    model = keras.models.Sequential()

    model.add(keras.layers.Dense(units= 1024 * 6 * 5, input_dim= latent_dim))
    model.add(keras.layers.LeakyReLU(0.2))
    model.add(keras.layers.Reshape((6, 5, 1024)))
    # 6 * 5
    model.add(keras.layers.Conv2DTranspose(filters= 512,
                                           kernel_size= (4,4),
                                           padding= 'same',
                                           strides= (2,2)))
    model.add(keras.layers.LeakyReLU(0.2))
    # 12 * 10
    model.add(keras.layers.Conv2DTranspose(filters= 256,
                                           kernel_size= (4,4),
                                           padding= 'same',
                                           strides= (2,2)))
    model.add(keras.layers.LeakyReLU(0.2))
    # 24 * 20
    model.add(keras.layers.Conv2DTranspose(filters= 128,
                                           kernel_size= (4,4),
                                           padding= 'same',
                                           strides= (2,2)))
    model.add(keras.layers.LeakyReLU(0.2))
    # 48 * 40
    model.add(keras.layers.Conv2DTranspose(filters= 128,
                                           kernel_size= (4,4),
                                           padding= 'same',
                                           strides= (2,2)))
    model.add(keras.layers.LeakyReLU(0.2))
    # 96 * 80
    
    # Ready for colorization
    model.add(keras.layers.Conv2D(filters= 3,
                                  kernel_size= (3,3),
                                  padding= 'same',
                                  activation= 'tanh'))
    
    return model

## Generating the Fake samples

In [6]:
def generate_latent_points(latent_dim, n_samples):
    X = np.random.randn(latent_dim * n_samples)
    X = X.reshape((n_samples, latent_dim))
    return X

In [7]:
def generate_fake_sample(g_model, latent_dim, n_samples):
    x_input = generate_latent_points(latent_dim= latent_dim,
                                     n_samples= n_samples)
    
    X = g_model.predict(x_input)
    y = np.zeros((n_samples, 1))
    return X, y

## Generating the Real samples

In [8]:
def generate_real_sample(train_it):
    X, _ = train_it.next()
    X = X[:, 6:102,4:84,:].astype('float32')
    X = (X - 127.5) / 127.5
    y = np.ones((X.shape[0], 1))
    # y = 0.9 * np.ones((n_samples, 1)) + 0.2 * np.random.rand(n_samples).reshape((n_samples, 1))
    return X, y

## Saving the Plot and summarizing

In [9]:
def save_plot(x_input, epoch, n=5):
    x_input = (x_input + 1.0) / 2.0
    filename = f'generated_{epoch + 1}.png'
    for i in range(n*n):
        plt.subplot(n, n, i+1)
        plt.imshow(x_input[i,:,:,:])
        plt.axis('off')
    plt.savefig(filename)
    plt.close()

In [10]:
def summarize_the_model(g_model, d_model, epoch, latent_dim, n_samples, train_iter):
    X_real, y_real = generate_real_sample(train_it= train_iter)
    X_fake, y_fake = generate_fake_sample(g_model= g_model,
                                          latent_dim= latent_dim,
                                          n_samples= n_samples)
    print(f'Accuracy on real data: {d_model.evaluate(X_real, y_real, verbose= 0)}')
    print(f'Accuracy on fake data: {d_model.evaluate(X_fake, y_fake, verbose= 0)}')
    filename = f'model_e_{epoch+1:03}.h5'
    save_plot(x_input= X_fake,
              epoch= epoch)
    
    g_model.save(filename)

# Function for training the GAN

In [11]:
def train_GAN(gan_model, g_model, d_model, dataset_len, latent_dim, train_iter, iters= 100, batch_size= 256):
    half_batch = int(batch_size / 2)
    batch_per_epoch = int(dataset_len / batch_size)
    for i in range(iters):
        for j in range(batch_per_epoch):
            X_real, y_real = generate_real_sample(train_it= train_it)
            X_fake, y_fake = generate_fake_sample(g_model= g_model,
                                                  latent_dim= latent_dim,
                                                  n_samples= half_batch)
            X, y = np.vstack((X_real, X_fake)), np.vstack((y_real, y_fake))
            dloss = d_model.train_on_batch(X, y)
            x_gan = generate_latent_points(latent_dim= latent_dim,
                                             n_samples= batch_size)
            y_gan = np.ones((batch_size, 1))
            gloss = gan_model.train_on_batch(x_gan, y_gan)
            print(f'> Epoch: {i+1}, {j+1}/{batch_per_epoch}, dloss: {dloss[0]:5f}, gloss: {gloss:5f}')
        # After each epoch
        summarize_the_model(g_model= g_model,
                            d_model= d_model,
                            epoch= i,
                            latent_dim= latent_dim,
                            n_samples= batch_size, train_iter= train_it)

## Training the Model

In [None]:
latent_dim = 200
batch_size = 128

g_model = define_generator(latent_dim= latent_dim)
d_model = define_discriminator()
gan_model = define_GAN(g_model=g_model,
                       d_model= d_model)

datagen = keras.preprocessing.image.ImageDataGenerator()
path = os.getcwd() + '/data_faces'
train_it = datagen.flow_from_directory(path,
                                       batch_size= int(batch_size/2),
                                       target_size= (218, 178))


train_GAN(gan_model= gan_model,
          g_model= g_model,
          d_model= d_model,
          dataset_len= 202599,
          latent_dim= latent_dim, train_iter= train_it)

Found 202599 images belonging to 1 classes.


  'Discrepancy between trainable weights and collected trainable'


> Epoch: 1, 1/791, dloss: 0.706158, gloss: 0.694150
> Epoch: 1, 2/791, dloss: 0.663778, gloss: 0.693971
> Epoch: 1, 3/791, dloss: 0.624622, gloss: 0.690521
> Epoch: 1, 4/791, dloss: 0.595687, gloss: 0.663707
> Epoch: 1, 5/791, dloss: 0.633580, gloss: 0.584469
Accuracy on real data: [0.2152627855539322, 1.0]
Accuracy on fake data: [1.077889010310173, 0.0]
> Epoch: 2, 1/791, dloss: 0.860998, gloss: 0.535043
> Epoch: 2, 2/791, dloss: 0.894511, gloss: 0.619994
> Epoch: 2, 3/791, dloss: 0.684165, gloss: 0.798792
> Epoch: 2, 4/791, dloss: 0.582981, gloss: 0.996834
> Epoch: 2, 5/791, dloss: 0.484403, gloss: 1.345097
Accuracy on real data: [0.5107622742652893, 0.625]
Accuracy on fake data: [0.38819436356425285, 1.0]
> Epoch: 3, 1/791, dloss: 0.435592, gloss: 1.766273
> Epoch: 3, 2/791, dloss: 0.360114, gloss: 2.193388
> Epoch: 3, 3/791, dloss: 0.533608, gloss: 1.258700
> Epoch: 3, 4/791, dloss: 0.639676, gloss: 0.791338
> Epoch: 3, 5/791, dloss: 0.613564, gloss: 0.744176
Accuracy on real data:

In [None]:
d_model.summary(), g_model.summary(), gan_model.summary()