InfoGAN

eriklindernoren · Jul 18, 2017 · 98ec711 · 98ec711
1 parent 2df4f55
commit 98ec711
Show file tree

Hide file tree

Showing 13 changed files with 283 additions and 20 deletions.
diff --git a/README.md b/README.md
@@ -1,7 +1,7 @@
 # Keras-GAN
 
 ## About
-Keras implementations of Generative Adversarial Network (GAN) models suggested in research papers. Since I'm running these models from my Macbook Pro they will be limited in their complexity (and therefore the quality of the generated images) compared to the implementations suggested in the papers. Short training sessions are prioritized.
+Keras implementations of Generative Adversarial Networks (GANs) suggested in research papers. Since I'm training these models on my Macbook Pro they will be limited in their complexity (and therefore the quality of the generated images) compared to the implementations suggested in the papers. Short training sessions are prioritized.
 
 ## Table of Contents
 - [Keras-GAN](#keras-gan)
@@ -15,6 +15,7 @@ Keras implementations of Generative Adversarial Network (GAN) models suggested i
     + [Context Encoder](#context-encoder)
     + [Deep Convolutional GAN](#dcgan)
     + [Generative Adversarial Network](#gan)
+    + [InfoGAN](#infogan)
     + [Semi-Supervised GAN](#sgan)
     + [Wasserstein GAN](#wgan)
 
@@ -100,6 +101,14 @@ Paper: https://arxiv.org/abs/1406.2661
     <img src="http://eriklindernoren.se/images/gan.png" width="640"\>
 </p>
 
+### InfoGAN
+Implementation of InfoGAN: Interpretable Representation Learning by Information Maximizing Generative Adversarial Nets.
+
+[Code](infogan/infogan.py)
+
+Paper: https://arxiv.org/abs/1606.03657
+
+
 ### SGAN
 Implementation of Semi-Supervised Generative Adversarial Network.
 

diff --git a/aae/adversarial_autoencoder.py b/aae/adversarial_autoencoder.py
@@ -181,14 +181,14 @@ def save_imgs(self, epoch, imgs):
                 axs[i,j].imshow(gen_imgs[cnt, :,:,0], cmap='gray')
                 axs[i,j].axis('off')
                 cnt += 1
-        fig.savefig("images/mnist_%d.png" % epoch)
+        fig.savefig("aae/images/mnist_%d.png" % epoch)
         plt.close()
 
     def save_model(self):
 
         def save(model, model_name):
-            model_path = "./saved_model/%s.json" % model_name
-            weights_path = "./saved_model/%s_weights.hdf5" % model_name
+            model_path = "aae/saved_model/%s.json" % model_name
+            weights_path = "aae/saved_model/%s_weights.hdf5" % model_name
             options = {"file_arch": model_path, 
                         "file_weight": weights_path}
             json_string = model.to_json()

diff --git a/acgan/acgan.py b/acgan/acgan.py
@@ -209,14 +209,14 @@ def save_imgs(self, epoch):
                 axs[i,j].set_title("Digit: %d" % sampled_labels[cnt])
                 axs[i,j].axis('off')
                 cnt += 1
-        fig.savefig("images/mnist_%d.png" % epoch)
+        fig.savefig("acgan/images/mnist_%d.png" % epoch)
         plt.close()
 
     def save_model(self):
 
         def save(model, model_name):
-            model_path = "./saved_model/%s.json" % model_name
-            weights_path = "./saved_model/%s_weights.hdf5" % model_name
+            model_path = "acgan/saved_model/%s.json" % model_name
+            weights_path = "acgan/saved_model/%s_weights.hdf5" % model_name
             options = {"file_arch": model_path, 
                         "file_weight": weights_path}
             json_string = model.to_json()

diff --git a/bigan/bigan.py b/bigan/bigan.py
@@ -194,7 +194,7 @@ def save_imgs(self, epoch):
                 axs[i,j].imshow(gen_imgs[cnt, :,:,0], cmap='gray')
                 axs[i,j].axis('off')
                 cnt += 1
-        fig.savefig("images/mnist_%d.png" % epoch)
+        fig.savefig("bigan/images/mnist_%d.png" % epoch)
         plt.close()
 
 

diff --git a/ccgan/ccgan.py b/ccgan/ccgan.py
@@ -257,14 +257,14 @@ def save_imgs(self, epoch, imgs):
             axs[1,i].axis('off')
             axs[2,i].imshow(gen_imgs[i, :,:])
             axs[2,i].axis('off')
-        fig.savefig("images/cifar_%d.png" % epoch)
+        fig.savefig("ccgan/images/cifar_%d.png" % epoch)
         plt.close()
 
     def save_model(self):
 
         def save(model, model_name):
-            model_path = "./saved_model/%s.json" % model_name
-            weights_path = "./saved_model/%s_weights.hdf5" % model_name
+            model_path = "ccgan/saved_model/%s.json" % model_name
+            weights_path = "ccgan/saved_model/%s_weights.hdf5" % model_name
             options = {"file_arch": model_path, 
                         "file_weight": weights_path}
             json_string = model.to_json()

diff --git a/context_encoder/context_encoder.py b/context_encoder/context_encoder.py
@@ -229,14 +229,14 @@ def save_imgs(self, epoch, imgs):
             filled_in[y1[i]:y2[i], x1[i]:x2[i], :] = gen_missing[i]
             axs[2,i].imshow(filled_in)
             axs[2,i].axis('off')
-        fig.savefig("images/cifar_%d.png" % epoch)
+        fig.savefig("context_encoder/images/cifar_%d.png" % epoch)
         plt.close()
 
     def save_model(self):
 
         def save(model, model_name):
-            model_path = "./saved_model/%s.json" % model_name
-            weights_path = "./saved_model/%s_weights.hdf5" % model_name
+            model_path = "context_encoder/saved_model/%s.json" % model_name
+            weights_path = "context_encoder/saved_model/%s_weights.hdf5" % model_name
             options = {"file_arch": model_path, 
                         "file_weight": weights_path}
             json_string = model.to_json()

diff --git a/dcgan/dcgan.py b/dcgan/dcgan.py
@@ -168,7 +168,7 @@ def save_imgs(self, epoch):
                 axs[i,j].imshow(gen_imgs[cnt, :,:,0], cmap='gray')
                 axs[i,j].axis('off')
                 cnt += 1
-        fig.savefig("images/mnist_%d.png" % epoch)
+        fig.savefig("dcgan/images/mnist_%d.png" % epoch)
         plt.close()
 
 

diff --git a/gan/gan.py b/gan/gan.py
@@ -159,7 +159,7 @@ def save_imgs(self, epoch):
                 axs[i,j].imshow(gen_imgs[cnt, :,:,0], cmap='gray')
                 axs[i,j].axis('off')
                 cnt += 1
-        fig.savefig("images/mnist_%d.png" % epoch)
+        fig.savefig("gan/images/mnist_%d.png" % epoch)
         plt.close()
 
 

diff --git a/infogan/images/.gitignore b/infogan/images/.gitignore
@@ -0,0 +1,2 @@
+*
+!.gitignore
diff --git a/infogan/infogan.py b/infogan/infogan.py
@@ -0,0 +1,250 @@
+from __future__ import print_function
+
+from keras.datasets import mnist
+from keras.layers import Input, Dense, Reshape, Flatten, Dropout, multiply, concatenate
+from keras.layers import BatchNormalization, Activation, Embedding, ZeroPadding2D, Lambda
+from keras.layers.advanced_activations import LeakyReLU
+from keras.layers.convolutional import UpSampling2D, Conv2D
+from keras.models import Sequential, Model
+from keras.optimizers import Adam
+from keras.utils import to_categorical
+import keras.backend as K
+
+import matplotlib.pyplot as plt
+
+import numpy as np
+
+class INFOGAN():
+    def __init__(self):
+        self.img_rows = 28 
+        self.img_cols = 28
+        self.channels = 1
+        self.num_classes = 10
+        self.img_shape = (self.img_rows, self.img_cols, self.channels)
+        self.latent_dim = 74
+
+
+        optimizer = Adam(0.0002, 0.5)
+        losses = ['binary_crossentropy', 'categorical_crossentropy', self.gaussian_loss]
+
+        # Build and compile the discriminator
+        self.discriminator = self.build_discriminator()
+        self.discriminator.compile(loss=losses, 
+            optimizer=optimizer,
+            metrics=['accuracy'])
+
+        # Build and compile the generator
+        self.generator = self.build_generator()
+        self.generator.compile(loss=['binary_crossentropy'], 
+            optimizer=optimizer)
+
+        # The generator takes noise and the target label as input
+        # and generates the corresponding digit of that label
+        gen_input = Input(shape=(self.latent_dim,))
+        img = self.generator(gen_input)
+
+        # For the combined model we will only train the generator
+        self.discriminator.trainable = False
+
+        # The discriminator takes generated image as input and determines validity
+        # and the label of that image
+        valid, target_label, target_cont = self.discriminator(img)
+
+        # The combined model  (stacked generator and discriminator) takes
+        # noise as input => generates images => determines validity 
+        self.combined = Model(gen_input, [valid, target_label, target_cont])
+        self.combined.compile(loss=losses, 
+            optimizer=optimizer)
+
+    # Reference: https://github.com/tdeboissiere/DeepLearningImplementations/blob/master/InfoGAN/
+    def gaussian_loss(self, y_true, y_pred):
+
+        mean = y_pred[0]
+        log_stddev = y_pred[1]
+
+        y_true = y_true[0]
+
+        epsilon = (y_true - mean) / (K.exp(log_stddev) + K.epsilon())
+        loss = (log_stddev + 0.5 * K.square(epsilon))
+        loss = K.mean(loss)
+
+        return loss
+
+    def build_generator(self):
+
+        model = Sequential()
+
+        model.add(Dense(1024, activation='relu', input_dim=self.latent_dim))
+        model.add(BatchNormalization(momentum=0.8))
+        model.add(Dense(128 * 7 * 7, activation="relu"))
+        model.add(BatchNormalization(momentum=0.8))
+        model.add(Reshape((7, 7, 128)))
+        model.add(UpSampling2D())
+        model.add(Conv2D(64, kernel_size=4, padding="same"))
+        model.add(Activation("relu"))
+        model.add(BatchNormalization(momentum=0.8))
+        model.add(UpSampling2D())
+        model.add(Conv2D(self.channels, kernel_size=4, padding='same'))
+        model.add(Activation("tanh"))
+
+        model.summary()
+
+        gen_input = Input(shape=(self.latent_dim,))
+        img = model(gen_input)
+
+        return Model(gen_input, img)
+
+    def build_discriminator(self):
+
+        model = Sequential()
+
+        model.add(Conv2D(64, kernel_size=4, strides=2, input_shape=self.img_shape, padding="same"))
+        model.add(LeakyReLU(alpha=0.2))
+        model.add(Dropout(0.25))
+        model.add(Conv2D(128, kernel_size=4, strides=2, padding="same"))
+        model.add(LeakyReLU(alpha=0.2))
+        model.add(BatchNormalization(momentum=0.8))
+        model.add(Dropout(0.25))
+        model.add(Flatten())
+        model.add(Dense(1024))
+        model.add(LeakyReLU(alpha=0.2))
+        model.add(BatchNormalization(momentum=0.8))
+
+        model.summary()
+
+        img = Input(shape=self.img_shape)
+
+        features = model(img)
+
+        validity = Dense(1, activation="sigmoid")(features)
+
+        def linmax(x):
+            return K.maximum(x, -16)
+
+        def linmax_shape(input_shape):
+            return input_shape
+
+        label_model = Dense(128)(features)
+        label_model = LeakyReLU(alpha=0.2)(label_model)
+        label_model = BatchNormalization(momentum=0.8)(label_model)
+
+        label = Dense(self.num_classes, activation="softmax")(label_model)
+        mean = Dense(1, activation="linear")(label_model)
+        log_stddev = Dense(1)(label_model)
+        log_stddev = Lambda(linmax, output_shape=linmax_shape)(log_stddev)
+
+        cont = concatenate([mean, log_stddev], axis=1)
+
+        return Model(img, [validity, label, cont])
+
+    def sample_generator_input(self, batch_size):
+            # Generator inputs
+            sampled_noise = np.random.normal(0, 1, (batch_size, 62))
+            sampled_labels = np.random.randint(0, 10, batch_size).reshape(-1, 1)
+            sampled_labels = to_categorical(sampled_labels, num_classes=self.num_classes)
+            sampled_cont = np.random.uniform(-1, 1, size=(batch_size, 2))
+            return sampled_noise, sampled_labels, sampled_cont
+
+    def train(self, epochs, batch_size=128, save_interval=50):
+
+        # Load the dataset
+        (X_train, y_train), (_, _) = mnist.load_data()
+
+        # Rescale -1 to 1
+        X_train = (X_train.astype(np.float32) - 127.5) / 127.5
+        X_train = np.expand_dims(X_train, axis=3)
+        y_train = y_train.reshape(-1, 1)
+
+        half_batch = int(batch_size / 2)
+
+        for epoch in range(epochs):
+
+            # ---------------------
+            #  Train Discriminator
+            # ---------------------
+
+            # Train discriminator on generator output
+            sampled_noise, sampled_labels, sampled_cont = self.sample_generator_input(half_batch)
+            gen_input = np.concatenate((sampled_noise, sampled_labels, sampled_cont), axis=1)
+            # Generate a half batch of new images
+            gen_imgs = self.generator.predict(gen_input)
+            fake = np.zeros((half_batch, 1))
+            d_loss_fake = self.discriminator.train_on_batch(gen_imgs, [fake, sampled_labels, sampled_cont])
+
+            # Train discriminator on real data
+            # Select a random half batch of images
+            idx = np.random.randint(0, X_train.shape[0], half_batch)
+            imgs = X_train[idx]
+            labels = to_categorical(y_train[idx], num_classes=self.num_classes)
+            valid = np.ones((half_batch, 1))
+            d_loss_real = self.discriminator.train_on_batch(imgs, [valid, labels, sampled_cont])
+
+            # Avg. loss
+            d_loss = 0.5 * np.add(d_loss_real, d_loss_fake)
+
+            # ---------------------
+            #  Train Generator
+            # ---------------------
+
+            valid = np.ones((batch_size, 1))
+
+            # Generator inputs
+            sampled_noise = np.random.normal(0, 1, (batch_size, 62))
+            sampled_labels = np.random.randint(0, 10, batch_size).reshape(-1, 1)
+            sampled_labels = to_categorical(sampled_labels, num_classes=self.num_classes)
+            sampled_cont = np.random.uniform(-1, 1, size=(batch_size, 2))
+            gen_input = np.concatenate((sampled_noise, sampled_labels, sampled_cont), axis=1)
+
+            # Train the generator
+            g_loss = self.combined.train_on_batch(gen_input, [valid, sampled_labels, sampled_cont])
+
+            # Plot the progress
+            print ("%d [D loss: %.2f, acc.: %.2f%%, label_acc: %.2f%%] [G loss: %.2f]" % (epoch, d_loss[0], 100*d_loss[4], 100*d_loss[5], g_loss[0]))
+
+            # If at save interval => save generated image samples
+            if epoch % save_interval == 0:
+                self.save_imgs(epoch)
+
+    def save_imgs(self, epoch):
+        r, c = 10, 10
+
+        fig, axs = plt.subplots(r, c)
+        for i in range(r):
+            sampled_noise = np.random.normal(0, 1, (c, 62))
+            sampled_labels = np.arange(0, 10).reshape(-1, 1)
+            sampled_labels = to_categorical(sampled_labels, num_classes=self.num_classes)
+            sampled_cont = np.repeat(np.expand_dims(np.linspace(-1, 1, num=c), axis=1), 2, axis=1)
+            gen_input = np.concatenate((sampled_noise, sampled_labels, sampled_cont), axis=1)
+            gen_imgs = self.generator.predict(gen_input)
+            gen_imgs = 0.5 * gen_imgs + 0.5
+            for j in range(c):
+                axs[i,j].imshow(gen_imgs[j,:,:,0], cmap='gray')
+                axs[i,j].axis('off')
+        fig.savefig("./infogan/images/mnist_%d.png" % epoch)
+        plt.close()
+
+    def save_model(self):
+
+        def save(model, model_name):
+            model_path = "infogan/saved_model/%s.json" % model_name
+            weights_path = "infogan/saved_model/%s_weights.hdf5" % model_name
+            options = {"file_arch": model_path, 
+                        "file_weight": weights_path}
+            json_string = model.to_json()
+            open(options['file_arch'], 'w').write(json_string)
+            model.save_weights(options['file_weight'])
+
+        save(self.generator, "generator")
+        save(self.discriminator, "discriminator")
+        save(self.combined, "adversarial")
+
+
+if __name__ == '__main__':
+    infogan = INFOGAN()
+    infogan.train(epochs=6000, batch_size=32, save_interval=50)
+
+
+
+
+
+
diff --git a/infogan/saved_model/.gitignore b/infogan/saved_model/.gitignore
@@ -0,0 +1,2 @@
+*
+!.gitignore