In [1]:
import matplotlib.pyplot as plt
import numpy as np
import PIL
import os
import tensorflow as tf
print(f"gpu: { len(tf.config.list_physical_devices('GPU')) }")
gpus = tf.config.experimental.list_physical_devices('GPU')
for gpu in gpus: tf.config.experimental.set_memory_growth(gpu, True)
from tensorflow.keras.optimizers import Adam
import math
from tqdm import tqdm
from sklearn.model_selection import train_test_split
from vae_adapted import VAEAdapted

gpu: 1


In [2]:
def load_data_for_model(model_name, batch_size=64):
    assert model_name in ['efficientnet', 'inception', 'resnet', 'mobilenet', 'vgg']
    labels = np.load('./data/LFSD_labels.npy')
    depths = np.load('./data/LFSD_depths_repeated_%s_feat.npy' % model_name)
    imgs = np.load('./data/LFSD_imgs_%s_feat.npy' % model_name)
    masks = np.load('./data/LFSD_masks_single.npy')
    idx = np.random.permutation(len(labels))
    batch_idxs = [idx[i:i + batch_size] for i in range(0, len(labels), batch_size)]
    dataset = []
    for idx in batch_idxs:
        img_batch, depth_batch, mask_batch = imgs[idx], depths[idx], masks[idx]
        dataset.append((img_batch, depth_batch, mask_batch))
    train_dataset, test_dataset = train_test_split(dataset, test_size=0.3)
    print("Train dataset contains %d batches of %d samples each" % (len(train_dataset), batch_size))
    print("Test dataset contains %d batches of %d samples each" % (len(test_dataset), batch_size))
    return train_dataset, test_dataset

In [3]:
def merge_images(image_batch, size):
    h,w = image_batch.shape[1], image_batch.shape[2]
    img = np.zeros((int(h*size[0]), w*size[1]))
    for idx, im in enumerate(image_batch):
        im = np.squeeze(im, axis=2)
        i = idx % size[1]
        j = idx // size[1]
        img[j*h:j*h+h, i*w:i*w+w] = im
    return img

In [4]:
def train_round(train_dataset, test_dataset, learning_rate, model_name, epochs):
    latent_lookup = {
        'inception': 2048,
        'vgg': 512,
        'efficientnet': 1280,
        'mobilenet': 1280,
        'resnet': 2048,
    }
    latent_dim = latent_lookup[model_name]
    vae = VAEAdapted(latent_dim)
    vae.compile(optimizer=Adam(learning_rate))
    epochs = epochs
    # Training Step
    losses_across_epochs = {
        "loss": [],
        "reconstruction_loss": [],
        "kl_loss": [],
    }
    batch_num = len(train_dataset)
    for i in range(epochs):

        for k, v in losses_across_epochs.items():
            losses_across_epochs[k].append(0)
        for data in train_dataset:
            cur_loss = vae.train_step(data)
            for k, v in cur_loss.items():
                losses_across_epochs[k][-1] += cur_loss[k].numpy() / batch_num
            generated_image = vae.sample(data)
        print(f"Epoch {i} Total loss: { losses_across_epochs['loss'][-1]}")
        im_merged = merge_images(generated_image.numpy(), [8,8])
        plt.imsave('./images/vae_adapted/%d.png' % i, im_merged, cmap='gray')
    for k, v in losses_across_epochs.items():
        np.save('./results/vae_adapted/%s_%s' % (model_name, k), np.array(v))
    # Testing Step
    test_loss = 0
    for i, data in enumerate(test_dataset):
        _, _, mask_batch = data
        generated_image = vae.sample(data)
        reconstruction_loss = tf.reduce_sum(
            tf.keras.losses.binary_crossentropy(mask_batch, generated_image), [1,2]
        )
        test_loss += tf.reduce_mean(reconstruction_loss).numpy()
        im_merged = merge_images(generated_image.numpy(), [8,8])
        plt.imsave('./images/vae_adapted/test_batch_%d.png' % i, im_merged, cmap='gray')
        
    test_loss = test_loss / len(test_dataset)
    np.save('./results/vae_adapted/%s_test_loss' % model_name, np.array([test_loss]))
    return vae

In [5]:
def get_encoding_for_model(vae, model_name):
    from skimage.transform import resize
    from tensorflow.keras import datasets

    train_dataset, test_dataset = None, None
 
    train_feats = np.load('./data/CIFAR100_%s_train_feat.npy' % model_name)
    test_feats = np.load('./data/CIFAR100_%s_test_feat.npy' % model_name)

    train_result, _, _ = vae.encode(train_feats[:128], tf.random.normal(train_feats[:128].shape))
    for i in range(128, len(train_feats), 128):
        activation, _, _ = vae.encode(train_feats[i:i+128], tf.random.normal(train_feats[i:i+128].shape))
        train_result = tf.concat((train_result, activation), axis=0)
    np.save('./data/CIFAR100_vae_adapted_%s_encoding_train.npy' % model_name, np.array(train_result))

    test_result, _, _ = vae.encode(test_feats[:128], tf.random.normal(test_feats[:128].shape))
    for i in range(128, len(test_feats), 128):
        activation, _, _ = vae.encode(test_feats[i:i+128], tf.random.normal(test_feats[i:i+128].shape))
        test_result = tf.concat((test_result, activation), axis=0)
    np.save('./data/CIFAR100_vae_adapted_%s_encoding_test.npy' % model_name, np.array(test_result))


In [6]:
%%time

learning_rate = 1e-4
epochs = 100
for model_name in ['efficientnet','inception', 'resnet', 'mobilenet', 'vgg']:
    train_dataset, test_dataset = load_data_for_model(model_name)
    trained_model = train_round(train_dataset, test_dataset, learning_rate, model_name, epochs)
    print("Gen encoding...")
    get_encoding_for_model(trained_model, model_name)

Train dataset contains 9 batches of 64 samples each
Test dataset contains 5 batches of 64 samples each
Epoch 0 Total loss: 9664419356.444445
Epoch 1 Total loss: 2548685311.9999995
Epoch 2 Total loss: 1520894919.1111112
Epoch 3 Total loss: 1087149077.3333335
Epoch 4 Total loss: 846926293.3333333
Epoch 5 Total loss: 694060928.0
Epoch 6 Total loss: 588156088.8888888
Epoch 7 Total loss: 510426140.4444445
Epoch 8 Total loss: 450935960.8888889
Epoch 9 Total loss: 403933340.4444444
Epoch 10 Total loss: 365854933.3333334
Epoch 11 Total loss: 334374193.77777773
Epoch 12 Total loss: 307908064.0
Epoch 13 Total loss: 285343264.0
Epoch 14 Total loss: 265872622.2222222
Epoch 15 Total loss: 248898551.11111107
Epoch 16 Total loss: 233970714.66666663
Epoch 17 Total loss: 220740881.77777776
Epoch 18 Total loss: 208935900.44444442
Epoch 19 Total loss: 198337692.44444442
Epoch 20 Total loss: 188770540.44444445
Epoch 21 Total loss: 180090620.44444445
Epoch 22 Total loss: 172180289.77777776
Epoch 23 Total l

Epoch 3 Total loss: 3197148.583333333
Epoch 4 Total loss: 2972662.055555556
Epoch 5 Total loss: 2746482.972222223
Epoch 6 Total loss: 2529458.5555555555
Epoch 7 Total loss: 2336879.9166666665
Epoch 8 Total loss: 2172561.8055555555
Epoch 9 Total loss: 2031269.541666667
Epoch 10 Total loss: 1908737.8749999998
Epoch 11 Total loss: 1800606.1527777775
Epoch 12 Total loss: 1705552.7083333335
Epoch 13 Total loss: 1621303.3055555557
Epoch 14 Total loss: 1545741.902777778
Epoch 15 Total loss: 1477585.847222222
Epoch 16 Total loss: 1415447.5277777778
Epoch 17 Total loss: 1359146.0833333333
Epoch 18 Total loss: 1308511.0694444445
Epoch 19 Total loss: 1263105.722222222
Epoch 20 Total loss: 1221251.25
Epoch 21 Total loss: 1182369.0833333333
Epoch 22 Total loss: 1146372.375
Epoch 23 Total loss: 1113312.0416666667
Epoch 24 Total loss: 1082745.513888889
Epoch 25 Total loss: 1054734.034722222
Epoch 26 Total loss: 1028664.75
Epoch 27 Total loss: 1003783.8402777778
Epoch 28 Total loss: 979933.9027777778


AssertionError: 