In [1]:
import tensorflow as tf
import tensorflow_datasets as tfds
import matplotlib.pyplot as plt
import numpy as np
import os
import tensorflow_datasets as tfds
import matplotlib.pyplot as plt
import pandas as pd
from keras_preprocessing.image import ImageDataGenerator
import tensorflow_addons as tfa
import torch

In [2]:
directory = 'C:\datasets\img_align_celeba\img_align_celeba'

In [3]:
tag = pd.read_csv('C:/datasets/list_attr_celeba.csv')

In [4]:
col = ['image_id', 'Male', 'Mustache', 'Bald', 'Smiling', 'Young']
tag = tag[col]
tag = tag.replace(-1, 0)
col = col[1:]
tag

Unnamed: 0,image_id,Male,Mustache,Bald,Smiling,Young
0,000001.jpg,0,0,0,1,1
1,000002.jpg,0,0,0,1,1
2,000003.jpg,1,0,0,0,1
3,000004.jpg,0,0,0,0,1
4,000005.jpg,0,0,0,0,1
...,...,...,...,...,...,...
202594,202595.jpg,0,0,0,0,1
202595,202596.jpg,1,0,0,1,1
202596,202597.jpg,1,0,0,1,1
202597,202598.jpg,0,0,0,1,1


In [5]:
train = tag.sample(frac = .8, random_state=42)
test = tag.drop(train.index)
train

Unnamed: 0,image_id,Male,Mustache,Bald,Smiling,Young
93241,093242.jpg,1,0,0,0,1
121413,121414.jpg,0,0,0,0,1
10624,010625.jpg,1,0,0,0,1
82523,082524.jpg,0,0,0,1,1
73192,073193.jpg,0,0,0,1,0
...,...,...,...,...,...,...
36890,036891.jpg,1,0,0,0,1
1992,001993.jpg,0,0,0,0,1
47852,047853.jpg,0,0,0,1,1
79821,079822.jpg,0,0,0,1,1


In [6]:
datagen=ImageDataGenerator(rescale=1./255.,validation_split=0.25)

In [7]:
train_generator=datagen.flow_from_dataframe(
dataframe=train,
directory = directory,
x_col="image_id",
y_col=col,
subset="training",
batch_size=16,
seed=42,
shuffle=True,
    class_mode='raw',
target_size=(256,256))

valid_generator=datagen.flow_from_dataframe(
dataframe=train,
directory=directory,
x_col="image_id",
y_col=col,
subset="validation",
batch_size=16,
seed=42,
shuffle=True,
class_mode="raw",
target_size=(256,256))

test_datagen=ImageDataGenerator(rescale=1./255.)
test_generator=test_datagen.flow_from_dataframe(
dataframe=test,
directory=directory,
x_col="image_id",
y_col=col,
batch_size=16,
seed=42,
shuffle=False,
class_mode='raw',
target_size=(256,256))

Found 121560 validated image filenames.
Found 40519 validated image filenames.
Found 40520 validated image filenames.


In [21]:
class MLP(tf.keras.layers.Layer):
    def __init__(self, in_channel:int, hidden_channel:int, dropout:float = 0.):
        super(MLP, self).__init__()
        self.in_channel = in_channel
        self.hidden_channel = hidden_channel
        self.dropout = dropout
        
        self.fc1 = tf.keras.layers.Dense(self.hidden_channel, activation = tf.keras.activations.gelu, kernel_initializer = tf.keras.initializers.lecun_normal())
        self.d = tf.keras.layers.Dropout(self.dropout)
        self.fc2 = tf.keras.layers.Dense(self.in_channel, kernel_initializer = tf.keras.initializers.lecun_normal())
        
    def call(self, X):
        X = self.fc1(X)
        X = self.d(X)
        X = self.fc2(X)
        return X
        
class MLP_block(tf.keras.layers.Layer):
    def __init__(self, n_patches:int, n_channels:int, mlp_ratio:int):
        super(MLP_block, self).__init__()
        self.n_patches = n_patches
        self.n_channels = n_channels
        self.mlp_ratio = mlp_ratio
        
        self.MLP1 = MLP(self.n_channels, self.n_channels*self.mlp_ratio)
        self.MLP2 = MLP(self.n_patches, self.n_patches*self.mlp_ratio)
        self.ln1 = tf.keras.layers.LayerNormalization()
        self.ln2 = tf.keras.layers.LayerNormalization()
        self.T = tf.keras.layers.Permute((2,1))
        
    def call(self, X):
        #channel
        y = self.ln1(X)
        y = self.MLP1(y)
        X = y + X
        #token(Spatial)
        y = self.T(X)
        y = self.ln2(y)
        y = self.MLP2(y)
        y = self.T(y)
        y = y + X
        return y
    

class LVT(tf.keras.models.Model):
    def __init__(self, n_channels:int, image_size:int, patch_size:int, n_blocks:int, mlp_ratio:int, batch_size:int, n_labels:int, mode:str = 'softmax'):
        super(LVT, self).__init__()
        self.n_channels = n_channels
        self.image_size = image_size
        self.patch_size = patch_size
        if (self.image_size % self.patch_size) != 0:
            raise ValueError('size error')
        self.n_patches = int((tf.square(self.image_size) / tf.square(self.patch_size)).numpy())
        self.n_blocks = n_blocks
        self.mlp_ratio = mlp_ratio
        self.batch_size = batch_size
        
        self.n_labels = n_labels
        if mode not in ['sigmoid','softmax']:
            raise ValueError('mode must be sigmoid or softmax')
        else:
            self.mode = mode
        
        self.patchConv = tf.keras.layers.Conv2D(self.n_channels, (self.patch_size, self.patch_size), strides = (self.patch_size, self.patch_size))
        self.CLS = tf.Variable(tf.random.truncated_normal([1, self.n_channels], stddev=.02))
        self.PE = tf.Variable(tf.random.truncated_normal([self.n_patches + 1, self.n_channels], stddev=.02))
        self.MLP_Blocks = [MLP_block(self.n_patches + 1, self.n_channels, self.mlp_ratio) for x in range(self.n_blocks)] # n_patchs + cls token
        self.ln = tf.keras.layers.LayerNormalization()
        self.head = tf.keras.layers.Dense(self.n_labels if self.n_labels > 2 else 1, activation = mode, kernel_initializer = tf.keras.initializers.glorot_normal(seed = 42))
        
    def call(self, X):
        X = self.patchConv(X)
        X = tf.reshape(X, [-1, self.n_patches, self.n_channels])
        CLS = tf.broadcast_to(self.CLS, [tf.shape(X)[0], 1, self.n_channels])
        X = tf.concat([CLS, X], 1)
        PE = tf.broadcast_to(self.PE, [tf.shape(X)[0], self.n_patches + 1, self.n_channels])
        X = X + PE
        
        for MLP in self.MLP_Blocks:
            X = MLP(X)
        X = self.ln(X)
        X = X[:,:,0]
        X = self.head(X) 
        return X

In [22]:
lvt = LVT(192, 256, 16, 12, 4, 16, len(col), mode = 'sigmoid')
opt = tf.keras.optimizers.Adam(.00005)
lvt.compile(optimizer=opt, loss=tfa.losses.focal_loss.sigmoid_focal_crossentropy, metrics='acc')

In [23]:
STEP_SIZE_TRAIN=train_generator.n//train_generator.batch_size
STEP_SIZE_VALID=valid_generator.n//valid_generator.batch_size
STEP_SIZE_TEST=test_generator.n//test_generator.batch_size
lvt.fit_generator(generator=train_generator,
                    steps_per_epoch=STEP_SIZE_TRAIN,
                    validation_data=valid_generator,
                    validation_steps=STEP_SIZE_VALID,
                    epochs=10)

Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


<tensorflow.python.keras.callbacks.History at 0x1d6cd3eb730>