1. Load weights of DeepFace
2. Add classification layer (2)
3. For each syn in syn_list calculate the stats


In [1]:
import keras
import numpy as np
from os import path
from os import listdir
from os.path import isfile, join
from PIL import Image 
from keras.models import Model
import tensorflow as tf
import csv
import pandas as pd
from tqdm import tqdm
import keras.initializers

from sklearn.model_selection import LeaveOneOut
import cv2
from sklearn.metrics import roc_auc_score, confusion_matrix
from sklearn.preprocessing import Normalizer

Using TensorFlow backend.


In [2]:
IMAGE_SIZE = (152, 152) # set by the model 
CHANNELS = 3 # RGB image
NUM_CLASSES = 8631 # classification layer will be removed 
LEARN_RATE = 0.01
MOMENTUM = 0.9

DOWNLOAD_PATH = 'https://github.com/swghosh/DeepFace/releases/download/weights-vggface2-2d-aligned/VGGFace2_DeepFace_weights_val-0.9034.h5.zip'
MD5_HASH = '0b21fb70cd6901c96c19ac14c9ea8b89'

In [3]:
wt_init = keras.initializers.RandomNormal(mean=0, stddev=0.01)
bias_init = keras.initializers.Constant(value=0.5)

def conv2d_layer(**args):
    return keras.layers.Conv2D(**args, 
        kernel_initializer=wt_init, 
        bias_initializer=bias_init,
        activation=keras.activations.relu)
def lc2d_layer(**args):
    return keras.layers.LocallyConnected2D(**args, 
        kernel_initializer=wt_init, 
        bias_initializer=bias_init,
        activation=keras.activations.relu)
def dense_layer(**args):
    return keras.layers.Dense(**args, 
        kernel_initializer=wt_init, 
        bias_initializer=bias_init)

In [4]:
def create_classifying_deepface(image_size=IMAGE_SIZE, channels=CHANNELS, num_classes=NUM_CLASSES, learn_rate=LEARN_RATE, momentum=MOMENTUM):
    deepface = keras.models.Sequential([
        keras.layers.InputLayer(input_shape=(*image_size, channels), name='I0'),
        conv2d_layer(filters=32, kernel_size=11, name='C1'),
        keras.layers.MaxPooling2D(pool_size=3, strides=2, padding='same',  name='M2'),
        conv2d_layer(filters=16, kernel_size=9, name='C3'),
        lc2d_layer(filters=16, kernel_size=9, name='L4'),
        lc2d_layer(filters=16, kernel_size=7, strides=2, name='L5'),
        lc2d_layer(filters=16, kernel_size=5, name='L6'),
        keras.layers.Flatten(name='F0'),
        dense_layer(units=4096, activation=keras.activations.relu, name='F7'),
        keras.layers.Dropout(rate=0.5, name='D0'),
        dense_layer(units=num_classes, activation=keras.activations.softmax, name='F8')
    ], name='DeepFace')
    # deepface.summary()

    sgd_opt = keras.optimizers.SGD(lr=learn_rate, momentum=momentum)
    cce_loss = keras.losses.categorical_crossentropy

    deepface.compile(optimizer=sgd_opt, loss=cce_loss, metrics=['accuracy'])
    
    return deepface

In [5]:
def get_weights():
    filename = 'deepface.zip'
    downloaded_file_path = keras.utils.get_file(filename, DOWNLOAD_PATH, 
        md5_hash=MD5_HASH, extract=True)
    downloaded_h5_file = path.join(path.dirname(downloaded_file_path), 
        path.basename(DOWNLOAD_PATH).rstrip('.zip'))
    return downloaded_h5_file


def create_deepface():
    model = create_classifying_deepface()
    weights = get_weights()
    model.load_weights(weights)
    
    num_classes = 2
    x = model.layers[-2].output
    x = dense_layer(units=num_classes, activation=keras.activations.softmax, name='preds')(x)
    #x = Dense(2, activation='softmax', name='predictions')(x)
    model2 = Model(model.input, x)
    
    sgd_opt = keras.optimizers.SGD(lr=LEARN_RATE, momentum=MOMENTUM)
    cce_loss = keras.losses.categorical_crossentropy
    #model2.compile(optimizer=sgd_opt, loss=cce_loss, metrics=['accuracy'])
 

    model2.compile(
        loss="sparse_categorical_crossentropy",
        optimizer=keras.optimizers.Adam(lr=0.001),
        metrics=["sparse_categorical_accuracy"])
    
    #model2.summary()
    
    return model2

In [6]:
def load_data(syn, GENERAL_DIR):
    
    data, labels = [], [] 
    
    syn_dir = GENERAL_DIR + "\\{}\{}-patients".format(syn, syn)
    ID_dir = GENERAL_DIR + "\\{}\{}-selected-ID-controls".format(syn, syn)

    # get list of filenames
    files_syn = [f for f in listdir(syn_dir) if (isfile(join(syn_dir, f)))and ".jpg" in f]
    files_ID = [f for f in listdir(ID_dir) if (isfile(join(ID_dir, f))) and ".jpg" in f]
    
    print("Syn_list: {}, ID_list: {}".format(len(files_syn), len(files_ID)))

    for filename in files_syn:
        im = Image.open(join(syn_dir, filename))
        im = im.resize(IMAGE_SIZE)
        data.append(np.array(im))
        labels.append(1)

    for filename in files_ID:
        im = Image.open(join(ID_dir, filename))
        im = im.resize(IMAGE_SIZE)
        data.append(np.array(im))
        labels.append(0)    
    
    return np.array(data), np.array(labels)

In [7]:
from tensorflow.keras import preprocessing
from tensorflow.keras import backend as K

model  = create_deepface()

im = Image.open(r"H:\Genetica Projecten\Facial Recognition\Studenten en Onderzoekers\Fien\test\YY1_1.jpg")
im = np.array(im.resize(IMAGE_SIZE))

#im = preprocessing.image.img_to_array(im)
im = np.expand_dims(im, axis=0)
im = tf.convert_to_tensor(im, dtype=np.float32)
print(im.shape)

conv_layer = model.get_layer("L6")
heatmap_model = Model([model.input], [conv_layer.output, model.output])

with tf.GradientTape() as gtape:
    conv_output, predictions = heatmap_model(im)
    
    i = tf.math.argmax(predictions[0], -1).eval(session=tf.compat.v1.Session()) #.numpy()
    
    loss = predictions[:, i] #np.argmax(predictions[0])]
    grads = gtape.gradient(loss, conv_output)
    pooled_grads = K.mean(grads, axis=(0,1,2))

heatmap = tf.reduce_mean(tf.multiply(pooled_grads, conv_output), axis=-1)
heatmap = np.maximum(heatmap, 0)
max_heat = np.max(heatmap)
if max_heat == 0:
    max_heat = 1e-10
heatmap /= max_heat

print(heatmap.shape)


(1, 152, 152, 3)


ValueError: Cannot use the given session to evaluate tensor: the tensor's graph is different from the session's graph.

In [None]:
plt.figure()
plt.plot(heatmap)
plt.show()

In [7]:
BATCH_SIZE = 32
GENERAL_DIR = r"H:\Genetica Projecten\Facial Recognition\Studenten en Onderzoekers\Fien" 

# load img data
syn_list = ['ADNP', 'ANKRD11', 'CDK13', 'DEAF1', 'DYRK1A', 'EHMT1', 'FBXO11', 'SON', 'WAC', 'YY1', 'KDVS']
results_file = open("results/deepface_classification.txt", "w")

for syn in ['YY1']:
    data, labels = load_data(syn, GENERAL_DIR)

    results_file.write("Syndrome {} with {} patients and {} controls\n".format(syn, labels.tolist().count(1), labels.tolist().count(0)))
    all_y, all_probs, all_preds = [], [], [] 

    loo = LeaveOneOut()
    for train_index, test_index in tqdm(loo.split(data)):
        X_train, X_test = np.array(data[train_index]), data[test_index]
        y_train, y_test = np.array(labels[train_index]), labels[test_index]

        model = create_deepface()
        model.fit(x=X_train, y=y_train, batch_size=BATCH_SIZE, epochs=1, shuffle=True)

        y_pred_array = model.predict(X_test)
        y_pred = tf.math.argmax(y_pred_array, -1).numpy()

        all_y.append(y_test[0])
        all_probs.append(y_pred_array[0][1])
        all_preds.append(y_pred)  
        
        
        
    aroc = roc_auc_score(all_y, all_probs, labels=[0,1])
    tn, fp, fn, tp = confusion_matrix(all_y, all_preds, labels=[0,1]).ravel()
    spec = tn / (tn+fp)  
    sens = tp / (tp+fn)

    results_file.write("AROC: {:.4f}, spec: {:.4f}, sens: {:.4f}\n\n".format(aroc, spec, sens))
    
    break
    
results_file.close()




Syn_list: 10, ID_list: 10


0it [00:00, ?it/s]

Epoch 1/1


1it [05:52, 352.72s/it]

Epoch 1/1


2it [13:12, 378.88s/it]

Epoch 1/1


3it [20:37, 398.56s/it]

Epoch 1/1


4it [28:52, 427.68s/it]

Epoch 1/1


5it [37:15, 450.27s/it]

Epoch 1/1


6it [46:22, 479.08s/it]

Epoch 1/1


7it [54:58, 490.31s/it]

Epoch 1/1


8it [1:04:00, 505.68s/it]

Epoch 1/1


9it [1:13:07, 518.18s/it]

Epoch 1/1


9it [1:17:54, 519.38s/it]


ResourceExhaustedError:  OOM when allocating tensor with shape[19,63,63,16] and type float on /job:localhost/replica:0/task:0/device:CPU:0 by allocator cpu
	 [[node gradients_9/L4_9/strided_slice_1831_grad/StridedSliceGrad (defined at C:\MyPrograms\Anaconda3\envs\ai-thesis2\lib\site-packages\keras\backend\tensorflow_backend.py:3009) ]]
Hint: If you want to see a list of allocated tensors when OOM happens, add report_tensor_allocations_upon_oom to RunOptions for current allocation info.
 [Op:__inference_keras_scratch_graph_1471148]

Function call stack:
keras_scratch_graph
