In [1]:
import tensorflow as tf
from tensorflow import keras
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dropout
from tensorflow.keras.models import Model
from tensorflow.keras.layers import Input
from tensorflow.keras.layers import Dense
from tensorflow.keras.layers import Activation
from tensorflow.keras.layers import Flatten
from tensorflow.keras.layers import Dropout
from tensorflow.keras.layers import Conv2D, Conv3D
from tensorflow.keras.layers import MaxPooling2D, MaxPooling3D
from tensorflow.keras.layers import GlobalAveragePooling2D
from tensorflow.keras.layers import BatchNormalization
from tensorflow.keras.applications.vgg16 import VGG16
from tensorflow.keras.optimizers import Adam
from tensorflow.keras import regularizers
from tensorflow.keras.losses import categorical_crossentropy
from tensorflow.keras.losses import binary_crossentropy
from sklearn.metrics import f1_score
from keras.wrappers.scikit_learn import KerasClassifier
from sklearn.model_selection import cross_val_score
from tensorflow.keras.applications.vgg16 import preprocess_input

from keras.callbacks import EarlyStopping
from keras.preprocessing.image import ImageDataGenerator
from sklearn.model_selection import train_test_split
import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
from PIL import Image 
import seaborn as sns
import os
import re
import glob
import cv2
from sklearn.metrics import classification_report
from sklearn.metrics import confusion_matrix
from sklearn.utils.multiclass import unique_labels
from sklearn.model_selection import StratifiedKFold
from sklearn import preprocessing
import tqdm
from numpy import loadtxt
from os import *
from sklearn.utils import class_weight


Using TensorFlow backend.


In [2]:
def atoi(text):
    return int(text) if text.isdigit() else text
def natural_keys(text):
    return [atoi(c) for c in re.split('(\d+)', text)]

In [3]:
def draw_confusion_matrix(true,preds):
    conf_matx = confusion_matrix(true, preds)
    sns.heatmap(conf_matx, annot=True,annot_kws={"size": 12},fmt='g', cbar=False, cmap=plt.cm.Blues) #'viridis'
    #plt.savefig('/home/jovyan/conf_matrix.png')
    plt.show()
    
    return conf_matx

In [4]:
def plot_history(model_history, model_name):
    fig = plt.figure(figsize=(15,5), facecolor='w')
    ax = fig.add_subplot(121)
    ax.plot(model_history.history['loss'])
    ax.plot(model_history.history['val_loss'])
    ax.set(title=model_name + ': Model loss', ylabel='Loss', xlabel='Epoch')
    ax.legend(['Train', 'Val'], loc='upper left')
    ax = fig.add_subplot(122)
    ax.plot(model_history.history['accuracy'])
    ax.plot(model_history.history['val_accuracy'])
    ax.set(title=model_name + ': Model Accuracy; test='+ str(np.round(model_history.history['val_accuracy'][-1], 3)),
           ylabel='Accuracy', xlabel='Epoch')
    ax.legend(['Train', 'Val'], loc='upper left')
    #plt.savefig('/home/jovyan/curve.png')
    plt.show()
    
    return fig

In [5]:
def resize(x):
    rescaled = []

    for i in x:

        scale_percent = 140 # percent of original size
        width = int(i.shape[1] / (scale_percent / 100))
        height = int(i.shape[0] / (scale_percent / 100))
        dim = (width, height)
        resized = cv2.resize(i, dim, interpolation = cv2.INTER_LANCZOS4)
        rescaled.append(resized)

    x_orig = np.reshape( rescaled, (len( rescaled), resized.shape[1], resized.shape[1], 3))

    return x_orig

In [6]:
def loadImages(path_data):
    
    p = '/home/jovyan/DATA_MASTER_PROJECT/Check_DIFF_T0_T97/'
    
    
    
    pa_adr = p + 'ADR_cropped/'
    
    pa_control = p + 'CONTROL_cropped/'
    
    pa_hrh = p + 'HRH_cropped/'
    
    image_list = []
    
    
       


    for filename in tqdm.tqdm(sorted(path_data, key=natural_keys)): 
        
        if 'adr' in filename:
            
            im=cv2.imread(pa_adr + filename)

            imarray = np.array(im)
            

            image_list.append(imarray)
            
        if 'control' in filename:
            
            im=cv2.imread(pa_control + filename)

            imarray = np.array(im)
            

            image_list.append(imarray)
            
        if 'hrh' in filename:
            
            im=cv2.imread(pa_hrh + filename)

            imarray = np.array(im)
            

            image_list.append(imarray)



    x_orig = np.reshape(image_list, (len(image_list), 90, 90, 3))

    return x_orig

In [7]:
def return_count(x):
    name_wel = []
    for i in sorted(x, key = natural_keys):
        name_wel.append(i.split('_')[0])

    z = sorted(list(set(name_wel)))
    r = list(range(len(z)))

    num = []
    for iz in range(len(z)):
        count = 0
        for i in sorted(x, key=natural_keys):
            if z[iz] in i:
                count += 1
        num.append(count)
    return list(zip(z, r, num))

In [8]:
def creat_label(y):
    labels = []
    for ix, _ in enumerate(y):
        
        if y[ix][0] == 'adr':
        
            labels.append([[y[ix][0],0]] * y[ix][2])
        
        if y[ix][0] == 'hrh' or y[ix][0] == 'control':
            
            labels.append([[y[ix][0],1]] * y[ix][2])
    
    ler = [i for sub in labels for i in sub ]
    
    _, lab= zip(*ler)

    
    return lab

In [9]:
def make_labels(data_set):
    fe = return_count(data_set)
    leb = creat_label(fe)
    y = np.array(list(leb))
    return y
    

In [10]:
def time_step_acc(tes_data):

    results = []            

    x_test = loadImages(tes_data)
    y_test = make_labels(tes_data)
    x_test = resize(x_test)
    x_test = preprocess_input(x_test)

    scores = m4.evaluate(x_test, y_test, verbose = 1)
    results.append(scores[1]*100)

    return results

# TEST SET

In [11]:
midorine = ['C6', 'F11']
lebetalol = ['D11', 'G4']
mephenteremine = ['F2', 'G10']
methoaxamine = ['G5', 'B10']
ocymetazoline = ['G3', 'B8']

In [12]:
time_points = list(map(str, range(1,97,3)))

new_time = []
for i in time_points:
    r = '_' + i + '.'
    new_time.append(r)


path_test = '/home/jovyan/DATA_MASTER_PROJECT/Check_DIFF_T0_T97/ADR_cropped/'

# NAME OF THE WELLS CORRESPONDING TO THE FRUG THAT YOU WANT IN THE TEST SET 

wells_drug = ['D11', 'G4'] 

test = []

for _,_, filenames in os.walk(path_test):
    
    for filename in sorted(filenames, key = natural_keys):
    
        for w in wells_drug:
            for t in new_time:
                if '{}'.format(w) in filename and '{}tiff'.format(t) in filename:
                    test.append(filename)

# TRAIN & VALIDATION

In [13]:
groups_list = ['ADR', 'HRH']#, 'CONTROL']

fileds_of_view = ['1','2','3','4']

field_train, field_val = train_test_split(fileds_of_view, test_size=0.2, random_state=int(np.random.randint(1,1000,1)))


In [14]:
train = []

validation = []

group_compounds = []

In [15]:
for group in tqdm.tqdm(groups_list):
    
    pa = '/home/jovyan/DATA_MASTER_PROJECT/Check_DIFF_T0_T97/{}_cropped/'.format(group)
    
    for _,_, filenames in os.walk(pa):
    
        for filename in sorted(filenames, key = natural_keys):

            for t in new_time:

                if '_{}-'.format(wells_drug[0]) not in filename and '_{}-'.format(wells_drug[1]) not in filename and '{}tiff'.format(t) in filename:

                    group_compounds.append(filename)
        
        
            
            
    

100%|██████████| 2/2 [00:11<00:00,  5.54s/it]


In [16]:
for i in group_compounds:
    
    for f in field_train:
        if '-{}_'.format(f) in i:
            train.append(i)
            
            
    for v in field_val:
        if '-{}_'.format(v) in i:
            validation.append(i)
            

In [17]:
x_train = loadImages(train)
y_train = make_labels(train)

x_train.shape, y_train.shape

100%|██████████| 63199/63199 [00:57<00:00, 1093.36it/s]


((63199, 90, 90, 3), (63199,))

In [18]:
x_val = loadImages(validation)
y_val = make_labels(validation)

x_val.shape, y_val.shape

100%|██████████| 19906/19906 [00:18<00:00, 1057.19it/s]


((19906, 90, 90, 3), (19906,))

In [19]:
x_train = resize(x_train)
x_train.shape

(63199, 64, 64, 3)

In [20]:
x_val = resize(x_val)
x_val.shape

(19906, 64, 64, 3)

In [21]:
weights = class_weight.compute_class_weight('balanced', np.unique(y_train),y_train)
print('weights = ' + str(weights))

weights = [1.13000644 0.89682134]


In [22]:
x_train = preprocess_input(x_train)

x_val = preprocess_input(x_val)


#y_train = keras.utils.to_categorical(y_train ,num_classes=2)
#y_test_1 = keras.utils.to_categorical(y_test, num_classes=2)
#y_val = keras.utils.to_categorical(y_val, num_classes=2)

In [23]:
es = EarlyStopping(monitor='val_loss', mode='min', verbose=2, patience=3)

In [24]:
pretrained_model = VGG16(weights='imagenet',include_top=False, input_shape=(64, 64, 3))

base_model = Model(inputs=pretrained_model.input, outputs=pretrained_model.get_layer('block3_pool').output)

In [25]:
batch_size = 128

In [26]:
datagen = ImageDataGenerator()

datagen.fit(x_train)

train_gen = datagen.flow(x_train, y_train,batch_size=batch_size )

dat_val = ImageDataGenerator()

dat_val.fit(x_val)

val_gen = dat_val.flow(x_val, y_val,batch_size=batch_size)

m4 = Sequential()
m4.add(base_model)


m4.add(BatchNormalization())
m4.add(GlobalAveragePooling2D())
m4.add(BatchNormalization())
m4.add(Activation('PReLU'))
m4.add(Dense(64, activation='PReLU'))
m4.add(Dense(1,activation='sigmoid'))


base_model.trainable = False

opt = keras.optimizers.Adam(lr=1e-3)

m4.compile(loss= keras.losses.binary_crossentropy, optimizer=opt, metrics = ['accuracy'])



epochs = 300

m4_h = m4.fit(train_gen,
                steps_per_epoch=(len(x_train)/batch_size),
                callbacks = [es],
                epochs=epochs,
                validation_data = (val_gen), 
                validation_steps = (len(x_val)/batch_size),
                class_weight = weights,
                 verbose = 1)

ValueError: Unknown activation function:PReLU

In [None]:
base_model.trainable = True

opt = keras.optimizers.Adam(lr=1e-5)

m4.compile(loss= keras.losses.binary_crossentropy, optimizer=opt, metrics = ['accuracy'])

epochs = 300

m4_h = m4.fit(train_gen,
                steps_per_epoch=(len(x_train)/batch_size),
                callbacks = [es],
                epochs=epochs,
                validation_data = val_gen, 
                validation_steps = (len(x_val)/batch_size),
                class_weight = weights,
                verbose = 1)

In [None]:
plot_history(m4_h, 'first')

In [None]:
l = []
for t in new_time:
    for i in test:
        if t in i:
            l.append((i))
            

In [None]:
grouped = {}
for elem in l:
    key = elem.split('.tiff')[0].split('_')[5]
    grouped.setdefault(key, []).append(elem)
grouped = grouped.values()

In [None]:
test_data = list(grouped)

In [None]:
r = []

for ix ,_ in enumerate(test_data):
    r.append(time_step_acc(test_data[ix]))

In [None]:
plt.plot(time_points,r)

In [None]:
len(r), len(time_points)

In [None]:
test_/home/jovyan/save_model_final/t(x_test)

t= []
for i in (test_preds):
    if i > 0.5:
        t.append(1)
    else:
        t.append(0)

draw_confusion_matrix(y_test, t)

In [None]:
p = '/home/jovyan/save_model_final/'
m4.save(p + "LEBATALOL.h5")