1. going to fix image preprocessing
2. going to use pretrained featurse kfold
3. going to re-ensemble

this should produce a better leaderboard score

In [1]:
from tensorflow.python.client import device_lib
device_lib.list_local_devices()

[name: "/cpu:0"
 device_type: "CPU"
 memory_limit: 268435456
 locality {
 }
 incarnation: 11987689039894707743, name: "/gpu:0"
 device_type: "GPU"
 memory_limit: 11332668621
 locality {
   bus_id: 2
 }
 incarnation: 15775065129179825909
 physical_device_desc: "device: 0, name: Tesla K80, pci bus id: 0000:85:00.0"]

In [2]:
import os, glob, bcolz

import numpy as np
import pandas as pd

from tqdm import tqdm
from scipy import ndimage, misc

from sklearn.model_selection import train_test_split, KFold
from sklearn.metrics import roc_auc_score

from keras import backend as K
from keras import optimizers
from keras.models import Model
from keras.callbacks import ModelCheckpoint
from keras.preprocessing.image import ImageDataGenerator

from keras.layers.normalization import BatchNormalization
from keras.layers import Dense, Dropout, Flatten, Activation, Input
from keras.layers.convolutional import MaxPooling2D, Convolution2D
from keras.layers.advanced_activations import PReLU, LeakyReLU

from keras.applications.vgg19 import VGG19
from keras.applications.resnet50 import ResNet50
from keras.applications.inception_v3 import InceptionV3
from keras.applications.xception import Xception
from keras.applications.inception_v3 import preprocess_input as preprocess_input_incep_xcep
from keras.applications.imagenet_utils import preprocess_input as preprocess_input_vgg_resnet

import matplotlib.image as mpimg
import matplotlib.pyplot as plt

Using TensorFlow backend.


In [3]:
def read_img(img_path, img_shape):
    img = misc.imread(img_path)
    img = misc.imresize(img, img_shape)
    return img

def read_imgs(img_height, img_width):
    train_img, test_img = [],[]
    for img_path in tqdm(train_set['name'].iloc[:]):
        train_img.append(read_img(os.path.join(path, 'train', str(img_path)+'.jpg'), (img_height, img_width)))

    for img_path in tqdm(test_set['name'].iloc[:]):
        test_img.append(read_img(os.path.join(path, 'test', str(img_path)+'.jpg'), (img_height, img_width)))
    return np.array(train_img), np.array(test_img)

def save_array(fname, arr):
    c=bcolz.carray(arr, rootdir=fname, mode='w')
    c.flush()

def load_array(fname):
    return bcolz.open(fname)[:]

def freeze_model(model):
    for layer in model.layers:
        layer.trainable = False
    return model

def grab_optimizer(opt, lr):
    if opt == 'sgd':
        return optimizers.SGD(lr=lr, decay=1e-6, momentum=0.8, nesterov=True)
    elif opt == 'adam':
        return optimizers.Adam(lr=lr)
    elif opt == 'adagrad':
        return optimizers.Adagrad(lr=lr)
    elif opt == 'rmsprop':
        return optimizers.RMSprop(lr=lr)
    
def dense_block(units, activation, drop_prob, inputs):
    x = Dense(units, activation=None)(inputs)
    x = BatchNormalization()(x)
    x = Activation(activation)(x)
    x = Dropout(drop_prob)(x)
    return x

def make_conv_model(input_shape, optimizer):
    inputs = Input(shape=input_shape)
    m = conv_block(16, (3,3), (2,2),'relu', inputs=inputs)
    m = conv_block(32, (3,3), (2,2), 'relu', inputs=m)
    m = conv_block(64, (3,3), (2,2), 'relu', inputs=m)
    m = conv_block(128, (3,3), (2,2), 'relu', inputs=m)
    m = conv_block(256, (3,3), (2,2), 'relu', inputs=m)
    m = Flatten()(m)
    m = dense_block(2048, 'relu', 0.25, inputs=m)
    m = dense_block(512, 'relu', 0.5, inputs=m)
    outputs = dense_block(1, 'sigmoid', 0, inputs=m)
    
    model = Model(inputs=inputs, outputs=outputs)
    model.compile(loss='binary_crossentropy', optimizer=optimizer, metrics=['accuracy'])
    return model

def make_vgg19_conv(input_shape):
    base_model = VGG19(input_shape=input_shape, weights='imagenet', include_top=False)
    base_model = freeze_model(base_model)
    return base_model

def make_incepv3_conv(input_shape):
    base_model = InceptionV3(input_shape=input_shape, weights='imagenet', include_top=False)
    base_model = freeze_model(base_model)
    return base_model

def make_resnet50_conv(input_shape):
    base_model = ResNet50(input_shape=input_shape, weights='imagenet', include_top=False)
    base_model = freeze_model(base_model)
    return base_model

def make_xception_conv(input_shape):
    base_model = Xception(input_shape=input_shape, weights='imagenet', include_top=False)
    base_model = freeze_model(base_model)
    return base_model

def make_ft_dense(input_shape, optimizer):
    inputs = Input(shape=input_shape)
    m = Flatten()(inputs)
    m = dense_block(1024, 'relu', 0.25, inputs=m)
    m = dense_block(1024, 'relu', 0.5, inputs=m)
    outputs = dense_block(1, 'sigmoid', 0, inputs=m)
    
    model = Model(inputs=inputs, outputs=outputs)
    model.compile(loss='binary_crossentropy', optimizer=optimizer, metrics=['accuracy'])
    return model

def train_model_k_folds_ft(model, base_model, train_data, train_label, model_out, model_init_weights, epochs, kfolds, batch_size):
    kf = KFold(n_splits=kfolds, shuffle=True)
    
    i = 0
    models_stats = {}
    for train_ixs, valid_ixs in kf.split(train_data):
        # use convolutional model to precompute training
        # features with data aug
    
        x_train = train_data[train_ixs]
        x_valid = train_data[valid_ixs]
        y_train = train_label[train_ixs]
        y_valid = train_label[valid_ixs]

        x_train = base_model.predict(x_train)
        x_valid = base_model.predict(x_valid)
                
        #re-initialzie the weights of the model on each run
        model.load_weights(model_init_weights)
        model_out_file = '{}_{}.model'.format(model_out, str(i))
        model_checkpoint = ModelCheckpoint(model_out_file, 
                                            monitor='val_loss', 
                                            save_best_only=True)
        
        print('training dense layers:')
        model.fit(x=x_train, y=y_train, 
                  batch_size=batch_size,
                  validation_data=(x_valid,y_valid),
                  epochs=epochs,
                  verbose=1,
                  callbacks=[model_checkpoint])
        
        model.load_weights(model_out_file)
        
        eval_tr = model.evaluate(x_train, y_train)
        eval_va = model.evaluate(x_valid, y_valid)
        
        tr_score = roc_auc_score(y_train, model.predict(x_train)[:, 0])
        va_score = roc_auc_score(y_valid, model.predict(x_valid)[:, 0])
        
        print('\n')
        print('kfold: {}'.format(str(i)))
        print('best model train acc: {}, loss: {}'.format(eval_tr[1], eval_tr[0]))
        print('best model valid acc: {}, loss: {}'.format(eval_va[1], eval_va[0]))
        print('best model train aroc score: {}, valid aroc score: {}'.format(tr_score, va_score))
        print('\n')
        models_stats[model_out_file] = {'score_tr_va':[tr_score, va_score], 'train_acc_loss':[eval_tr[1], eval_tr[0]], 'val_acc_loss':[eval_va[1], eval_va[0]]}
        
        with open(os.path.join(models_path,'{}_{}.out'.format(model_out,'history')), 'a') as f:
            f.write('kfold: {}'.format(str(i)))
            f.write('best model train acc: {}, loss: {}'.format(eval_tr[1], eval_tr[0]))
            f.write('best model valid acc: {}, loss: {}'.format(eval_va[1], eval_va[0]))
            f.write('best model train aroc score: {}, valid aroc score: {}'.format(tr_score, va_score))
            f.write('\n')
        
        i += 1
    
    return models_stats

setup data dirs and read in imgs:

In [4]:
DATA_DIR = os.path.join('/scratch', 'yns207', 'data_invasive')

path = DATA_DIR
test_path = os.path.join(path, 'test')
models_path = os.path.join(path, 'results')
train_path = os.path.join(path, 'train')
valid_path = os.path.join(path, 'valid')
print('DATA_PATH: ' + path)

DATA_PATH: /scratch/yns207/data_invasive


# loading data

In [None]:
train_set = pd.read_csv(os.path.join(path, 'train_labels.csv'))
test_set = pd.read_csv(os.path.join(path, 'sample_submission.csv'))

In [None]:
train_img, test_img = read_imgs(300,400)
train_label = np.array(train_set['invasive'].iloc[:])

create a holdout set of 10%:

In [None]:
train_img, hold_img, train_labels, hold_labels = train_test_split(train_img, train_label, test_size=0.10)

In [None]:
train_img.shape, hold_img.shape, train_labels.shape, hold_labels.shape

save the datasets unaltered so they can be loaded again at a later point:

In [None]:
%cd $models_path
save_array('aug_3_train_img.dat', train_img)
save_array('aug_3_hold_img.dat', hold_img)
save_array('aug_3_train_labels.dat', train_labels)
save_array('aug_3_hold_labels.dat', hold_labels)

# checkpoint

read the datasets with bcolz:

In [5]:
%cd $models_path
train_img = load_array('aug_3_train_img.dat')
hold_img = load_array('aug_3_hold_img.dat')
train_labels = load_array('aug_3_train_labels.dat')
hold_labels = load_array('aug_3_hold_labels.dat')

/scratch/yns207/data_invasive/results


In [6]:
train_img.shape, hold_img.shape, train_labels.shape, hold_labels.shape

((2065, 300, 400, 3), (230, 300, 400, 3), (2065,), (230,))

In [7]:
batch_size = 32
epochs = 100
kfolds = 5
lr = 0.00025

In [None]:
# get it into right folder
%cd $models_path
model_name = 'invasive_vgg19_aug3'
init_weights_model = '{}_base.model'.format(model_name)

# create base model
base_model = make_vgg19_conv(train_img[0].shape)

# train dense model ontop of precomputed conv features
dense_model = make_ft_dense(input_shape=tuple(base_model.output[0].shape.as_list()), optimizer=grab_optimizer('adam', lr))
dense_model.save_weights(init_weights_model)

#preprocess imgs
vgg19_train_img = preprocess_input_vgg_resnet(train_img.astype(np.float32))

# train dense model on folds
performance1 = train_model_k_folds_ft(dense_model, base_model, vgg19_train_img, train_labels, model_name, init_weights_model, epochs, kfolds, batch_size)

/scratch/yns207/data_invasive/results
training dense layers:
Train on 1652 samples, validate on 413 samples
Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100
Epoch 22/100
Epoch 23/100
Epoch 24/100
Epoch 25/100
Epoch 26/100
Epoch 27/100
Epoch 28/100
Epoch 29/100
Epoch 30/100
Epoch 31/100
Epoch 32/100
Epoch 33/100
Epoch 34/100
Epoch 35/100
Epoch 36/100
Epoch 37/100
Epoch 38/100
Epoch 39/100
Epoch 40/100
Epoch 41/100
Epoch 42/100
Epoch 43/100
Epoch 44/100
Epoch 45/100
Epoch 46/100
Epoch 47/100
Epoch 48/100
Epoch 49/100
Epoch 50/100
Epoch 51/100
Epoch 52/100
Epoch 53/100
Epoch 54/100
Epoch 55/100
Epoch 56/100
Epoch 57/100
Epoch 58/100
Epoch 59/100
Epoch 60/100
Epoch 61/100
Epoch 62/100
Epoch 63/100
Epoch 64/100
Epoch 65/100
Epoch 66/100
Epoch 67/100
Epoch 68/100
Epoch 69/100
Epoc

In [None]:
#resnet50
%cd $models_path
model_name = 'invasive_resnet50_aug3'
init_weights_model = '{}_base.model'.format(model_name)

base_model = make_resnet50_conv(train_img[0].shape)
dense_model = make_ft_dense(input_shape=tuple(base_model.output[0].shape.as_list()), optimizer=grab_optimizer('adam', lr))
dense_model.save_weights(init_weights_model)

# preprocess (demean normalize, etc for vgg)
resnet50_train_img = preprocess_input_vgg_resnet(train_img.astype(np.float32))
performance2 = train_model_k_folds_ft(dense_model, base_model, resnet50_train_img, train_labels, model_name, init_weights_model, epochs, kfolds, batch_size)

In [None]:
#inceptionv3
%cd $models_path
model_name = 'invasive_inceptionv3_aug3'
init_weights_model = '{}_base.model'.format(model_name)

base_model = make_incepv3_conv(train_img[0].shape)
dense_model = make_ft_dense(input_shape=tuple(base_model.output[0].shape.as_list()), optimizer=grab_optimizer('adam', lr))
dense_model.save_weights(init_weights_model)

inceptionv3_train_img = preprocess_input_incep_xcep(train_img.astype(np.float32))
performance3 = train_model_k_folds_ft(dense_model, base_model, inceptionv3_train_img, train_labels, model_name, init_weights_model, epochs, kfolds, batch_size)

In [8]:
%cd $models_path
model_name = 'invasive_xception_aug3'
init_weights_model = '{}_base.model'.format(model_name)

base_model = make_xception_conv(train_img[0].shape)
dense_model = make_ft_dense(input_shape=tuple(base_model.output[0].shape.as_list()), optimizer=grab_optimizer('adam', lr))
dense_model.save_weights(init_weights_model)

xception_train_img = preprocess_input_incep_xcep(train_img.astype(np.float32))
performance4 = train_model_k_folds_ft(dense_model, base_model, xception_train_img, train_labels, model_name, init_weights_model, epochs, kfolds, batch_size)

/scratch/yns207/data_invasive/results
training dense layers:
Train on 1652 samples, validate on 413 samples
Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100
Epoch 22/100
Epoch 23/100
Epoch 24/100
Epoch 25/100
Epoch 26/100
Epoch 27/100
Epoch 28/100
Epoch 29/100
Epoch 30/100
Epoch 31/100
Epoch 32/100
Epoch 33/100
Epoch 34/100
Epoch 35/100
Epoch 36/100
Epoch 37/100
Epoch 38/100
Epoch 39/100
Epoch 40/100
Epoch 41/100
Epoch 42/100
Epoch 43/100
Epoch 44/100
Epoch 45/100
Epoch 46/100
Epoch 47/100
Epoch 48/100
Epoch 49/100
Epoch 50/100
Epoch 51/100
Epoch 52/100
Epoch 53/100
Epoch 54/100
Epoch 55/100
Epoch 56/100
Epoch 57/100
Epoch 58/100
Epoch 59/100
Epoch 60/100
Epoch 61/100
Epoch 62/100
Epoch 63/100
Epoch 64/100
Epoch 65/100
Epoch 66/100
Epoch 67/100
Epoch 68/100
Epoch 69/100
Epoc

In [12]:
performance1

{'invasive_vgg19_aug3_0.model': {'score_tr_va': [1.0, 0.97520912547528527],
  'train_acc_loss': [1.0, 0.10456592546320423],
  'val_acc_loss': [0.91525423497899683, 0.24978774785995483]},
 'invasive_vgg19_aug3_1.model': {'score_tr_va': [1.0, 0.98594247611464969],
  'train_acc_loss': [1.0, 0.096260497360050531],
  'val_acc_loss': [0.93220338882026021, 0.21518026916513142]},
 'invasive_vgg19_aug3_2.model': {'score_tr_va': [1.0, 0.97967873533911265],
  'train_acc_loss': [1.0, 0.094112012093350045],
  'val_acc_loss': [0.92978208131420703, 0.21770779994151782]},
 'invasive_vgg19_aug3_3.model': {'score_tr_va': [1.0, 0.98369592398099515],
  'train_acc_loss': [1.0, 0.089576962604649701],
  'val_acc_loss': [0.93220338723272733, 0.21327042990966225]},
 'invasive_vgg19_aug3_4.model': {'score_tr_va': [1.0, 0.98041823112223614],
  'train_acc_loss': [1.0, 0.10280938749596225],
  'val_acc_loss': [0.93220339011915088, 0.22696813370933255]}}

In [13]:
performance2

{'invasive_resnet50_aug3_0.model': {'score_tr_va': [1.0, 0.98118838262723163],
  'train_acc_loss': [1.0, 0.097477986650951837],
  'val_acc_loss': [0.94430992476299369, 0.21711079852055695]},
 'invasive_resnet50_aug3_1.model': {'score_tr_va': [1.0, 0.97967479674796754],
  'train_acc_loss': [1.0, 0.090678999033591931],
  'val_acc_loss': [0.92736077380815374, 0.2284473896603896]},
 'invasive_resnet50_aug3_2.model': {'score_tr_va': [1.0, 0.97648202137998052],
  'train_acc_loss': [1.0, 0.088843455867386331],
  'val_acc_loss': [0.92251815720851427, 0.22848029380560497]},
 'invasive_resnet50_aug3_3.model': {'score_tr_va': [1.0, 0.98030908606448164],
  'train_acc_loss': [1.0, 0.089160008937769888],
  'val_acc_loss': [0.92493946601345811, 0.22133081978227556]},
 'invasive_resnet50_aug3_4.model': {'score_tr_va': [1.0, 0.98322302601200562],
  'train_acc_loss': [1.0, 0.091530842909512744],
  'val_acc_loss': [0.92493946659074278, 0.22031529835869557]}}

In [14]:
performance3

{'invasive_inceptionv3_aug3_0.model': {'score_tr_va': [1.0,
   0.98376432559506322],
  'train_acc_loss': [1.0, 0.10009470794882093],
  'val_acc_loss': [0.93220338752136966, 0.21509663987967928]},
 'invasive_inceptionv3_aug3_1.model': {'score_tr_va': [1.0,
   0.98466815654072037],
  'train_acc_loss': [1.0, 0.09467029169237931],
  'val_acc_loss': [0.93220338723272733, 0.21086167545930526]},
 'invasive_inceptionv3_aug3_2.model': {'score_tr_va': [1.0,
   0.98026517083120857],
  'train_acc_loss': [1.0, 0.08919046808385965],
  'val_acc_loss': [0.9418886172569404, 0.20869693196137362]},
 'invasive_inceptionv3_aug3_3.model': {'score_tr_va': [1.0,
   0.99089103996028793],
  'train_acc_loss': [1.0, 0.09285220925946501],
  'val_acc_loss': [0.9564164635921506, 0.18566454806281638]},
 'invasive_inceptionv3_aug3_4.model': {'score_tr_va': [1.0,
   0.9834322323163367],
  'train_acc_loss': [1.0, 0.094340892449995509],
  'val_acc_loss': [0.93462469603767118, 0.2113053193248213]}}

In [9]:
performance4

{'invasive_xception_aug3_0.model': {'score_tr_va': [1.0, 0.98988928770031848],
  'train_acc_loss': [1.0, 0.10268585916076388],
  'val_acc_loss': [0.95157384987893467, 0.19207329283182037]},
 'invasive_xception_aug3_1.model': {'score_tr_va': [1.0, 0.99205646549604054],
  'train_acc_loss': [1.0, 0.091459043955398819],
  'val_acc_loss': [0.95641646517968348, 0.18050229971547394]},
 'invasive_xception_aug3_2.model': {'score_tr_va': [1.0, 0.98883952184491686],
  'train_acc_loss': [1.0, 0.091712733356340739],
  'val_acc_loss': [0.94673123284633165, 0.18840859458752462]},
 'invasive_xception_aug3_3.model': {'score_tr_va': [1.0, 0.99085576259489305],
  'train_acc_loss': [1.0, 0.089450628792113893],
  'val_acc_loss': [0.95399515738498786, 0.18167023739572299]},
 'invasive_xception_aug3_4.model': {'score_tr_va': [1.0, 0.98349031920460495],
  'train_acc_loss': [1.0, 0.091769100786987287],
  'val_acc_loss': [0.93946731263731065, 0.20025796340395116]}}

with proper normalization data aug and some conv retraining should yield very good results.