In [1]:
import os
os.environ["CUDA_VISIBLE_DEVICES"]="1" 
import ast
import datetime as dt
import matplotlib.pyplot as plt
import seaborn as sns
import cv2
import pandas as pd
import numpy as np
import tensorflow as tf
import keras
from keras import backend as K
from keras import Model
from keras import optimizers
from keras.legacy import interfaces
from keras.utils.generic_utils import get_custom_objects
from keras.layers import Conv2D, MaxPooling2D
from keras.layers import Dense, Dropout, Flatten, Activation, GlobalAveragePooling2D, BatchNormalization
from keras.metrics import categorical_accuracy, top_k_categorical_accuracy, categorical_crossentropy
from keras.models import Sequential
from keras.callbacks import EarlyStopping, ReduceLROnPlateau, ModelCheckpoint, TensorBoard
from keras.optimizers import Adam

from keras.optimizers import SGD
from keras import callbacks
from data import *
from keras_helper import *

from keras.applications import MobileNetV2
from keras.applications.mobilenetv2 import preprocess_input

Using TensorFlow backend.


In [2]:
TOT = 35534421
EPOCHS = 150
size = 64
batchsize = 640
lw = 6
channel = 3
STEPS = TOT / EPOCHS / batchsize
NCATS = 340
mixup = 0
center = False
optimizer = 'adam'
cb = 'raw'

In [3]:
valid_df = pd.read_csv('../input/valid.csv')
x_valid = df_to_image_array_xd(valid_df, size, lw=lw, preprocess_input=preprocess_input, 
                               channel=channel, center = center)
y_valid = keras.utils.to_categorical(valid_df.word, num_classes=NCATS)

print(x_valid.shape, y_valid.shape)
print('Validation array memory {:.2f} GB'.format(x_valid.nbytes / 1024.**3 ))

x shape (34000, 64, 64, 3) x max 255
(34000, 64, 64, 3) (34000, 340)
Validation array memory 1.56 GB


In [4]:
K.clear_session()
# model = Xception(input_shape=(size, size, channel), weights=None, classes=NCATS)
model = MobileNetV2(input_shape=(size,size,channel), weights=None, classes=NCATS)

if optimizer == 'sgd':
    opt = SGD(0.002, momentum=0.9, nesterov=True)
    opt = NormalizedOptimizer(opt, normalization='l2')
elif optimizer == 'adam':
    opt = Adam(lr=0.002)

model.compile(optimizer=opt, loss='categorical_crossentropy',
              metrics=[categorical_crossentropy, categorical_accuracy, top_3_accuracy])
print(model.summary())

__________________________________________________________________________________________________
Layer (type)                    Output Shape         Param #     Connected to                     
input_1 (InputLayer)            (None, 64, 64, 3)    0                                            
__________________________________________________________________________________________________
Conv1_pad (ZeroPadding2D)       (None, 65, 65, 3)    0           input_1[0][0]                    
__________________________________________________________________________________________________
Conv1 (Conv2D)                  (None, 32, 32, 32)   864         Conv1_pad[0][0]                  
__________________________________________________________________________________________________
bn_Conv1 (BatchNormalization)   (None, 32, 32, 32)   128         Conv1[0][0]                      
__________________________________________________________________________________________________
Conv1_relu

In [5]:
train_datagen = image_generator_xd(df_path = '../input/train_all_balance.csv', 
                                   size=size, batchsize=batchsize, lw=lw, 
                                   preprocess_input=preprocess_input,
                                  channel=channel, mixup=mixup, center=center)

In [6]:
model_prefix = 'mobile{}_linelength_lw{}_balance_{}_{}'.format(size, lw, mixup, optimizer, cb)
if center:
    model_prefix += '_center'
if channel == 3:
    model_prefix += '_parts'
print(model_prefix)
check_path = "./models/{}.model".format(model_prefix)
fold = 9
if cb == 'raw':
    callbks = [
        ReduceLROnPlateau(monitor='val_top_3_accuracy', factor=0.5, patience=5,
                          min_delta=0.005, mode='max', cooldown=3, verbose=1),
        callbacks.ModelCheckpoint(check_path,
                                    monitor='val_top_3_accuracy', 
                                    mode = 'max', save_best_only=True, verbose=1),
        callbacks.TensorBoard(log_dir='./log/{}'.format(model_prefix)),
        EarlyStopping(monitor='val_top_3_accuracy', mode='max',patience=20, verbose=1)
    ]
elif cb == 'snap':
    snapshot = SnapshotCallbackBuilder(nb_epochs=EPOCHS,
                                       nb_snapshots=1,
                                       size = size,
                                       init_lr=1e-3, 
                                       fold=fold)

    callbks = snapshot.get_callbacks(model_prefix = model_prefix)

mobile64_linelength_lw6_balance_0_adam_parts


In [None]:
hists = []
hist = model.fit_generator(
    train_datagen, steps_per_epoch=STEPS, epochs=EPOCHS, verbose=1,
    validation_data=(x_valid, y_valid),
    callbacks = callbks
)

Epoch 1/150

Epoch 00001: val_top_3_accuracy improved from -inf to 0.02924, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 2/150

Epoch 00002: val_top_3_accuracy improved from 0.02924 to 0.07721, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 3/150

Epoch 00003: val_top_3_accuracy did not improve from 0.07721
Epoch 4/150

Epoch 00004: val_top_3_accuracy did not improve from 0.07721
Epoch 5/150

Epoch 00005: val_top_3_accuracy did not improve from 0.07721
Epoch 6/150

Epoch 00006: val_top_3_accuracy improved from 0.07721 to 0.09438, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 7/150

Epoch 00007: val_top_3_accuracy improved from 0.09438 to 0.13976, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 8/150

Epoch 00008: val_top_3_accuracy improved from 0.13976 to 0.14026, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 


Epoch 00021: val_top_3_accuracy did not improve from 0.49397
Epoch 22/150

Epoch 00022: val_top_3_accuracy improved from 0.49397 to 0.52665, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 23/150

Epoch 00023: val_top_3_accuracy did not improve from 0.52665
Epoch 24/150

Epoch 00024: val_top_3_accuracy did not improve from 0.52665
Epoch 25/150

Epoch 00025: val_top_3_accuracy improved from 0.52665 to 0.60274, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 26/150

Epoch 00026: val_top_3_accuracy did not improve from 0.60274
Epoch 27/150

Epoch 00027: val_top_3_accuracy did not improve from 0.60274
Epoch 28/150

Epoch 00028: val_top_3_accuracy improved from 0.60274 to 0.62538, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 29/150

Epoch 00029: val_top_3_accuracy improved from 0.62538 to 0.63691, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 30/150




Epoch 00042: val_top_3_accuracy improved from 0.80544 to 0.85376, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 43/150

Epoch 00043: val_top_3_accuracy improved from 0.85376 to 0.86721, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 44/150

Epoch 00044: val_top_3_accuracy improved from 0.86721 to 0.88385, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 45/150

Epoch 00045: val_top_3_accuracy improved from 0.88385 to 0.88500, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 46/150

Epoch 00046: val_top_3_accuracy improved from 0.88500 to 0.88771, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 47/150

Epoch 00047: val_top_3_accuracy improved from 0.88771 to 0.88856, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 48/150

Epoch 00048: val_top_3_accuracy improved from 0.88856 to 0.8914


Epoch 00061: val_top_3_accuracy improved from 0.90724 to 0.90768, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 62/150

Epoch 00062: val_top_3_accuracy did not improve from 0.90768
Epoch 63/150

Epoch 00063: val_top_3_accuracy did not improve from 0.90768
Epoch 64/150

Epoch 00064: val_top_3_accuracy improved from 0.90768 to 0.90774, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 65/150

Epoch 00065: ReduceLROnPlateau reducing learning rate to 0.0002500000118743628.

Epoch 00065: val_top_3_accuracy improved from 0.90774 to 0.90879, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 66/150

Epoch 00066: val_top_3_accuracy improved from 0.90879 to 0.91147, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 67/150

Epoch 00067: val_top_3_accuracy did not improve from 0.91147
Epoch 68/150

Epoch 00068: val_top_3_accuracy did not improve from 0.91147
Epoch 69


Epoch 00081: val_top_3_accuracy improved from 0.91376 to 0.91382, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 82/150

Epoch 00082: val_top_3_accuracy did not improve from 0.91382
Epoch 83/150

Epoch 00083: val_top_3_accuracy improved from 0.91382 to 0.91421, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 84/150

Epoch 00084: val_top_3_accuracy did not improve from 0.91421
Epoch 85/150

Epoch 00085: val_top_3_accuracy improved from 0.91421 to 0.91444, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 86/150

Epoch 00086: ReduceLROnPlateau reducing learning rate to 3.125000148429535e-05.

Epoch 00086: val_top_3_accuracy did not improve from 0.91444
Epoch 87/150

Epoch 00087: val_top_3_accuracy did not improve from 0.91444
Epoch 88/150

Epoch 00088: val_top_3_accuracy did not improve from 0.91444
Epoch 89/150

Epoch 00089: val_top_3_accuracy did not improve from 0.91444
Epoch 90/150




Epoch 00101: val_top_3_accuracy did not improve from 0.91512
Epoch 102/150

Epoch 00102: val_top_3_accuracy did not improve from 0.91512
Epoch 103/150

Epoch 00103: val_top_3_accuracy did not improve from 0.91512
Epoch 104/150

Epoch 00104: val_top_3_accuracy improved from 0.91512 to 0.91515, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 105/150

Epoch 00105: val_top_3_accuracy improved from 0.91515 to 0.91524, saving model to ./models/mobile64_linelength_lw6_balance_0_adam_parts.model
Epoch 106/150

Epoch 00106: val_top_3_accuracy did not improve from 0.91524
Epoch 107/150

Epoch 00107: ReduceLROnPlateau reducing learning rate to 3.906250185536919e-06.

Epoch 00107: val_top_3_accuracy did not improve from 0.91524
Epoch 108/150

In [None]:
test = pd.read_csv('../input/test_simplified.csv')
test.head()
x_test = df_to_image_array_xd(test, size, lw=lw, 
                              preprocess_input=preprocess_input,
                             channel=channel, center = center)
print(test.shape, x_test.shape)
print('Test array memory {:.2f} GB'.format(x_test.nbytes / 1024.**3 ))

np_classes = np.load('../input/classes.npy')
id2cat = {k: cat.replace(' ', '_') for k, cat in enumerate(np_classes)}


In [None]:
def doodle_predict(model, model_path, x_test):
    model.load_weights(model_path)

    test_predictions = model.predict(x_test, batch_size=128, verbose=1)
    top3 = preds2catids(test_predictions)
    top3cats = top3.replace(id2cat)
    test['word'] = top3cats['a'] + ' ' + top3cats['b'] + ' ' + top3cats['c']
    submission = test[['key_id', 'word']]

    import kaggle_util
    kaggle_util.save_result(submission,  
                            '../result/{}.csv'.format(model_prefix), 
                            'quickdraw-doodle-recognition', 
                            send=True, index=False)

In [None]:
# doodle_predict(model, check_path, x_test)