In [1]:
from __future__ import division, print_function, absolute_import

import tflearn
from tflearn.layers.core import input_data, dropout, fully_connected,reshape
from tflearn.layers.conv import conv_2d, max_pool_2d,highway_conv_2d
from tflearn.layers.normalization import local_response_normalization,batch_normalization
from tflearn.layers.estimator import regression
from tflearn.layers.merge_ops import merge
# Data loading and preprocessing
import tflearn.datasets.mnist as mnist
import tflearn.data_utils as du

import tensorflow as tf
import numpy as np
import pickle, random, copy, platform, os, time

def convnet(img_aug=None, drop_out = 0.5):
    Input = tflearn.input_data(shape=[None, 75, 75, 2], dtype='float', name ='input', data_augmentation=img_aug)
    network = conv_2d(Input, 32, 5, activation='elu', regularizer="L2")
    network = max_pool_2d(network, 2)
    network = batch_normalization(network) #try with batch norm
    network = conv_2d(network, 64, 5, activation='elu', regularizer="L2")
    network = max_pool_2d(network, 2)
    network = batch_normalization(network)
    network = conv_2d(network, 128, 5, activation='elu', regularizer="L2")
    network = batch_normalization(network)
    network = fully_connected(network, 512, activation='elu')
    network = dropout(network, drop_out)
    network = fully_connected(network, 2048, activation='elu')
    network = dropout(network, drop_out)
    network = fully_connected(network, 2, activation='softmax')
    network = regression(network, optimizer='adam',loss='categorical_crossentropy', name='target')
    return network


def highnet(img_aug = None, drop_out = 0.5):
    highnet = tflearn.input_data(shape=[None, 75, 75, 2], dtype='float', name ='input', data_augmentation=img_aug)

    for i in range(3):
        for j in [3, 2, 1]:
            highnet = highway_conv_2d(highnet, 16, j, activation='elu')
        highnet = max_pool_2d(highnet, 2)
        highnet = batch_normalization(highnet)

    highnet = fully_connected(highnet, 128, activation='elu')
    highnet = dropout(highnet,drop_out);
    highnet = fully_connected(highnet, 256, activation='elu')
    highnet = dropout(highnet,drop_out);
    highnet = fully_connected(highnet, 2, activation='softmax')
    highnet = regression(highnet, optimizer='adam', learning_rate=0.01,
                         loss='categorical_crossentropy', name='target')
    return highnet

def resnet(img_aug=None, drop_out=0.5):
    # Building Residual Network
    net = input_data(shape=[None, 75, 75, 2], name='input', data_augmentation=img_aug)
    net = tflearn.conv_2d(net, 64, 3, activation='elu', bias=False)
    # Residual blocks
    net = tflearn.residual_bottleneck(net, 3, 16, 64)
    net = tflearn.residual_bottleneck(net, 1, 32, 128, downsample=True)
    net = tflearn.residual_bottleneck(net, 2, 32, 128)
    net = tflearn.residual_bottleneck(net, 1, 64, 256, downsample=True)
    net = tflearn.residual_bottleneck(net, 2, 64, 256)
    net = tflearn.batch_normalization(net)
    net = tflearn.activation(net, 'elu')
    net = tflearn.global_avg_pool(net)
    # Regression
    net = tflearn.fully_connected(net, 2, activation='softmax')
    net = tflearn.regression(net, optimizer='adam',
                             loss='categorical_crossentropy',
                             learning_rate=0.001, name='target')
    return net

def vgg(img_aug=None, drop_out=0.5):    
    Input = tflearn.input_data(shape=[None, 75, 75, 2], dtype='float', name ='input', data_augmentation=img_aug)
    network = conv_2d(Input, 64, 3, activation='relu')
    network = conv_2d(network, 64, 3, activation='relu')
    network = max_pool_2d(network, 2, strides=2)

    network = conv_2d(network, 128, 3, activation='relu')
    network = conv_2d(network, 128, 3, activation='relu')
    network = max_pool_2d(network, 2, strides=2)

    network = conv_2d(network, 256, 3, activation='relu')
    network = conv_2d(network, 256, 3, activation='relu')
    network = conv_2d(network, 256, 3, activation='relu')
    network = max_pool_2d(network, 2, strides=2)

    network = conv_2d(network, 512, 3, activation='relu')
    network = conv_2d(network, 512, 3, activation='relu')
    network = conv_2d(network, 512, 3, activation='relu')
    network = max_pool_2d(network, 2, strides=2)

    network = conv_2d(network, 512, 3, activation='relu')
    network = conv_2d(network, 512, 3, activation='relu')
    network = conv_2d(network, 512, 3, activation='relu')
    network = max_pool_2d(network, 2, strides=2)

    network = fully_connected(network, 4096, activation='relu')
    network = dropout(network, drop_out)
    network = fully_connected(network, 4096, activation='relu')
    network = dropout(network, drop_out)
    network = fully_connected(network, 2, activation='softmax')
    network = tflearn.regression(network, optimizer='adam',loss='categorical_crossentropy',learning_rate=0.001, name='target')
    
    return network

def alexnet(img_aug=None, drop_out=0.5): 
    Input = tflearn.input_data(shape=[None, 75, 75, 2], dtype='float', name ='input', data_augmentation=img_aug)
    network = conv_2d(x, 96, 11, strides=4, activation='relu')
    network = max_pool_2d(network, 3, strides=2)
    network = local_response_normalization(network)
    network = conv_2d(network, 256, 5, activation='relu')
    network = max_pool_2d(network, 3, strides=2)
    network = local_response_normalization(network)
    network = conv_2d(network, 384, 3, activation='relu')
    network = conv_2d(network, 384, 3, activation='relu')
    network = conv_2d(network, 256, 3, activation='relu')
    network = max_pool_2d(network, 3, strides=2)
    network = local_response_normalization(network)
    network = fully_connected(network, 4096, activation='tanh')
    network = dropout(network, drop_out)
    network = fully_connected(network, 4096, activation='tanh')
    network = dropout(network, drop_out)
    network = fully_connected(network, 2, activation='softmax')
    network = tflearn.regression(network, optimizer='adam',loss='categorical_crossentropy',learning_rate=0.001, name='target')
    return network

curses is not supported on this machine (please install/reinstall curses for an optimal experience)


In [2]:
def onehot_encoding (Y, y_class):
    Y_onehot = np.zeros((Y.size, int(y_class)))
    for i in range(Y.size):
        Y_onehot[i][Y[i]] = 1
    return Y_onehot

with open('resnet_data', 'rb') as f:
    data = pickle.load(f)
    Xtr = data[0]
    Xtr = np.reshape(Xtr, (-1,75,75,2))
    Ytr = data[1]
    Xte =data[2]
    Xte = np.reshape(Xte, (-1,75,75,2))
    rf = data[3]

Ytr = onehot_encoding(Ytr, 2) 
Xtr, Ytr = tflearn.data_utils.shuffle(Xtr, Ytr)

X, Y = Xtr[:1200], Ytr[:1200]
validX, validY =Xtr[1200:1500], Ytr[1200:1500]
testX, testY = Xtr[1500:],Ytr[1500:]

X, mean = du.featurewise_zero_center(X)
testX = du.featurewise_zero_center(testX, mean)
validX = du.featurewise_zero_center(validX, mean)

ensemble=10   #Total no of ensemble models : 10
n_ensemble=0   #n_semble counter
n_sample=300 #Number of validation set from training set
validX = np.concatenate((validX,X[0:n_sample]),axis=0)
validY = np.concatenate((validY,Y[0:n_sample]),axis=0)
hypotheses = np.zeros((ensemble,testY.shape[0],2))
hypotheses_valid = np.zeros((ensemble,validY.shape[0],2))

#img_prep.add_custom_preprocessing (func) <-함수 적용가능: 추가사항

img_aug = tflearn.ImageAugmentation()
img_aug.add_random_flip_leftright()
img_aug.add_random_90degrees_rotation(rotations=[0, 1, 2, 3])
img_aug.add_random_crop([75,75,2], padding=4)

In [3]:
# Training graphs
convnet1 = tf.Graph()
convnet2 = tf.Graph()
highnet1 = tf.Graph()
highnet2 = tf.Graph()
resnet1 = tf.Graph()
resnet2 = tf.Graph()
vgg1 = tf.Graph()
vgg2 = tf.Graph()
alexnet1 = tf.Graph()
alexnet2 = tf.Graph()

n_epoch=1
batch_size =20
#ensemble trial
with convnet1.as_default():
    tf.set_random_seed(777) #no reproducibility...T.T
    tflearn.init_graph(seed=777)
    network1 = convnet(img_aug=img_aug, drop_out=0.7)
    model = tflearn.DNN(network1, tensorboard_verbose=0)
    model.fit({'input': X}, {'target': Y}, n_epoch=n_epoch,
               validation_set=({'input': validX[:300]}, {'target': validY[:300]}),
               snapshot_step=1000, show_metric=True, run_id='conv1', batch_size=batch_size)
    model.save('convnet1')
    hypotheses[n_ensemble]=model.predict(testX)
    hypotheses_valid[n_ensemble]=model.predict(validX)
    n_ensemble+=1
tf.reset_default_graph()

with convnet2.as_default():
    tf.set_random_seed(777) 
    tflearn.init_graph(seed=777)
    network2 = convnet(img_aug=img_aug, drop_out=0.6)
    model2 = tflearn.DNN(network2, tensorboard_verbose=0)
    model2.fit({'input': X}, {'target': Y}, n_epoch=n_epoch,
               validation_set=({'input': validX[:300]}, {'target': validY[:300]}),show_metric=True, run_id='conv2', batch_size=batch_size)
    model2.save('convnet2')
    hypotheses[n_ensemble]=model2.predict(testX)
    hypotheses_valid[n_ensemble]=model2.predict(validX)
    n_ensemble+=1
tf.reset_default_graph()

with highnet1.as_default():
    tf.set_random_seed(779)
    tflearn.init_graph(seed=779)
    network3 = highnet(img_aug=img_aug,drop_out=0.6)
    model3 = tflearn.DNN(network3, tensorboard_verbose=0)
    model3.fit({'input': X}, {'target': Y}, n_epoch=n_epoch,validation_set=({'input': validX[:300]}, {'target': validY[:300]}),
               show_metric=True, run_id='high1', batch_size=batch_size)
    model3.save('high1')
    hypotheses[n_ensemble]=model3.predict(testX)
    hypotheses_valid[n_ensemble]=model3.predict(validX)
    n_ensemble+=1
    
tf.reset_default_graph()
with highnet2.as_default():
    tf.set_random_seed(780)
    tflearn.init_graph(seed=780)
    network4 = highnet(img_aug=img_aug,drop_out=0.5)
    model4 = tflearn.DNN(network4, tensorboard_verbose=0)
    model4.fit({'input': X}, {'target': Y}, n_epoch=n_epoch,validation_set=({'input': validX[:300]}, {'target': validY[:300]}),
               show_metric=True, run_id='high2', batch_size=batch_size)
    model4.save('high2')
    hypotheses[n_ensemble]=model4.predict(testX)
    hypotheses_valid[n_ensemble]=model4.predict(validX)
    n_ensemble+=1
tf.reset_default_graph()

with resnet1.as_default():
    tf.set_random_seed(781)
    tflearn.init_graph(seed=781)

    network5 = resnet(img_aug=img_aug,drop_out=0.7)
    model5 = tflearn.DNN(network5, tensorboard_verbose=0)

    model5.fit({'input': X}, {'target': Y}, n_epoch=n_epoch,validation_set=({'input': validX[:300]}, {'target': validY[:300]}),
               show_metric=True, run_id='resnet1', batch_size=batch_size)
    model5.save('resnet1')
    hypotheses[n_ensemble]=model5.predict(testX)
    hypotheses_valid[n_ensemble]=model5.predict(validX)
    n_ensemble+=1
tf.reset_default_graph()


with resnet2.as_default():
    tf.set_random_seed(782)
    tflearn.init_graph(seed=782)

    network6 = resnet(img_aug=img_aug,drop_out=0.6)
    model6 = tflearn.DNN(network6, tensorboard_verbose=0)
    model6.fit({'input': X}, {'target': Y}, n_epoch=n_epoch,validation_set=({'input': validX[:300]}, {'target': validY[:300]}),
               show_metric=True, run_id='resnet2',batch_size=batch_size)
    model6.save('resnet2')
    hypotheses[n_ensemble]=model6.predict(testX)
    hypotheses_valid[n_ensemble]=model6.predict(validX)
    n_ensemble+=1
tf.reset_default_graph()

with vgg1.as_default():
    tf.set_random_seed(783)
    tflearn.init_graph(seed=783)

    network7 = vgg(img_aug=img_aug,drop_out=0.6)
    model7 = tflearn.DNN(network7, tensorboard_verbose=0)
    model7.fit({'input': X}, {'target': Y}, n_epoch=n_epoch,validation_set=({'input': validX[:300]}, {'target': validY[:300]}),
               show_metric=True, run_id='vgg1',batch_size=batch_size)
    model7.save('vgg1')
    hypotheses[n_ensemble]=model7.predict(testX)
    hypotheses_valid[n_ensemble]=model7.predict(validX)
    n_ensemble+=1
tf.reset_default_graph()

with vgg2.as_default():
    tf.set_random_seed(784)
    tflearn.init_graph(seed=784)

    network8 = vgg(img_aug=img_aug,drop_out=0.7)
    model8= tflearn.DNN(network8, tensorboard_verbose=0)
    model8.fit({'input': X}, {'target': Y}, n_epoch=n_epoch,validation_set=({'input': validX[:300]}, {'target': validY[:300]}),
               show_metric=True, run_id='vgg2',batch_size=batch_size)
    model8.save('vgg2')
    hypotheses[n_ensemble]=model8.predict(testX)
    hypotheses_valid[n_ensemble]=model8.predict(validX)
    n_ensemble+=1
tf.reset_default_graph()


with alexnet1.as_default():
    tf.set_random_seed(785)
    tflearn.init_graph(seed=785)
    
    network9= alexnet(img_aug=img_aug, drop_out=0.7)
    model9 = tflearn.DNN(network9, tensorboard_verbose=0)
    model9.fit({'input': X}, {'target': Y}, n_epoch=n_epoch,validation_set=({'input': validX[:300]}, {'target': validY[:300]}),
               show_metric=True, run_id='alex1',batch_size=batch_size)
    model9.save('alex1')
    hypotheses[n_ensemble]=model9.predict(testX)
    hypotheses_valid[n_ensemble]=model9.predict(validX)
    n_ensemble+=1
tf.reset_default_graph()

with alexnet2.as_default():
    tf.set_random_seed(786)
    tflearn.init_graph(seed=786)

    network10= alexnet(img_aug=img_aug,drop_out=0.6)
    model10 = tflearn.DNN(network10, tensorboard_verbose=0)
    model10.fit({'input': X}, {'target': Y}, n_epoch=n_epoch,validation_set=({'input': validX[:300]}, {'target': validY[:300]}),
                show_metric=True, run_id='alex2',batch_size=batch_size)
    model10.save('alex2')
    hypotheses[n_ensemble]=model10.predict(testX)
    hypotheses_valid[n_ensemble]=model10.predict(validX)

    n_ensemble+=1
tf.reset_default_graph()

#End of training

print("Optimization finished")

hypotheses_valid = hypotheses_valid.transpose([1,0,2])
hypotheses = hypotheses.transpose([1,0,2])
hypothesis = np.zeros((testY.shape[0],2))

#Ensemble weight training : using Validation set
ens=tf.Graph()
with ens.as_default():
    ensemble_net = input_data(shape=[None,n_ensemble, 2], name='input')
    ensemble_net = fully_connected(ensemble_net, 2, activation='softplus')
    ensemble_net = regression(ensemble_net, optimizer='adam', learning_rate=0.01,
                         loss='categorical_crossentropy', name='target')

    ens_model = tflearn.DNN(ensemble_net, tensorboard_verbose=0)
    ens_model.fit({'input': hypotheses_valid}, {'target': validY}, n_epoch=20, show_metric=False, run_id='ensemble',batch_size=100)

    hypothesis = ens_model.predict(hypotheses)
    ens_model.save('ens_model')


correct_prediction = np.equal(np.argmax(hypothesis,1), np.argmax(testY, 1))
accuracy_ens = np.mean(correct_prediction)

print("Final Accuracy :", accuracy_ens)


Training Step: 59  | total loss: [1m[32m0.53473[0m[0m | time: 24.252s
| Adam | epoch: 001 | loss: 0.53473 - acc: 0.7494 -- iter: 1180/1200
Training Step: 60  | total loss: [1m[32m0.53650[0m[0m | time: 25.816s
| Adam | epoch: 001 | loss: 0.53650 - acc: 0.7429 | val_loss: 0.52473 - val_acc: 0.7267 -- iter: 1200/1200
--
INFO:tensorflow:C:\Users\User\Desktop\kaggle\resnet1 is not in all_model_checkpoint_paths. Manually adding it.


ResourceExhaustedError: OOM when allocating tensor with shape[600,64,75,75]
	 [[Node: ResidualBottleneck_1/Conv2D/Conv2D = Conv2D[T=DT_FLOAT, data_format="NHWC", padding="VALID", strides=[1, 2, 2, 1], use_cudnn_on_gpu=true, _device="/job:localhost/replica:0/task:0/device:GPU:0"](ResidualBottleneck_1/Relu, ResidualBottleneck_1/Conv2D/W/read/_2183)]]
	 [[Node: FullyConnected/BiasAdd/_2219 = _Recv[client_terminated=false, recv_device="/job:localhost/replica:0/task:0/device:CPU:0", send_device="/job:localhost/replica:0/task:0/device:GPU:0", send_device_incarnation=1, tensor_name="edge_1342_FullyConnected/BiasAdd", tensor_type=DT_FLOAT, _device="/job:localhost/replica:0/task:0/device:CPU:0"]()]]

Caused by op 'ResidualBottleneck_1/Conv2D/Conv2D', defined at:
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\runpy.py", line 193, in _run_module_as_main
    "__main__", mod_spec)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\runpy.py", line 85, in _run_code
    exec(code, run_globals)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\ipykernel_launcher.py", line 16, in <module>
    app.launch_new_instance()
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\traitlets\config\application.py", line 658, in launch_instance
    app.start()
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\ipykernel\kernelapp.py", line 477, in start
    ioloop.IOLoop.instance().start()
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\zmq\eventloop\ioloop.py", line 177, in start
    super(ZMQIOLoop, self).start()
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\tornado\ioloop.py", line 888, in start
    handler_func(fd_obj, events)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\tornado\stack_context.py", line 277, in null_wrapper
    return fn(*args, **kwargs)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\zmq\eventloop\zmqstream.py", line 440, in _handle_events
    self._handle_recv()
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\zmq\eventloop\zmqstream.py", line 472, in _handle_recv
    self._run_callback(callback, msg)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\zmq\eventloop\zmqstream.py", line 414, in _run_callback
    callback(*args, **kwargs)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\tornado\stack_context.py", line 277, in null_wrapper
    return fn(*args, **kwargs)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\ipykernel\kernelbase.py", line 283, in dispatcher
    return self.dispatch_shell(stream, msg)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\ipykernel\kernelbase.py", line 235, in dispatch_shell
    handler(stream, idents, msg)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\ipykernel\kernelbase.py", line 399, in execute_request
    user_expressions, allow_stdin)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\ipykernel\ipkernel.py", line 196, in do_execute
    res = shell.run_cell(code, store_history=store_history, silent=silent)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\ipykernel\zmqshell.py", line 533, in run_cell
    return super(ZMQInteractiveShell, self).run_cell(*args, **kwargs)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\IPython\core\interactiveshell.py", line 2698, in run_cell
    interactivity=interactivity, compiler=compiler, result=result)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\IPython\core\interactiveshell.py", line 2802, in run_ast_nodes
    if self.run_code(code, result):
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\IPython\core\interactiveshell.py", line 2862, in run_code
    exec(code_obj, self.user_global_ns, self.user_ns)
  File "<ipython-input-3-f7cba7a7cd8d>", line 73, in <module>
    network5 = resnet(img_aug=img_aug,drop_out=0.7)
  File "<ipython-input-1-b7619e0b8b96>", line 60, in resnet
    net = tflearn.residual_bottleneck(net, 1, 32, 128, downsample=True)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\tflearn\layers\conv.py", line 1542, in residual_bottleneck
    trainable, restore)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\tflearn\layers\conv.py", line 99, in conv_2d
    inference = tf.nn.conv2d(incoming, W, strides, padding)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\tensorflow\python\ops\gen_nn_ops.py", line 630, in conv2d
    data_format=data_format, name=name)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\tensorflow\python\framework\op_def_library.py", line 787, in _apply_op_helper
    op_def=op_def)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\tensorflow\python\framework\ops.py", line 2956, in create_op
    op_def=op_def)
  File "C:\Users\User\Anaconda3\envs\tensorflow\lib\site-packages\tensorflow\python\framework\ops.py", line 1470, in __init__
    self._traceback = self._graph._extract_stack()  # pylint: disable=protected-access

ResourceExhaustedError (see above for traceback): OOM when allocating tensor with shape[600,64,75,75]
	 [[Node: ResidualBottleneck_1/Conv2D/Conv2D = Conv2D[T=DT_FLOAT, data_format="NHWC", padding="VALID", strides=[1, 2, 2, 1], use_cudnn_on_gpu=true, _device="/job:localhost/replica:0/task:0/device:GPU:0"](ResidualBottleneck_1/Relu, ResidualBottleneck_1/Conv2D/W/read/_2183)]]
	 [[Node: FullyConnected/BiasAdd/_2219 = _Recv[client_terminated=false, recv_device="/job:localhost/replica:0/task:0/device:CPU:0", send_device="/job:localhost/replica:0/task:0/device:GPU:0", send_device_incarnation=1, tensor_name="edge_1342_FullyConnected/BiasAdd", tensor_type=DT_FLOAT, _device="/job:localhost/replica:0/task:0/device:CPU:0"]()]]
