In [1]:
import keras
import cv2
import os
import sys
import numpy as np
from keras.datasets import cifar10
from keras.preprocessing.image import ImageDataGenerator
from keras.models import Sequential

Using TensorFlow backend.


In [2]:
(x_train, y_train), (x_test, y_test) = cifar10.load_data()

In [3]:
IS_POSITION_BASED = True
# IS_POSITION_BASED = int(sys.argv[1])
image_size = 32
batch_size = 10
image_channels = 3
if IS_POSITION_BASED:
    image_channels = 5
num_classes = 10
epochs = 1
data_augmentation = False

In [4]:
nx, ny = (32, 32)
xt = np.linspace(0, 1, nx)
yt = np.linspace(0, 1, ny)
xpos, ypos = np.meshgrid(xt, yt)

def xy_pos_add(images):
    processed_images = []
    count = 1
    for image in images:
        # print str(count) + "/" + str(len(images))
        image = np.reshape(image, (32, 32, 3))
        img = np.swapaxes(np.swapaxes(x_train[0], 0, 2), 1, 2)
#         image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
        if IS_POSITION_BASED:
            asd = np.swapaxes(np.swapaxes(np.array(np.concatenate([[img[0]],[img[1]], [img[2]], [xpos], [ypos]])), 0, 1), 1, 2)
#             asd = np.swapaxes(np.swapaxes(np.array(np.concatenate([[image], [xpos], [ypos]])), 0, 1), 1, 2)
        else:
            asd = image
#             asd = np.swapaxes(np.swapaxes(np.array([image,]*3), 0, 1), 1, 2)
        processed_images.append(asd)
        count = count + 1
    return np.array(processed_images)

In [5]:
print('x_train shape:', x_train.shape[1:])

('x_train shape:', (32, 32, 3))


In [6]:
new_x_train = xy_pos_add(x_train)
new_x_test = xy_pos_add(x_test)
print(new_x_train.shape[1:])

(32, 32, 5)


# LABELS = {0:'airplane', 1:'automobile', 2:'bird', 3:'cat', 4:'deer', 5:'dog',

# 6:'frog', 7:'horse', 8:'ship', 9:'truck'}

In [7]:
new_y_train = keras.utils.to_categorical(y_train, num_classes)
new_y_test = keras.utils.to_categorical(y_test, num_classes)

In [8]:
# data check
import cv2
print(new_y_test[420])
cv2.imshow("test", x_test[420])
cv2.waitKey(3000)

[ 0.  0.  0.  0.  1.  0.  0.  0.  0.  0.]


-1

In [19]:
# normalize data
new_x_train = new_x_train.astype('float32')
new_x_test = new_x_test.astype('float32')
new_x_train /= 255
new_x_test /= 255

In [22]:
# model defination
from keras.applications.vgg16 import VGG16
from keras.preprocessing import image
from keras.applications.vgg16 import preprocess_input
from keras.layers import Input, Flatten, Dense, GlobalAveragePooling2D
from keras.models import Model
from keras import optimizers
from keras.callbacks import EarlyStopping
from keras.callbacks import ModelCheckpoint
from keras.callbacks import TensorBoard
from keras.callbacks import CSVLogger
from keras.callbacks import ReduceLROnPlateau
from keras.layers import Dropout, Activation
from keras.layers import Conv2D, MaxPooling2D

In [23]:
model = Sequential()

model.add(Conv2D(32, (3, 3), padding='same', input_shape=new_x_train.shape[1:]))
model.add(Activation('relu'))
model.add(Conv2D(32, (3, 3)))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.25))

model.add(Conv2D(64, (3, 3), padding='same'))
model.add(Activation('relu'))
model.add(Conv2D(64, (3, 3)))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.25))

model.add(Flatten())
model.add(Dense(512))
model.add(Activation('relu'))
model.add(Dropout(0.5))
model.add(Dense(num_classes))
model.add(Activation('softmax'))

# initiate RMSprop optimizer
# opt = keras.optimizers.rmsprop(lr=0.0001, decay=1e-6)

# Let's train the model using Adam
model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])

In [24]:
# create direct..
if not os.path.exists("../results"):
    os.mkdir("../results")
    os.mkdir("../results/position")
    os.mkdir("../results/position/best_models")
    os.mkdir("../results/normal")
    os.mkdir("../results/normal/best_models")

In [25]:
# checkpoints and logs

if IS_POSITION_BASED:
    checkpointer = ModelCheckpoint(filepath="../results/position/best_models/fn_model.{epoch:02d}-{val_acc:.6f}.hdf5", verbose=1, monitor='val_acc', save_best_only=True, save_weights_only=False, mode='max', period=1)
    tf_board = TensorBoard(log_dir='../results/position/logs', histogram_freq=0, write_graph=True, write_images=True)
    csv_logger = CSVLogger('../results/position/training.log')
else :
    checkpointer = ModelCheckpoint(filepath="../results/normal/best_models/fn_model.{epoch:02d}-{val_acc:.6f}.hdf5", verbose=1, monitor='val_acc', save_best_only=True, save_weights_only=False, mode='max', period=1)
    tf_board = TensorBoard(log_dir='../results/normal/logs', histogram_freq=0, write_graph=True, write_images=True)
    csv_logger = CSVLogger('../results/normal/training.log')

early_stopping = EarlyStopping(monitor='val_loss', patience=10)
reduce_lr = ReduceLROnPlateau(monitor='val_loss', factor=0.1, patience=5, min_lr=0.0001)

In [28]:
# model fitting
if not data_augmentation:
    print('Not using data augmentation.')
    model.fit(new_x_train, new_y_train,
              batch_size=batch_size,
              epochs=epochs,
              validation_split=0.05,
              callbacks=[early_stopping, checkpointer, tf_board, csv_logger],
              shuffle=True)
else:
    print('Using real-time data augmentation.')
    datagen = ImageDataGenerator(
        featurewise_center=False,  # set input mean to 0 over the dataset
        samplewise_center=False,  # set each sample mean to 0
        featurewise_std_normalization=False,  # divide inputs by std of the dataset
        samplewise_std_normalization=False,  # divide each input by its std
        zca_whitening=False,  # apply ZCA whitening
        rotation_range=0,  # randomly rotate images in the range (degrees, 0 to 180)
        width_shift_range=0.1,  # randomly shift images horizontally (fraction of total width)
        height_shift_range=0.1,  # randomly shift images vertically (fraction of total height)
        horizontal_flip=True,  # randomly flip images
        vertical_flip=False)  # randomly flip images

    # Compute quantities required for feature-wise normalization
    # (std, mean, and principal components if ZCA whitening is applied).
    datagen.fit(new_x_train[:5000])

    # Fit the model on the batches generated by datagen.flow().
    model.fit_generator(datagen.flow(new_x_train[:5000], new_y_train[:5000], batch_size=batch_size),
                        epochs=epochs,
                        steps_per_epoch=x_train.shape[0] // batch_size,
                        validation_data = (new_x_train[5000:], new_y_train[5000:]),
                        callbacks=[early_stopping, checkpointer, tf_board, csv_logger])
                        

Not using data augmentation.
Train on 47500 samples, validate on 2500 samples
Epoch 1/1

KeyboardInterrupt: 

In [None]:
# testing network
if IS_POSITION_BASED:
    model.save("./results/position/best_models/final_model_vgg16.hdf5")
    score, acc = model.evaluate(new_x_test, new_y_test, batch_size=batch_size)
    resultsfile = open("./results/position/results.txt", 'w')
    resultsfile.write("test_acc: "+str(acc)+"\n")
    resultsfile.write("test_score: " + str(score))
    resultsfile.close()
else:
    model.save("./results/normal/best_models/final_model_vgg16.hdf5")
    score, acc = model.evaluate(new_x_test, new_y_test, batch_size=batch_size)
    resultsfile = open("./results/normal/results.txt", 'w')
    resultsfile.write("test_acc: "+str(acc)+ "\n")
    resultsfile.write("test_score: "+str(score))
    resultsfile.close()
