In [3]:
import cv2  # for resizing image
import numpy as np  # for arrays
import os  # to play with directories
from random import shuffle
from tqdm import tqdm  # for professional looping with progress bar

TRAIN_DIR = '/Users/jacquesthibodeau/Downloads/train/'
TEST_DIR = '/Users/jacquesthibodeau/Downloads/test/'
IMG_SIZE = 50
LR = 1e-3

MODEL_NAME = 'dogsvscats-{}-{}.model'.format(LR, '2conv-basic')

In [4]:
def label_img(img):
    # filenames are ex: cat.9.png, so we'll take out the 'cat' or 'dog' part
    word_label = img.split('.')[-3]
    if word_label == 'cat': return [1,0]
    elif word_label == 'dog': return [0,1]

In [5]:
def create_train_data():
    training_data = []
    # let's take every image in our training data and convert it into
    # a grayscale image of size 50x50 pixels. Grayscale sets every training
    # image a 1D array that gives an intensity value
    for img in tqdm(os.listdir(TRAIN_DIR)):
        label = label_img(img)
        path = os.path.join(TRAIN_DIR, img)
        img = cv2.resize(cv2.imread(path, cv2.IMREAD_GRAYSCALE), (IMG_SIZE, IMG_SIZE))
        training_data.append([np.array(img), np.array(label)])
    shuffle(training_data)
    np.save('training_data.npy', training_data)
    return training_data

In [6]:
def process_test_data():
    testing_data = []
    for img in tqdm(os.listdir(TEST_DIR)):
        path = os.path.join(TEST_DIR, img)
        img_num = img.split('.')[0]
        img = cv2.resize(cv2.imread(path, cv2.IMREAD_GRAYSCALE), (IMG_SIZE, IMG_SIZE))
        testing_data.append([np.array(img), img_num])
        
    np.save('test_data.npy', testing_data)
    return testing_data

In [7]:
train_data = create_train_data()
# or if you already have train data:
# train_data = np.load('train_data.npy')

100%|██████████| 25000/25000 [00:32<00:00, 763.56it/s]


In [10]:
from keras.models import Sequential
from keras.layers.core import Dense, Dropout, Activation, Flatten
from keras.layers.convolutional import Conv2D, MaxPooling2D
from keras.utils import np_utils

In [None]:
model = Sequential()

# Conv2D(number_filters, row_size, column_size, input_shape=(number_channels, img_row, img_col))

model.add(Conv2D(6, (5, 5), input_shape=(1, IMG_SIZE, IMG_SIZE), padding='same')) # convolution layer
model.add(Activation('relu')) # ReLU = Rectified Linear Unit / non-linearity layer
model.add(MaxPooling2D(pool_size=(2, 2), data_format="channels_first"))
model.add(Conv2D(16, (5, 5), padding='same'))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2), data_format="channels_first"))
model.add(Conv2D(120, (5, 5), data_format="channels_first"))
model.add(Activation('relu'))
model.add(Dropout(0.25))
model.add(Flatten()) # flatten the image

# add fully-connected layers

model.add(Dense(84))
model.add(Activation('relu'))
model.add(Dropout(0.5))
model.add(Dense(10))
model.add(Activation('softmax'))

sgd = optimizers.SGD(lr=LR, decay=1e-6, momentum=0.9, nesterov=True)
model.compile(loss='categorical_crossentropy', optimizer=sgd, metrics=['accuracy'])