In [5]:
import cv2                 # working with, mainly resizing, images
import numpy as np         # dealing with arrays
import os                  # dealing with directories
from random import shuffle # mixing up or currently ordered data that might lead our network astray in training.
from tqdm.auto import tqdm      # a nice pretty percentage bar for tasks. Thanks to viewer Daniel BA1/4hler for this suggestion

TRAIN_DIR = 'C:/Dataset/train'
TEST_DIR = 'C:/Dataset/test'
IMG_SIZE = 50
LR = 0.001

MODEL_NAME = 'dogsvscats-{}-{}.model'.format(LR, '2conv-basic (50,50)')

In [2]:
def label_img(img):
    word_label = img.split('.')[-3]
    # conversion to one-hot array [cat,dog]
    #                            [much cat, no dog]
    if word_label == 'cat': return [1,0]
    #                             [no cat, very doggo]
    elif word_label == 'dog': return [0,1]

In [3]:
def create_train_data():
    training_data = []
    for img in tqdm(os.listdir(TRAIN_DIR)):
        label = label_img(img)
        path = os.path.join(TRAIN_DIR,img)
        img = cv2.imread(path,cv2.IMREAD_GRAYSCALE)
        img = cv2.resize(img, (IMG_SIZE,IMG_SIZE))
        training_data.append([np.array(img),np.array(label)])
    shuffle(training_data)
    np.save('train_data.npy', training_data)
    return training_data




In [4]:
def process_test_data():
    testing_data = []
    for img in tqdm(os.listdir(TEST_DIR)):
        path = os.path.join(TEST_DIR,img)
        img_num = img.split('.')[0]
        img = cv2.imread(path,cv2.IMREAD_GRAYSCALE)
        img = cv2.resize(img, (IMG_SIZE,IMG_SIZE))
        testing_data.append([np.array(img), img_num])
        
    shuffle(testing_data)
    np.save('test_data.npy', testing_data)

In [6]:
#train_data = create_train_data()
#train_data = np.load('CatDog-50x50.npy')
train_data = np.load('train_data.npy')


HBox(children=(IntProgress(value=0, max=25000), HTML(value='')))




In [8]:
import tflearn
from tflearn.layers.conv import conv_2d, max_pool_2d
from tflearn.layers.core import input_data, dropout, fully_connected
from tflearn.layers.estimator import regression

convnet = input_data(shape=[None, IMG_SIZE, IMG_SIZE, 1], name='input')

convnet = conv_2d(convnet, 32, 5, activation='relu')
convnet = max_pool_2d(convnet, 5)

convnet = conv_2d(convnet, 64, 5, activation='relu')
convnet = max_pool_2d(convnet, 5)

convnet = conv_2d(convnet, 128, 5, activation='relu')
convnet = max_pool_2d(convnet, 5)

convnet = conv_2d(convnet, 64, 5, activation='relu')
convnet = max_pool_2d(convnet, 5)

convnet = conv_2d(convnet, 32, 5, activation='relu')
convnet = max_pool_2d(convnet, 5)

convnet = fully_connected(convnet, 1024, activation='relu')
convnet = dropout(convnet, 0.8)

convnet = fully_connected(convnet, 2, activation='softmax')
convnet = regression(convnet, optimizer='adam', learning_rate=LR, loss='categorical_crossentropy', name='targets')

model = tflearn.DNN(convnet, tensorboard_dir='../AlexandreDataset/logs')


curses is not supported on this machine (please install/reinstall curses for an optimal experience)
Instructions for updating:
Colocations handled automatically by placer.
Instructions for updating:
Use tf.initializers.variance_scaling instead with distribution=uniform to get equivalent behavior.
Instructions for updating:
Please use `rate` instead of `keep_prob`. Rate should be set to `rate = 1 - keep_prob`.
Instructions for updating:
keep_dims is deprecated, use keepdims instead
Instructions for updating:
Use tf.cast instead.


In [6]:
if os.path.exists('{}.meta'.format(MODEL_NAME)):
    model.load(MODEL_NAME)
    print('model loaded!')

In [11]:
train = train_data[:-5000]
test = train_data[-5000:]

In [12]:
X = np.array([i[0] for i in train]).reshape(-1,IMG_SIZE,IMG_SIZE,1)
Y = [i[1] for i in train]

test_x = np.array([i[0] for i in test]).reshape(-1,IMG_SIZE,IMG_SIZE,1)
test_y = [i[1] for i in test]

In [13]:
model.fit({'input': X}, {'targets': Y}, n_epoch=10, validation_set=({'input': test_x}, {'targets': test_y}), show_metric=True, run_id=MODEL_NAME)

Training Step: 3129  | total loss: 0.34577 | time: 63.336s
| Adam | epoch: 010 | loss: 0.34577 - acc: 0.8426 -- iter: 19968/20000
Training Step: 3130  | total loss: 0.34955 | time: 69.112s
| Adam | epoch: 010 | loss: 0.34955 - acc: 0.8396 | val_loss: 0.52837 - val_acc: 0.7588 -- iter: 20000/20000
--


In [18]:
model.save(MODEL_NAME)


INFO:tensorflow:C:\Users\skzt\PycharmProjects\tcc\test\Own Dataset\dogsvscats-0.001-2conv-basic.model is not in all_model_checkpoint_paths. Manually adding it.


In [15]:
process_test_data()

HBox(children=(IntProgress(value=0, max=12500), HTML(value='')))




[[array([[142, 142, 147, ..., 182, 170, 136],
         [157, 152, 156, ..., 169, 159, 115],
         [161, 158, 163, ..., 161, 148, 100],
         ...,
         [142, 181, 231, ..., 230, 242, 235],
         [115, 225, 228, ..., 236, 231, 246],
         [179, 218, 224, ..., 237, 230, 239]], dtype=uint8), '11040'],
 [array([[ 33,  33,  31, ...,  43,  53,  47],
         [ 27,  33,  37, ...,  41,  39,  56],
         [ 39,  41,  39, ...,  45,  52,  42],
         ...,
         [ 29,  27,  31, ...,  82, 107, 108],
         [ 32,  27,  21, ...,  93,  99,  97],
         [ 33,  24,  26, ...,  97,  86,  92]], dtype=uint8), '1088'],
 [array([[158, 164, 160, ..., 167, 147, 153],
         [184, 190, 159, ..., 165, 135, 151],
         [164, 179, 152, ..., 161, 133, 176],
         ...,
         [123, 166, 151, ..., 163, 130, 124],
         [150, 144, 128, ..., 146, 127, 157],
         [136, 132, 145, ..., 142, 121, 128]], dtype=uint8), '4656'],
 [array([[54,  2, 73, ..., 18, 15, 10],
         [58, 12,

In [14]:
import matplotlib.pyplot as plt

# if you need to create the data:
#test_data = process_test_data()
# if you already have some saved:
test_data = np.load('test_data.npy')

fig=plt.figure()

for num,data in enumerate(test_data[:12]):
    # cat: [1,0]
    # dog: [0,1]
    
    img_num = data[1]
    img_data = data[0]
    
    y = fig.add_subplot(3,4,num+1)
    orig = img_data
    data = img_data.reshape(IMG_SIZE,IMG_SIZE,1)
    #model_out = model.predict([data])[0]
    model_out = model.predict([data])[0]
    
    if np.argmax(model_out) == 1: str_label='Dog'
    else: str_label='Cat'
        
    y.imshow(orig,cmap='gray')
    plt.title(str_label)
    y.axes.get_xaxis().set_visible(False)
    y.axes.get_yaxis().set_visible(False)
plt.show()

FileNotFoundError: [Errno 2] No such file or directory: 'test_data.npy'

In [22]:
img = cv2.imread("03.jpg", cv2.IMREAD_GRAYSCALE)
img = cv2.resize(img, (50,50))
img = img.reshape(50,50,1)

In [23]:
mdl = model.predict([img])[0]

In [25]:
mdl

array([0.47631863, 0.5236814 ], dtype=float32)