In [9]:
import os
import cv2
import numpy as np
from tqdm import tqdm

REBUILD_DATA = False

class DogsVSCats():
    IMG_SIZE = 50
    CATS = "PetImages/Cat"
    DOGS = "PetImages/Dog"
    TESTING = "PetImages/Testing"
    LABELS = {CATS: 0, DOGS: 1}
    training_data = []

    catcount = 0
    dogcount = 0

    def make_training_data(self):
        for label in self.LABELS:
            print(label)
            for f in tqdm(os.listdir(label)):
                if "jpg" in f:
                    try:
                        path = os.path.join(label, f)
                        img = cv2.imread(path, cv2.IMREAD_GRAYSCALE)
                        img = cv2.resize(img, (self.IMG_SIZE, self.IMG_SIZE))
                        self.training_data.append([np.array(img), np.eye(2)[self.LABELS[label]]])

                        if label == self.CATS:
                            self.catcount += 1
                        elif label == self.DOGS:
                            self.dogcount += 1

                    except Exception as e:
                        pass

        np.random.shuffle(self.training_data)
        np.save("training_data.npy", self.training_data)
        print('Cats:',dogsvcats.catcount)
        print('Dogs:',dogsvcats.dogcount)

if REBUILD_DATA:
    dogsvcats = DogsVSCats()
    dogsvcats.make_training_data()

training_data = np.load('training_data.npy', allow_pickle=True)

import torch
import torch.nn as nn
import torch.nn.functional as F

class Net(nn.Module):
    def __init__(self):
        super().__init__()
        self.conv1 = nn.Conv2d(1, 32, 5)
        self.conv2 = nn.Conv2d(32, 64, 5)
        self.conv3 = nn.Conv2d(64, 128, 5)

        x = torch.randn(50, 50).view(-1, 1, 50, 50)
        self._to_linear = None
        self.convs(x)

        self.fc1 = nn.Linear(self._to_linear, 512)
        self.fc2 = nn.Linear(512, 2)

    def convs(self, x):
        x = F.max_pool2d(F.relu(self.conv1(x)), (2,2))
        x = F.max_pool2d(F.relu(self.conv2(x)), (2,2))
        x = F.max_pool2d(F.relu(self.conv3(x)), (2,2))

        # print(x[0].shape)
        if self._to_linear is None:
            self._to_linear = x[0].shape[0]*x[0].shape[1]*x[0].shape[2]
        return x

    def forward(self, x):
        x = self.convs(x)
        x = x.view(-1, self._to_linear)
        x = F.relu(self.fc1(x))
        x = self.fc2(x)
        return F.softmax(x, dim = 1)

net = Net().cuda()

import torch.optim as optim

X = torch.Tensor([i[0] for i in training_data]).view(-1, 50, 50).cuda()
X = X/255.0
y = torch.Tensor([i[1] for i in training_data]).cuda()

VAL_PCT = 0.1
val_size = int(len(X)*VAL_PCT)

train_X = X[:-val_size]
train_y = y[:-val_size]

test_X = X[-val_size:]
test_y = y[-val_size:]

def train(net, EPOCHS = 4, BATCH_SIZE = 100):

    optimizer = optim.Adam(net.parameters(), lr=0.001)
    loss_function = nn.MSELoss()


    for epoch in range(EPOCHS):
        for i in tqdm(range(0, len(train_X), BATCH_SIZE)): 
            
            #print(f"{i}:{i+BATCH_SIZE}")
            batch_X = train_X[i:i+BATCH_SIZE].view(-1, 1, 50, 50)
            batch_y = train_y[i:i+BATCH_SIZE]

            batch_X, batch_y = batch_X.cuda(), batch_y.cuda()

            net.zero_grad()
            # print('fire')
            outputs = net(batch_X)
            loss = loss_function(outputs, batch_y)
            loss.backward()
            optimizer.step()    # Does the update
            

        print(f"\nEpoch: {epoch}. Loss: {loss}")

def test(net):
    correct = 0
    total = 0
    with torch.no_grad():
        for i in tqdm(range(len(test_X))):
            real_class = torch.argmax(test_y[i]).cuda()
            net_out = net(test_X[i].view(-1, 1, 50, 50))[0]  # returns a list, 
            predicted_class = torch.argmax(net_out)

            if predicted_class == real_class:
                correct += 1
            total += 1

    print("\nAccuracy: ", round(correct/total, 3))

In [12]:
train(net, 10, 500)

100%|██████████| 45/45 [00:01<00:00, 43.14it/s]
 24%|██▍       | 11/45 [00:00<00:00, 98.48it/s]
Epoch: 0. Loss: 0.096854068338871
100%|██████████| 45/45 [00:00<00:00, 45.76it/s]
 24%|██▍       | 11/45 [00:00<00:00, 96.75it/s]
Epoch: 1. Loss: 0.09046080708503723
100%|██████████| 45/45 [00:00<00:00, 45.81it/s]
 24%|██▍       | 11/45 [00:00<00:00, 98.48it/s]
Epoch: 2. Loss: 0.07703021168708801
100%|██████████| 45/45 [00:00<00:00, 45.76it/s]
 24%|██▍       | 11/45 [00:00<00:00, 100.27it/s]
Epoch: 3. Loss: 0.07135042548179626
100%|██████████| 45/45 [00:00<00:00, 45.99it/s]
 24%|██▍       | 11/45 [00:00<00:00, 98.48it/s]
Epoch: 4. Loss: 0.07021471858024597
100%|██████████| 45/45 [00:00<00:00, 45.48it/s]
 24%|██▍       | 11/45 [00:00<00:00, 100.27it/s]
Epoch: 5. Loss: 0.0837930291891098
100%|██████████| 45/45 [00:00<00:00, 45.30it/s]
 24%|██▍       | 11/45 [00:00<00:00, 99.36it/s]
Epoch: 6. Loss: 0.08759430795907974
100%|██████████| 45/45 [00:00<00:00, 45.48it/s]
 24%|██▍       | 11/45 [00:00

In [13]:
test(net)

100%|██████████| 2494/2494 [00:02<00:00, 866.48it/s]
Accuracy:  0.749

