In [30]:
# import packages

import numpy as np
import tensorflow as tf
from keras.preprocessing import image
from keras.preprocessing.image import ImageDataGenerator

### Data Preprocessing

In [31]:
# Preprocessing Trainset
# these transformations are applied only on trainset
# purpose: to avoid overfitting (more accuracy on trainset, less on test set)
# transformations include some simple geometrical transformations, or zoom, or some rotations/ flips on the images.
# the technical term for applying these transorfations on images is Image Augmentation.

train_datagen = ImageDataGenerator(rescale = 1./255,
                                   shear_range = 0.2,
                                   zoom_range = 0.2,
                                   horizontal_flip = True) 
 
training_set = train_datagen.flow_from_directory('dataset/training_set',
                                                target_size = (64, 64),
                                                batch_size = 32,
                                                class_mode = 'binary')



Found 8000 images belonging to 2 classes.


In [32]:
# Preprocessing Testset

test_datagen = ImageDataGenerator(rescale = 1./255)
test_set = train_datagen.flow_from_directory('dataset/test_set',
                                             target_size = (64, 64),
                                             batch_size = 32,
                                             class_mode = 'binary')

Found 2000 images belonging to 2 classes.


### Building a CNN

In [33]:
# Initialize a CNN
cnn = tf.keras.models.Sequential()

In [34]:
# Adding convolution layer
# input_shape must be same as shape transformed using ImageDataGenerator
# if images and b&w then input_shape = [64, 64, 1]
cnn.add(tf.keras.layers.Conv2D(filters = 32, 
                               kernel_size = 3, 
                               activation = 'relu', 
                               input_shape = [64, 64, 3]))

In [35]:
# Applying Max Pooling
cnn.add(tf.keras.layers.MaxPool2D(pool_size=(3, 3),
                                  strides=2))

In [36]:
# Adding second convolutional layer along with pooling
# remove input_shape parameter, as it is required only for the first layer
cnn.add(tf.keras.layers.Conv2D(filters = 32, 
                               kernel_size = 3, 
                               activation = 'relu'))
cnn.add(tf.keras.layers.MaxPool2D(pool_size=(3, 3),
                                  strides=2))

In [37]:
# Add flattenning layer
cnn.add(tf.keras.layers.Flatten())

In [38]:
# Full Connection
cnn.add(tf.keras.layers.Dense(units = 128, 
                              activation = 'relu'))

In [39]:
# Add an output layer
cnn.add(tf.keras.layers.Dense(units = 1, 
                             activation = 'sigmoid'))

### Training a CNN

In [40]:
# Compile CNN
cnn.compile(optimizer = 'adam', loss = 'binary_crossentropy', metrics = ['accuracy'])

In [41]:
# training on train set and eevaluating on test set
cnn.fit(x = training_set, validation_data = test_set, epochs = 30)

Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 21/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


<keras.src.callbacks.History at 0x15c2af1c0>

### Make a single Prediction

In [42]:
# step1: load the image using load_img function, it generates a PIL image format
# step2: convert PIL format to numpy array using img_to_array()
# step3: add an extra dimension, as during training phase we did add batch as an extra dimension, the predict 
# method expects the single input image to have that batch dimension as well. For that we use expand_dims().
# As thebatch dimension comes first and then images, we make axis = 0.
test_image = image.load_img('dataset/single_prediction/cat_img.jpeg',
                           target_size = (64, 64))
test_image = image.img_to_array(test_image)
test_image = np.expand_dims(test_image, axis = 0)
result = cnn.predict(test_image)



In [47]:
result

array([[0.]], dtype=float32)

In [44]:
# from this we get class indices- dog: 1, cat: 0
training_set.class_indices
if result[0][0] == 1:
    prediction = 'Dog'
else:
    prediction = 'Cat'
print(prediction)

Cat


In [48]:
test_image = image.load_img('dataset/single_prediction/dog.jpeg',
                           target_size = (64, 64))
test_image = image.img_to_array(test_image)
test_image = np.expand_dims(test_image, axis = 0)
result = cnn.predict(test_image)
if result[0][0] == 1:
    prediction = 'Dog'
else:
    prediction = 'Cat'
print(prediction)

Dog


In [49]:
test_image = image.load_img('dataset/single_prediction/dog1.jpeg',
                           target_size = (64, 64))
test_image = image.img_to_array(test_image)
test_image = np.expand_dims(test_image, axis = 0)
result = cnn.predict(test_image)
if result[0][0] == 1:
    prediction = 'Dog'
else:
    prediction = 'Cat'
print(prediction)

Cat


In [50]:
test_image = image.load_img('dataset/single_prediction/dog2.jpeg',
                           target_size = (64, 64))
test_image = image.img_to_array(test_image)
test_image = np.expand_dims(test_image, axis = 0)
result = cnn.predict(test_image)
if result[0][0] == 1:
    prediction = 'Dog'
else:
    prediction = 'Cat'
print(prediction)

Dog
