# Convolutional Neural Network

### Importing the libraries

In [1]:
import tensorflow as tf
from keras.preprocessing.image import ImageDataGenerator

In [2]:
tf.__version__

'2.7.0'

## Part 1 - Data Preprocessing

### Preprocessing the Training set

In [3]:
train_datagen = ImageDataGenerator(rescale = 1./255,
                                   shear_range = 0.2,
                                   zoom_range = 0.2,
                                   horizontal_flip = True)
training_set = train_datagen.flow_from_directory('dataset/training_set',
                                                 target_size = (64, 64),
                                                 batch_size = 32,
                                                 class_mode = 'binary')

#transformation(zoom, rotate, etc) or augmentation is done on the images to avoid overfitting on training dataset so that we don't get bad performance on test dataset
#ImageDataGenerator is a class that generates batches of tensor image data with real time data augmentation
#train_datagen is the object of ImageDataGenerator class
#feature scaling compulsary for neural networks

Found 8000 images belonging to 2 classes.


### Preprocessing the Test set

In [4]:
test_datagen = ImageDataGenerator(rescale = 1./255)
test_set = test_datagen.flow_from_directory('dataset/test_set',
                                            target_size = (64, 64),
                                            batch_size = 32,
                                            class_mode = 'binary')
#transformation is not done on test data, only feature scaling should be done

Found 2000 images belonging to 2 classes.


## Part 2 - Building the CNN

### Initialising the CNN

In [5]:
cnn = tf.keras.models.Sequential()
#Sequential class that allows to build CNN instance(object) as sequential layers using models module in keras library

### Step 1 - Convolution

In [6]:
cnn.add(tf.keras.layers.Conv2D(filters=32, kernel_size=3, activation='relu', input_shape=[64, 64, 3]))
#Conv2D is a class
#classic number of filters(feature detectors) is 32, kernel_size is 3 as filter is 3 by 3 square matrix, 64 by 64 is image size, 3 is for RGB
#mostly rectifier activation function(relu) is used in hidden layer for CNN

### Step 2 - Pooling

In [7]:
cnn.add(tf.keras.layers.MaxPool2D(pool_size=2, strides=2))
#pool_size is the frame used for max pooling, strides is the number of pixels by which frame is slided right

### Adding a second convolutional layer

In [8]:
cnn.add(tf.keras.layers.Conv2D(filters=32, kernel_size=3, activation='relu'))#no need to add input_shape as parameter again
cnn.add(tf.keras.layers.MaxPool2D(pool_size=2, strides=2)) 

### Step 3 - Flattening

In [9]:
cnn.add(tf.keras.layers.Flatten())

### Step 4 - Full Connection

In [10]:
cnn.add(tf.keras.layers.Dense(units=128, activation='relu'))
#use Dense class for fully connected layer
#128 units is number of neurons

### Step 5 - Output Layer

In [11]:
cnn.add(tf.keras.layers.Dense(units=1, activation='sigmoid'))
#1 unit means a binary classification
#mostly sigmoid activation function is used in output layer for CNN(for binary classification)

## Part 3 - Training the CNN

### Compiling the CNN

In [12]:
cnn.compile(optimizer = 'adam', loss = 'binary_crossentropy', metrics = ['accuracy'])

### Training the CNN on the Training set and evaluating it on the Test set

In [13]:
cnn.fit(x = training_set, validation_data = test_set, epochs = 25)

Epoch 1/25
Epoch 2/25
Epoch 3/25
Epoch 4/25
Epoch 5/25
Epoch 6/25
Epoch 7/25
Epoch 8/25
Epoch 9/25
Epoch 10/25
Epoch 11/25
Epoch 12/25
Epoch 13/25
Epoch 14/25
Epoch 15/25
Epoch 16/25
Epoch 17/25
Epoch 18/25
Epoch 19/25
Epoch 20/25
Epoch 21/25
Epoch 22/25
Epoch 23/25
Epoch 24/25
Epoch 25/25


<keras.callbacks.History at 0x24758ad3670>

## Part 4 - Making a single prediction

In [14]:
import numpy as np
from keras.preprocessing import image
test_image = image.load_img('dataset/single_prediction/cat_or_dog_1.jpg', target_size = (64, 64)) #input image should be of same size as that of training images size
test_image = image.img_to_array(test_image) #predict methos expects array as input, so convert pil image to numpy array
test_image = np.expand_dims(test_image, axis = 0) #adding extra dimension for the batch to which image belongs, dimension of added batch is 1st
result = cnn.predict(test_image/255.0) #normalizing the image
training_set.class_indices #to know that dog is 1 and cat is 0
if result[0][0] > 0.5: #result also has dimensions of test_image
  prediction = 'dog'
else:
  prediction = 'cat'

In [15]:
print(prediction)

dog
