# Convolutional Neural Network

CNN Steps:

1. Convolution


2. Max Pooling


3. Flattening


4. Full Connection




### Importing the libraries

In [None]:
import tensorflow as tf
from tensorflow.keras.preprocessing.image import ImageDataGenerator

In [None]:
tf.__version__

'2.17.0'

## Part 1 - Data Preprocessing

### Preprocessing the Training set

In [None]:
train_datagen = ImageDataGenerator(rescale = 1./255, # Feature scaling for images
                                   # Steps to prevent overfitting
                                   shear_range = 0.2,
                                   zoom_range = 0.2,
                                   horizontal_flip = True)

training_set = train_datagen.flow_from_directory('dataset/training_set', # Path leading to the training set
                                                 target_size = (64, 64), # Final size of the images fed to the CNN
                                                 batch_size = 32, # How many images will be in each batch
                                                 class_mode = 'binary' # binary or categorical (cat or dog for this case))

FileNotFoundError: [Errno 2] No such file or directory: 'dataset/training_set'

### Preprocessing the Test set

In [None]:
test_datagen = ImageDataGenerator(rescale = 1./255)
test_set = test_datagen.flow_from_directory('dataset/test_set',
                                            target_size = (64, 64),
                                            batch_size = 32,
                                            class_mode = 'binary')

## Part 2 - Building the CNN

### Initialising the CNN

In [None]:
cnn = tf.keras.models.Sequential()

### Step 1 - Convolution

In [None]:
# filters (or kernels) -> Number of feature dectors to use for convolutions
# kernel_size -> The size of the convolutional window, often a 3x3 grid
# activation -> Activation function applied after the convolution, ReLU is commonly used to introduce non-linearity
# input_shape -> shape of the image 64x64 pixels in this case and 3 for RGB images (1 for black and white)

cnn.add(tf.keras.layers.Conv2D(filters=32, kernel_size=3, activation='relu', input_shape=[64, 64, 3]))

  super().__init__(activity_regularizer=activity_regularizer, **kwargs)


### Step 2 - Pooling

In [None]:
# pool_size -> Size of the pooling window (2x2 in this case)
# strides -> Movement of the pooling window across the input feature map. A stride
# of 2 means the window moves by 2 pixels both horizontally and vertically

cnn.add(tf.keras.layers.MaxPool2D(pool_size=2, strides=2))

### Adding a second convolutional layer

In [None]:
cnn.add(tf.keras.layers.Conv2D(filters=32, kernel_size=3, activation='relu'))
cnn.add(tf.keras.layers.MaxPool2D(pool_size=2, strides=2))

### Step 3 - Flattening

In [None]:
cnn.add(tf.keras.layers.Flatten())

### Step 4 - Full Connection

In [None]:
# units -> number of neurons in the dense layer, the typical number is 128 for an intermediate full connected layer
# ReLU -> activation function to introduce non-linearity
cnn.add(tf.keras.layers.Dense(units=128, activation='relu'))

### Step 5 - Output Layer

In [None]:
# units -> the output layer has only 1 neuron because we're making a binary decision,
# a single neuron will output a value between 0 and 1, representing the probability
# of the input belonging to a specific class.

# activation -> the sigmoid activation function is used to map the output to a probability range
# between 0 and 1.
cnn.add(tf.keras.layers.Dense(units=1, activation='sigmoid'))

## Part 3 - Training the CNN

### Compiling the CNN

In [None]:
# Optimization algorithm, provide an adaptative learning rate that speeds up the convergence of the model
# loss function for binary classification problems, compares the predicted value to the actual class label (0 or 1)
# and calculates the error

# metrics to use
cnn.compile(optimizer = 'adam', loss = 'binary_crossentropy', metrics = ['accuracy'])

### Training the CNN on the Training set and evaluating it on the Test set

In [None]:
cnn.fit(x = training_set, validation_data = test_set, epochs = 25)

## Part 4 - Making a single prediction

In [None]:
import numpy as np
from tensorflow.keras.preprocessing import image

# Loading the image with a 64x64 pixels size
test_image = image.load_img('dataset/single_prediction/cat_or_dog_1.jpg', target_size = (64, 64))
# Converting the image into an array
test_image = image.img_to_array(test_image)
# Adding an extra dimension to make it compatible for CNN input (i.e. turning a 3D array into a 4D array)
test_image = np.expand_dims(test_image, axis = 0)

result = cnn.predict(test_image)
# Mapping class labels ({'cat':0, 'dog':1})
training_set.class_indices
# result[0] gives the prediction array for the first (and only) image
# result[0][0] accesses the first element of that prediction array (in this case probability label)
if result[0][0] == 1:
  prediction = 'dog'
else:
  prediction = 'cat'

NameError: name 'test_image' is not defined

In [None]:
print(prediction)

https://www.superdatascience.com/blogs/the-ultimate-guide-to-convolutional-neural-networks-cnn