# Convolutional Neural Network

### Importing the libraries

In [13]:
import tensorflow as tf
from keras.preprocessing.image import ImageDataGenerator

In [14]:
tf.__version__

'2.3.0'

## Part 1 - Data Preprocessing

### Preprocessing the Training set

In [15]:
# we want to apply a transformation only on the images in the training set, in order to avoid overfitting.
# the transofrmations are: Zooms, Rotations,

In [16]:
train_datagen = ImageDataGenerator(
        rescale=1./255,
        shear_range=0.2,
        zoom_range=0.2,
        horizontal_flip=True)

In [23]:
#now we want to resize the images in order to decrease the computations of the machines. 
# train_datagen is an OBJECT, flow_from_directory is a METHOD from the CLASS ImageDataGenerator.
training_set = train_datagen.flow_from_directory(
        r'dataset\training_set',
        target_size=(64, 64),
        batch_size=32,
        class_mode='binary')



Found 8000 images belonging to 2 classes.


### Preprocessing the Test set

In [24]:
# we don't want to change anything in the test set, to us these are new images.
test_datagen = ImageDataGenerator(rescale=1./255)

test_set = test_datagen.flow_from_directory(
        r'dataset/test_set',
        target_size=(64, 64),
        batch_size=32,
        class_mode='binary')


Found 2000 images belonging to 2 classes.


## Part 2 - Building the CNN

### Initialising the CNN

In [25]:

# we want to create an ANN as a sequence of layers.
cnn = tf.keras.models.Sequential()

### Step 1 - Convolution

In [27]:
cnn.add(tf.keras.layers.Conv2D(filters=32, kernel_size=3, activation='relu', input_shape=[64, 64, 3]))
#  input_shape=[64, 64, 3]) is added only when we add our first layer.

### Step 2 - Pooling

In [28]:
cnn.add(tf.keras.layers.MaxPool2D(pool_size=2, strides=2))

### Adding a second convolutional layer

In [29]:
# Question: Wht do we add a second Convolutional Layer?

In [30]:
# In order to learn hierarchical representations of your input data. For example first layers
# will learn edges and second layers will combine these edges in order to form more abstract representations (e.g. circular and/or rectangular shapes). 
# Fifth layer builds later on top of this and creates even more abstract representations (for example this could be something like dog faces).
# There is no consensus on what is the best number of layers. Most of the time people experiment with different depth and choose whatever works the best.
# Below is an example how the filters in first, third and fifth layer might look like in some arbitrary chosen Convolutional Neural Net.



In [32]:
cnn.add(tf.keras.layers.Conv2D(filters=32, kernel_size=3, activation='relu', input_shape=[64, 64, 3]))
cnn.add(tf.keras.layers.MaxPool2D(pool_size=2, strides=2))


### Step 3 - Flattening

In [33]:
cnn.add(tf.keras.layers.Flatten())

### Step 4 - Full Connection

In [34]:
cnn.add(tf.keras.layers.Dense(units=128, activation='relu')) #relu = rectifier activation func

### Step 5 - Output Layer

In [35]:
cnn.add(tf.keras.layers.Dense(units=1, activation='sigmoid'))
# we need only one neuron to encode the binary class 0/1.
# for binary classificaiton we use sigmoid.
# for multi-class classification we use softmax activation function.

## Part 3 - Training the CNN

### Compiling the CNN

In [36]:
cnn.compile(optimizer='adam', loss = 'binary_crossentropy', metrics = ['accuracy'])

### Training the CNN on the Training set and evaluating it on the Test set

In [None]:
cnn.fit(x = training_set, validation_data=test_set, epochs = 25)

Epoch 1/25
Epoch 2/25
Epoch 3/25
Epoch 4/25
Epoch 5/25
Epoch 6/25
Epoch 7/25
Epoch 8/25
Epoch 9/25
Epoch 10/25
Epoch 11/25
Epoch 12/25
Epoch 13/25
Epoch 14/25
Epoch 15/25
 37/250 [===>..........................] - ETA: 38s - loss: 0.3235 - accuracy: 0.8522- ETA: 40s - loss: 0.3178 - accurac

In [None]:
# 32*250 = 8000 images, the batch-size is 32, and we have 8000 images, we have 250 steps in each epoch.
# the number of epochs is not related to the batch-size or images number.
# accuary - is the accuracy of the training set.
# val_accuracy - is the accuracy on the test set. 
# if we didn't do data augmentation at the beginning we will get something close to 98% or 99% in the test set accuracy
# which clearly indicates overfitting, and lower accuracy in the training set. 

## Part 4 - Making a single prediction

In [None]:
import numpy as np
from keras.preprocessing import image
test_image = image.load_img('dataset\single_prediction\cat_or_dog_2.jpg', target_size = (64,64))
#the predict method expects at it's input a 2D array
test_image = image.img_to_array(test_image)
# the predict method has to be used as it was used in the TRAINING.
# the cnn was trained on batches (not signle image), where batch #1 contained 32 imgs, batch #2 contained 32 imgs.
# so we have an extra dimention for the batch.


In [1]:
# the expand_dims adds a dimention corresponding to the batch.
test_image = np.expand_dims(test_image, axis = 0)
result = cnn.predict(test_image)
training_set.class_indices  

# how do we know for ex if cat corresponds to 1 or 0?
training_set.class_indices
if result[0][0] == 1 # the first index 0 represent the only batch we have, and the second 0 represents the only 
                     # image we want to predict. 
prediction = 'dog'
else:
  prediction = 'cat'                    
print(prediction)

SyntaxError: invalid syntax (<ipython-input-1-281534f53205>, line 8)