In [None]:
import tensorflow as tf
from tensorflow.keras.layers import Input, Lambda, Dense, Flatten,Dropout
from tensorflow.keras.models import Model
from tensorflow.keras.applications.vgg16 import VGG16
from tensorflow.keras.applications.vgg16 import preprocess_input
from tensorflow.keras.preprocessing import image
from tensorflow.keras.preprocessing.image import ImageDataGenerator
from tensorflow.keras.models import Sequential
import numpy as np
from glob import glob
import matplotlib.pyplot as plt
%matplotlib inline
import os
import random





In [None]:
IMAGE_SIZE = [224, 224]
random.seed(42)

In [None]:
# initializing VGG with its own weights,
# include_top false means it removes top dense layers which are optimized for VGG images 
# we need to add new layers and train with our data.
vgg = VGG16(input_shape=IMAGE_SIZE + [3], weights='imagenet', include_top=False) # here [3] is 3 channels Red blue Green


In [None]:
for layer in vgg.layers:
  layer.trainable = False
#Here we Froze the weights of VGG- Meaning we are using existing features from VGG adn mixing with our dense layers

In [None]:
# Model without any dense layers, features only from VGNET and direct predictions.
x = Flatten()(vgg.output)
# x = Dense(1000, activation='relu')(x)
prediction = Dense(26, activation='softmax')(x) # here we have 26 output classes so i gave 5 in output layer


In [None]:
# Creating VGNET model
model = Model(inputs=vgg.input, outputs=prediction)

In [None]:
model.summary()


Model: "model_2"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_3 (InputLayer)        [(None, 224, 224, 3)]     0         
                                                                 
 block1_conv1 (Conv2D)       (None, 224, 224, 64)      1792      
                                                                 
 block1_conv2 (Conv2D)       (None, 224, 224, 64)      36928     
                                                                 
 block1_pool (MaxPooling2D)  (None, 112, 112, 64)      0         
                                                                 
 block2_conv1 (Conv2D)       (None, 112, 112, 128)     73856     
                                                                 
 block2_conv2 (Conv2D)       (None, 112, 112, 128)     147584    
                                                                 
 block2_pool (MaxPooling2D)  (None, 56, 56, 128)       0   

In [None]:

model.compile(
  loss='categorical_crossentropy',
  optimizer=tf.keras.optimizers.RMSprop(),
  metrics=['accuracy']
)


In [None]:
#Input needs to be (224,224)
# we are addign data augmentation to zoom in out , and flipping horizontally
train_datagen = ImageDataGenerator(rescale = 1./255,
                                  #  shear_range = 0.2,
                                  #  zoom_range = 0.2,
                                  #  horizontal_flip = True
                                   )# add augments with horizontal flip

test_datagen = ImageDataGenerator(rescale = 1./255)#divide by 255 to normalize/scale

training_set = train_datagen.flow_from_directory('/content/drive/MyDrive/Project_Data/Train',
                                                 target_size = (224, 224),
                                                 batch_size = 128,
                                                 class_mode = 'categorical')

test_set = test_datagen.flow_from_directory('/content/drive/MyDrive/Project_Data/Test',
                                           target_size = (224, 224),
                                             batch_size = 128,
                                             class_mode = 'categorical')

Found 2366 images belonging to 26 classes.
Found 811 images belonging to 26 classes.


In [None]:
r = model.fit(
  training_set,
  validation_data=test_set,
  epochs=5
  # steps_per_epoch=128

)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


In [None]:
#This did not work very will with VG net architecture.
#Transfer learning may not always work. we need to Tweak some parameters and try it agian,
score = model.evaluate(test_set)
print('Test Loss:', score[0])
print('Test accuracy:', score[1])

Test Loss: 3.271759033203125
Test accuracy: 0.24907521903514862


In [None]:
#second try
vgg = VGG16(input_shape=IMAGE_SIZE + [3], weights='imagenet', include_top=False)


In [None]:
for layer in vgg.layers:
  layer.trainable = False

In [None]:
# our layers - you can add more if you want
x = Flatten()(vgg.output)
# x = Dense(1000, activation='relu')(x)
x=Dense(100, activation='relu')(x)
Dropout(0.5)(x)
x=Dense(100, activation='relu')(x)
prediction = Dense(26, activation='softmax')(x)


In [None]:
# create a model object
model = Model(inputs=vgg.input, outputs=prediction)

In [None]:
model.summary()


Model: "model_3"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_4 (InputLayer)        [(None, 224, 224, 3)]     0         
                                                                 
 block1_conv1 (Conv2D)       (None, 224, 224, 64)      1792      
                                                                 
 block1_conv2 (Conv2D)       (None, 224, 224, 64)      36928     
                                                                 
 block1_pool (MaxPooling2D)  (None, 112, 112, 64)      0         
                                                                 
 block2_conv1 (Conv2D)       (None, 112, 112, 128)     73856     
                                                                 
 block2_conv2 (Conv2D)       (None, 112, 112, 128)     147584    
                                                                 
 block2_pool (MaxPooling2D)  (None, 56, 56, 128)       0   

In [None]:
from tensorflow.keras.callbacks import EarlyStopping
model.compile(
  loss='categorical_crossentropy',
  optimizer=tf.keras.optimizers.RMSprop(),
  metrics=['accuracy']
)
earlystop = EarlyStopping(monitor='val_loss', patience=5, verbose=1, mode='auto')
callback = [earlystop]


In [None]:
r = model.fit(
  training_set,
  validation_data=test_set,
  epochs=5,
  batch_size=128,
  callbacks=callback
)


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


In [None]:
score = model.evaluate(test_set)
print('Test Loss:', score[0])
print('Test accuracy:', score[1])

Test Loss: 3.0759243965148926
Test accuracy: 0.10234278440475464


In [None]:
#Thrid Model - Now i will only use one dense layer and one for output.


In [None]:
vgg = VGG16(input_shape=IMAGE_SIZE + [3], weights='imagenet', include_top=False)
for layer in vgg.layers:
  layer.trainable = False

In [None]:
# our layers - you can add more if you want
x = Flatten()(vgg.output)
# x = Dense(1000, activation='relu')(x)
x=Dense(50, activation='relu')(x)
prediction = Dense(26, activation='softmax')(x)


In [None]:
from tensorflow.keras.callbacks import EarlyStopping
model.compile(
  loss='categorical_crossentropy',
  optimizer=tf.keras.optimizers.Adam(),
  metrics=['accuracy']
)
earlystop = EarlyStopping(monitor='val_loss', patience=5, verbose=1, mode='auto')
callback = [earlystop]


In [None]:
r = model.fit(
  training_set,
  validation_data=test_set,
  epochs=8,
  steps_per_epoch=len(training_set),
  validation_steps=len(test_set),callbacks=callback
)


Epoch 1/8
Epoch 2/8
Epoch 3/8
Epoch 4/8
Epoch 5/8
Epoch 6/8
Epoch 7/8
Epoch 8/8


In [None]:
score = model.evaluate(test_set)
print('Test Loss:', score[0])
print('Test accuracy:', score[1])

Test Loss: 2.034989356994629
Test accuracy: 0.3612823784351349


In [None]:
from tensorflow.keras.callbacks import EarlyStopping
model.compile(
  loss='categorical_crossentropy',
  optimizer=tf.keras.optimizers.RMSprop(),
  metrics=['accuracy']
)
earlystop = EarlyStopping(monitor='val_loss', patience=5, verbose=1, mode='auto')
callback = [earlystop]

In [None]:
r = model.fit(
  training_set,
  validation_data=test_set,
  epochs=8,
  # steps_per_epoch=len(training_set),
  # validation_steps=len(test_set)
  callbacks=callback
)

Epoch 1/8
Epoch 2/8
Epoch 3/8
Epoch 4/8
Epoch 5/8
Epoch 6/8
Epoch 00006: early stopping


In [None]:
#This model Fitted Best compared to the model whit direct predictions of our data with VGG 
#it worked better than the one with 2 dense layers.

In [None]:
# Its good to use simple models than complex models with more features.

In [None]:
# Here we explored the Power of transfer learning, by using existing features from VGG
# and adding only one dense layer other than output we saved a lot of compute power and time and
#achieved great accuracy.

In [None]:
vgg = VGG16(input_shape=IMAGE_SIZE + [3], weights='imagenet', include_top=False)


In [None]:
for layer in vgg.layers:
  layer.trainable = False

In [None]:

last_layer = vgg.get_layer('block4_pool')

print('last layer output shape: ', last_layer.output_shape)

last_output = last_layer.output

x = Flatten()(last_output)

# x = Dense(1000, activation='relu')(x)
# x=Dense(100, activation='relu')(x)
# Dropout(0.5)(x)
x=Dense(100, activation='relu')(x)
Dropout(0.5)(x)
prediction = Dense(26, activation='softmax')(x)


last layer output shape:  (None, 14, 14, 512)


In [None]:
model = Model(inputs=vgg.input, outputs=prediction)
model.summary()
from tensorflow.keras.callbacks import EarlyStopping
model.compile(
  loss='categorical_crossentropy',
  optimizer=tf.keras.optimizers.RMSprop(),
  metrics=['accuracy']
)
earlystop = EarlyStopping(monitor='val_loss', patience=5, verbose=1, mode='auto')
callback = [earlystop]

Model: "model_4"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_6 (InputLayer)        [(None, 224, 224, 3)]     0         
                                                                 
 block1_conv1 (Conv2D)       (None, 224, 224, 64)      1792      
                                                                 
 block1_conv2 (Conv2D)       (None, 224, 224, 64)      36928     
                                                                 
 block1_pool (MaxPooling2D)  (None, 112, 112, 64)      0         
                                                                 
 block2_conv1 (Conv2D)       (None, 112, 112, 128)     73856     
                                                                 
 block2_conv2 (Conv2D)       (None, 112, 112, 128)     147584    
                                                                 
 block2_pool (MaxPooling2D)  (None, 56, 56, 128)       0   

In [None]:
r = model.fit(
  training_set,
  validation_data=test_set,
  epochs=5,
  batch_size=128,
  callbacks=callback
)


Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


In [None]:
# we can see that Image net is not a great fit for our dataset, even after training and removing some layers.