In [1]:
import tensorflow as tf
from keras import layers, Model
from tensorflow.keras.preprocessing.image import ImageDataGenerator

In [2]:
# Define custom VGG16 model
def custom_vgg16(input_shape=(224, 224, 3), num_classes=2):
    input_tensor = layers.Input(shape=input_shape)

    # Block 1
    x = layers.Conv2D(64, (3, 3), activation='relu', padding='same')(input_tensor)
    x = layers.Conv2D(64, (3, 3), activation='relu', padding='same')(x)
    x = layers.MaxPooling2D((2, 2), strides=(2, 2))(x)

    # Block 2
    x = layers.Conv2D(128, (3, 3), activation='relu', padding='same')(x)
    x = layers.Conv2D(128, (3, 3), activation='relu', padding='same')(x)
    x = layers.MaxPooling2D((2, 2), strides=(2, 2))(x)

    # Block 3
    x = layers.Conv2D(256, (3, 3), activation='relu', padding='same')(x)
    x = layers.Conv2D(256, (3, 3), activation='relu', padding='same')(x)
    x = layers.Conv2D(256, (3, 3), activation='relu', padding='same')(x)
    x = layers.MaxPooling2D((2, 2), strides=(2, 2))(x)

    # Block 4
    x = layers.Conv2D(512, (3, 3), activation='relu', padding='same')(x)
    x = layers.Conv2D(512, (3, 3), activation='relu', padding='same')(x)
    x = layers.Conv2D(512, (3, 3), activation='relu', padding='same')(x)
    x = layers.MaxPooling2D((2, 2), strides=(2, 2))(x)

    # Block 5
    x = layers.Conv2D(512, (3, 3), activation='relu', padding='same')(x)
    x = layers.Conv2D(512, (3, 3), activation='relu', padding='same')(x)
    x = layers.Conv2D(512, (3, 3), activation='relu', padding='same')(x)
    x = layers.MaxPooling2D((2, 2), strides=(2, 2))(x)

    # Flatten
    x = layers.Flatten()(x)

    # Fully connected layers
    x = layers.Dense(4096, activation='relu')(x)
    x = layers.Dense(4096, activation='relu')(x)
    output = layers.Dense(num_classes, activation='softmax')(x)

    # Create model
    model = Model(input_tensor, output, name='custom_vgg16')
    return model

In [3]:
# Instantiate the custom VGG16 model
model = custom_vgg16(num_classes = 5)

# Compile the model
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

# Display model architecture
# model.summary()

# Paths to your train and test directories
train_dir = '/Users/vishnuvardhanvankayalapati/Desktop/FinalProject_Bird_Image_Classification/Project_Data_Set/train'
test_dir = '/Users/vishnuvardhanvankayalapati/Desktop/FinalProject_Bird_Image_Classification/Project_Data_Set/test'

# Image dimensions
img_height, img_width = 224, 224
batch_size = 32

# Create data generators
train_datagen = ImageDataGenerator(
    rescale=1./255)

test_datagen = ImageDataGenerator(rescale=1./255)

train_generator = train_datagen.flow_from_directory(
    train_dir,
    target_size=(img_height, img_width),
    batch_size=batch_size,
    class_mode='categorical')

validation_generator = test_datagen.flow_from_directory(
    test_dir,
    target_size=(img_height, img_width),
    batch_size=batch_size,
    class_mode='categorical')


Found 200 images belonging to 5 classes.
Found 88 images belonging to 5 classes.


In [4]:
# Train the model
history = model.fit(train_generator,
                    steps_per_epoch=len(train_generator),
                    epochs=5,
                    validation_data=validation_generator,
                    validation_steps=len(validation_generator))

Epoch 1/5


  self._warn_if_super_not_called()


[1m7/7[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m188s[0m 27s/step - accuracy: 0.1512 - loss: 2.1143 - val_accuracy: 0.2045 - val_loss: 1.6112
Epoch 2/5
[1m7/7[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 12ms/step - accuracy: 0.0000e+00 - loss: 0.0000e+00 - val_accuracy: 0.0000e+00 - val_loss: 0.0000e+00
Epoch 3/5


2024-03-15 10:54:25.947121: W tensorflow/core/framework/local_rendezvous.cc:404] Local rendezvous is aborting with status: OUT_OF_RANGE: End of sequence
	 [[{{node IteratorGetNext}}]]
  self.gen.throw(typ, value, traceback)
2024-03-15 10:54:26.014310: W tensorflow/core/framework/local_rendezvous.cc:404] Local rendezvous is aborting with status: OUT_OF_RANGE: End of sequence
	 [[{{node IteratorGetNext}}]]


[1m7/7[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m174s[0m 25s/step - accuracy: 0.2137 - loss: 1.6155 - val_accuracy: 0.2045 - val_loss: 1.6098
Epoch 4/5
[1m7/7[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 3ms/step - accuracy: 0.0000e+00 - loss: 0.0000e+00 - val_accuracy: 0.0000e+00 - val_loss: 0.0000e+00
Epoch 5/5


2024-03-15 10:57:19.813455: W tensorflow/core/framework/local_rendezvous.cc:404] Local rendezvous is aborting with status: OUT_OF_RANGE: End of sequence
	 [[{{node IteratorGetNext}}]]
2024-03-15 10:57:19.819833: W tensorflow/core/framework/local_rendezvous.cc:404] Local rendezvous is aborting with status: OUT_OF_RANGE: End of sequence
	 [[{{node IteratorGetNext}}]]


[1m7/7[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m167s[0m 24s/step - accuracy: 0.2018 - loss: 1.6089 - val_accuracy: 0.2045 - val_loss: 1.6099


In [5]:
# Extract training and validation accuracy from history
training_accuracy = (history.history['accuracy'][-1] * 100)
validation_accuracy = (history.history['val_accuracy'][-1] * 100)

print(f"Training Accuracy: {training_accuracy}")
print(f"Validation Accuracy: {validation_accuracy}")

Training Accuracy: 20.499999821186066
Validation Accuracy: 20.454545319080353


In [19]:
# import numpy as np
# from keras.preprocessing import image

# # Load the image
# img_path = '/Users/vishnuvardhanvankayalapati/Desktop/FinalProject_Bird_Image_Classification/Project_Data_Set/test/Red_faced_Cormorant/Red_Faced_Cormorant_0007_796280.jpg'
# img = image.load_img(img_path, target_size=(img_height, img_width))

# # Preprocess the image
# img_array = image.img_to_array(img)
# img_array = np.expand_dims(img_array, axis=0)
# img_array /= 255.  # Normalize the image

# # Make predictions
# predictions = model.predict(img_array)

# # Get the predicted class
# predicted_class = np.argmax(predictions[0])

# # If you have ground truth labels, compare with the ground truth to compute accuracy
# ground_truth =[0,1,2,3,4]# Provide the ground truth label here
# accuracy = (predicted_class == ground_truth)

# # Print the predicted class and probability
# print("Predicted Class:", predicted_class)
# print("Predicted Probability:", predictions[0][predicted_class])

# # If you have ground truth labels, print accuracy
# print("Prediction Accuracy:", accuracy)


[1m1/1[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 165ms/step
Predicted Class: 3
Predicted Probability: 0.22075781
Prediction Accuracy: [False False False  True False]
