In [None]:
from google.colab import drive
drive.mount('/content/drive')


Mounted at /content/drive


In [None]:
!unzip /content/drive/MyDrive/FYP/chest_xray_VGG16_Augmentation>.zip -d /content/extracted_files

In [None]:
import os
import tensorflow as tf
from tensorflow.keras.applications import VGG16
from tensorflow.keras.preprocessing.image import ImageDataGenerator
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Flatten, Dense, Dropout
from sklearn.metrics import classification_report, confusion_matrix


In [None]:
# Define dataset paths
base_dir = '/content/extracted_files/chest_xray_VGG16_Augmentation'  # Adjust this path as needed
train_dir = os.path.join(base_dir, '/content/extracted_files/chest_xray_VGG16_Augmentation/train')
test_dir = os.path.join(base_dir, '/content/extracted_files/chest_xray_VGG16_Augmentation/test')


In [None]:
# Define data generators with augmentation for training
train_datagen = ImageDataGenerator(
    rescale=1.0/255,
    rotation_range=30,
    width_shift_range=0.2,
    height_shift_range=0.2,
    shear_range=0.2,
    zoom_range=0.2,
    horizontal_flip=True,
    fill_mode='nearest',
    validation_split=0.2  # 20% for validation
)


In [None]:
# Create training and validation datasets
train_generator = train_datagen.flow_from_directory(
    train_dir,
    target_size=(224, 224),  # VGG16 input size
    batch_size=32,
    class_mode='binary',
    subset='training'
)

Found 4187 images belonging to 2 classes.


In [None]:
validation_generator = train_datagen.flow_from_directory(
    train_dir,
    target_size=(224, 224),
    batch_size=32,
    class_mode='binary',
    subset='validation'
)


Found 1045 images belonging to 2 classes.


In [None]:
# Create test dataset without augmentation
test_datagen = ImageDataGenerator(rescale=1.0/255)

test_generator = test_datagen.flow_from_directory(
    test_dir,
    target_size=(224, 224),
    batch_size=32,
    class_mode='binary',
    shuffle=False
)

Found 624 images belonging to 2 classes.


In [None]:
# Load VGG16 without the top layer
vgg_base = VGG16(weights='imagenet', include_top=False, input_shape=(224, 224, 3))


Downloading data from https://storage.googleapis.com/tensorflow/keras-applications/vgg16/vgg16_weights_tf_dim_ordering_tf_kernels_notop.h5
[1m58889256/58889256[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 0us/step


In [None]:
# Freeze the convolutional base
for layer in vgg_base.layers:
    layer.trainable = False


In [None]:
# Build the full model
model = Sequential([
    vgg_base,
    Flatten(),
    Dense(128, activation='relu'),
    Dropout(0.5),
    Dense(1, activation='sigmoid')  # Binary classification
])


In [None]:
# Compile the model
model.compile(optimizer='adam', loss='binary_crossentropy', metrics=['accuracy'])
model.summary()

In [None]:
history = model.fit(
    train_generator,
    validation_data=validation_generator,
    epochs=10,  # Adjust epochs as needed
    verbose=1
)


Epoch 1/10


  self._warn_if_super_not_called()


[1m131/131[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m3159s[0m 24s/step - accuracy: 0.7916 - loss: 0.5959 - val_accuracy: 0.9100 - val_loss: 0.1913
Epoch 2/10
[1m131/131[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m3212s[0m 25s/step - accuracy: 0.9030 - loss: 0.2413 - val_accuracy: 0.9368 - val_loss: 0.1727
Epoch 3/10
[1m131/131[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m3202s[0m 24s/step - accuracy: 0.9066 - loss: 0.2147 - val_accuracy: 0.9378 - val_loss: 0.1572
Epoch 4/10
[1m131/131[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m3141s[0m 24s/step - accuracy: 0.9172 - loss: 0.2049 - val_accuracy: 0.9435 - val_loss: 0.1539
Epoch 5/10
[1m131/131[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m3126s[0m 24s/step - accuracy: 0.9188 - loss: 0.2030 - val_accuracy: 0.9378 - val_loss: 0.1493
Epoch 6/10
[1m131/131[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m3113s[0m 24s/step - accuracy: 0.9191 - loss: 0.1906 - val_accuracy: 0.9206 - val_loss: 0.1822
Epoch 7/10
[1m131/13

In [None]:
# Evaluate the model on the test set
test_loss, test_accuracy = model.evaluate(test_generator)
print(f"Test Accuracy: {test_accuracy * 100:.2f}%")


[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m361s[0m 18s/step - accuracy: 0.8839 - loss: 0.3397
Test Accuracy: 90.38%


In [None]:
# Predict classes on test data
predictions = (model.predict(test_generator) > 0.5).astype("int32")


[1m20/20[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m360s[0m 18s/step


In [None]:
# Generate Confusion Matrix and Classification Report
print("Confusion Matrix")
print(confusion_matrix(test_generator.classes, predictions))


Confusion Matrix
[[196  38]
 [ 22 368]]


In [None]:
print("Classification Report")
print(classification_report(test_generator.classes, predictions, target_names=test_generator.class_indices.keys()))


Classification Report
              precision    recall  f1-score   support

      NORMAL       0.90      0.84      0.87       234
   PNEUMONIA       0.91      0.94      0.92       390

    accuracy                           0.90       624
   macro avg       0.90      0.89      0.90       624
weighted avg       0.90      0.90      0.90       624

