In [1]:
import os
import numpy as np
import pandas as pd
import tensorflow as tf
from tensorflow.keras.applications import Xception
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, GlobalAveragePooling2D
from tensorflow.keras.preprocessing.image import ImageDataGenerator
from sklearn.model_selection import StratifiedKFold
from tensorflow.keras.callbacks import ModelCheckpoint
from sklearn.metrics import classification_report, confusion_matrix



In [2]:
image_path = '/kaggle/input/k-fold-images/images'

In [3]:
input_shape = (299, 299) 
batch_size = 32
num_epochs = 31
num_folds = 4 

In [4]:
data_gen = ImageDataGenerator(
                    rescale=1./255,
                    width_shift_range=0.2,
                    height_shift_range=0.2,
                    zoom_range=0.2,
                    horizontal_flip=True,
                    vertical_flip=False,
                    rotation_range=10,  
                    shear_range=0.2,
                    brightness_range=[0.8, 1.2])

In [5]:
classes = os.listdir(image_path)

all_image_paths = []
all_labels = []

for class_name in classes:
    class_path = os.path.join(image_path, class_name)
    class_images = os.listdir(class_path)
    class_image_paths = [os.path.join(class_path, image) for image in class_images]
    all_image_paths.extend(class_image_paths)
    all_labels.extend([class_name] * len(class_image_paths))

all_image_paths = np.array(all_image_paths)
all_labels = np.array(all_labels)

stratified_kfold = StratifiedKFold(n_splits=num_folds, shuffle=True, random_state=42)

In [6]:
len(classes)

5

In [7]:
base_model = Xception(weights='imagenet', include_top=False, input_shape=(*input_shape, 3))
model = Sequential([
    base_model,
    GlobalAveragePooling2D(),
    Dense(256, activation='relu'),
    Dense(len(classes), activation='softmax')
])


Downloading data from https://storage.googleapis.com/tensorflow/keras-applications/xception/xception_weights_tf_dim_ordering_tf_kernels_notop.h5


In [8]:
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])

In [None]:
for fold, (train_indices, val_indices) in enumerate(stratified_kfold.split(all_image_paths, all_labels)):
    train_data = all_image_paths[train_indices]
    train_labels = all_labels[train_indices]
    val_data = all_image_paths[val_indices]
    val_labels = all_labels[val_indices]
    print("################# Results for fold:-", fold+1, "###################")
    train_generator = data_gen.flow_from_dataframe(
        dataframe=pd.DataFrame({'filepath': train_data, 'class': train_labels}),
        x_col='filepath',
        y_col='class',
        target_size=input_shape,
        batch_size=batch_size,
        class_mode='categorical',
        shuffle=True,
    )

    val_generator = data_gen.flow_from_dataframe(
        dataframe=pd.DataFrame({'filepath': val_data, 'class': val_labels}),
        x_col='filepath',
        y_col='class',
        target_size=input_shape,
        batch_size=batch_size,
        class_mode='categorical',
        shuffle=False,
    )
    

    Checkpoint = ModelCheckpoint("K-Xception.hdf5", monitor="val_accuracy", save_best_only=True, mode="max")
    model.fit(
        train_generator,
        epochs=num_epochs,
        validation_data=val_generator,
        callbacks=[Checkpoint]
    )
    
    new_model=tf.keras.models.load_model("/kaggle/working/K-Xception.hdf5")
    
    predictions = new_model.predict(val_generator)
    predicted_labels = np.argmax(predictions, axis=1)
    true_labels = val_generator.classes

    class_names = list(val_generator.class_indices.keys())
    report = classification_report(true_labels, predicted_labels, target_names=class_names)
    
    print(f"Fold {fold + 1}:")
    print("Classification Report:")
    print(report)

    # Calculate and display the confusion matrix
    confusion_mat = confusion_matrix(true_labels, predicted_labels)
    print("Confusion Matrix:")
    print(confusion_mat)

model.save('xception_model.h5')


################# Results for fold:- 1 ###################
Found 8076 validated image filenames belonging to 5 classes.
Found 2019 validated image filenames belonging to 5 classes.
Epoch 1/31
Epoch 2/31
Epoch 3/31
Epoch 4/31
Epoch 5/31
Epoch 6/31
Epoch 7/31
Epoch 8/31
Epoch 9/31
Epoch 10/31
Epoch 11/31
Epoch 12/31
Epoch 13/31
Epoch 14/31
Epoch 15/31
Epoch 16/31
Epoch 17/31
Epoch 18/31
Epoch 19/31
Epoch 20/31
Epoch 21/31
Epoch 22/31
Epoch 23/31
Epoch 24/31
Epoch 25/31
Epoch 26/31
Epoch 27/31
Epoch 28/31
Epoch 29/31
Epoch 30/31
Epoch 31/31
Fold 1:
Classification Report:
                      precision    recall  f1-score   support

 Bacterial Pneumonia       0.84      0.79      0.81       402
Corona Virus Disease       0.99      0.98      0.99       406
              Normal       0.90      0.99      0.94       403
        Tuberculosis       0.99      1.00      1.00       407
     Viral Pneumonia       0.80      0.77      0.78       401

            accuracy                           0.90