# convolutional neural network (CNN) to classify medical X-ray images and detect pneumonia


### Importing the libraries


In [4]:
import tensorflow as tf
from tensorflow.keras.preprocessing.image import ImageDataGenerator

## Part 1 - Data Preprocessing


In [5]:
TRAINING_SET_DIR = "/Users/sivaram/Developer/SDS/SuperDataScience-Community-Projects/datasets/chest_xray/train"
TEST_SET_DIR = "/Users/sivaram/Developer/SDS/SuperDataScience-Community-Projects/datasets/chest_xray/test"
VALIDATION_SET_DIR = "/Users/sivaram/Developer/SDS/SuperDataScience-Community-Projects/datasets/chest_xray/val"


### Preprocessing the Training set

In [7]:
# Image augmentation gives variety and diversity of training set to avoid overfitting
train_datagen = ImageDataGenerator(rescale = 1./255,
                                   shear_range = 0.2,
                                   zoom_range = 0.2,
                                   horizontal_flip = True)
training_set = train_datagen.flow_from_directory(TRAINING_SET_DIR,
                                                 target_size = (64, 64),
                                                 batch_size = 32,
                                                 class_mode = 'binary')

Found 5216 images belonging to 2 classes.


In [8]:
labels = (training_set.class_indices)
print(labels)

{'NORMAL': 0, 'PNEUMONIA': 1}


### Preprocessing the test set


In [9]:
test_datagen = ImageDataGenerator(rescale = 1./255)
test_set = train_datagen.flow_from_directory(TEST_SET_DIR,
                                                 target_size = (64, 64),
                                                 batch_size = 32,
                                                 class_mode = 'binary')

Found 624 images belonging to 2 classes.


In [10]:
labels = (test_set.class_indices)
print(labels)

{'NORMAL': 0, 'PNEUMONIA': 1}


### Preprocessing the validation set


In [11]:
val_datagen = ImageDataGenerator(rescale = 1./255)
val_set = train_datagen.flow_from_directory(VALIDATION_SET_DIR,
                                                 target_size = (64, 64),
                                                 batch_size = 32,
                                                 class_mode = 'binary')

Found 16 images belonging to 2 classes.


In [12]:
labels = (val_set.class_indices)
print(labels)

{'NORMAL': 0, 'PNEUMONIA': 1}


## Part 2 - Building the CNN


### Initialising the CNN

In [13]:
cnn = tf.keras.models.Sequential()


### Step 1 - Convolution

In [14]:
cnn.add(tf.keras.layers.Conv2D(filters=32, kernel_size=3, activation='relu', input_shape=[64, 64, 3]))


  super().__init__(activity_regularizer=activity_regularizer, **kwargs)


### Step 2 - Pooling

In [15]:
cnn.add(tf.keras.layers.MaxPool2D(pool_size=2, strides=2))


### Adding a second convolutional layer


In [16]:
cnn.add(tf.keras.layers.Conv2D(filters=32, kernel_size=3, activation='relu'))
cnn.add(tf.keras.layers.MaxPool2D(pool_size=2, strides=2))

### Step 3 - Flattening

In [17]:
cnn.add(tf.keras.layers.Flatten())


### Step 4 - Full Connection

In [18]:
cnn.add(tf.keras.layers.Dense(units=128, activation='relu'))


### Step 5 - Output Layer

In [19]:
cnn.add(tf.keras.layers.Dense(units=1, activation='sigmoid'))


## Part 3 - Training the CNN


### Compiling the CNN

In [20]:
cnn.compile(optimizer = 'adam', loss = 'binary_crossentropy', metrics = ['accuracy'])


### Training the CNN on the Training set and evaluating it on the Test set


In [21]:
cnn.fit(x = training_set, validation_data = test_set, epochs = 25)


  self._warn_if_super_not_called()


Epoch 1/25
[1m163/163[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 146ms/step - accuracy: 0.7501 - loss: 0.5198

  self._warn_if_super_not_called()


[1m163/163[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m27s[0m 163ms/step - accuracy: 0.7506 - loss: 0.5191 - val_accuracy: 0.7548 - val_loss: 0.5254
Epoch 2/25
[1m163/163[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m28s[0m 170ms/step - accuracy: 0.9021 - loss: 0.2329 - val_accuracy: 0.8221 - val_loss: 0.4193
Epoch 3/25
[1m163/163[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m29s[0m 178ms/step - accuracy: 0.8995 - loss: 0.2330 - val_accuracy: 0.8237 - val_loss: 0.3983
Epoch 4/25
[1m163/163[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m29s[0m 178ms/step - accuracy: 0.9232 - loss: 0.1955 - val_accuracy: 0.7404 - val_loss: 0.8041
Epoch 5/25
[1m163/163[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m30s[0m 184ms/step - accuracy: 0.9245 - loss: 0.1848 - val_accuracy: 0.8478 - val_loss: 0.3675
Epoch 6/25
[1m163/163[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m30s[0m 185ms/step - accuracy: 0.9195 - loss: 0.1878 - val_accuracy: 0.8542 - val_loss: 0.3498
Epoch 7/25
[1m163/16

<keras.src.callbacks.history.History at 0x1486820f0>

In [23]:
cnn.save('pneumonia_detection-CNN.keras')

## Part 4 - Making a single prediction


In [36]:
import numpy as np
from tensorflow.keras.preprocessing import image

test_image = image.load_img(
    VALIDATION_SET_DIR + "/PNEUMONIA/person1946_bacteria_4874.jpeg",
    target_size=(64, 64))
test_image = image.img_to_array(test_image)
test_image = np.expand_dims(test_image, axis=0)
result = cnn.predict(test_image)
training_set.class_indices
if result[0][0] == 1:
    prediction = 'PNEUMONIA'
else:
    prediction = 'NORMAL'

[1m1/1[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 15ms/step


In [37]:
print(prediction)

PNEUMONIA


In [29]:
CATEGORIES = ["NORMAL", "PNEUMONIA"]
from tensorflow.keras.preprocessing import image
import numpy as np

def prepare(filepath):
    test_image = image.load_img(filepath, target_size=(64, 64))
    test_image = image.img_to_array(test_image)
    test_image = np.expand_dims(test_image, axis=0)
    return  test_image


model = tf.keras.models.load_model('pneumonia_detection-CNN.keras')

prediction = model.predict(prepare(TEST_SET_DIR + "/NORMAL/IM-0015-0001.jpeg"))
print(prediction)  # will be a list in a list.
print(CATEGORIES[int(prediction[0][0])])

[1m1/1[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 30ms/step
[[0.]]
NORMAL
