In [1]:
from tensorflow.keras.preprocessing.image import ImageDataGenerator
from tensorflow.keras.losses import SparseCategoricalCrossentropy
from tensorflow.keras.applications import VGG16
from keras.applications.vgg16 import preprocess_input
from tensorflow.keras.layers import Activation, Dense, Dropout, Flatten, BatchNormalization, Conv2D, MaxPooling2D, Lambda, Input, AveragePooling2D
from tensorflow.keras.models import Sequential, Model
from tensorflow.keras.layers import Input
from tensorflow.keras import layers
from tensorflow.keras.utils import to_categorical
from sklearn.preprocessing import LabelBinarizer
from sklearn.model_selection import train_test_split
from tensorflow.keras.preprocessing import image
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.optimizers import SGD
from tensorflow.keras.preprocessing import image
from tensorflow.keras import backend as K
import tensorflow as tf 
import matplotlib.pyplot as plt 
import numpy as np 
import pandas as pd
import random
#import cv2
import os

In [2]:
covid_dir=os.path.join("Database/COVID19")
norm_dir=os.path.join("Database/NORMAL")
pneu_dir=os.path.join("Database/Viral_Pneumonia")


print('total Covid images:', len(os.listdir(covid_dir)))
print('total Normal images:', len(os.listdir(norm_dir)))
print('total Viral_Pneumonia:', len(os.listdir(pneu_dir)))


total Covid images: 1327
total Normal images: 1341
total Viral_Pneumonia: 1463


In [3]:
# Settings
batch_size = 128
img_height, img_width = 200,200
data_dir = "Database/"

# Rescale images 
datagen= ImageDataGenerator(rescale=1/255,validation_split=.3,rotation_range=20,
                           shear_range=.2,width_shift_range=0.1,height_shift_range=0.1,zoom_range=0.2,
                           horizontal_flip=True)

# Flow training images in batches of batch_size using train_data 
train_generator= datagen.flow_from_directory(
                data_dir,
                target_size=(img_width,img_height),
                batch_size=batch_size,
                subset="training",
                class_mode="categorical", 
                classes= ["COVID19", "NORMAL","Viral_Pneumonia"],
                shuffle=True, 
                seed=30)


datagen2=ImageDataGenerator(rescale=1/255,validation_split=.3)

test_generator=datagen2.flow_from_directory(
                data_dir,
                target_size=(img_width,img_height),
                batch_size=batch_size,
                classes= ["COVID19", "NORMAL","Viral_Pneumonia"],
                class_mode="categorical", 
                subset="validation", 
                shuffle=True, 
                seed=30)

## For evaluation
eval_train_generator= datagen.flow_from_directory(
                data_dir,
                target_size=(img_width,img_height),
                batch_size=batch_size,
                subset="training",
                class_mode="categorical", 
                classes= ["COVID19", "NORMAL","Viral_Pneumonia"],
                shuffle=False, 
                seed=30)

eval_test_generator=datagen2.flow_from_directory(
                data_dir,
                target_size=(img_width,img_height),
                batch_size=batch_size,
                classes= ["COVID19", "NORMAL","Viral_Pneumonia"],
                class_mode="categorical", 
                subset="validation", 
                shuffle=False, 
                seed=30)

Found 2893 images belonging to 3 classes.
Found 1238 images belonging to 3 classes.
Found 2893 images belonging to 3 classes.
Found 1238 images belonging to 3 classes.


In [4]:
classifier=VGG16(weights="imagenet", include_top=False, input_shape=(img_height,img_width,3))

for layer in classifier.layers:
    layer.trainable=False

VGG16_model = tf.keras.Sequential([

classifier,
MaxPooling2D(),
Dense(128, activation='relu'),
Flatten(),
Dense(3, activation='softmax')
])

In [5]:
VGG16_model.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
vgg16 (Functional)           (None, 6, 6, 512)         14714688  
_________________________________________________________________
max_pooling2d (MaxPooling2D) (None, 3, 3, 512)         0         
_________________________________________________________________
dense (Dense)                (None, 3, 3, 128)         65664     
_________________________________________________________________
flatten (Flatten)            (None, 1152)              0         
_________________________________________________________________
dense_1 (Dense)              (None, 3)                 3459      
Total params: 14,783,811
Trainable params: 69,123
Non-trainable params: 14,714,688
_________________________________________________________________


In [6]:
VGG16_model.compile(
      optimizer='adam',
      loss=tf.losses.CategoricalCrossentropy(from_logits=True),
      metrics=['accuracy']
      )
VGG16_model_history = VGG16_model.fit(
      train_generator,
      validation_data=test_generator,
      epochs=50,
      verbose=1
      )

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50


In [None]:
#Plot Model
plt.plot(VGG16_model2_history.history['accuracy'])
plt.plot(VGG16_model2_history.history['val_accuracy'])
plt.title('VGG16 model 2 accuracy')
plt.ylabel('accuracy')
plt.xlabel('epoch')
plt.legend(['train', 'test'], loc='upper left')
plt.show()

In [None]:
VGG16_model_history_df = pd.DataFrame(VGG16_model2_history.history) 
VGG16_model_history_df.to_csv('VGG16_model.csv')

tf.keras.utils.plot_model(
    VGG16_model2, to_file='VGG16_model.png', show_shapes=False,
    show_layer_names=True, rankdir='TB', expand_nested=False, dpi=96
)

VGG16_model2.save('VGG16_model.h5')

In [7]:
Y_pred = VGG16_model.predict_generator(test_generatorgenerator_ds, 1238 // batch_size+1)
y_pred = np.argmax(Y_pred, axis=1)

print('VGG16_model Confusion Matrix')
conf_matrix = pd.DataFrame(
    confusion_matrix(test_ds.classes, y_pred), 
    index=['true: COVID19', 'true: NORMAL','true: Viral_Pneumonia'], 
    columns=['pred: COVID19', 'pred: NORMAL','pred: Viral_Pneumonia']
)



conf_matrix.to_csv("VGG16_model/confusion_matrix.csv")
print(conf_matrix)
print('\n')
print('Classification Report')
target_names = list(test_ds.class_indices.keys())
print(classification_report(test_ds.classes, y_pred, target_names=target_names))

NameError: name 'test_ds' is not defined

In [11]:
# Test Loss/ Test Accuracy
test_loss, test_acc= VGG16_model.evaluate(test_generator)
print("\n Test Accuracy:", test_acc)
print("\n Test Loss:", test_loss)0


 Test Accuracy: 0.8473343849182129

 Test Loss: 0.6990122199058533
