# Welcome to the Pneumonia Image Classifier
## In this notebook we're going to train a Neural Network to detect pneumonia in images.

### Let's get started by importing our libraries

In [1]:
from __future__ import print_function
import keras

from keras.preprocessing.image import ImageDataGenerator, load_img
from keras.models import Sequential
from keras.layers import Dense, Dropout, Flatten, Activation
from keras.layers import Conv2D, MaxPooling2D
from keras.optimizers import SGD
from keras.datasets import mnist
from keras import backend as K
import numpy as np
import math


  from ._conv import register_converters as _register_converters
Using TensorFlow backend.


### Let's create a reference to our data directories

In [2]:
train_data_dir = './input/train'
test_data_dir = './input/test'
val_data_dir = './input/val'

### Define some variables that we're going to use in training and testing

In [3]:
nb_train_samples = 5217
nb_validation_samples = 17
epochs = 20
batch_size = 16

### Shape our input

In [4]:
# dimensions of our images.
img_width, img_height = 150, 150

input_shape = (img_width, img_height, 3)
if K.image_data_format() == 'channels_first':
    input_shape = (3, img_width, img_height)

### Given the size of our dataset, we'll need to use generators in order to feed the data to our model bit-by-bit
### Let's create our generators

In [5]:
train_gen = ImageDataGenerator(
    rescale=1. / 255,
    shear_range=0.2,
    zoom_range=0.2,
    horizontal_flip=True)

In [6]:
test_gen = ImageDataGenerator(rescale=1. / 255)

In [7]:
train_generator = train_gen.flow_from_directory(
    train_data_dir,
    target_size=(img_width, img_height),
    batch_size=batch_size,
    class_mode='binary')

Found 5216 images belonging to 2 classes.


In [8]:
test_generator = test_gen.flow_from_directory(
    test_data_dir,
    target_size=(img_width, img_height),
    batch_size=batch_size,
    class_mode='binary')

Found 624 images belonging to 2 classes.


In [9]:
validation_generator = test_gen.flow_from_directory(
    val_data_dir,
    target_size=(img_width, img_height),
    batch_size=batch_size,
    class_mode='binary')

Found 16 images belonging to 2 classes.


### Now let's initialize our model

In [10]:
model = Sequential()
model.add(Conv2D(64, (3, 3), input_shape=input_shape))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))

model.add(Conv2D(48, (3, 3)))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))

model.add(Conv2D(32, (3, 3)))
model.add(Activation('relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))

model.add(Flatten())
model.add(Dense(32))
model.add(Activation('relu'))
model.add(Dropout(0.5))
model.add(Dense(1))
model.add(Activation('sigmoid'))

### Compile it

In [11]:
model.compile(loss='binary_crossentropy',
              optimizer='rmsprop',
              metrics=['accuracy'])

### Fit it using our training generator... it's going to take a while

In [12]:
model.fit_generator(
    train_generator,
    steps_per_epoch=nb_train_samples // batch_size,
    epochs=epochs,
    validation_data=validation_generator,
    validation_steps=nb_validation_samples // batch_size)

Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


<keras.callbacks.History at 0xb1e6bdba8>

### Now let's evaluate it using our test generator

In [13]:
score = model.evaluate_generator(test_generator, math.ceil(5217 / batch_size), verbose=1)



In [14]:
score

[0.47056583494376264, 0.9030963302752294]