In [1]:
# This demo draws heavily from the handwritten digit example in
# Chapter 2 of Francois Chollet's "Deep Learning with Python" book.
# I've added a simpler single-layer example first before moving to
# the 2-layer example. -George Chen (CMU Fall 2017)

%matplotlib inline
import matplotlib.pyplot as plt
import numpy as np

from tensorflow.python import keras
from keras.datasets import mnist
from keras.models import Sequential
from keras.layers import Dense

(train_images, train_labels), (test_images, test_labels) = mnist.load_data()

flattened_train_images = train_images.reshape(len(train_images), -1)  # flattens out each training image
flattened_train_images = flattened_train_images.astype(np.float32) / 255  # rescale to be between 0 and 1
flattened_test_images = test_images.reshape(len(test_images), -1)  # flattens out each test image
flattened_test_images = flattened_test_images.astype(np.float32) / 255  # rescale to be between 0 and 1

from keras.utils import to_categorical
train_labels_categorical = to_categorical(train_labels)
test_labels_categorical = to_categorical(test_labels)

Using TensorFlow backend.


In [2]:
train_labels[0]

5

In [3]:
train_labels_categorical[0]

array([0., 0., 0., 0., 0., 1., 0., 0., 0., 0.], dtype=float32)

In [4]:
# extremely shallow single-layer model
single_layer_model = Sequential()  # this is Keras's way of specifying a model that is a single sequence of layers
single_layer_model.add(Dense(10, activation='softmax', input_shape=(784,)))
single_layer_model.summary()

AttributeError: module 'tensorflow' has no attribute 'get_default_graph'

In [None]:
single_layer_model.compile(optimizer='adam',
                           loss='categorical_crossentropy',
                           metrics=['accuracy'])

In [None]:
single_layer_model.fit(flattened_train_images,
                       train_labels_categorical,
                       validation_split=0.2,
                       epochs=5,
                       batch_size=128)

In [None]:
# two-layer model
two_layer_model = Sequential()  # this is Keras's way of specifying a model that is a single sequence of layers
two_layer_model.add(Dense(512, activation='relu', input_shape=(784,)))
two_layer_model.add(Dense(10, activation='softmax'))
two_layer_model.compile(optimizer='adam',
                        loss='categorical_crossentropy',
                        metrics=['accuracy'])
two_layer_model.summary()

In [None]:
two_layer_model.fit(flattened_train_images,
                    train_labels_categorical,
                    validation_split=0.2,
                    epochs=5,
                    batch_size=128)

## Finally evaluate on test data

In [None]:
test_loss, test_acc = single_layer_model.evaluate(flattened_test_images, test_labels_categorical)
print('Test accuracy:', test_acc)

In [None]:
test_loss, test_acc = two_layer_model.evaluate(flattened_test_images, test_labels_categorical)
print('Test accuracy:', test_acc)