In [None]:
%matplotlib inline
import numpy as np
np.random.seed(3) # set seed for reproducability

from keras.models import Sequential
from keras.layers import Dense, Dropout, Activation, Flatten
from keras.layers import Convolution2D, MaxPooling2D
from keras import utils
from keras.datasets import mnist # the "hello world" data set for deep learning

In [None]:
# Load pre-shuffled MNIST data into train and test sets
(X_train, y_train), (X_test, y_test) = mnist.load_data()

# show some example of the mnist dataset and print the dataformat 
print(X_train.shape)
import matplotlib as mpl
from matplotlib import pyplot as plt
plt.imshow(X_train[11]) 

In [None]:
# Reshape input data
X_train = X_train.reshape(X_train.shape[0], 28, 28, 1)
X_test = X_test.reshape(X_test.shape[0], 28, 28, 1)
print(X_train.shape)

# Convert datatype
X_train = X_train.astype('float32')
X_test = X_test.astype('float32')


In [None]:
# normalize values (experiment!!!)

# to 0 to 1
X_train /= 255
X_test /= 255

# to -1 to 1
#X_train /= 127.5 - 1
#X_test /= 127.5 - 1

In [None]:
# Preprocess the output classes
#-------------------------------------------------------------------------------
# Convert 1-dimensional class arrays to 10-dimensional class matrices
Y_train = utils.to_categorical(y_train, 10)
Y_test = utils.to_categorical(y_test, 10)

In [None]:
model = Sequential()

model.add(Convolution2D(filters=32, kernel_size=(3, 3), activation='relu', input_shape=(28,28,1)))
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Convolution2D(filters=32, kernel_size=(3, 3), activation='relu'))
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.25))

model.add(Flatten())
model.add(Dense(128, activation='relu'))
model.add(Dropout(0.5))
model.add(Dense(10, activation='softmax'))

# compile model 
model.compile(loss = 'categorical_crossentropy',
              optimizer = 'adam',
              metrics=['accuracy'])

In [None]:
model.summary()

In [None]:
# use only part of the training data due to time restrictions in the TP
number_of_training_samples = 4000
X_train_small = X_train[1:number_of_training_samples]
Y_train_small = Y_train[1:number_of_training_samples]

In [None]:
# train model
model.fit(X_train_small, Y_train_small, 
          batch_size=32, epochs=10, verbose=1)

In [None]:
score = model.evaluate(X_test, Y_test, verbose=1)
print(score)

In [None]:
index = 888
plt.imshow(np.vstack(X_test[index:index+5]).reshape([-1,28]))

In [None]:
np.argmax(model.predict(X_test[index:index+5]), axis=1)