In [1]:
import numpy
from keras.datasets import mnist
from keras.models import Sequential
from keras.layers import Dense
from keras.layers import Dropout
from keras.utils import np_utils

Using Theano backend.


In [2]:
# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)

(X_train, y_train), (X_test, y_test) = mnist.load_data()

# flatten 28*28 images to a 784 vector for each image
num_pixels = X_train.shape[1] * X_train.shape[2]
X_train = X_train.reshape(X_train.shape[0], num_pixels).astype('float32')
X_test = X_test.reshape(X_test.shape[0], num_pixels).astype('float32')

In [3]:
# Normalize inputs from 0-255 to 0-1
X_train = X_train / 255
X_test = X_test / 255

# one hot encode outputs
y_train = np_utils.to_categorical(y_train)
y_test = np_utils.to_categorical(y_test)
num_classes = y_test.shape[1]

In [4]:
# define baseline model
def baseline_model():
    # create model
    model = Sequential()
    model.add(Dense(num_pixels, input_dim=num_pixels, init='normal', activation='relu'))
    model.add(Dense(num_classes, init='normal', activation='softmax'))
    # Compile model
    model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

In [13]:
# build the model
model = baseline_model()
# Fit the model 
model.fit(X_train, y_train, validation_data=(X_test, y_test), nb_epoch=10, batch_size=200, verbose=2)
# Final evaluation of the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("Baseline Error: %.2f%%" % (100-scores[1]*100))

Train on 60000 samples, validate on 10000 samples
Epoch 1/10
4s - loss: 0.2791 - acc: 0.9203 - val_loss: 0.1421 - val_acc: 0.9577
Epoch 2/10
4s - loss: 0.1122 - acc: 0.9678 - val_loss: 0.0996 - val_acc: 0.9696
Epoch 3/10
4s - loss: 0.0724 - acc: 0.9790 - val_loss: 0.0784 - val_acc: 0.9749
Epoch 4/10
5s - loss: 0.0511 - acc: 0.9853 - val_loss: 0.0777 - val_acc: 0.9771
Epoch 5/10
4s - loss: 0.0366 - acc: 0.9894 - val_loss: 0.0630 - val_acc: 0.9795
Epoch 6/10
4s - loss: 0.0264 - acc: 0.9931 - val_loss: 0.0635 - val_acc: 0.9795
Epoch 7/10
5s - loss: 0.0186 - acc: 0.9957 - val_loss: 0.0600 - val_acc: 0.9812
Epoch 8/10
5s - loss: 0.0149 - acc: 0.9968 - val_loss: 0.0623 - val_acc: 0.9820
Epoch 9/10
5s - loss: 0.0107 - acc: 0.9980 - val_loss: 0.0593 - val_acc: 0.9817
Epoch 10/10
5s - loss: 0.0072 - acc: 0.9988 - val_loss: 0.0599 - val_acc: 0.9821
Baseline Error: 1.79%


In [5]:
import numpy
from keras.datasets import mnist
from keras.models import Sequential
from keras.layers import Dense
from keras.layers import Dropout
from keras.layers import Flatten
from keras.layers.convolutional import Convolution2D
from keras.layers.convolutional import MaxPooling2D
from keras.utils import np_utils
from keras import backend as K
K.set_image_dim_ordering('th')


# fix random seed for reproducibility
seed = 7
numpy.random.seed(seed)

# load data
(X_train, y_train), (X_test, y_test) = mnist.load_data()
# reshape to be [samples][pixels][width][height]
X_train = X_train.reshape(X_train.shape[0], 1, 28, 28).astype('float32')
X_test = X_test.reshape(X_test.shape[0], 1, 28, 28).astype('float32')

# normalize inputs from 0-255 to 0-1
X_train = X_train / 255
X_test = X_test / 255
# one hot encode outputs
y_train = np_utils.to_categorical(y_train)
y_test = np_utils.to_categorical(y_test)
num_classes = y_test.shape[1]

In [6]:
def CNN_model():
    # create model
    model = Sequential()
    model.add(Convolution2D(32, 5, 5, border_mode='valid', input_shape=(1, 28, 28), activation='relu'))
    model.add(MaxPooling2D(pool_size=(2, 2)))
    model.add(Dropout(0.2))
    model.add(Flatten())
    model.add(Dense(128, activation='relu'))
    model.add(Dense(num_classes, activation='softmax'))
    # Compile model
    model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
    return model

In [7]:
# build the model
model = CNN_model()
# Fit the model
model.fit(X_train, y_train, validation_data=(X_test, y_test), nb_epoch=10, batch_size=200, verbose=2)
# Final evaluation of the model
scores = model.evaluate(X_test, y_test, verbose=0)
print("Baseline Error: %.2f%%" % (100-scores[1]*100))

Train on 60000 samples, validate on 10000 samples
Epoch 1/10
53s - loss: 0.2412 - acc: 0.9317 - val_loss: 0.0752 - val_acc: 0.9769
Epoch 2/10
47s - loss: 0.0728 - acc: 0.9781 - val_loss: 0.0526 - val_acc: 0.9830
Epoch 3/10
44s - loss: 0.0496 - acc: 0.9851 - val_loss: 0.0389 - val_acc: 0.9858
Epoch 4/10
43s - loss: 0.0412 - acc: 0.9869 - val_loss: 0.0430 - val_acc: 0.9858
Epoch 5/10
43s - loss: 0.0323 - acc: 0.9897 - val_loss: 0.0390 - val_acc: 0.9867
Epoch 6/10
51s - loss: 0.0283 - acc: 0.9910 - val_loss: 0.0413 - val_acc: 0.9864
Epoch 7/10
48s - loss: 0.0222 - acc: 0.9928 - val_loss: 0.0329 - val_acc: 0.9893
Epoch 8/10
46s - loss: 0.0196 - acc: 0.9939 - val_loss: 0.0380 - val_acc: 0.9883
Epoch 9/10
46s - loss: 0.0159 - acc: 0.9951 - val_loss: 0.0343 - val_acc: 0.9883
Epoch 10/10
46s - loss: 0.0143 - acc: 0.9955 - val_loss: 0.0321 - val_acc: 0.9896
Baseline Error: 1.04%


In [16]:
import pickle
pkl_handle = open('trained_conv_weights.pkl', 'wb')

In [17]:
#import matplotlib as pl

# Visualize weights
W = model.layers[0].W.get_value(borrow=True)
W = numpy.squeeze(W)
print("W shape : ", W.shape)
print W
pickle.dump(W, pkl_handle)
pkl_handle.close()

#pl.figure(figsize=(15, 15))
#pl.title('conv1 weights')
#nice_imshow(pl.gca(), make_mosaic(W, 6, 6), cmap=cm.binary)

('W shape : ', (32, 5, 5))
[[[ -1.09866314e-01   1.29987381e-03  -1.14111891e-02   1.94709495e-01
     2.49121100e-01]
  [  9.72325448e-03  -4.05195653e-02  -2.00826406e-01  -1.16524361e-01
     3.09393518e-02]
  [  5.59176765e-02   3.99214290e-02  -1.68650612e-01  -3.16331923e-01
    -1.89539954e-01]
  [  4.97269444e-02   1.99614037e-02   3.59363258e-02   6.29092827e-02
    -1.55112520e-01]
  [ -4.53055538e-02   1.70500815e-01   9.18523595e-02   1.32131830e-01
     1.14934318e-01]]

 [[ -2.15603366e-01   9.13213938e-02   1.60746083e-01   1.34934662e-02
    -1.98026374e-01]
  [ -9.87272337e-02   1.42041266e-01   8.46384391e-02  -6.89426661e-02
    -2.64167935e-01]
  [  6.42976165e-02   1.40637368e-01  -2.90168263e-02  -8.74014124e-02
    -2.18808293e-01]
  [  3.05259414e-02   5.12211807e-02   1.97997540e-02  -1.46216571e-01
    -1.54691309e-01]
  [  3.10066398e-02   4.78953496e-02   9.38038230e-02  -1.39081866e-01
    -6.90522715e-02]]

 [[ -6.60526529e-02  -9.77553874e-02  -3.30118798