In [None]:
'''Trains a simple deep NN on the MNIST dataset.
Gets to 98.40% test accuracy after 20 epochs
(there is *a lot* of margin for parameter tuning).
2 seconds per epoch on a K520 GPU.
'''

# Original Demo: https://github.com/keras-team/keras/blob/master/examples/mnist_mlp.py

from __future__ import print_function

# import keras
# from keras.datasets import mnist
# from keras.models import Sequential
# from keras.layers import Dense, Dropout
# from keras.optimizers import SGD

import syft.interfaces.keras as keras
from syft.interfaces.keras.datasets import mnist
from syft.interfaces.keras.models import Sequential
from syft.interfaces.keras.layers import Dense, Dropout
from syft.interfaces.keras.optimizers import SGD

batch_size = 128
num_classes = 10
epochs = 5

# the data, shuffled and split between train and test sets
(x_train, y_train), (x_test, y_test) = mnist.load_data()

x_train = x_train.reshape(60000, 784)
x_test = x_test.reshape(10000, 784)
x_train = x_train.astype('float32')
x_test = x_test.astype('float32')
x_train /= 255
x_test /= 255
print(x_train.shape[0], 'train samples')
print(x_test.shape[0], 'test samples')

# convert class vectors to binary class matrices
y_train = keras.utils.to_categorical(y_train, num_classes)
y_test = keras.utils.to_categorical(y_test, num_classes)

model = Sequential()
# model.add(Dense(512, activation='relu', input_shape=(784,)))
# model.add(Dropout(0.2))
# model.add(Dense(512, activation='relu'))
# model.add(Dropout(0.2))
model.add(Dense(num_classes, activation='softmax',input_shape=(784,)))

In [None]:
model.compile(loss='categorical_crossentropy',
              optimizer=SGD(),
              metrics=['accuracy'])

In [None]:
model.summary()

In [None]:
history = model.fit(x_train, y_train,
                    batch_size=128,
                    epochs=epochs,
                    verbose=1,
                    log_interval=5)

# Model.evaluate()
Function to evaluate the model on the test/evaluation data. You can pass metrics that refer to functions in **metrics.py**. You can also define your own metrics by creating a function that takes **y_true** and **y_pred**. For example:

In [None]:
import syft.metrics
import numpy as np
def precision_digit_3(y_true, y_pred):
    indices = np.where(np.argmax(y_true, axis=1)==3)
    return syft.metrics.categorical_accuracy(y_true[indices], y_pred[indices])
    
def top_2_acc(y_true, y_pred):
    return syft.metrics.top_k_categorical_accuracy(y_true, y_pred, 2)

def top_3_acc(y_true, y_pred):
    return syft.metrics.top_k_categorical_accuracy(y_true, y_pred, 3)

In [None]:
loss, metrics = model.evaluate(x_test, y_test, batch_size=128, verbose=True, metrics=
                               ['categorical_accuracy', precision_digit_3, top_2_acc, top_3_acc])


**Result after 5 epochs:**<br>
Test loss = 0.4483006<br>
precision_digit_3 = 0.875<br>
categorical_accuracy = 0.8866185897435898<br>
top_3_acc = 0.9729567307692307<br>
top_2_acc = 0.9509214743589743<br>