Fetching and preprocessing the MNIST dataset

In [None]:
from sklearn.datasets import fetch_openml

X, y = fetch_openml('mnist_784', version=1, return_X_y=True, as_frame=False)
X = X / 255.
y = y.astype(int)

print(X.shape)
print(y.shape)

Split into training and test set:

In [None]:
from sklearn.model_selection import train_test_split

X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=123, test_size=0.7)

In [None]:
from sklearn.neural_network import MLPClassifier

mlp = MLPClassifier(
    hidden_layer_sizes=(50,),
    validation_fraction=0.1,
    activation='logistic',
    max_iter=100,
    # alpha=1e-4,
    solver="sgd",
    verbose=10,
    random_state=123,
    learning_rate_init=0.2
);

In [None]:
mlp.fit(X_train, y_train);

In [None]:
print("Training set score: %f" % mlp.score(X_train, y_train))
print("Test set score: %f" % mlp.score(X_test, y_test))

In [None]:
import matplotlib.pyplot as plt

plt.plot(mlp.loss_curve_)
plt.ylabel('Loss')
plt.xlabel('Epoch')
plt.show()

Failure cases:

In [None]:
X_test_subset = X_test[:1000, :]
y_test_subset = y_test[:1000]

In [None]:
import numpy as np

probas = mlp.predict_proba(X_test_subset)

test_pred = np.argmax(probas, axis=1)

misclassified_images = X_test_subset[y_test_subset != test_pred][:25]
misclassified_labels = test_pred[y_test_subset != test_pred][:25]
correct_labels = y_test_subset[y_test_subset != test_pred][:25]

In [None]:
_, ax = plt.subplots(nrows=5, ncols=5,
                     sharex=True, sharey=True, figsize=(8, 8))
ax = ax.flatten()
for i in range(25):
    img = misclassified_images[i].reshape(28, 28)
    ax[i].imshow(img, cmap='Greys', interpolation='nearest')
    ax[i].set_title(f'{i + 1}) '
                    f'True: {correct_labels[i]}\n'
                    f' Predicted: {misclassified_labels[i]}')

ax[0].set_xticks([])
ax[0].set_yticks([])
plt.tight_layout()
plt.show()