## Shallow artificial neural network with Keras

### Import libraries

In [6]:
import tensorflow as tf
import keras
from keras.datasets import mnist
from keras.models import Sequential
from keras.layers import Dense
from keras.optimizers import SGD
from keras.utils import to_categorical
import matplotlib.pyplot as plt

### Define the function

In [2]:
def get_mnist(dataset="mnist"):
    
    # STEP 1 Load dataset.  
    # Training set is 60 000 images, each 28 x 28 pixels.  Test set is 10 000 pixels, each 28 x 28 pixels. 
    # Type is numpy.ndarray
    if dataset == "fashion":
        (X_train, y_train), (X_test,y_test) = tf.keras.datasets.fashion_mnist.load_data()
    else:
        (X_train, y_train), (X_test, y_test) = mnist.load_data()
    
    return (X_train, y_train), (X_test, y_test) 

        
def preprocess_mnist(X_train, y_train, X_test, y_test):
    
    # Reshape the images into a 1D vector.  Each 28 x 28 image becomes a 1 dimensional vector 784 long
    X_train = X_train.reshape(60000, 784)
    X_test = X_test.reshape(10000, 784)

    # Convert data type to float
    X_train = X_train.astype('float32')
    X_test = X_test.astype('float32')

    # Divide by 255 so that all values are between 0 and 1
    X_train /= 255
    X_test /= 255

    # Change labels to one-hot encoding.  There are 10 classes
    y_train = to_categorical(y_train, 10)
    y_test = to_categorical(y_test, 10)
    
    return (X_train, y_train), (X_test, y_test) 
    
    
def train_predict_mnist(X_train, y_train, X_test, y_test):

    # Define the neural network
    model = Sequential()
    model.add(Dense(64, activation= "sigmoid", input_shape=(784,)))
    model.add(Dense(10, activation = "softmax"))

    # Compile and train the network.
    model.compile(loss='mean_squared_error', optimizer=SGD(lr=0.01), metrics=['accuracy'])
    model.fit(X_train, y_train, batch_size = 128, epochs = 200, verbose = 1, validation_data=(X_test, y_test))
    
    # Predict on training set and test set
    predictions_train = model.predict(X_train)
    predictions_test = model.predict(X_test)
    



### Use the functions 

### Example 1 - use MNIST

In [4]:
# Step 1 - get the numeral MNIST (it is the default dataset)
(X_train, y_train), (X_test, y_test) = get_mnist()

# Step 2 - preprocess the data so it is suitable to input into neural network
(X_train, y_train), (X_test, y_test) = preprocess_mnist(X_train, y_train, X_test, y_test)

# Step 3 - train the MNIST dataset
train_predict_mnist(X_train, y_train, X_test, y_test)



Train on 60000 samples, validate on 10000 samples
Epoch 1/200
Epoch 2/200
Epoch 3/200
Epoch 4/200
Epoch 5/200
Epoch 6/200
Epoch 7/200
Epoch 8/200
Epoch 9/200
Epoch 10/200
Epoch 11/200
Epoch 12/200
Epoch 13/200
Epoch 14/200
Epoch 15/200
Epoch 16/200
Epoch 17/200
Epoch 18/200
Epoch 19/200
Epoch 20/200
Epoch 21/200
Epoch 22/200
Epoch 23/200
Epoch 24/200
Epoch 25/200
Epoch 26/200
Epoch 27/200
Epoch 28/200
Epoch 29/200
Epoch 30/200
Epoch 31/200
Epoch 32/200
Epoch 33/200
Epoch 34/200
Epoch 35/200
Epoch 36/200
Epoch 37/200
Epoch 38/200
Epoch 39/200
Epoch 40/200
Epoch 41/200
Epoch 42/200
Epoch 43/200
Epoch 44/200
Epoch 45/200
Epoch 46/200
Epoch 47/200
Epoch 48/200
Epoch 49/200
Epoch 50/200
Epoch 51/200
Epoch 52/200
Epoch 53/200
Epoch 54/200
Epoch 55/200


Epoch 56/200
Epoch 57/200
Epoch 58/200
Epoch 59/200
Epoch 60/200
Epoch 61/200
Epoch 62/200
Epoch 63/200
Epoch 64/200
Epoch 65/200
Epoch 66/200
Epoch 67/200
Epoch 68/200
Epoch 69/200
Epoch 70/200
Epoch 71/200
Epoch 72/200
Epoch 73/200
Epoch 74/200
Epoch 75/200
Epoch 76/200
Epoch 77/200
Epoch 78/200
Epoch 79/200
Epoch 80/200
Epoch 81/200
Epoch 82/200
Epoch 83/200
Epoch 84/200
Epoch 85/200
Epoch 86/200
Epoch 87/200
Epoch 88/200
Epoch 89/200
Epoch 90/200
Epoch 91/200
Epoch 92/200
Epoch 93/200
Epoch 94/200
Epoch 95/200
Epoch 96/200
Epoch 97/200
Epoch 98/200
Epoch 99/200
Epoch 100/200
Epoch 101/200
Epoch 102/200
Epoch 103/200
Epoch 104/200
Epoch 105/200
Epoch 106/200
Epoch 107/200
Epoch 108/200
Epoch 109/200
Epoch 110/200


Epoch 111/200
Epoch 112/200
Epoch 113/200
Epoch 114/200
Epoch 115/200
Epoch 116/200
Epoch 117/200
Epoch 118/200
Epoch 119/200
Epoch 120/200
Epoch 121/200
Epoch 122/200
Epoch 123/200
Epoch 124/200
Epoch 125/200
Epoch 126/200
Epoch 127/200
Epoch 128/200
Epoch 129/200
Epoch 130/200
Epoch 131/200
Epoch 132/200
Epoch 133/200
Epoch 134/200
Epoch 135/200
Epoch 136/200
Epoch 137/200
Epoch 138/200
Epoch 139/200
Epoch 140/200
Epoch 141/200
Epoch 142/200
Epoch 143/200
Epoch 144/200
Epoch 145/200
Epoch 146/200
Epoch 147/200
Epoch 148/200
Epoch 149/200
Epoch 150/200
Epoch 151/200
Epoch 152/200
Epoch 153/200
Epoch 154/200
Epoch 155/200
Epoch 156/200
Epoch 157/200
Epoch 158/200
Epoch 159/200
Epoch 160/200
Epoch 161/200
Epoch 162/200
Epoch 163/200
Epoch 164/200
Epoch 165/200


Epoch 166/200
Epoch 167/200
Epoch 168/200
Epoch 169/200
Epoch 170/200
Epoch 171/200
Epoch 172/200
Epoch 173/200
Epoch 174/200
Epoch 175/200
Epoch 176/200
Epoch 177/200
Epoch 178/200
Epoch 179/200
Epoch 180/200
Epoch 181/200
Epoch 182/200
Epoch 183/200
Epoch 184/200
Epoch 185/200
Epoch 186/200
Epoch 187/200
Epoch 188/200
Epoch 189/200
Epoch 190/200
Epoch 191/200
Epoch 192/200
Epoch 193/200
Epoch 194/200
Epoch 195/200
Epoch 196/200
Epoch 197/200
Epoch 198/200
Epoch 199/200
Epoch 200/200


### Example 2 - use Fashion MNIST

In [7]:
# Step 1 - get the numeral MNIST (it is the default dataset)
(X_train, y_train), (X_test, y_test) = get_mnist("fashion")

# Step 2 - preprocess the data so it is suitable to input into neural network
(X_train, y_train), (X_test, y_test) = preprocess_mnist(X_train, y_train, X_test, y_test)

# Step 3 - train the MNIST dataset
train_predict_mnist(X_train, y_train, X_test, y_test)

NameError: name 'train_mnist' is not defined