# Exclusive OR with Keras

In [1]:
# NOTE: This is required, else the results of the model training will differ vastly.
from __future__ import absolute_import, division, print_function, unicode_literals

import numpy as np
import tensorflow as tf

from tensorflow.keras import Sequential
from tensorflow.keras.layers import Dense
from tensorflow.keras.optimizers import SGD

In [2]:
print(tf.version.VERSION)

2.0.0-beta1


In [3]:
x_train = np.array([[0, 0],
                    [0, 1],
                    [1, 0],
                    [1, 1]])

y_train = np.array([[0],
                    [1],
                    [1],
                    [0]])

In [4]:
def create_model():
# The fully connected hidden layer will have 100 neurons.
    num_neurons = 10

    model = Sequential([
        Dense(num_neurons, activation='relu', input_dim=2),
        # The output layer has one neuron to output a single binary classification value (0 or 1).
        Dense(1, activation='sigmoid')
    ])
    sgd = SGD(0.1)
    model.compile(loss='binary_crossentropy', 
                  optimizer=sgd,
                  metrics=['accuracy'])
    return model

# Alternatively, we can use add each layer independently.
# model.add(Dense(num_neurons, activation='relu', input_dim=2))
# model.add(Dense(1, activation='sigmoid'))

In [5]:
model = create_model()
# Overview of the network parameter and number of weights at each stage.
# 10 neurons, each with two weights (one for each value in the input vector), 
# and one weight for the bias gives you 30 weights to learn.
# The output layer has a weight for each of the 10 neurons in the first layer 
# and one bias weight for a total of 11 in that layer.
model.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense (Dense)                (None, 10)                30        
_________________________________________________________________
dense_1 (Dense)              (None, 1)                 11        
Total params: 41
Trainable params: 41
Non-trainable params: 0
_________________________________________________________________


In [6]:
model.predict(x_train)

array([[0.5       ],
       [0.28757626],
       [0.5413843 ],
       [0.25403112]], dtype=float32)

In [7]:
model.fit(x_train, y_train, epochs=100)

W1221 14:46:44.952793 4450168256 deprecation.py:323] From /usr/local/lib/python3.7/site-packages/tensorflow/python/ops/math_grad.py:1250: add_dispatch_support.<locals>.wrapper (from tensorflow.python.ops.array_ops) is deprecated and will be removed in a future version.
Instructions for updating:
Use tf.where in 2.0, which has the same broadcast rule as np.where


Train on 4 samples
Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100
Epoch 22/100
Epoch 23/100
Epoch 24/100
Epoch 25/100
Epoch 26/100
Epoch 27/100
Epoch 28/100
Epoch 29/100
Epoch 30/100
Epoch 31/100
Epoch 32/100
Epoch 33/100
Epoch 34/100
Epoch 35/100
Epoch 36/100
Epoch 37/100
Epoch 38/100
Epoch 39/100
Epoch 40/100
Epoch 41/100
Epoch 42/100
Epoch 43/100
Epoch 44/100
Epoch 45/100
Epoch 46/100
Epoch 47/100
Epoch 48/100
Epoch 49/100
Epoch 50/100
Epoch 51/100
Epoch 52/100
Epoch 53/100
Epoch 54/100
Epoch 55/100
Epoch 56/100
Epoch 57/100
Epoch 58/100
Epoch 59/100
Epoch 60/100
Epoch 61/100
Epoch 62/100
Epoch 63/100
Epoch 64/100
Epoch 65/100
Epoch 66/100
Epoch 67/100
Epoch 68/100
Epoch 69/100
Epoch 70/100
Epoch 71/100
Epoch 72/100
Epoch 73/100
Epoch 74/100
Epoch 75/100
Epoch 76/100
Ep

Epoch 82/100
Epoch 83/100
Epoch 84/100
Epoch 85/100
Epoch 86/100
Epoch 87/100
Epoch 88/100
Epoch 89/100
Epoch 90/100
Epoch 91/100
Epoch 92/100
Epoch 93/100
Epoch 94/100
Epoch 95/100
Epoch 96/100
Epoch 97/100
Epoch 98/100
Epoch 99/100
Epoch 100/100


<tensorflow.python.keras.callbacks.History at 0x127530b10>

In [8]:
model.predict_classes(x_train)

array([[0],
       [1],
       [1],
       [0]], dtype=int32)

In [9]:
model.predict(x_train)

array([[0.49407762],
       [0.5063816 ],
       [0.79505247],
       [0.26788902]], dtype=float32)

# Saving the trained model

In [13]:
# Save the model.
model.save('model.h5')

!ls -a 

# Recreate the exact same model purely from the file.
new_model = tf.keras.models.load_model('model.h5')
new_model.predict(x_train)

[36m.[m[m                  01_neuron.ipynb    04_mnist.ipynb     model.h5
[36m..[m[m                 02_or_gate.ipynb   basic_model.json
[36m.ipynb_checkpoints[m[m 03-xor-keras.ipynb basic_weights.h5


array([[0.49407762],
       [0.5063816 ],
       [0.79505247],
       [0.26788902]], dtype=float32)

# References

https://blog.thoughtram.io/machine-learning/2016/11/02/understanding-XOR-with-keras-and-tensorlow.html