In [2]:
import os

os.environ["TF_CPP_MIN_LOG_LEVEL"] = "2"

import tensorflow as tf
from tensorflow import keras
from tensorflow.keras import layers
from tensorflow.keras.datasets import mnist

In [3]:
physical_devices = tf.config.list_physical_devices("GPU")
tf.config.experimental.set_memory_growth(physical_devices[0], True)

In [4]:
(x_train, y_train), (x_test, y_test) = mnist.load_data()
# x_train = x_train.reshape(-1, 784).astype("float32") / 255.0
# x_test = x_test.reshape(-1, 784).astype("float32") / 255.0
x_train = x_train.reshape([-1, 28, 28]).astype("float32") / 255.0
x_test = x_test.reshape([-1, 28, 28]).astype("float32") / 255.0

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/mnist.npz


In [9]:
#SimpleRNN with relu
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(layers.SimpleRNN(512, return_sequences=True, activation="relu"))
model.add(layers.SimpleRNN(512, activation="relu"))
model.add(layers.Dense(10))

In [None]:
#Simple RNN with tanh
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(layers.SimpleRNN(256, return_sequences=True, activation="tanh"))
model.add(layers.SimpleRNN(256))
model.add(layers.Dense(10))

In [None]:
#GRU Cells
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(layers.GRU(256, return_sequences=True, activation="relu"))
model.add(layers.GRU(256))
model.add(layers.Dense(10))

In [None]:
#LSTM Cells
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(
    layers.Bidirectional(layers.LSTM(256, return_sequences=True, activation="relu"))
)
model.add(layers.LSTM(256, name="lstm_layer2"))
model.add(layers.Dense(10))

In [6]:
#Bidirectional LSTM
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(
    layers.Bidirectional(layers.LSTM(256, return_sequences=True, activation="relu"))
)
model.add(layers.Bidirectional(layers.LSTM(256, name="lstm_layer2")))
model.add(layers.Dense(10))



In [11]:
print(model.summary())
model.compile(
    loss=keras.losses.SparseCategoricalCrossentropy(from_logits=True),
    optimizer=keras.optimizers.Adam(learning_rate=0.001),
    metrics=["accuracy"],
)

Model: "sequential_2"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 simple_rnn_2 (SimpleRNN)    (None, None, 512)         276992    
                                                                 
 simple_rnn_3 (SimpleRNN)    (None, 512)               524800    
                                                                 
 dense_2 (Dense)             (None, 10)                5130      
                                                                 
Total params: 806,922
Trainable params: 806,922
Non-trainable params: 0
_________________________________________________________________
None


In [12]:
model.fit(x_train, y_train, batch_size=64, epochs=10, verbose=2)
model.evaluate(x_test, y_test, batch_size=64, verbose=2)

Epoch 1/10
938/938 - 67s - loss: 0.3127 - accuracy: 0.9040 - 67s/epoch - 72ms/step
Epoch 2/10
938/938 - 66s - loss: 0.1377 - accuracy: 0.9615 - 66s/epoch - 70ms/step
Epoch 3/10
938/938 - 66s - loss: 0.1163 - accuracy: 0.9693 - 66s/epoch - 70ms/step
Epoch 4/10
938/938 - 66s - loss: 0.1022 - accuracy: 0.9725 - 66s/epoch - 70ms/step
Epoch 5/10
938/938 - 66s - loss: 0.0958 - accuracy: 0.9745 - 66s/epoch - 70ms/step
Epoch 6/10
938/938 - 66s - loss: 0.1000 - accuracy: 0.9731 - 66s/epoch - 70ms/step
Epoch 7/10
938/938 - 66s - loss: 0.0771 - accuracy: 0.9790 - 66s/epoch - 70ms/step
Epoch 8/10
938/938 - 65s - loss: 0.0706 - accuracy: 0.9808 - 65s/epoch - 70ms/step
Epoch 9/10
938/938 - 65s - loss: 0.0735 - accuracy: 0.9799 - 65s/epoch - 69ms/step
Epoch 10/10
938/938 - 65s - loss: 0.0647 - accuracy: 0.9830 - 65s/epoch - 69ms/step
157/157 - 2s - loss: 0.0805 - accuracy: 0.9762 - 2s/epoch - 15ms/step


[0.0805467739701271, 0.9761999845504761]