# *RNNs*, *GRUs*, *LSTMs* and *Bidirectionality*🛵

In [1]:
import tensorflow as tf
from tensorflow import keras
from keras import layers
from keras.datasets import mnist

# physical_devices = tf.config.list_physical_devices('GPU')
# tf.config.experimental.set_memory_growth(physical_devices[0], True)

In [2]:
(x_train, y_train), (x_test, y_test) = mnist.load_data()
print(x_train.shape)
print(y_train.shape)
x_train = x_train.astype("float32") / 255.0
x_test = x_test.astype("float32") / 255.0

(60000, 28, 28)
(60000,)


### RNNs🚧

In [3]:
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(
    layers.SimpleRNN(512, return_sequences=True, activation='relu')
)
model.add(layers.SimpleRNN(512, activation='relu'))
model.add(layers.Dense(10))
print(model.summary())

model.compile(
    loss=keras.losses.SparseCategoricalCrossentropy(from_logits=True),
    optimizer=keras.optimizers.Adam(learning_rate=0.001),
    metrics=["accuracy"]
)

model.fit(x_train, y_train, batch_size=64, epochs=10, verbose=2)
model.evaluate(x_test, y_test, batch_size=64, verbose=2)

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 simple_rnn (SimpleRNN)      (None, None, 512)         276992    
                                                                 
 simple_rnn_1 (SimpleRNN)    (None, 512)               524800    
                                                                 
 dense (Dense)               (None, 10)                5130      
                                                                 
Total params: 806,922
Trainable params: 806,922
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
938/938 - 306s - loss: 0.3180 - accuracy: 0.9007 - 306s/epoch - 326ms/step
Epoch 2/10
938/938 - 294s - loss: 0.1458 - accuracy: 0.9602 - 294s/epoch - 313ms/step
Epoch 3/10
938/938 - 305s - loss: 0.1203 - accuracy: 0.9672 - 305s/epoch - 325ms/step
Epoch 4/10
938/938 - 296s - loss: 0.1069 - accuracy

[0.07115627825260162, 0.9799000024795532]

### GRUs🧪

In [4]:
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(
    layers.GRU(256, return_sequences=True, activation='tanh')
)
model.add(layers.GRU(256, activation='tanh'))
model.add(layers.Dense(10))
print(model.summary())

model.compile(
    loss=keras.losses.SparseCategoricalCrossentropy(from_logits=True),
    optimizer=keras.optimizers.Adam(learning_rate=0.001),
    metrics=["accuracy"]
)

model.fit(x_train, y_train, batch_size=64, epochs=10, verbose=2)
model.evaluate(x_test, y_test, batch_size=64, verbose=2)

Model: "sequential_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 gru (GRU)                   (None, None, 256)         219648    
                                                                 
 gru_1 (GRU)                 (None, 256)               394752    
                                                                 
 dense_1 (Dense)             (None, 10)                2570      
                                                                 
Total params: 616,970
Trainable params: 616,970
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
938/938 - 177s - loss: 0.2675 - accuracy: 0.9115 - 177s/epoch - 188ms/step
Epoch 2/10
938/938 - 171s - loss: 0.0693 - accuracy: 0.9789 - 171s/epoch - 182ms/step
Epoch 3/10
938/938 - 169s - loss: 0.0468 - accuracy: 0.9851 - 169s/epoch - 180ms/step
Epoch 4/10
938/938 - 171s - loss: 0.0362 - accura

[0.03414703533053398, 0.9901000261306763]

### LSTMs💉

In [5]:
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(
    layers.LSTM(256, return_sequences=True, activation='tanh')
)
model.add(layers.LSTM(256, activation='tanh'))
model.add(layers.Dense(10))
print(model.summary())

model.compile(
    loss=keras.losses.SparseCategoricalCrossentropy(from_logits=True),
    optimizer=keras.optimizers.Adam(learning_rate=0.001),
    metrics=["accuracy"]
)

model.fit(x_train, y_train, batch_size=64, epochs=10, verbose=2)
model.evaluate(x_test, y_test, batch_size=64, verbose=2)

Model: "sequential_2"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 lstm (LSTM)                 (None, None, 256)         291840    
                                                                 
 lstm_1 (LSTM)               (None, 256)               525312    
                                                                 
 dense_2 (Dense)             (None, 10)                2570      
                                                                 
Total params: 819,722
Trainable params: 819,722
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
938/938 - 378s - loss: 0.3076 - accuracy: 0.9010 - 378s/epoch - 403ms/step
Epoch 2/10
938/938 - 375s - loss: 0.0868 - accuracy: 0.9728 - 375s/epoch - 399ms/step
Epoch 3/10
938/938 - 320s - loss: 0.0581 - accuracy: 0.9827 - 320s/epoch - 342ms/step
Epoch 4/10
938/938 - 204s - loss: 0.0452 - accura

[0.037348292768001556, 0.9898999929428101]

### Bidirectionality🧼

In [6]:
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(
    layers.Bidirectional(
        layers.LSTM(256, return_sequences=True, activation='tanh')
    )
)
model.add(
    layers.Bidirectional(
        layers.LSTM(256, activation='tanh')
    )
)
model.add(layers.Dense(10))
print(model.summary())

model.compile(
    loss=keras.losses.SparseCategoricalCrossentropy(from_logits=True),
    optimizer=keras.optimizers.Adam(learning_rate=0.001),
    metrics=["accuracy"]
)

model.fit(x_train, y_train, batch_size=64, epochs=10, verbose=2)
model.evaluate(x_test, y_test, batch_size=64, verbose=2)

Model: "sequential_3"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 bidirectional (Bidirectiona  (None, None, 512)        583680    
 l)                                                              
                                                                 
 bidirectional_1 (Bidirectio  (None, 512)              1574912   
 nal)                                                            
                                                                 
 dense_3 (Dense)             (None, 10)                5130      
                                                                 
Total params: 2,163,722
Trainable params: 2,163,722
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
938/938 - 741s - loss: 0.2588 - accuracy: 0.9145 - 741s/epoch - 790ms/step
Epoch 2/10
938/938 - 688s - loss: 0.0728 - accuracy: 0.9779 - 688s/epoch - 734ms/step

[0.03244110941886902, 0.9908000230789185]