In [1]:
# ignore msg from tensorflow
import os
os.environ['TF_CP_MIN_LOG_LEVEL'] = '2'

In [2]:
import tensorflow as tf
from tensorflow import keras
from tensorflow.keras import layers
from tensorflow.keras.datasets import mnist

In [13]:
# load dataset
(x_train, y_train), (x_test, y_test) = mnist.load_data()

In [4]:
# normalize data
x_train = x_train.astype("float32") / 255.0
x_test = x_test.astype("float32") / 255.0

In [14]:
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(layers.SimpleRNN(512, return_sequences=True, activation="relu")) 
model.add(layers.SimpleRNN(512, activation="relu"))
model.add(layers.Dense(10))

### Using GRU

In [None]:
# not run coz of time consumption
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(layers.GRU(256, return_sequence=True, activation='tanh'))
model.add(layers.GRU(256, activation='tanh'))
model.add(layers.Dense(10))

### Using LSTM

In [None]:
# not run coz of time consumption
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(layers.Bidirectional(layers.LSTM(256, return_sequence=True, activation='tanh')))
model.add(layers.Bidirectional(layers.LSTM(256, activation='tanh')))
model.add(layers.Dense(10))

In [15]:
model.summary()

Model: "sequential_1"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
simple_rnn_2 (SimpleRNN)     (None, None, 512)         276992    
_________________________________________________________________
simple_rnn_3 (SimpleRNN)     (None, 512)               524800    
_________________________________________________________________
dense_1 (Dense)              (None, 10)                5130      
Total params: 806,922
Trainable params: 806,922
Non-trainable params: 0
_________________________________________________________________


In [16]:
model.compile(
    loss= keras.losses.SparseCategoricalCrossentropy(from_logits=True),
    optimizer= keras.optimizers.Adam(learning_rate=0.001), 
    metrics= ['accuracy'])

In [17]:
model.fit(x_train, y_train, batch_size=64, epochs=10, verbose=2)

Epoch 1/10
938/938 - 518s - loss: 0.9549 - accuracy: 0.7105
Epoch 2/10
938/938 - 522s - loss: 0.2914 - accuracy: 0.9180
Epoch 3/10
938/938 - 520s - loss: 0.2149 - accuracy: 0.9442
Epoch 4/10
938/938 - 519s - loss: 0.1832 - accuracy: 0.9523
Epoch 5/10
938/938 - 542s - loss: 0.1716 - accuracy: 0.9564
Epoch 6/10
938/938 - 518s - loss: 0.1756 - accuracy: 0.9567
Epoch 7/10
938/938 - 519s - loss: 0.1435 - accuracy: 0.9633
Epoch 8/10
938/938 - 522s - loss: 0.1481 - accuracy: 0.9634
Epoch 9/10
938/938 - 520s - loss: 0.1302 - accuracy: 0.9682
Epoch 10/10
938/938 - 522s - loss: 0.1286 - accuracy: 0.9685


<keras.callbacks.History at 0x836c560948>

In [18]:
# accuracy
model.evaluate(x_test, y_test, batch_size=64, verbose=2)

157/157 - 28s - loss: 0.1396 - accuracy: 0.9665


[0.13957415521144867, 0.9664999842643738]