<a href="https://colab.research.google.com/github/soohyunme/TensorFlow_Tutorial/blob/main/Code/05_RNN%2CGRUs%2CLSTMs%2CBidirectionality.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
import os
from threading import active_count

from tensorflow.python.keras.layers.core import Activation
os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2'
import tensorflow as tf
from tensorflow import keras
from tensorflow.keras import layers
from tensorflow.keras.datasets import mnist


# Device setting

In [2]:
physical_devices = tf.config.list_physical_devices('GPU')
tf.config.experimental.set_memory_growth(physical_devices[0],True)

# Load data

In [3]:
(x_train,y_train), (x_test,y_test) = mnist.load_data()

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/mnist.npz


# Normalize

In [4]:
x_train = x_train.astype('float32') / 255.0
x_test = x_test.astype('float32') / 255.0

# Model

## SimpleRNN

In [5]:
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(
    layers.SimpleRNN(512, return_sequences=True, activation='relu')
)
model.add(layers.SimpleRNN(512, activation='relu'))
model.add(layers.Dense(10))

print(model.summary())

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 simple_rnn (SimpleRNN)      (None, None, 512)         276992    
                                                                 
 simple_rnn_1 (SimpleRNN)    (None, 512)               524800    
                                                                 
 dense (Dense)               (None, 10)                5130      
                                                                 
Total params: 806,922
Trainable params: 806,922
Non-trainable params: 0
_________________________________________________________________
None


## GRU

In [6]:
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(
    layers.GRU(256, return_sequences=True, activation='tanh')
)
model.add(layers.GRU(256, activation='tanh'))
model.add(layers.Dense(10))

print(model.summary())

Model: "sequential_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 gru (GRU)                   (None, None, 256)         219648    
                                                                 
 gru_1 (GRU)                 (None, 256)               394752    
                                                                 
 dense_1 (Dense)             (None, 10)                2570      
                                                                 
Total params: 616,970
Trainable params: 616,970
Non-trainable params: 0
_________________________________________________________________
None


## LSTM

In [7]:
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(
    layers.LSTM(256, return_sequences=True, activation='tanh')
)
model.add(layers.LSTM(256, activation='tanh'))
model.add(layers.Dense(10))

print(model.summary())

Model: "sequential_2"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 lstm (LSTM)                 (None, None, 256)         291840    
                                                                 
 lstm_1 (LSTM)               (None, 256)               525312    
                                                                 
 dense_2 (Dense)             (None, 10)                2570      
                                                                 
Total params: 819,722
Trainable params: 819,722
Non-trainable params: 0
_________________________________________________________________
None


## Bidireactional LSTM

In [8]:
model = keras.Sequential()
model.add(keras.Input(shape=(None, 28)))
model.add(
    layers.Bidirectional(
        layers.LSTM(256, return_sequences=True, activation='tanh')
    )
)
model.add(
    layers.Bidirectional(
        layers.LSTM(256, activation='tanh')
        )
)
model.add(layers.Dense(10))

print(model.summary())

Model: "sequential_3"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 bidirectional (Bidirectiona  (None, None, 512)        583680    
 l)                                                              
                                                                 
 bidirectional_1 (Bidirectio  (None, 512)              1574912   
 nal)                                                            
                                                                 
 dense_3 (Dense)             (None, 10)                5130      
                                                                 
Total params: 2,163,722
Trainable params: 2,163,722
Non-trainable params: 0
_________________________________________________________________
None


In [9]:
model.compile(
    loss=keras.losses.SparseCategoricalCrossentropy(from_logits=True),
    optimizer=keras.optimizers.Adam(lr=0.001),
    metrics=['accuracy']
)

  super(Adam, self).__init__(name, **kwargs)


In [10]:
model.fit(x_train, y_train, batch_size=64, epochs=10, verbose=2)
model.evaluate(x_test, y_test, batch_size=64, verbose=2)

Epoch 1/10
938/938 - 50s - loss: 0.2711 - accuracy: 0.9112 - 50s/epoch - 53ms/step
Epoch 2/10
938/938 - 39s - loss: 0.0776 - accuracy: 0.9757 - 39s/epoch - 41ms/step
Epoch 3/10
938/938 - 39s - loss: 0.0539 - accuracy: 0.9830 - 39s/epoch - 41ms/step
Epoch 4/10
938/938 - 39s - loss: 0.0414 - accuracy: 0.9873 - 39s/epoch - 41ms/step
Epoch 5/10
938/938 - 39s - loss: 0.0347 - accuracy: 0.9890 - 39s/epoch - 41ms/step
Epoch 6/10
938/938 - 38s - loss: 0.0294 - accuracy: 0.9909 - 38s/epoch - 41ms/step
Epoch 7/10
938/938 - 38s - loss: 0.0251 - accuracy: 0.9924 - 38s/epoch - 41ms/step
Epoch 8/10
938/938 - 39s - loss: 0.0209 - accuracy: 0.9932 - 39s/epoch - 41ms/step
Epoch 9/10
938/938 - 39s - loss: 0.0186 - accuracy: 0.9939 - 39s/epoch - 41ms/step
Epoch 10/10
938/938 - 38s - loss: 0.0166 - accuracy: 0.9945 - 38s/epoch - 41ms/step
157/157 - 4s - loss: 0.0349 - accuracy: 0.9892 - 4s/epoch - 27ms/step


[0.034949783235788345, 0.9891999959945679]