# RNN for semtiment analysis

**初期設定**

In [1]:
import os
import tensorflow as tf
import numpy as np
from tensorflow import keras

In [3]:
tf.random.set_seed(22)
np.random.seed(22)
os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2'
assert tf.__version__.startswith('2.')

**Config Info**

In [4]:
np.random.seed(7)
# Load the dataset but only keep the top n words, zero the rest
top_words = 10000
# Trancate and pad input sequences
max_review_length = 80
(x_tr, y_tr), (x_te, y_te) = keras.datasets.imdb.load_data(num_words=top_words)
print("Pad sequences (samples x time)")
x_tr = keras.preprocessing.sequence.pad_sequences(x_tr, maxlen=max_review_length)
x_te = keras.preprocessing.sequence.pad_sequences(x_te, maxlen=max_review_length)
print('x_trian shape: ',x_tr.shape)
print('x_test shape: ',x_te.shape)

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/imdb.npz
Pad sequences (samples x time)
x_trian shape:  (25000, 80)
x_test shape:  (25000, 80)


In [9]:
class RNN(keras.Model):
    def __init__(self, units, num_class, num_layers):
        super(RNN, self).__init__()
        
        self.rnn = keras.layers.LSTM(units, return_sequences=True)
        self.rnn2 = keras.layers.LSTM(units)
        
        self.embedding = keras.layers.Embedding(top_words, 100, input_length=max_review_length)
        self.fc = keras.layers.Dense(1)
        
    def call(self, inputs, training=None, mask=None):
        x = self.embedding(inputs)
        x = self.rnn(x)
        x = self.rnn2(x)
        
        x = self.fc(x)
        print(x.shape)

        return x 

In [7]:
def main():
    units = 64
    num_classes = 2
    batch_size = 32
    epochs = 20
    
    model = RNN(units, num_classes, num_layers=2)
    
    model.compile(optimizer=keras.optimizers.Adam(0.001),
                  loss=keras.losses.BinaryCrossentropy(from_logits=True),
                  metrics=['accuracy'])
    model.fit(x_tr, y_tr, batch_size=batch_size, epochs=epochs,
              validation_data=(x_te, y_te), verbose=1)
    
    scores = model.evaluate(x_te, y_te, batch_size, verbose=1)
    
    print('Final test loss and accuracy: ', scores)

In [10]:
if __name__ == '__main__':
    main()

Epoch 1/20
(None, 1)
(None, 1)
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20
Final test loss and accuracy:  [1.1671234369277954, 0.8161600232124329]
