In [1]:
import tensorflow as tf
from tensorflow import keras 
from keras.datasets import imdb
from keras.preprocessing.sequence import pad_sequences
from keras.models import Sequential
from keras.layers import Embedding, SimpleRNN, Dense, LSTM, GRU

In [2]:
#Loading the data

(x_train, y_train), (x_test, y_test) = imdb.load_data(num_words=10000) #Taking only 10K words for 

x_train = pad_sequences(x_train, maxlen=100)
x_test = pad_sequences(x_test, maxlen=100)


## Deep RNN

In [3]:
# Deep RNN
model_rnn = Sequential([
    Embedding(10000, 32, input_length=100),    #10K movies, 32 embedding vector
    SimpleRNN(5, return_sequences=True),    #return_sequences true, multiple to multiple network
    SimpleRNN(5),
    Dense(1, activation='sigmoid') 
])
model_rnn.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding (Embedding)       (None, 100, 32)           320000    
                                                                 
 simple_rnn (SimpleRNN)      (None, 100, 5)            190       
                                                                 
 simple_rnn_1 (SimpleRNN)    (None, 5)                 55        
                                                                 
 dense (Dense)               (None, 1)                 6         
                                                                 
Total params: 320251 (1.22 MB)
Trainable params: 320251 (1.22 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


## Deep LSTM

In [4]:
model_lstm = Sequential([
    Embedding(10000, 32, input_length=100),    #10K movies, 32 embedding vector
    LSTM(5, return_sequences=True),    #return_sequences true, multiple to multiple network
    LSTM(5),
    Dense(1, activation='sigmoid') 
])
model_lstm.summary()

Model: "sequential_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding_1 (Embedding)     (None, 100, 32)           320000    
                                                                 
 lstm (LSTM)                 (None, 100, 5)            760       
                                                                 
 lstm_1 (LSTM)               (None, 5)                 220       
                                                                 
 dense_1 (Dense)             (None, 1)                 6         
                                                                 
Total params: 320986 (1.22 MB)
Trainable params: 320986 (1.22 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


## Deep GRU

In [5]:
model_gru = Sequential([
    Embedding(10000, 32, input_length=100),    #10K movies, 32 embedding vector
    GRU(5, return_sequences=True),    #return_sequences true, multiple to multiple network
    GRU(5),
    Dense(1, activation='sigmoid') 
])
model_gru.summary()

Model: "sequential_2"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding_2 (Embedding)     (None, 100, 32)           320000    
                                                                 
 gru (GRU)                   (None, 100, 5)            585       
                                                                 
 gru_1 (GRU)                 (None, 5)                 180       
                                                                 
 dense_2 (Dense)             (None, 1)                 6         
                                                                 
Total params: 320771 (1.22 MB)
Trainable params: 320771 (1.22 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [6]:
model_gru.compile(optimizer='adam', loss='binary_crossentropy', metrics=['accuracy'])

In [7]:
history = model_gru.fit(x_train, y_train, epochs=5, batch_size=32, validation_split=0.2, validation_data=(x_test, y_test))

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


In [None]:
##There is more than 10% difference between accuracy and val_accuracy, clear sign of model overfitting. Use dropout to reduce it