##Install dependencies and setting up GPU environment

In [1]:
!pip install numpy==1.16.1

Collecting numpy==1.16.1
[?25l  Downloading https://files.pythonhosted.org/packages/f5/bf/4981bcbee43934f0adb8f764a1e70ab0ee5a448f6505bd04a87a2fda2a8b/numpy-1.16.1-cp36-cp36m-manylinux1_x86_64.whl (17.3MB)
[K     |████████████████████████████████| 17.3MB 184kB/s 
[31mERROR: umap-learn 0.4.2 has requirement numpy>=1.17, but you'll have numpy 1.16.1 which is incompatible.[0m
[31mERROR: datascience 0.10.6 has requirement folium==0.2.1, but you'll have folium 0.8.3 which is incompatible.[0m
[31mERROR: albumentations 0.1.12 has requirement imgaug<0.2.7,>=0.2.5, but you'll have imgaug 0.2.9 which is incompatible.[0m
[?25hInstalling collected packages: numpy
  Found existing installation: numpy 1.18.4
    Uninstalling numpy-1.18.4:
      Successfully uninstalled numpy-1.18.4
Successfully installed numpy-1.16.1


##Importing project dependencies

In [0]:
import numpy as np
import tensorflow as tf

from tensorflow.keras.datasets import imdb

In [2]:
tf.__version__

'2.2.0'

## Stage 3: Dataset preprocessing

### Setting up dataset parameters

In [0]:
number_of_words = 20000
max_len = 100

### Loading the IMDB dataset

In [4]:
(X_train, y_train), (X_test, y_test) = imdb.load_data(num_words=number_of_words)

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/imdb.npz


### Padding all sequences to be the same length 

In [0]:
X_train = tf.keras.preprocessing.sequence.pad_sequences(X_train, maxlen=max_len)

In [0]:
X_test = tf.keras.preprocessing.sequence.pad_sequences(X_test, maxlen=max_len)

### Setting up Embedding Layer parameters

In [7]:
vocab_size = number_of_words
vocab_size

20000

In [0]:
embed_size = 128

## Step 4: Building a Recurrent Neural Network

### Defining the model

In [0]:
model = tf.keras.Sequential()

### Adding the Embeding Layer

In [0]:
model.add(tf.keras.layers.Embedding(vocab_size, embed_size, input_shape=(X_train.shape[1],)))

In [0]:
model.add(tf.keras.layers.Dropout(0.44))

### Adding the LSTM Layer

- units: 128
- activation: tanh

In [0]:
model.add(tf.keras.layers.LSTM(units=128, activation='tanh'))

In [0]:
model.add(tf.keras.layers.Dropout(0.4))

### Adding the Dense output layer

- units: 1
- activation: sigmoid

In [0]:
model.add(tf.keras.layers.Dense(units=1, activation='sigmoid'))

### Compiling the model

In [0]:
model.compile(optimizer='rmsprop', loss='binary_crossentropy', metrics=['accuracy'])

In [27]:
model.summary()

Model: "sequential_1"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
embedding_1 (Embedding)      (None, 100, 128)          2560000   
_________________________________________________________________
dropout_2 (Dropout)          (None, 100, 128)          0         
_________________________________________________________________
lstm_1 (LSTM)                (None, 128)               131584    
_________________________________________________________________
dropout_3 (Dropout)          (None, 128)               0         
_________________________________________________________________
dense_1 (Dense)              (None, 1)                 129       
Total params: 2,691,713
Trainable params: 2,691,713
Non-trainable params: 0
_________________________________________________________________


### Training the model

In [28]:
model.fit(X_train, y_train, epochs=7, batch_size=256)

Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
Epoch 5/7
Epoch 6/7
Epoch 7/7


<tensorflow.python.keras.callbacks.History at 0x7fe030a73160>

### Evaluating the model

In [29]:
test_loss, test_acurracy = model.evaluate(X_test, y_test)



In [0]:
print("Test accuracy: {}".format(test_acurracy))

Test accuracy: 0.8527600169181824
