In [20]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import tensorflow as tf
from tensorflow.keras.datasets import imdb
from tensorflow.keras.preprocessing import sequence
from tensorflow.keras.models import load_model

In [21]:
word_index = imdb.get_word_index()
reverse_word_index = {value: key for key, value in word_index.items()}

In [22]:
model = load_model('./simple_rnn_imdb.h5')
model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding (Embedding)       (None, 500, 128)          1280000   
                                                                 
 simple_rnn (SimpleRNN)      (None, 128)               32896     
                                                                 
 dense (Dense)               (None, 1)                 129       
                                                                 
Total params: 1313025 (5.01 MB)
Trainable params: 1313025 (5.01 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [23]:
model.get_weights()

[array([[ 3.73476930e-02, -8.29476640e-02, -8.77428278e-02, ...,
          5.96587174e-03,  1.79825984e-02, -1.96044017e-02],
        [-4.54741269e-02, -3.04321386e-02, -6.61247373e-02, ...,
          1.08307064e-01, -2.50560828e-02, -8.33437666e-02],
        [-3.56123522e-02,  5.21735363e-02,  4.64927405e-02, ...,
          2.40305904e-02, -5.55510409e-02,  1.09966151e-01],
        ...,
        [ 1.03554472e-01,  2.84117181e-04, -1.12189889e-01, ...,
          8.57997162e-04,  1.01844974e-01, -5.64498082e-02],
        [ 1.12223394e-01, -1.69980019e-01,  6.15027361e-02, ...,
         -1.67130053e-01,  1.11854792e-01, -6.33544400e-02],
        [-2.73691207e-01,  3.60921293e-01,  3.67770374e-01, ...,
          1.64342910e-01, -2.17816621e-01,  3.36960703e-01]], dtype=float32),
 array([[ 0.16393524, -0.00962487,  0.01673398, ..., -0.23753552,
          0.17035666, -0.07905306],
        [ 0.07419618,  0.05963884,  0.11546837, ...,  0.13122627,
          0.10168235,  0.03232535],
        [ 

In [24]:
def decode_review(encoded_review):
    return " ".join([reverse_word_index.get(i-3, "?") for i in encoded_review])

def preprocess_text(text):
    words = text.lower().split()
    encoded_review = [word_index.get(word,2) + 3 for word in words]
    padded_review = sequence.pad_sequences([encoded_review], maxlen=500)
    return padded_review

In [38]:
## Prediction Function

def predict_sentiment(review):
    preprocess_input = preprocess_text(review)
    prediction = model.predict(preprocess_input)
    sentiment = 'Positive' if prediction[0][0] > 0.1 else 'Negative'
    return sentiment, prediction[0][0]

In [41]:
example_review = 'Best movie'

sentiment, score = predict_sentiment(example_review)

print(f'Review: {example_review}')
print(f'Sentiment: {sentiment}')
print(f'Prediction Score: {score}')

Review: Best movie
Sentiment: Negative
Prediction Score: 0.08030034601688385
