In [1]:
import numpy as np
import tensorflow as tf
from tensorflow.keras.datasets import imdb
from tensorflow.keras.preprocessing import sequence
from tensorflow.keras.models import load_model 





In [2]:
word_index = imdb.get_word_index()
reverse_word_index = {value:key for key, value in word_index.items()}

In [3]:
model = load_model("simple_rnn_imdb.h5")
model.summary()


Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding (Embedding)       (None, 500, 128)          1280000   
                                                                 
 simple_rnn (SimpleRNN)      (None, 128)               32896     
                                                                 
 dense (Dense)               (None, 1)                 129       
                                                                 
Total params: 1313025 (5.01 MB)
Trainable params: 1313025 (5.01 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [4]:
model.get_weights()

[array([[-0.0699003 ,  0.04117377, -0.01222987, ...,  0.00943068,
         -0.0346515 , -0.04236471],
        [-0.1270641 ,  0.03504466, -0.11449436, ..., -0.06079433,
          0.0279518 , -0.0143371 ],
        [-0.10439283,  0.05825527, -0.06421027, ..., -0.10485464,
          0.07607394, -0.16163822],
        ...,
        [ 0.23242007, -0.19455819,  0.24555233, ...,  0.22927456,
          0.08872735,  0.27557948],
        [-0.11523603,  0.09345407, -0.04898502, ..., -0.09354638,
         -0.05902797, -0.11228432],
        [ 0.07366029, -0.0703059 ,  0.03199391, ..., -0.0063665 ,
          0.05761788,  0.10078231]], dtype=float32),
 array([[ 0.04909078,  0.12902519,  0.03871666, ...,  0.06055011,
         -0.08905692,  0.12785034],
        [ 0.02670014,  0.02625332, -0.02887109, ...,  0.0513947 ,
          0.09733048, -0.04278557],
        [-0.10087746, -0.0614852 ,  0.09094134, ...,  0.0356874 ,
          0.05320677,  0.04316503],
        ...,
        [-0.01395093,  0.26176712, -0.0

In [5]:
#step 2 -> Helper Functions
#Function to decode reviews
def decode_review(encoded_review):
    return ' '.join([reverse_word_index.get(i - 3, '?') for i in encoded_review])

def preprocess_text(text):
    words = text.lower().split()
    encoded_review = [word_index.get(word,2) + 3 for word in words]
    padded_review = sequence.pad_sequences([encoded_review],maxlen = 500)
    return padded_review

In [6]:
#PREDICTION FUNCTION
def predict_seniment(review):
    preprocessed_input = preprocess_text(review)
    prediction = model.predict(preprocessed_input)
    sentiment = 'Positive' if prediction[0][0] > 0.5 else 'Negative'
    return sentiment, prediction[0][0]

In [11]:
#USER PREVIEW AND PREDICTION
example_statement = "This movie was very boring, i hated the movie, the acting was very bad , i hate the movie, but the critics were good and ending was quite good "

sentiment,score = predict_seniment(example_statement)

print(f'Review : {example_statement}')
print(f'Sentiment {sentiment}')
print(f'Prdiction Score {score}')

Review : This movie was very boring, i hated the movie, the acting was very bad , i hate the movie, but the critics were good and ending was quite good 
Sentiment Negative
Prdiction Score 0.031027935445308685
