In [2]:
import numpy as np
import tensorflow as tp
from tensorflow.keras.datasets import imdb
from tensorflow.keras.preprocessing import sequence
from tensorflow.keras.models import load_model

In [3]:
# Load the IMDB dataset word index
word_index = imdb.get_word_index()
reverse_word_index = {value : key for key, value in word_index.items()}

In [4]:
model = load_model("simple_rnn_imdb.h5")
model.summary()


Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding (Embedding)       (None, 500, 128)          1280000   
                                                                 
 simple_rnn (SimpleRNN)      (None, 128)               32896     
                                                                 
 dense (Dense)               (None, 1)                 129       
                                                                 
Total params: 1313025 (5.01 MB)
Trainable params: 1313025 (5.01 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [5]:
model.get_weights()

[array([[-0.01255558,  0.01264636, -0.02549807, ..., -0.06456687,
          0.03761341, -0.00302027],
        [ 0.02272361, -0.01513299, -0.00267611, ..., -0.07089437,
          0.04309975, -0.0677562 ],
        [-0.03299938,  0.04603096,  0.03659783, ..., -0.0592237 ,
         -0.02943829, -0.02540252],
        ...,
        [ 0.03618477,  0.03412636, -0.02825801, ..., -0.02613164,
         -0.13625161, -0.04628958],
        [ 0.02244207,  0.0054781 , -0.08251512, ...,  0.05571353,
          0.01491856, -0.14893472],
        [ 0.235548  , -0.23114529, -0.02398361, ...,  0.17512897,
         -0.14846882, -0.09275907]], dtype=float32),
 array([[ 0.07751825, -0.07449485,  0.10241541, ..., -0.12586369,
          0.11866526,  0.12887222],
        [-0.00826485,  0.01755297, -0.1274952 , ..., -0.15904962,
          0.09288124,  0.07865763],
        [-0.00557369, -0.06851345,  0.10918   , ..., -0.08981633,
         -0.00113887,  0.09356903],
        ...,
        [-0.08082213,  0.03849262,  0.1

In [6]:
# Step 2 : Helper function
# Function to decode reviews
def decode_reviews(encoded_review):
    return " ".join([reverse_word_index.get(i - 3, "?") for i in encoded_review])

# Function to preprocess user input
def preprocess_text(text):
    words = text.lower().split()
    encoded_review = [word_index.get(word, 2) + 3 for word in words] 
    padded_review = sequence.pad_sequences([encoded_review], maxlen = 500)
    return padded_review

In [7]:
# Prediction function

def predict_sentiment(review):
    preprocessed_input = preprocess_text(review)

    prediction = model.predict(preprocessed_input)

    sentiment = "Positive" if prediction[0][0] > 0.5 else "Negative"
    
    return sentiment, prediction[0][0]

In [8]:
# Step 4 : User input and prediction
# Example review for prediction
example_review = "This movie was fantastic! The acting was great and the plot was thrilling."

sentiment, score = predict_sentiment(example_review)

print(f"Review : {example_review}")
print(f"Sentiment : {sentiment}")
print(f"Prediction Score : {score}")

Review : This movie was fantastic! The acting was great and the plot was thrilling.
Sentiment : Positive
Prediction Score : 0.778017520904541
