In [1]:
import numpy as np
import tensorflow as tf
from tensorflow.keras.datasets import imdb
from tensorflow.keras.preprocessing import sequence
from tensorflow.keras.models import load_model

In [2]:
# Load the IMDB dataset word index
word_index = imdb.get_word_index()
reverse_word_index = {value: key for key, value in word_index.items()}

In [3]:
# Laod the pre-trained model with ReLu activation
model = load_model('simple_rnn_imdb.h5')
model.summary()


Model: "sequential_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding (Embedding)       (None, 500, 128)          1280000   
                                                                 
 simple_rnn (SimpleRNN)      (None, 128)               32896     
                                                                 
 dense (Dense)               (None, 1)                 129       
                                                                 
Total params: 1313025 (5.01 MB)
Trainable params: 1313025 (5.01 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [4]:
model.get_weights()

[array([[ 0.02078478,  0.03665311, -0.00302268, ...,  0.05957913,
         -0.03419689, -0.01107404],
        [-0.05030663, -0.03955369,  0.00844739, ...,  0.01146049,
         -0.00361926, -0.00612135],
        [ 0.02431214,  0.00854113,  0.01409184, ...,  0.01757726,
          0.04643181, -0.01086193],
        ...,
        [ 0.00507205,  0.00365536,  0.15096785, ...,  0.03417505,
         -0.12684153, -0.05364938],
        [-0.1975373 ,  0.16839786, -0.1892042 , ..., -0.21107922,
         -0.20151387,  0.12011069],
        [ 0.25923312, -0.19805081,  0.12683399, ...,  0.22024494,
         -0.2394033 , -0.22664091]], dtype=float32),
 array([[ 5.7021908e-02, -6.0477080e-03, -7.6542579e-02, ...,
          2.4824578e-02, -1.2140416e-01,  5.5245712e-02],
        [ 4.7968782e-02,  1.3917769e-01, -8.1076264e-02, ...,
          4.5881525e-02,  1.0535072e-02,  3.8073894e-02],
        [ 8.0815412e-02, -1.5788752e-01, -4.8700623e-02, ...,
         -7.1299434e-02,  1.8163763e-01, -6.1274555e-02]

In [5]:
# Step 2: helper Functions
# Function to decode reviews

def decode_review(encoded_review):
    return ' '.join([reverse_word_index.get(i - 3, '?') for i in encoded_review])

# Function to preprocess user input
def preprocess_text(text):
    words = text.lower().split()
    encoded_review = [word_index.get(word, 2) + 3 for word in words]
    padded_review = sequence.pad_sequences([encoded_review], maxlen=500)
    return padded_review


In [6]:
### Predicion Function

def predict_sentiment(review):
    preprocessed_input = preprocess_text(review)

    prediction = model.predict(preprocessed_input)
    
    sentiment = 'Positive' if prediction[0][0]> 0.5 else 'Negative'

    return sentiment, prediction[0][0]

In [7]:
# Step 4: User Input and Prediction
# Example review for prediction

example_review = "This movie was fantastic! The acting was great and the plot was thrilling."

sentiment, score = predict_sentiment(example_review)

print(f'Review: {example_review}')
print(f'Sentiment: {sentiment}')
print(f'Prediction Score: {score}')

Review: This movie was fantastic! The acting was great and the plot was thrilling.
Sentiment: Positive
Prediction Score: 0.9014578461647034
