In [25]:
import numpy as np
from tensorflow.keras.datasets import imdb
from tensorflow.keras.preprocessing import sequence
from tensorflow.keras.models import load_model



In [26]:
# Load the IMDB dataset word index
word_index = imdb.get_word_index()
reverse_word_index = {value: key for key, value in word_index.items()}

In [27]:
model = load_model('simple_RNN_IMDB.h5')
model.summary()

Model: "sequential_2"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding_2 (Embedding)     (None, 500, 128)          1280000   
                                                                 
 simple_rnn_2 (SimpleRNN)    (None, 128)               32896     
                                                                 
 dense_2 (Dense)             (None, 1)                 129       
                                                                 
Total params: 1313025 (5.01 MB)
Trainable params: 1313025 (5.01 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [28]:
model.get_weights()

[array([[-0.01255068, -0.01177229,  0.01401186, ..., -0.04311793,
         -0.04528725, -0.0213562 ],
        [ 0.02712433,  0.06570248,  0.0148854 , ...,  0.02023057,
         -0.02767831, -0.01745383],
        [-0.01915758,  0.00435224,  0.00491284, ...,  0.01328172,
          0.03584548, -0.01242628],
        ...,
        [ 0.02198854, -0.01505796, -0.06275222, ...,  0.05600437,
         -0.02695091,  0.06045551],
        [-0.00704556, -0.0446912 , -0.058924  , ...,  0.01897049,
          0.01116615,  0.03636946],
        [ 0.00751915,  0.02038316,  0.00561873, ...,  0.03550854,
          0.01868449,  0.15146314]], dtype=float32),
 array([[-0.10730301,  0.07374957,  0.01766495, ..., -0.16314045,
         -0.11231025,  0.07471647],
        [ 0.01646808,  0.05469098,  0.02389727, ..., -0.0941212 ,
          0.02638509,  0.0440498 ],
        [-0.00601865,  0.10234173,  0.15494603, ...,  0.04669923,
          0.10889851,  0.13159375],
        ...,
        [-0.0508864 ,  0.09890266,  0.1

In [29]:
## Step 2:helper functions
# Function to decode reviews

def decode_review(encoded_review):
    return " ".join([reverse_word_index.get(i - 3, '?') for i in encoded_review])

# Function to preprocess user input

def preprocess_text(text):
    words = text.lower().split()
    encoded_review = [word_index.get(word, 2) + 3 for word in words]
    padded_review = sequence.pad_sequences([encoded_review], maxlen=500)
    return padded_review

In [30]:
### Prediction Function

def predict_sentiment(review):
    preprocessed_input = preprocess_text(review)
    prediction = model.predict(preprocessed_input)
    
    sentiment = 'Postive' if prediction[0][0] > 0.5 else 'Negative'
    
    return sentiment, prediction[0][0]

In [31]:
### Step 4: User Input and predcition
# Example review for prediciton

example_review = "This movie was fantastic! The acting was great and the plot was thrilling."

sentiment, score = predict_sentiment(example_review)

print(f'Review: {example_review}')
print(f'Sentiment: {sentiment}')
print(f'Prediciton Score: {score}')

Review: This movie was fantastic! The acting was great and the plot was thrilling.
Sentiment: Postive
Prediciton Score: 0.6127640008926392
