In [20]:
import numpy as np
import tensorflow as tf
from tensorflow.keras.datasets import imdb
from tensorflow.keras.preprocessing import sequence
from tensorflow.keras.models import load_model

In [21]:
## mapping of word index back to words for better understanding
word_index = imdb.get_word_index()

reverse_word_index = dict((value, key) for (key, value) in word_index.items())


In [22]:
model = load_model('simple_rnn_imdb.h5')
model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding (Embedding)       (None, 500, 128)          1280000   
                                                                 
 simple_rnn (SimpleRNN)      (None, 128)               32896     
                                                                 
 dense (Dense)               (None, 1)                 129       
                                                                 
Total params: 1313025 (5.01 MB)
Trainable params: 1313025 (5.01 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [23]:
model.get_weights()

[array([[-0.05754893,  0.00465252, -0.03639083, ...,  0.0645531 ,
          0.01964178,  0.01570315],
        [-0.02834357, -0.03361292,  0.00292905, ...,  0.00363235,
          0.0243489 ,  0.01335125],
        [ 0.02305565,  0.03130459, -0.03670143, ...,  0.04845603,
         -0.03574843, -0.00366456],
        ...,
        [-0.04728448,  0.03628258, -0.0122586 , ...,  0.02893184,
          0.04375948, -0.05499761],
        [-0.02625564,  0.0249668 , -0.01619824, ...,  0.0040842 ,
         -0.01752632, -0.08214568],
        [ 0.06280711,  0.03689718, -0.05596733, ..., -0.05065775,
          0.02137072, -0.05246853]], dtype=float32),
 array([[ 0.13683027,  0.158071  ,  0.16309999, ..., -0.11373451,
          0.1328951 , -0.01520081],
        [ 0.12161562, -0.1272239 , -0.10078335, ..., -0.08147402,
          0.0157907 ,  0.05536897],
        [-0.06244615,  0.01567652,  0.06306451, ...,  0.12627009,
          0.09435153,  0.06903812],
        ...,
        [ 0.01299568,  0.02591524, -0.1

In [24]:
def decode_review(encoded_review):
    # Decode the review back to words
    return ' '.join([reverse_word_index.get(i - 3, '?') for i in encoded_review])

# Function to preprocess the user input
def preprocess_text(text):
    words = text.lower().split()
    encoded_review = [word_index.get(word, 2) + 3 for word in words]
    padded_review = sequence.pad_sequences([encoded_review], maxlen=500)
    return padded_review

In [25]:
## prediction function
def predict_sentiment(review):
    preprocessed_input = preprocess_text(review)
    prediction = model.predict(preprocessed_input)
    sentiment = 'positive' if prediction[0][0] > 0.5 else 'negative'
    return sentiment, prediction[0][0]

In [27]:
example_review = "This movie was fantastic! I loved it. The acting was great and the plot was engaging."
sentiment, score = predict_sentiment(example_review)
print(f"Review: {example_review}")
print(f"Predicted Sentiment: {sentiment} \nScore: {score:.2f}")

Review: This movie was fantastic! I loved it. The acting was great and the plot was engaging.
Predicted Sentiment: positive 
Score: 0.76
