In [1]:
import numpy as np
import tensorflow as tf
from tensorflow.keras.datasets import imdb
from tensorflow.keras.preprocessing import sequence
from tensorflow.keras.models import load_model




In [2]:
word_index = imdb.get_word_index()
reverse_word_index = {value: key for key, value in word_index.items()}

In [3]:
model = load_model('simple_rnn_imdb.h5')
model.summary()


Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding (Embedding)       (None, 500, 128)          1280000   
                                                                 
 simple_rnn (SimpleRNN)      (None, 128)               32896     
                                                                 
 dense (Dense)               (None, 1)                 129       
                                                                 
Total params: 1313025 (5.01 MB)
Trainable params: 1313025 (5.01 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [4]:
model.get_weights()

[array([[-4.93707657e-02,  2.50790417e-02,  2.66644470e-02, ...,
         -1.84293017e-02, -1.04592385e-04, -9.98556148e-03],
        [-3.70272025e-02, -4.04514968e-02, -2.90390383e-02, ...,
         -2.66347919e-02, -2.12386716e-02,  8.49924609e-02],
        [-1.02916129e-01, -7.42307082e-02, -2.82645915e-02, ...,
         -4.17614281e-02, -8.89028087e-02, -4.10050303e-02],
        ...,
        [ 6.60253242e-02, -6.40225187e-02, -2.33778842e-02, ...,
         -2.04749443e-02,  3.81352156e-02,  1.24454461e-01],
        [ 2.11126089e-01,  1.86445042e-01,  1.02863580e-01, ...,
          2.74475902e-01, -1.72293231e-01,  7.03025609e-02],
        [-5.99953905e-02, -2.23696202e-01, -2.40374014e-01, ...,
         -1.94142655e-01,  2.45562047e-01,  2.41989419e-01]], dtype=float32),
 array([[-0.00028673, -0.0112287 , -0.02021839, ...,  0.07615379,
          0.06775907,  0.08278631],
        [ 0.15726498, -0.10141496,  0.00174407, ..., -0.08503257,
          0.10853493,  0.21599816],
        [ 

In [5]:
# Helper Functions

# 1. Function to decode reviews
def decode_review(encoded_review):
    return ' '.join([reverse_word_index.get(i - 3, '?') for i in encoded_review])


# 2. Function to preprocess user input
def preprocess_text(text):
    words = text.lower().split()
    encoded_review = [word_index.get(word, 2) + 3 for word in words]
    padded_review = sequence.pad_sequences([encoded_review], maxlen=500)
    return padded_review

In [6]:
# Prediction Function

def predict_sentiment(review):
    preprocessed_input=preprocess_text(review)

    prediction=model.predict(preprocessed_input)

    sentiment = 'Positive' if prediction[0][0] > 0.5 else 'Negative'
    
    return sentiment, prediction[0][0]

In [19]:
# User Input and Prediction

example_review = "This movie was Entertaining"

sentiment,score=predict_sentiment(example_review)

print(f'Review: {example_review}')
print(f'Sentiment: {sentiment}')
print(f'Prediction Score: {score}')

Review: This movie was Entertaining
Sentiment: Positive
Prediction Score: 0.5980027318000793
Review: This movie was Entertaining
Sentiment: Positive
Prediction Score: 0.5980027318000793
