In [1]:
import numpy as np
import tensorflow as tf
from tensorflow.keras.datasets import imdb
from tensorflow.keras.preprocessing import sequence
from tensorflow.keras.models import load_model




In [2]:
word_index = imdb.get_word_index()
reverse_word_index = {value: key for key, value in word_index.items()}

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/imdb_word_index.json


In [3]:
model = load_model('simple_rnn_imdb.h5')
model.summary()


Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding (Embedding)       (None, 500, 128)          1280000   
                                                                 
 simple_rnn (SimpleRNN)      (None, 128)               32896     
                                                                 
 dense (Dense)               (None, 1)                 129       
                                                                 
Total params: 1313025 (5.01 MB)
Trainable params: 1313025 (5.01 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [4]:
model.get_weights()

[array([[ 0.00851537, -0.03892183, -0.03195516, ...,  0.03849715,
         -0.05407899, -0.0240601 ],
        [ 0.10639954,  0.17138165,  0.00561702, ..., -0.04643449,
         -0.03907331,  0.10271819],
        [ 0.10764227,  0.01103903, -0.01936407, ..., -0.0180254 ,
         -0.007372  ,  0.05562874],
        ...,
        [-0.00912896, -0.076694  , -0.00046052, ...,  0.08211396,
          0.08517012,  0.02167956],
        [ 0.04870542,  0.07832369,  0.11307038, ..., -0.03506981,
          0.0539668 , -0.04065448],
        [-0.1193752 , -0.08581609, -0.00186431, ...,  0.07510299,
          0.08287833, -0.06929346]], dtype=float32),
 array([[-0.06413068,  0.05543423,  0.02367918, ...,  0.01734109,
          0.03306309,  0.23075975],
        [-0.13871552,  0.15357639,  0.01778751, ..., -0.1023709 ,
          0.04640111,  0.11174115],
        [-0.08505128,  0.01650616, -0.13553405, ...,  0.04100905,
          0.02344285,  0.05151066],
        ...,
        [-0.07340669,  0.07806746, -0.2

In [5]:
# Function to decode reviews
def decode_review(encoded_review):
    return ' '.join([reverse_word_index.get(i - 3, '?') for i in encoded_review])

# Function to preprocess user input
def preprocess_text(text):
    words = text.lower().split()
    encoded_review = [word_index.get(word, 2) + 3 for word in words]
    padded_review = sequence.pad_sequences([encoded_review], maxlen=500)
    return padded_review

In [6]:
def predict_sentiment(review):
    preprocessed_input=preprocess_text(review)

    prediction=model.predict(preprocessed_input)

    sentiment = 'Positive' if prediction[0][0] > 0.5 else 'Negative'
    
    return sentiment, prediction[0][0]

In [7]:
example_review = "This movie was fantastic! The acting was great and the plot was thrilling."

sentiment,score=predict_sentiment(example_review)

print(f'Review: {example_review}')
print(f'Sentiment: {sentiment}')
print(f'Prediction Score: {score}')

Review: This movie was fantastic! The acting was great and the plot was thrilling.
Sentiment: Positive
Prediction Score: 0.9587916731834412
