In [5]:
import numpy as np
import pandas as pd
import tensorflow as tf
from tensorflow.keras.datasets import imdb
from tensorflow.keras.preprocessing import sequence
from tensorflow.keras.models import Sequential, load_model
from tensorflow.keras.layers import Embedding, SimpleRNN, Dense

In [6]:
#Mapping of word index back to words

word_index = imdb.get_word_index()
reverse_word_index = {value: key for key, value in word_index.items()}

In [8]:
model = load_model('simple_rnn_imdb.h5')
model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding (Embedding)       (None, 500, 128)          1280000   
                                                                 
 simple_rnn (SimpleRNN)      (None, 128)               32896     
                                                                 
 dense (Dense)               (None, 1)                 129       
                                                                 
Total params: 1313025 (5.01 MB)
Trainable params: 1313025 (5.01 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [10]:
model.get_weights()

[array([[ 0.03243158,  0.00224091, -0.01559729, ...,  0.05313546,
         -0.03449006, -0.00922514],
        [-0.04575593,  0.01432513, -0.00919037, ...,  0.03509814,
          0.01319049, -0.02920637],
        [-0.0471844 ,  0.0020656 , -0.01529548, ..., -0.00799191,
          0.00271448, -0.01452106],
        ...,
        [-0.01808481, -0.03838668,  0.04801741, ...,  0.03054458,
          0.03238704, -0.0905014 ],
        [-0.15885875, -0.01270267,  0.00145487, ..., -0.10172118,
         -0.16274066,  0.05494296],
        [ 0.05156705,  0.0437537 , -0.12566394, ..., -0.08489514,
          0.03362164,  0.06298032]], dtype=float32),
 array([[-0.16472124, -0.06840443,  0.06577741, ...,  0.06698578,
         -0.00073238, -0.14158133],
        [ 0.12161295, -0.00763061, -0.06991029, ..., -0.07633532,
         -0.01104696,  0.00600125],
        [ 0.14329532, -0.11774715, -0.0356289 , ..., -0.00139726,
          0.09563536,  0.0927795 ],
        ...,
        [ 0.13308978, -0.14076723,  0.1

In [14]:
#Step2: Helper Functions

#Function to decode review
def decode_review(encoded_review):
    return ' '.join([reverse_word_index.get(i - 3,'?') for i in encoded_review])

#Function to preprocess the input
def preprocess_text(text):
    words=text.lower().split()
    encoded_review = [word_index.get(word,2) + 3 for word in words]
    padded_review = sequence.pad_sequences([encoded_review], maxlen=500)
    return padded_review

In [15]:
## Prediction function

def predict_sentiment(review):
    preprocessed_input = preprocess_text(review)
    prediction = model.predict(preprocessed_input)
    sentiment = 'Possitive' if prediction[0][0] > 0.5 else 'Negative'
    return sentiment, prediction[0][0]

In [17]:
## Review Example

#example_review = 'This movie is fantastic !! The acting was great and the plot was thrilling'
example_review = 'This movie is Pathetic !! The acting was worse and the plot was disgusting'

sentiment, score = predict_sentiment(example_review)

print(f'Review: {example_review}')
print(f'Sentiment: {sentiment}')
print(f'Prediction Score: {score}')

Review: This movie is Pathetic !! The acting was worse and the plot was disgusting
Sentiment: Negative
Prediction Score: 0.44417300820350647
