In [16]:
import numpy as np
import tensorflow as tf
from tensorflow.keras.datasets import imdb
from tensorflow.keras.preprocessing import sequence
from tensorflow.keras.models import load_model


In [17]:
## load the IMDB dataset 
word_index=imdb.get_word_index()
reverse_word_index={value:key for key,value in word_index.items()}

In [18]:
model=load_model('simple_rnn_imdb.h5')
model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding (Embedding)       (None, 500, 128)          1280000   
                                                                 
 simple_rnn (SimpleRNN)      (None, 128)               32896     
                                                                 
 dense (Dense)               (None, 1)                 129       
                                                                 
Total params: 1313025 (5.01 MB)
Trainable params: 1313025 (5.01 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [19]:
model.get_weights()

[array([[ 0.01608222, -0.00232146,  0.02007602, ..., -0.04309461,
         -0.00077243,  0.02266626],
        [ 0.03736301,  0.01098465, -0.02132717, ...,  0.04152368,
          0.05937279,  0.04836767],
        [-0.03847177,  0.04194459, -0.02534053, ...,  0.02865404,
          0.06643952,  0.04106462],
        ...,
        [-0.08389651,  0.08655689,  0.08909348, ..., -0.00340404,
          0.06198435,  0.0330187 ],
        [ 0.09271717, -0.03847655, -0.11873026, ..., -0.01123095,
         -0.05050033, -0.12110952],
        [-0.08896454,  0.08833558,  0.08402719, ...,  0.14504662,
          0.1317441 ,  0.14978604]], dtype=float32),
 array([[ 0.08383862,  0.16028605,  0.05798643, ..., -0.04114209,
          0.03293208, -0.101602  ],
        [ 0.09562114,  0.07611097, -0.04637082, ...,  0.09126115,
         -0.16158205,  0.09098836],
        [ 0.03350146, -0.04465936, -0.07521499, ..., -0.05054178,
          0.10744353,  0.0193169 ],
        ...,
        [-0.11874765, -0.09412359,  0.0

In [20]:
##function to decode reviews
def decode_review(encoded_review):
    return ' '.join([reverse_word_index.get(i-3,'?') for i in encoded_review])

#function to preproces user input
def preprocess_text(text):
    words=text.lower().split()
    encoded_review=[word_index.get(word,2)+3 for word in words]
    padded_review=sequence.pad_sequences([encoded_review],maxlen=500)
    return padded_review

In [21]:
##prediction function

def predict_sentiment(review):
    preprocessed_input=preprocess_text(review)
    prediction=model.predict(preprocessed_input)
    sentiment='Positive' if prediction[0][0]>0.5 else 'Negative'
    return sentiment,prediction[0][0]

In [22]:
##Example

example_review='Movie was fantastic and I liked it.'

sentiment,score=predict_sentiment(example_review)

print(f'Review: {example_review}')
print(f'Sentiment: {sentiment}')
print(f'Prediction Score: {score}')


Review: Movie was fantastic and I liked it.
Sentiment: Positive
Prediction Score: 0.9894087910652161
