In [1]:
### End to end deep learning project using simple RNN
import numpy as np
import tensorflow as tf
from tensorflow.keras.datasets import imdb
from tensorflow.keras.preprocessing import sequence
from tensorflow.keras.models import load_model 

In [2]:
##Load the imdb dataset word index
word_index=imdb.get_word_index()
## word_index
revrese_word_index= {value:key for key, value in word_index.items()}

In [8]:
model = load_model('simplernn_rnn_imdn.h5')
model.summary()


Model: "sequential_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding_1 (Embedding)     (None, 500, 128)          1280000   
                                                                 
 simple_rnn_1 (SimpleRNN)    (None, 128)               32896     
                                                                 
 dense_1 (Dense)             (None, 1)                 129       
                                                                 
Total params: 1313025 (5.01 MB)
Trainable params: 1313025 (5.01 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [9]:
model.get_weights()

[array([[ 0.06707461,  0.00586419, -0.04503753, ...,  0.05577635,
         -0.04116806,  0.06172702],
        [ 0.01498441,  0.07038636, -0.03924245, ...,  0.01364108,
         -0.06795142,  0.00722646],
        [-0.0190648 ,  0.08427708, -0.06039049, ..., -0.02710036,
          0.00676285,  0.01394366],
        ...,
        [-0.00827246, -0.01376081, -0.04587322, ..., -0.0548214 ,
          0.03322185,  0.00408244],
        [ 0.12221344,  0.10632707, -0.12251056, ...,  0.13060431,
          0.0604091 ,  0.09993586],
        [ 0.0616362 , -0.12951621,  0.16870065, ..., -0.03832517,
         -0.02454342, -0.14904141]], dtype=float32),
 array([[-0.02573374, -0.20050247,  0.1458445 , ...,  0.11676878,
         -0.09951234,  0.03469783],
        [-0.09293783,  0.12264612, -0.10118192, ..., -0.00161549,
          0.09100421, -0.0493921 ],
        [ 0.18751982,  0.08719517,  0.12217574, ..., -0.01045969,
         -0.01803541,  0.17306228],
        ...,
        [ 0.10657918,  0.04614231,  0.0

In [10]:
# Step 2: Helper functions 
## function to decode reviews
def decode_review(encoded_review):
    return ' '.join([revrese_word_index.get('i - 3','?') for i in encoded_review])

## function to preprocess user input
def preprocess_text(text):
    words = text.lower().split()
    encoded_review = [word_index.get(word,2) + 3 for word in words]
    padded_review = sequence.pad_sequences([encoded_review],maxlen=500)
    return padded_review

In [11]:
## Predicition fucntion

def predict_sentiment(review):
    preprocessed_input = preprocess_text(review)

    prediction=model.predict(preprocessed_input)

    sentiment= 'Positive' if prediction[0][0] > 0.5 else 'Negative'
    return sentiment,prediction[0][0]

In [12]:
## Step 4 : User Input and Prediction
## Example review for prediction

example_review= "This movie was fantastic! The acting was great and the plot was thrilling."

sentiment, score=predict_sentiment(example_review)

print(f'Review: {example_review}')
print(f'Sentiment: {sentiment}')
print(f'Prediction Score: {score}')

Review: This movie was fantastic! The acting was great and the plot was thrilling.
Sentiment: Positive
Prediction Score: 0.7454075217247009
