In [1]:
# import libraries
import numpy as np
import tensorflow as tf
from tensorflow.keras.datasets import imdb
from tensorflow.keras.preprocessing import sequence
from tensorflow.keras.models import load_model

2024-12-30 21:25:46.749826: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


In [2]:
# load word index
word_index = imdb.get_word_index()
reverse_word_index = {value: key for key, value in word_index.items()}

In [4]:
# load model
model = load_model('simple_run_imdb.h5')
model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 embedding (Embedding)       (None, 500, 128)          1280000   
                                                                 
 simple_rnn (SimpleRNN)      (None, 128)               32896     
                                                                 
 dense (Dense)               (None, 1)                 129       
                                                                 
Total params: 1313025 (5.01 MB)
Trainable params: 1313025 (5.01 MB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [6]:
model.get_weights()

[array([[ 4.9473312e-02,  5.5655017e-02,  5.0414845e-02, ...,
         -4.6104968e-02,  3.4781769e-02, -6.3962489e-03],
        [ 4.7350161e-02, -2.3491604e-02, -4.4174576e-03, ...,
          3.3427820e-02, -1.0791651e-02,  2.5382694e-02],
        [ 7.5496035e-03,  3.0295897e-02,  3.5931557e-02, ...,
         -8.0197831e-05,  4.0462220e-04, -6.7505829e-02],
        ...,
        [-5.1413365e-03,  9.0993136e-02, -7.6773956e-02, ...,
          7.4955270e-02,  4.0193401e-02, -2.2164470e-02],
        [ 8.2465019e-03, -4.6319295e-02,  3.8868625e-02, ...,
         -3.1016741e-02,  3.2395527e-02, -3.1013401e-02],
        [-8.5598193e-02, -3.0892745e-02,  8.2163140e-02, ...,
         -4.4233326e-02, -5.2002650e-02,  6.3030340e-02]], dtype=float32),
 array([[-0.0621236 ,  0.08419833,  0.00648172, ..., -0.05748236,
          0.01140529,  0.06203992],
        [ 0.06657384, -0.05001218, -0.05869251, ...,  0.07808294,
         -0.13124111,  0.01623084],
        [ 0.01333027, -0.02140141,  0.08329075

In [7]:
# function to decode review
def decode_review(encoded_review):
    return ' '.join([reverse_word_index.get(i - 3, '?') for i in encoded_review])

In [14]:
def preprocess_text(text):
    words = text.lower().split()
    encoded_review = [word_index.get(word, 2)+3 for word in words]
    padded_review = sequence.pad_sequences([encoded_review], maxlen = 500)

    return padded_review

In [15]:
def predict_sentiment(review):
    preprocessed_input = preprocess_text(review)

    prediction = model.predict(preprocessed_input)

    sentiment = 'Positive' if prediction[0][0] >0.5 else 'Negative'

    return sentiment, prediction[0][0]

In [18]:
# user input and prediction
example_review = 'This movie was fantastic! The acting was great and the plot was thrilling.'
sentiment, score = predict_sentiment(example_review)



In [19]:
print(example_review, sentiment, score)

This movie was fantastic! The acting was great and the plot was thrilling. Positive 0.71328056
