In [1]:
# Import Datasets
from keras.datasets import imdb

In [3]:
vocabulary_size = 5000
(X_tr, y_tr), (X_te, y_te) = imdb.load_data(num_words = vocabulary_size)
(X_train, y_train), (X_test, y_test) = imdb.load_data(num_words = vocabulary_size)

word2id = imdb.get_word_index()
id2word = {i: word for word, i in word2id.items()}

In [4]:
print('Maximum  length: {}'.format(
len(max((X_train + X_test), key=len))))
print('Minimum  length: {}'.format(
len(min((X_test + X_test), key=len))))

Maximum  length: 2697
Minimum  length: 14


In [5]:
from keras.preprocessing import sequence
max_words = 500
X_train = sequence.pad_sequences(X_train, maxlen=max_words)
X_test = sequence.pad_sequences(X_test, maxlen=max_words)

In [6]:
from keras import Sequential
from keras.layers import Embedding, LSTM, Dense, Dropout
embedding_size=32
model=Sequential()
model.add(Embedding(vocabulary_size, embedding_size, input_length=max_words))
model.add(LSTM(100))
model.add(Dense(1, activation='sigmoid'))
print(model.summary())

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
embedding (Embedding)        (None, 500, 32)           160000    
_________________________________________________________________
lstm (LSTM)                  (None, 100)               53200     
_________________________________________________________________
dense (Dense)                (None, 1)                 101       
Total params: 213,301
Trainable params: 213,301
Non-trainable params: 0
_________________________________________________________________
None


In [7]:
model.compile(loss='binary_crossentropy', 
             optimizer='adam', 
             metrics=['accuracy'])

In [8]:
batch_size = 32
num_epochs = 2
X_valid, y_valid = X_train[:batch_size], y_train[:batch_size]
X_train2, y_train2 = X_train[batch_size:], y_train[batch_size:]
results=model.fit(X_train2, y_train2, validation_data=(X_valid, y_valid), batch_size=batch_size, epochs=num_epochs)

Epoch 1/2
Epoch 2/2


In [9]:
#Predicting classes
scores = model.predict_classes(X_test)

Instructions for updating:
Please use instead:* `np.argmax(model.predict(x), axis=-1)`,   if your model does multi-class classification   (e.g. if it uses a `softmax` last-layer activation).* `(model.predict(x) > 0.5).astype("int32")`,   if your model does binary classification   (e.g. if it uses a `sigmoid` last-layer activation).


In [10]:
print('---Review---')
print([id2word.get(i, ' ') for i in X_te[6]])
print('---Actual Result---')
print(y_te[6])
print('---prediction---')
print(scores[6])

---Review---
['the', 'instance', 'absolutely', 'in', 'at', 'out', 'is', 'lot', 'br', 'is', 'mostly', 'humans', 'of', 'someone', 'and', 'and', 'of', 'wear', 'br', 'and', 'and', 'it', 'of', 'their', 'br', 'of', 'and', 'br', 'of', 'ended', 'br', 'of', 'and', 'this', 'and', 'and', 'of', 'you', 'debut', 'film', 'of', 'ended', 'and', 'sacrifice', 'to', 'of', 'energy', 'and', 'of', 'proud', 'br', 'of', 'so', 'and', 'beautiful', 'put', 'special', 'really', 'of', 'brooklyn', 'strength', 'it', 'age', 'as', 'and', 'it', 'released', 'in', 'of', 'and', 'in', 'wave', 'this', 'trouble', 'no', 'of', 'and', 'and', 'are', 'is', 'mostly', 'johnson', 'br', 'letting', 'and', 'of', 'and', 'and', 'bands', 'girlfriend', 'to', 'mann', 'things', 'of', 'letting', 'anna', 'she', 'of', 'correct', 'is', 'and', 'and', 'it', 'cry', 'in', 'and', 'of', 'and', 'not', 'they', 'of', 'writer', 'no', 'of', 'and', 'saw', 'first', 'costs', 'were', 'and', 'unnecessary', 'of', 'in', 'surely', "i'm", 'and', 'country', 'hello', '

In [11]:
print('---Review---')
print([id2word.get(i, ' ') for i in X_te[7]])
print('---Actual Result---')
print(y_te[7])
print('---prediction---')
print(scores[7])

---Review---
['the', 'of', 'and', 'animation', 'and', 'male', 'it', 'and', 'in', 'and', 'explanation', 'and', 'male', 'take', 'no', 'and', 'and', 'and', 'risk', 'this', 'kill', 'in', 'exploitation', 'is', 'vhs', 'fred', 'in', 'of', 'and', 'be', 'male', 'it', 'mentally', 'who', 'and', 'male', 'watch', 'is', 'popular', 'catch', 'know', 'and', 'it', 'and', 'or', 'kill', 'is', 'and', 'and', 'for', 'and', 'male', "isn't", 'and', 'male', 'her', 'for', 'would', 'well', 'thousands', 'about', 'and', 'heat', 'as', 'it', 'and', 'to', 'of', 'universe', 'form', 'this', 'did', 'her', 'people', 'and', 'to', 'and', 'of', 'hollywood', 'br', 'of', 'you', 'furthermore', 'who', 'film', 'reading', 'to', 'they', 'of', 'here', 'and', 'male', 'lines', 'enemy', 'not', 'like', 'it', 'of', 'help', 'i', 'i', 'of', 'male', 'their', 'it', 'of', 'time', 'buy', 'treatment', 'for', 'it', 'short', 'in', 'classic', 'to', 'pay', 'is', 'their', 'may', 'comedic', 'make', 'is', 'getting', 'using', 'more', 'he', 'either', 'w

In [13]:
print('---Review---')
print([id2word.get(i, ' ') for i in X_te[9]])
print('---Actual Result---')
print(y_te[9])
print('---prediction---')
print(scores[9])

---Review---
['the', 'as', 'you', 'it', 'know', 'of', 'soul', 'separate', 'web', 'in', 'one', 'fill', 'old', 'was', 'into', 'and', 'for', 'of', 'front', 'side', 'soul', 'victim', 'than', 'shot', 'to', 'after', 'one', 'will', 'miss', 'and', 'who', 'is', 'andrew', 'going', 'movie', 'that', 'modern', 'some', 'as', 'with', 'his', 'in', 'at', 'of', 'liked', 'i', 'i', 'events', 'fortunately', 'entirely', 'and', 'than', 'due', 'film', "don't", 'seemed', 'as', 'father', 'soul', 'you', 'or', 'technical', 'aforementioned', 'modern', 'some', 'joke', 'or', 'of', 'and', 'br', 'talented', 'last', 'fan', 'or', 'aforementioned', 'to', 'of', 'stevens', 'and', 'br', 'were', 'exaggerated', 'fault', 'in', "i'd", 'of', 'separate', 'first', 'so', 'mafia', 'in', 'of', 'resulting', 'day', 'original', 'was', 'knowledge', 'in', 'terrible', "don't", 'soul', 'teacher', 'well', 'at', 'sick', 'they', 'an', 'harry', 'i', 'i', "wasn't", 'that', 'it', 'his', 'world', 'of', 'stretch', 'br', 'of', 'how', 'you', 'old', '