In [1]:
import numpy
from keras.datasets import imdb
from keras.models import Sequential
from keras.layers import Dense
from keras.layers import LSTM, Convolution1D, Flatten, Dropout
from keras.layers.embeddings import Embedding
from keras.preprocessing import sequence
from keras.callbacks import TensorBoard

  from ._conv import register_converters as _register_converters
Using TensorFlow backend.


In [2]:
# Using keras to load the dataset with the top_words
top_words = 10000
(X_train, y_train), (X_test, y_test) = imdb.load_data(num_words=top_words)

In [3]:
# Pad the sequence to the same length
max_review_length = 1600
X_train = sequence.pad_sequences(X_train, maxlen=max_review_length)
X_test = sequence.pad_sequences(X_test, maxlen=max_review_length)

In [4]:
# Using embedding from keras
embedding_vector_length = 300
model = Sequential()
model.add(Embedding(top_words, embedding_vector_length, input_length=max_review_length))

In [5]:
# Convolutional model (3x conv, flatten, 2x dense)
model.add(Convolution1D(64, 3, padding='same'))
model.add(Convolution1D(32, 3, padding='same'))
model.add(Convolution1D(16, 3, padding='same'))
model.add(Flatten())
model.add(Dropout(0.2))
model.add(Dense(180, activation='sigmoid'))
model.add(Dropout(0.2))
model.add(Dense(1, activation='sigmoid'))

In [None]:
# Log to tensorboard
tensorBoardCallback = TensorBoard(log_dir='./logs', write_graph=True)
model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])
model.fit(X_train, y_train, epochs=7, callbacks=[tensorBoardCallback], batch_size=64)

Epoch 1/7
Epoch 2/7
Epoch 3/7
Epoch 4/7
   64/25000 [..............................] - ETA: 29s - loss: 2.5742e-04 - acc: 1.0000  128/25000 [..............................] - ETA: 29s - loss: 7.0349e-04 - acc: 1.0000  192/25000 [..............................] - ETA: 29s - loss: 8.8739e-04 - acc: 1.0000  256/25000 [..............................] - ETA: 29s - loss: 0.0124 - acc: 0.9961      320/25000 [..............................] - ETA: 29s - loss: 0.0100 - acc: 0.9969  384/25000 [..............................] - ETA: 29s - loss: 0.0086 - acc: 0.9974

In [None]:
# Evaluation on the test set
scores = model.evaluate(X_test, y_test, verbose=0)
print('Accuracy: %.2f%%' % (scores[1]*100))