In [3]:
from __future__ import absolute_import
from __future__ import print_function
import numpy as np
np.random.seed(1337)  # for reproducibility

from keras.preprocessing import sequence
from keras.optimizers import SGD, RMSprop, Adagrad
from keras.utils import np_utils
from keras.models import Sequential
from keras.layers.core import Dense, Dropout, Activation
from keras.layers.embeddings import Embedding
from keras.layers.recurrent import LSTM, GRU
from keras.datasets import imdb



max_features = 10000
maxlen = 500  # cut texts after this number of words (among top max_features most common words)
batch_size = 32
embedding_vector_length=32
print("Loading data...")
(X_train, y_train), (X_test, y_test) = imdb.load_data(num_words=max_features)
print(len(X_train), 'train sequences')
print(len(X_test), 'test sequences')



Loading data...




25000 train sequences
25000 test sequences


In [4]:
print("Pad sequences (samples x time)")
X_train = sequence.pad_sequences(X_train, maxlen=maxlen)
X_test = sequence.pad_sequences(X_test, maxlen=maxlen)
print('X_train shape:', X_train.shape)
print('X_test shape:', X_test.shape)

print('Build model...')
model = Sequential()
model.add(Embedding(max_features,embedding_vector_length, input_length=maxlen))
model.add(LSTM(128))  # try using a GRU instead, for fun
model.add(Dropout(0.2))
model.add(Dense(1))
model.add(Activation('sigmoid'))

# try using different optimizers and different optimizer configs
model.compile(loss='binary_crossentropy', optimizer='adam',metrics=['accuracy'])

print("Train...")
model.fit(X_train, y_train, batch_size=batch_size,epochs=5, validation_data=(X_test, y_test),verbose=True)
score= model.evaluate(X_test, y_test, batch_size=batch_size)
print('Test score:', score)


Pad sequences (samples x time)
X_train shape: (25000, 500)
X_test shape: (25000, 500)
Build model...
Train...




Train on 25000 samples, validate on 25000 samples
Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
Test score: 0.35371619759082795


In [5]:
print('Build model GRU')
model = Sequential()
model.add(Embedding(max_features,embedding_vector_length, input_length=maxlen))
model.add(GRU(128))  # try using a GRU instead, for fun
model.add(Dropout(0.2))
model.add(Dense(1))
model.add(Activation('sigmoid'))

# try using different optimizers and different optimizer configs
model.compile(loss='binary_crossentropy', optimizer='adam',metrics=['accuracy'])

print("Train..")
model.fit(X_train, y_train, batch_size=batch_size,epochs=5, validation_data=(X_test, y_test),verbose=True)
score= model.evaluate(X_test, y_test, batch_size=batch_size)
print('Test score:', score)

Build model GRU
Train...
Train on 25000 samples, validate on 25000 samples
Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5
Test score: [0.37019708607673646, 0.87672]
