In [2]:
import tensorflow as tf
import tensorflow_datasets as tfds

In [3]:
from tensorflow import keras
from keras import datasets, layers, models, preprocessing

In [4]:
MAX_LEN = 200
N_WORDS = 10000
DIM_EMBEDDING = 256
EPOCHS = 20
BATCH_SIZE = 500

In [5]:
def load_data():
    (X_train, Y_train), (X_test, Y_test) = datasets.imdb.load_data(num_words=N_WORDS)
    X_train = preprocessing.sequence.pad_sequences(X_train, MAX_LEN)
    X_test = preprocessing.sequence.pad_sequences(X_test, MAX_LEN)
    
    return (X_train, Y_train), (X_test, Y_test)

In [6]:
def build_model():
    model = models.Sequential([
        layers.Embedding(N_WORDS, DIM_EMBEDDING, input_length=MAX_LEN),
        layers.Dropout(0.3),
        
        layers.GlobalAveragePooling1D(),
        layers.Dense(128, activation='relu'),
        layers.Dropout(0.5),
        layers.Dense(1, activation='sigmoid')
    ])
    
    return model

In [7]:
(X_train, Y_train), (X_test, Y_test) = load_data()

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/imdb.npz


In [8]:
model = build_model()

In [9]:
model.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
embedding (Embedding)        (None, 200, 256)          2560000   
_________________________________________________________________
dropout (Dropout)            (None, 200, 256)          0         
_________________________________________________________________
global_average_pooling1d (Gl (None, 256)               0         
_________________________________________________________________
dense (Dense)                (None, 128)               32896     
_________________________________________________________________
dropout_1 (Dropout)          (None, 128)               0         
_________________________________________________________________
dense_1 (Dense)              (None, 1)                 129       
Total params: 2,593,025
Trainable params: 2,593,025
Non-trainable params: 0
______________________________________________

In [11]:
model.compile(optimizer = 'adam', loss = 'binary_crossentropy', metrics=['accuracy'])

In [12]:
score = model.fit(X_train, Y_train, epochs = EPOCHS, batch_size = BATCH_SIZE, validation_data = (X_test, Y_test))

Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [13]:
score2 = model.evaluate(X_test, Y_test, batch_size = BATCH_SIZE)
print('\nTest score:', score2[0])
print('Test Accuracy', score2[1])


Test score: 0.6668372750282288
Test Accuracy 0.8395199775695801
