## Creating the ML algorithm

#### Importing the relevant libraries

In [3]:
import numpy as np
import tensorflow as tf

### Data

In [9]:
npz = np.load('Audiobooks_data_train.npz')

train_inputs = npz['inputs'].astype(np.float)
train_targets = npz['targets'].astype(np.int)

npz = np.load('Audiobooks_validation.npz')
validation_inputs, validation_targets = npz['inputs'].astype(np.float), npz['targets'].astype(np.int)

npz = np.load('Audiobooks_test.npz')
test_inputs, test_targets = npz['inputs'].astype(np.float), npz['targets'].astype(np.int)

### Model
Outline, optimizers, loss, early stopping and training

In [30]:
input_size = 10
output_size = 2
hidden_layer_size = 50
    
model = tf.keras.Sequential([
    tf.keras.layers.Dense(hidden_layer_size, activation='relu'), # 1st hidden layer
    tf.keras.layers.Dense(hidden_layer_size, activation='relu'), # 2nd hidden layer
    tf.keras.layers.Dense(output_size, activation='softmax') # output layer
])


model.compile(optimizer='adam', loss='sparse_categorical_crossentropy', metrics=['accuracy'])

batch_size = 100
max_epochs = 100

# set an early stopping mechanism
# let's set patience=2, to be a bit tolerant against random validation loss increases
early_stopping = tf.keras.callbacks.EarlyStopping(patience=2)

model.fit(train_inputs, 
          train_targets, 
          batch_size=batch_size, 
          epochs=max_epochs,
          callbacks=[early_stopping], 
          validation_data=(validation_inputs, validation_targets),
          verbose = 2 
          )  

Train on 3579 samples, validate on 447 samples
Epoch 1/100
3579/3579 - 1s - loss: 0.6165 - accuracy: 0.6734 - val_loss: 0.5100 - val_accuracy: 0.7562
Epoch 2/100
3579/3579 - 0s - loss: 0.4705 - accuracy: 0.7547 - val_loss: 0.4387 - val_accuracy: 0.7606
Epoch 3/100
3579/3579 - 0s - loss: 0.4133 - accuracy: 0.7930 - val_loss: 0.4084 - val_accuracy: 0.7919
Epoch 4/100
3579/3579 - 0s - loss: 0.3858 - accuracy: 0.8030 - val_loss: 0.3957 - val_accuracy: 0.7875
Epoch 5/100
3579/3579 - 0s - loss: 0.3706 - accuracy: 0.8053 - val_loss: 0.3816 - val_accuracy: 0.7763
Epoch 6/100
3579/3579 - 0s - loss: 0.3579 - accuracy: 0.8142 - val_loss: 0.3739 - val_accuracy: 0.7808
Epoch 7/100
3579/3579 - 0s - loss: 0.3534 - accuracy: 0.8083 - val_loss: 0.3779 - val_accuracy: 0.7964
Epoch 8/100
3579/3579 - 0s - loss: 0.3461 - accuracy: 0.8153 - val_loss: 0.3707 - val_accuracy: 0.7919
Epoch 9/100
3579/3579 - 0s - loss: 0.3433 - accuracy: 0.8175 - val_loss: 0.3715 - val_accuracy: 0.7808
Epoch 10/100
3579/3579 - 0

<tensorflow.python.keras.callbacks.History at 0x7f1048402748>

### Testing the model


In [31]:
test_loss, test_accuracy = model.evaluate(test_inputs, test_targets)



In [32]:
print('\nTest loss: {0:.2f}. Test accuracy: {1:.2f}%'.format(test_loss, test_accuracy*100.))


Test loss: 0.34. Test accuracy: 81.92%
