In [1]:
from __future__ import print_function

import keras
import numpy as np
from keras.datasets import mnist
from keras.models import Sequential
from keras.layers import Dense, Dropout
from keras.optimizers import RMSprop

Using TensorFlow backend.
  return f(*args, **kwds)


In [2]:
def unpickle(file):
    import pickle
    with open(file, 'rb') as fo:
        dict = pickle.load(fo, encoding='bytes')
    return dict

In [3]:
data_batch_1 = unpickle("cifar-10-batches-py/data_batch_1")
data_batch_2 = unpickle("cifar-10-batches-py/data_batch_2")
data_batch_3 = unpickle("cifar-10-batches-py/data_batch_3")
data_batch_4 = unpickle("cifar-10-batches-py/data_batch_4")
data_batch_5 = unpickle("cifar-10-batches-py/data_batch_5")

In [4]:
data1 = data_batch_1[b'data']
label1 = data_batch_1[b'labels']
data2 = data_batch_2[b'data']
label2 = data_batch_2[b'labels']
data3 = data_batch_3[b'data']
label3 = data_batch_3[b'labels']
data4 = data_batch_4[b'data']
label4 = data_batch_4[b'labels']
data5 = data_batch_5[b'data']
label5 = data_batch_5[b'labels']

In [5]:
x_train = np.concatenate((data1,data2,data3,data4,data5),axis=0)

In [6]:
label1 = np.array(label1, dtype = float)
label2 = np.array(label2, dtype = float)
label3 = np.array(label3, dtype = float)
label4 = np.array(label4, dtype = float)
label5 = np.array(label5, dtype = float)
y_train = np.concatenate((label1,label2,label3,label4,label5),axis=0)

In [7]:
test_data = unpickle("cifar-10-batches-py/test_batch")

In [8]:
x_test = test_data[b'data']
y_test = test_data[b'labels']
y_test = np.array(y_test, dtype = float)

In [9]:
# (x_train, y_train), (x_test, y_test) = mnist.load_data()

# x_train = x_train.reshape(60000, 3072)
# x_test = x_test.reshape(10000, 3072)
# x_train = train_data
# x_test = test_data
x_train = x_train.astype('float32')
x_test = x_test.astype('float32')
x_train /= 255
x_test /= 255
print(x_train.shape[0], 'train samples')
print(x_test.shape[0], 'test samples')

50000 train samples
10000 test samples


In [10]:
num_classes = 10

In [11]:
y_train = keras.utils.to_categorical(y_train, num_classes)
y_test = keras.utils.to_categorical(y_test, num_classes)

**The following configuration is the reference standard to evaluate model**

**1. No of epochs: 20**

**2. Batch size: 128**

**3. Network configuration**

    a. Number of neurons in a layer: 512
    
    b. Number of layers: 3
    
**4. Learning rate: 0.001**

**5. Activation functions: relu**

**6. Dropout rates: 0.2**

In [12]:
batch_size = 128
epochs = 20

In [13]:
model = Sequential()
model.add(Dense(512, activation='relu', input_shape=(3072,)))
model.add(Dropout(0.2))
model.add(Dense(512, activation='relu'))
model.add(Dropout(0.2))
model.add(Dense(num_classes, activation='softmax'))

In [14]:
model.summary()

_________________________________________________________________
Layer (type)                 Output Shape              Param #   
dense_1 (Dense)              (None, 512)               1573376   
_________________________________________________________________
dropout_1 (Dropout)          (None, 512)               0         
_________________________________________________________________
dense_2 (Dense)              (None, 512)               262656    
_________________________________________________________________
dropout_2 (Dropout)          (None, 512)               0         
_________________________________________________________________
dense_3 (Dense)              (None, 10)                5130      
Total params: 1,841,162
Trainable params: 1,841,162
Non-trainable params: 0
_________________________________________________________________


In [15]:
# initiate RMSprop optimizer
opt = keras.optimizers.rmsprop(lr=0.001, decay=1e-6)

In [16]:
model.compile(loss='categorical_crossentropy',
              optimizer=opt,
              metrics=['accuracy'])

In [17]:
history = model.fit(x_train, y_train,
                    batch_size=batch_size,
                    epochs=epochs,
                    verbose=1,
                    validation_data=(x_test, y_test))

Train on 50000 samples, validate on 10000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [18]:
score = model.evaluate(x_test, y_test, verbose=0)

In [19]:
print('Test loss:', score[0])
print('Test accuracy:', score[1])

Test loss: 1.53538006916
Test accuracy: 0.4586


**Change No. of epochs from 20 to 40**

In [21]:
model_epochs = Sequential()
model_epochs.add(Dense(512, activation='relu', input_shape=(3072,)))
model_epochs.add(Dropout(0.2))
model_epochs.add(Dense(512, activation='relu'))
model_epochs.add(Dropout(0.2))
model_epochs.add(Dense(num_classes, activation='softmax'))

model_epochs.compile(loss='categorical_crossentropy',
              optimizer=opt,
              metrics=['accuracy'])

history_epochs = model_epochs.fit(x_train, y_train,
                    batch_size=batch_size,
                    epochs=40,
                    verbose=1,
                    validation_data=(x_test, y_test))

Train on 50000 samples, validate on 10000 samples
Epoch 1/40
Epoch 2/40
Epoch 3/40
Epoch 4/40
Epoch 5/40
Epoch 6/40
Epoch 7/40
Epoch 8/40
Epoch 9/40
Epoch 10/40
Epoch 11/40
Epoch 12/40
Epoch 13/40
Epoch 14/40
Epoch 15/40
Epoch 16/40
Epoch 17/40
Epoch 18/40
Epoch 19/40
Epoch 20/40
Epoch 21/40
Epoch 22/40
Epoch 23/40
Epoch 24/40
Epoch 25/40
Epoch 26/40
Epoch 27/40
Epoch 28/40
Epoch 29/40
Epoch 30/40
Epoch 31/40
Epoch 32/40
Epoch 33/40
Epoch 34/40
Epoch 35/40
Epoch 36/40
Epoch 37/40
Epoch 38/40
Epoch 39/40
Epoch 40/40


In [22]:
score = model_epochs.evaluate(x_test, y_test, verbose=0)
print('Test loss:', score[0])
print('Test accuracy:', score[1])

Test loss: 1.49912586746
Test accuracy: 0.469


**The accuracy increased and the loss decreased. So that the more epochs, the better model is.**

**Change batch size from 128 to 256**

In [24]:
model_batch = Sequential()
model_batch.add(Dense(512, activation='relu', input_shape=(3072,)))
model_batch.add(Dropout(0.2))
model_batch.add(Dense(512, activation='relu'))
model_batch.add(Dropout(0.2))
model_batch.add(Dense(num_classes, activation='softmax'))

model_batch.compile(loss='categorical_crossentropy',
              optimizer=opt,
              metrics=['accuracy'])

history_batch = model_batch.fit(x_train, y_train,
                    batch_size=256,
                    epochs=epochs,
                    verbose=1,
                    validation_data=(x_test, y_test))

Train on 50000 samples, validate on 10000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [25]:
score = model_batch.evaluate(x_test, y_test, verbose=0)
print('Test loss:', score[0])
print('Test accuracy:', score[1])

Test loss: 1.5599057848
Test accuracy: 0.44


**The accuracy decreased and the loss increased.**

**Change number of neurons in a layer from 512 to 1024**

In [26]:
model_neuron = Sequential()
model_neuron.add(Dense(1024, activation='relu', input_shape=(3072,)))
model_neuron.add(Dropout(0.2))
model_neuron.add(Dense(1024, activation='relu'))
model_neuron.add(Dropout(0.2))
model_neuron.add(Dense(num_classes, activation='softmax'))

model_neuron.compile(loss='categorical_crossentropy',
              optimizer=opt,
              metrics=['accuracy'])

history_neuron = model_neuron.fit(x_train, y_train,
                    batch_size=batch_size,
                    epochs=epochs,
                    verbose=1,
                    validation_data=(x_test, y_test))

Train on 50000 samples, validate on 10000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [27]:
score = model_neuron.evaluate(x_test, y_test, verbose=0)
print('Test loss:', score[0])
print('Test accuracy:', score[1])

Test loss: 1.48965818634
Test accuracy: 0.4825


**The accuracy increased. So that the more neurons, the better model is.**

**Change number of layers from 3 to 5**

In [28]:
model_layer = Sequential()
model_layer.add(Dense(512, activation='relu', input_shape=(3072,)))
model_layer.add(Dropout(0.2))
model_layer.add(Dense(512, activation='relu'))
model_layer.add(Dropout(0.2))
model_layer.add(Dense(512, activation='relu'))
model_layer.add(Dropout(0.2))
model_layer.add(Dense(512, activation='relu'))
model_layer.add(Dropout(0.2))
model_layer.add(Dense(num_classes, activation='softmax'))

model_layer.compile(loss='categorical_crossentropy',
              optimizer=opt,
              metrics=['accuracy'])

history_layer = model_layer.fit(x_train, y_train,
                    batch_size=batch_size,
                    epochs=epochs,
                    verbose=1,
                    validation_data=(x_test, y_test))

Train on 50000 samples, validate on 10000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [29]:
score = model_layer.evaluate(x_test, y_test, verbose=0)
print('Test loss:', score[0])
print('Test accuracy:', score[1])

Test loss: 1.55837705841
Test accuracy: 0.4531


**The accuracy decreased and the loss increased.**

**Change learning rate from 0.001 to 0.0001**

In [30]:
opt_lr = keras.optimizers.rmsprop(lr=0.0001, decay=1e-6)

model_lr = Sequential()
model_lr.add(Dense(512, activation='relu', input_shape=(3072,)))
model_lr.add(Dropout(0.2))
model_lr.add(Dense(512, activation='relu'))
model_lr.add(Dropout(0.2))
model_lr.add(Dense(num_classes, activation='softmax'))

model_lr.compile(loss='categorical_crossentropy',
              optimizer=opt_lr,
              metrics=['accuracy'])

history_lr = model_lr.fit(x_train, y_train,
                    batch_size=batch_size,
                    epochs=epochs,
                    verbose=1,
                    validation_data=(x_test, y_test))

Train on 50000 samples, validate on 10000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [31]:
score = model_lr.evaluate(x_test, y_test, verbose=0)
print('Test loss:', score[0])
print('Test accuracy:', score[1])

Test loss: 1.35183344975
Test accuracy: 0.5204


**The accuracy increased and the loss decreased. The appropriate learning rate can increase the accuracy of model.**

**Change activation function from relu to tanh**

In [32]:
model_activation = Sequential()
model_activation.add(Dense(512, activation='tanh', input_shape=(3072,)))
model_activation.add(Dropout(0.2))
model_activation.add(Dense(512, activation='tanh'))
model_activation.add(Dropout(0.2))
model_activation.add(Dense(num_classes, activation='softmax'))

model_activation.compile(loss='categorical_crossentropy',
              optimizer=opt,
              metrics=['accuracy'])

history_activation = model_activation.fit(x_train, y_train,
                    batch_size=batch_size,
                    epochs=epochs,
                    verbose=1,
                    validation_data=(x_test, y_test))

Train on 50000 samples, validate on 10000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [33]:
score = model_activation.evaluate(x_test, y_test, verbose=0)
print('Test loss:', score[0])
print('Test accuracy:', score[1])

Test loss: 1.65307708321
Test accuracy: 0.4056


**The accuracy decreased and the loss increased. The activation function 'relu' is better than tanh.**

**Change dropout rates from 0.2 to 0.1**

In [34]:
model_dropout = Sequential()
model_dropout.add(Dense(512, activation='relu', input_shape=(3072,)))
model_dropout.add(Dropout(0.1))
model_dropout.add(Dense(512, activation='relu'))
model_dropout.add(Dropout(0.1))
model_dropout.add(Dense(num_classes, activation='softmax'))

model_dropout.compile(loss='categorical_crossentropy',
              optimizer=opt,
              metrics=['accuracy'])

history_dropout = model_dropout.fit(x_train, y_train,
                    batch_size=batch_size,
                    epochs=epochs,
                    verbose=1,
                    validation_data=(x_test, y_test))

Train on 50000 samples, validate on 10000 samples
Epoch 1/20
Epoch 2/20
Epoch 3/20
Epoch 4/20
Epoch 5/20
Epoch 6/20
Epoch 7/20
Epoch 8/20
Epoch 9/20
Epoch 10/20
Epoch 11/20
Epoch 12/20
Epoch 13/20
Epoch 14/20
Epoch 15/20
Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [35]:
score = model_dropout.evaluate(x_test, y_test, verbose=0)
print('Test loss:', score[0])
print('Test accuracy:', score[1])

Test loss: 1.44377016029
Test accuracy: 0.4839


**The accuracy increased and the loss decreased. The appropriate dropout rate can increase the accuracy of model.**

**My best model is as follow**

In [36]:
opt_best = keras.optimizers.rmsprop(lr=0.0001, decay=1e-6)

model_best = Sequential()
model_best.add(Dense(1024, activation='relu', input_shape=(3072,)))
model_best.add(Dropout(0.1))
model_best.add(Dense(1024, activation='relu'))
model_best.add(Dropout(0.1))
model_best.add(Dense(1024, activation='relu'))
model_best.add(Dropout(0.1))
model_best.add(Dense(1024, activation='relu'))
model_best.add(Dropout(0.1))
model_best.add(Dense(num_classes, activation='softmax'))

model_best.compile(loss='categorical_crossentropy',
              optimizer=opt_best,
              metrics=['accuracy'])

history_best = model_best.fit(x_train, y_train,
                    batch_size=128,
                    epochs=100,
                    verbose=1,
                    validation_data=(x_test, y_test))

Train on 50000 samples, validate on 10000 samples
Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100
Epoch 22/100
Epoch 23/100
Epoch 24/100
Epoch 25/100
Epoch 26/100
Epoch 27/100
Epoch 28/100
Epoch 29/100
Epoch 30/100
Epoch 31/100
Epoch 32/100
Epoch 33/100
Epoch 34/100
Epoch 35/100
Epoch 36/100
Epoch 37/100
Epoch 38/100
Epoch 39/100
Epoch 40/100
Epoch 41/100
Epoch 42/100
Epoch 43/100
Epoch 44/100
Epoch 45/100
Epoch 46/100
Epoch 47/100
Epoch 48/100
Epoch 49/100
Epoch 50/100
Epoch 51/100
Epoch 52/100
Epoch 53/100
Epoch 54/100
Epoch 55/100
Epoch 56/100
Epoch 57/100
Epoch 58/100


Epoch 59/100
Epoch 60/100
Epoch 61/100
Epoch 62/100
Epoch 63/100
Epoch 64/100
Epoch 65/100
Epoch 66/100
Epoch 67/100
Epoch 68/100
Epoch 69/100
Epoch 70/100
Epoch 71/100
Epoch 72/100
Epoch 73/100
Epoch 74/100
Epoch 75/100
Epoch 76/100
Epoch 77/100
Epoch 78/100
Epoch 79/100
Epoch 80/100
Epoch 81/100
Epoch 82/100
Epoch 83/100
Epoch 84/100
Epoch 85/100
Epoch 86/100
Epoch 87/100
Epoch 88/100
Epoch 89/100
Epoch 90/100
Epoch 91/100
Epoch 92/100
Epoch 93/100
Epoch 94/100
Epoch 95/100
Epoch 96/100
Epoch 97/100
Epoch 98/100
Epoch 99/100
Epoch 100/100


In [37]:
score = model_best.evaluate(x_test, y_test, verbose=0)
print('Test loss:', score[0])
print('Test accuracy:', score[1])

Test loss: 2.25705060596
Test accuracy: 0.5659


**• You are expected to provide a recommendation for the best model you would recommend for classification. Which model (with parameter values) would you choose and why?**

According to tests above, I'd like to build a model with 100 epochs, batch size 128, 1024 neurons in a layer, 5 layers, 0.0001 learning rate, activation function 'relu' and dropout rate 0.1.

**• Comment on how good your model is ? Does it overfit/underfit data ? What could you do to improve the model?**

My model fit data very well.