# G Neural Networks Overfitting
_6 points_

- Train a neural net and prevent overfitting by regularization. 
- You can use any combination of regularizers we saw in class.
- Use the train and test splits in the data do evaluate the model.

In [1]:
import keras
from keras.datasets import cifar10
from keras.models import Sequential
from keras.layers import Dense, Flatten, BatchNormalization
from keras.layers import Conv2D, MaxPooling2D, Dropout, Activation
from keras import backend as K
from keras.utils import to_categorical
from keras import regularizers

Using TensorFlow backend.


In [None]:
# change batch_size and epochs for fine tuning
# image_classes MUST remain at 10!!!

batch_size = 64
image_classes = 10
epochs = 20

In [None]:
# split data
(x_train, y_train), (x_test, y_test) = cifar10.load_data()
y_train = to_categorical(y_train, image_classes)
y_test = to_categorical(y_test, image_classes)

In [None]:
# We used some different model configurations to create a fitting model
# for the cifar dataset
model = Sequential()
decay = 1e-4
model.add(Conv2D(32, kernel_size=(5, 5), activation="hard_sigmoid", input_shape=(32, 32, 3), kernel_regularizer=regularizers.l2(decay)))
model.add(BatchNormalization())
model.add(Conv2D(32, kernel_size=(3, 3), activation="hard_sigmoid", input_shape=(32, 32, 3), kernel_regularizer=regularizers.l2(decay)))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.2))

model.add(Conv2D(64, (3,3), activation="hard_sigmoid", kernel_regularizer=regularizers.l2(decay)))
model.add(BatchNormalization())
model.add(Conv2D(64, (3,3), activation="hard_sigmoid", kernel_regularizer=regularizers.l2(decay)))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.4))

model.add(Conv2D(128, kernel_size=(3, 3), activation="hard_sigmoid", input_shape=(32, 32, 3)))
model.add(BatchNormalization())
model.add(Conv2D(128, kernel_size=(3, 3), activation="hard_sigmoid", input_shape=(32, 32, 3)))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.5))

model.add(Flatten())
#model.add(Dense(128, activation='hard_sigmoid'))
#model.add(BatchNormalization())
model.add(Dense(image_classes, activation="hard_sigmoid"))

In [None]:
# compilation
model.compile(loss="categorical_crossentropy", optimizer="adam", metrics=["accuracy"])
model.summary()

In [None]:
train_size = 5000
test_size = 8000
if (y_test.shape == (10000, 10)):
    model.fit(x_train[:train_size], y_train[:train_size],
          batch_size=batch_size,
          epochs=epochs,
          shuffle=True,
          validation_data=(x_test[:test_size], y_test[:test_size]))
else:
    raise AttributeError("y_test.shape must be (10000, 10) but is {}".format(y_test.shape))

In [None]:
score = model.evaluate(x_test[test_size:], y_test[test_size:], verbose=0)
print("Test loss:", score[0])
print("Test accuracy:", score[1])