In [4]:
""" DenseNet Model for cifar10 """

# Import libraries
import numpy as np
import tensorflow as tf
import keras
import keras.backend as K 
from keras.utils import np_utils
from keras.datasets import cifar10
from keras.models import Sequential
from keras.optimizers import Optimizer
from keras.callbacks import EarlyStopping
from keras.preprocessing.image import ImageDataGenerator
from keras.layers.core import Dense, Dropout, Activation, Flatten
from keras.layers.convolutional import Conv2D
from keras.layers.pooling import MaxPooling2D

import densenet

# For reproducibility
np.random.seed(42)
tf.set_random_seed(42)

In [2]:
# data
(x_train, y_train), (x_test, y_test) = cifar10.load_data()
x_train = x_train.astype('float32')
x_test = x_test.astype('float32')

#z-score
mean = np.mean(x_train,axis=(0,1,2,3))
std = np.std(x_train,axis=(0,1,2,3))
x_train = (x_train-mean)/(std+1e-7)
x_test = (x_test-mean)/(std+1e-7)

num_classes = 10
y_train = np_utils.to_categorical(y_train,num_classes)
y_test = np_utils.to_categorical(y_test,num_classes)

In [5]:
#data augmentation
datagen = ImageDataGenerator(
    featurewise_center=False,
    samplewise_center=False,
    featurewise_std_normalization=False,
    samplewise_std_normalization=False,
    zca_whitening=False,
    rotation_range=15,
    width_shift_range=0.1,
    height_shift_range=0.1,
    horizontal_flip=True,
    vertical_flip=False
    )
datagen.fit(x_train)

In [3]:
# Swish activation function
# x*sigmoid(x)
def swish(x):
    return x*K.sigmoid(x)

# Custom activation function 1
# mix between relu and positive part of swish mirrored across x=1
def e_swish_1(x):
    return K.maximum(0.0, x*(2-K.sigmoid(x)))

# Custom activation function 2
# positive part of swish mirrored across x=1
def e_swish_2(x):
    return K.maximum(x*K.sigmoid(x), x*(2-K.sigmoid(x)))

In [4]:
activations = [e_swish_1, e_swish_2, swish, "relu", "sigmoid", "tanh"]
names = activations[:]
for i,a in enumerate(names):
    if not isinstance(a, str):
        names[i] = a.__name__
print(names)

['e_swish_1', 'e_swish_2', 'swish', 'relu', 'sigmoid', 'tanh']


In [8]:
###################
# Construct model #
###################

act = "relu"
depth = 40
nb_dense_block = 3
nb_filter = 16 
growth_rate = 12
dropout_rate = 0.0
weight_decay = 1e-4

model = densenet.DenseNet(
                          act, 10,
                          (32, 32, 3),
                          depth,
                          nb_dense_block,
                          growth_rate,
                          nb_filter,
                          dropout_rate=dropout_rate,
                          weight_decay=weight_decay
                         )

# Model output
model.summary()

__________________________________________________________________________________________________
Layer (type)                    Output Shape         Param #     Connected to                     
input_1 (InputLayer)            (None, 32, 32, 3)    0                                            
__________________________________________________________________________________________________
initial_conv2D (Conv2D)         (None, 32, 32, 16)   432         input_1[0][0]                    
__________________________________________________________________________________________________
batch_normalization_1 (BatchNor (None, 32, 32, 16)   128         initial_conv2D[0][0]             
__________________________________________________________________________________________________
activation_1 (Activation)       (None, 32, 32, 16)   0           batch_normalization_1[0][0]      
__________________________________________________________________________________________________
conv2d_1 (

In [None]:
####################
# Network training #
####################
batch_size  = 64
epochs = 30

# Build optimizer
keras.optimizers.SGD(lr=0.1, momentum=0.9 decay=1e-4, nesterov=True
model.compile(loss='categorical_crossentropy', optimizer=opt, metrics=["accuracy"])
                     
print("Training up to 50%")
for i in range(5):
    his = model.fit_generator(datagen.flow(x_train, y_train, batch_size=batch_size),steps_per_epoch=x_train.shape[0] // batch_size,epochs=epochs,verbose=1,validation_data=(x_test,y_test))
    model.save_weights('densenet.h5')
    print(his.history)

In [10]:


print("Training")
model.fit_generator(datagen.flow(x_train, y_train, batch_size=batch_size),steps_per_epoch=x_train.shape[0] // batch_size,epochs=epochs,verbose=1,validation_data=(x_test,y_test))
model.save_weights('densenet.h5')

Training
Epoch 1/1


In [12]:
####################
# Network training #
####################
batch_size  = 64
epochs = 15

for i in range()
print("Training")
his = model.fit_generator(datagen.flow(x_train, y_train, batch_size=batch_size),steps_per_epoch=x_train.shape[0] // batch_size,epochs=epochs,verbose=1,validation_data=(x_test,y_test))
model.save_weights('densenet_'+str(i)+'.h5')

Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
Training
Epoch 1/1
