In [1]:
# https://keras.io/
!pip install -q keras
import keras

Using TensorFlow backend.


In [2]:
from google.colab import drive
drive.mount('/content/drive/')

Go to this URL in a browser: https://accounts.google.com/o/oauth2/auth?client_id=947318989803-6bn6qk8qdgf4n4g3pfee6491hc0brc4i.apps.googleusercontent.com&redirect_uri=urn%3Aietf%3Awg%3Aoauth%3A2.0%3Aoob&scope=email%20https%3A%2F%2Fwww.googleapis.com%2Fauth%2Fdocs.test%20https%3A%2F%2Fwww.googleapis.com%2Fauth%2Fdrive%20https%3A%2F%2Fwww.googleapis.com%2Fauth%2Fdrive.photos.readonly%20https%3A%2F%2Fwww.googleapis.com%2Fauth%2Fpeopleapi.readonly&response_type=code

Enter your authorization code:
··········
Mounted at /content/drive/


In [3]:
import os
os.getcwd()

'/content'

In [0]:
os.chdir("./drive/My Drive/Colab Notebooks")

In [0]:
import keras
from keras.datasets import cifar10
from keras.models import Model, Sequential
from keras.layers import Dense, Dropout, Flatten, Input, AveragePooling2D, merge, Activation
from keras.layers import Conv2D, MaxPooling2D, BatchNormalization
from keras.layers import Concatenate
from keras.optimizers import Adam
from keras.regularizers import l2
from keras.preprocessing.image import ImageDataGenerator

In [0]:
# this part will prevent tensorflow to allocate all the avaliable GPU Memory
# backend
import tensorflow as tf
from keras import backend as K

# Don't pre-allocate memory; allocate as-needed
config = tf.ConfigProto()
config.gpu_options.allow_growth = True

# Create a session with the above options specified.
K.tensorflow_backend.set_session(tf.Session(config=config))

In [7]:
num_classes = 10
# Load CIFAR10 Data
(x_train, y_train), (x_test, y_test) = cifar10.load_data()
img_height, img_width, channel = x_train.shape[1],x_train.shape[2],x_train.shape[3]

# convert to one hot encoing 
y_train = keras.utils.to_categorical(y_train, num_classes)
y_test = keras.utils.to_categorical(y_test, num_classes)

Downloading data from https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz


In [0]:
x_train_mean = x_train.mean(axis =0)
x_test_mean = x_test.mean(axis=0)
x_train_std = x_train.std(axis=0)
x_test_std = x_test.std(axis=0)
x_train = (x_train - x_train_mean)/x_train_std
x_test = (x_test - x_test_mean)/x_test_std

In [0]:
# Hyperparameters
batch_size = 64
l = 16
num_filter = 12
compression = 0.5
dropout_rate = 0.2

In [0]:
def conv_layer(input, num_filter, dropout_rate, l2_reg, kernel_size =3):
  BatchNorm = BatchNormalization(gamma_regularizer=l2(l2_reg), beta_regularizer=l2(l2_reg))(input)
  relu = Activation('relu')(BatchNorm)
  conv = Conv2D(num_filter, kernel_size, padding = 'same', kernel_regularizer = l2(l2_reg), use_bias = False)(relu)
  if dropout_rate>0:
    conv = Dropout(dropout_rate)(conv)
  return conv

In [0]:
# bottleneck layer
def bottleneck_layer(input, num_filter, dropout_rate, l2_reg, kernel_size=3):
  conv1 = conv_layer(input, num_filter*4, dropout_rate, l2_reg, kernel_size=1)
  conv3 = conv_layer(conv1, num_filter, dropout_rate, l2_reg, kernel_size=kernel_size)
  return conv3

In [0]:
# Dense Block
def add_denseblock(input, num_filter, dropout_rate, l2_reg, bottleneck=False, kernel_size=3):
    temp = input
    for _ in range(l):
        if bottleneck:
          output = bottleneck_layer(temp, num_filter, dropout_rate, l2_reg, kernel_size=kernel_size)
        else:
          output = conv_layer(temp, num_filter, dropout_rate, l2_reg, kernel_size=3)
    
        concat = Concatenate(axis=-1)([temp,output])
        temp = concat
        
    return temp

In [0]:
def add_transition(input, num_filter, dropout_rate, l2_reg):
    output = conv_layer(input, num_filter, dropout_rate, l2_reg, kernel_size=1)
    avg = AveragePooling2D(pool_size=(2,2))(output)
    return avg

In [0]:
def output_layer(input, l2_reg):
    BatchNorm = BatchNormalization(gamma_regularizer=l2(l2_reg), beta_regularizer=l2(l2_reg))(input)
    relu = Activation('relu')(BatchNorm)
    AvgPooling = AveragePooling2D(pool_size=(2,2))(relu)
    flat = Flatten()(AvgPooling)
    output = Dense(num_classes, activation='softmax')(flat)
    
    return output

In [0]:
num_blocks = 3
num_channels = 32
l2_reg = 1e-4
input = Input(shape=(img_height, img_width, channel,))
out = Conv2D(num_channels, (3,3), use_bias=False, kernel_regularizer = l2(l2_reg), padding='same')(input)

for i in range(num_blocks-1):
  out = add_denseblock(out, num_filter=num_filter, dropout_rate=dropout_rate, l2_reg= l2_reg, bottleneck=True)
  num_channels += l*num_filter
  num_channels = int(num_channels*compression)
  out = add_transition(out, num_filter=num_channels, dropout_rate=dropout_rate, l2_reg= l2_reg)

out = add_denseblock(out, num_filter=num_filter, dropout_rate=dropout_rate, l2_reg= l2_reg, bottleneck=True)

output = output_layer(out, l2_reg = 1e-4,)


In [16]:
model = Model(inputs=[input], outputs=[output])
model.summary()

__________________________________________________________________________________________________
Layer (type)                    Output Shape         Param #     Connected to                     
input_1 (InputLayer)            (None, 32, 32, 3)    0                                            
__________________________________________________________________________________________________
conv2d_1 (Conv2D)               (None, 32, 32, 32)   864         input_1[0][0]                    
__________________________________________________________________________________________________
batch_normalization_1 (BatchNor (None, 32, 32, 32)   128         conv2d_1[0][0]                   
__________________________________________________________________________________________________
activation_1 (Activation)       (None, 32, 32, 32)   0           batch_normalization_1[0][0]      
__________________________________________________________________________________________________
conv2d_2 (

In [0]:
from keras import optimizers
from keras import callbacks

In [0]:
# from keras import backend as K
# def scheduler(epoch):
#   if epoch > 50 and epoch <= 100:
#     K.set_value(model.optimizer.lr, 0.01)
#   elif epoch >100:
#     K.set_value(model.optimizer.lr, 0.001)
#   return K.get_value(model.optimizer.lr)

# change_lr = callbacks.LearningRateScheduler(scheduler)

In [0]:
checkpointer = callbacks.ModelCheckpoint(filepath= 'DNST_NO_AUG.{epoch:02d}-{val_loss:.2f}.hdf5', 
                                         monitor = 'val_acc',
                                         mode = 'max',
                                         save_best_only = True,
                                         save_weights_only = True,
                                         period =10)

In [0]:
sgd = optimizers.SGD(lr = 0.1, decay = 1e-6, momentum=0.9, nesterov=True )

In [0]:
# determine Loss function and Optimizer
model.compile(loss='categorical_crossentropy',
              optimizer=sgd,
              metrics=['accuracy'])

In [22]:
model.fit(x_train, y_train,
          batch_size=64,
          epochs=50,
          verbose=1,
          validation_data=(x_test, y_test),
          callbacks=[checkpointer])

Train on 50000 samples, validate on 10000 samples
Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50


<keras.callbacks.History at 0x7f2215f84908>

In [23]:
model.save("DNST_No_Aug_epochs_50.h5")
print("Saved model to disk")

Saved model to disk


In [0]:
from keras.models import load_model
model = load_model("DNST_No_Aug_epochs_80.h5")

In [0]:
model.fit(x_train, y_train,
          batch_size=64,
          epochs=55,
          verbose=1,
          validation_data=(x_test, y_test),
          callbacks=[checkpointer])

In [22]:
# Test the model
score = model.evaluate(x_test, y_test, verbose=1)
print('Test loss:', score[0])
print('Test accuracy:', score[1])

Test loss: 1.1033497195243835
Test accuracy: 0.7567


In [23]:
# Save the trained weights in to .h5 format
model.save("./DNST_No_Aug_Epoch_125.h5")
print("Saved model to disk")

Saved model to disk


In [0]:
from keras.models import load_model
model = load_model('DNST_No_Aug_Epoch_125.h5')

In [21]:
# Changing learning rate to 0.01
print(K.get_value(model.optimizer.lr)) # current learning rate
K.set_value(model.optimizer.lr, 0.01)
K.get_value(model.optimizer.lr)

0.1


In [0]:
model.fit(x_train, y_train,
          batch_size=64,
          epochs=65,
          verbose=1,
          validation_data=(x_test, y_test),
          callbacks=[checkpointer])

  


Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50


In [0]:
# Test the model
score = model.evaluate(x_test, y_test, verbose=1)
print('Test loss:', score[0])
print('Test accuracy:', score[1])

In [0]:
# Save the trained weights in to .h5 format
model.save("./DNST_No_Aug_Epoch_190.h5")
print("Saved model to disk")

In [26]:
model = load_model('DNST_No_Aug_Epoch_190.h5')
# Changing learning rate to 0.001
print(K.get_value(model.optimizer.lr)) # current learning rate
K.set_value(model.optimizer.lr, 0.001)
K.get_value(model.optimizer.lr)

  


Epoch 1/30
Epoch 2/30
Epoch 3/30
Epoch 4/30
Epoch 5/30
Epoch 6/30
Epoch 7/30
Epoch 8/30
Epoch 9/30
Epoch 10/30
Epoch 11/30
Epoch 12/30
Epoch 13/30
Epoch 14/30
Epoch 15/30
Epoch 16/30
Epoch 17/30
Epoch 18/30
Epoch 19/30
Epoch 20/30
Epoch 22/30
Epoch 23/30
Epoch 24/30
Epoch 25/30
Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


<keras.callbacks.History at 0x7fe7f8684358>

In [0]:
model.fit(x_train, y_train,
          batch_size=64,
          epochs=60,
          verbose=1,
          validation_data=(x_test, y_test),
          callbacks=[checkpointer])

In [27]:
# Test the model
score = model.evaluate(x_test, y_test, verbose=1)
print('Test loss:', score[0])
print('Test accuracy:', score[1])

Test loss: 0.5625957227706909
Test accuracy: 0.8707


In [0]:
# Save the trained weights in to .h5 format
model.save("./DNST_No_Aug_Epoch_250.h5")
print("Saved model to disk")