In [1]:
import tensorflow as tf
import matplotlib.pyplot as plt
from tensorflow import keras
from tensorflow.keras import layers

In [2]:
batch_size = 32  # The default batch size of keras.
num_classes = 100  # Number of class for the dataset
epochs = 100

(x_train, y_train), (x_test, y_test) = tf.keras.datasets.cifar100.load_data()
print('x_train shape:', x_train.shape)
print('y_train shape:', y_train.shape)
print(x_train.shape[0], 'train samples')
print(x_test.shape[0], 'test samples')

Downloading data from https://www.cs.toronto.edu/~kriz/cifar-100-python.tar.gz
x_train shape: (50000, 32, 32, 3)
y_train shape: (50000, 1)
50000 train samples
10000 test samples


In [3]:
x_train = x_train.astype('float32')
x_test = x_test.astype('float32')
x_train /= 255
x_test /= 255

# Convert class vectors to binary class matrices. This is called one hot encoding.
y_train = tf.keras.utils.to_categorical(y_train, num_classes)
y_test = tf.keras.utils.to_categorical(y_test, num_classes)

In [4]:
def efficonvres(projection_dim):

    def apply(inputs):
        x_input = inputs

        x = layers.Conv2D(filters=projection_dim,kernel_size=3,padding="same",groups=projection_dim)(x_input)

        x1 = layers.DepthwiseConv2D(3, padding="same", use_bias=False)(x)
        x1 = layers.BatchNormalization(3)(x1)
        x1 = layers.Activation("swish")(x1)

        x1 = layers.DepthwiseConv2D(3, padding="same", use_bias=False)(x1)
        x1 = layers.LayerNormalization(epsilon=1e-6)(x1)
        x1 = layers.Activation("gelu")(x1)

        x = layers.LayerNormalization(epsilon=1e-6)(x)
        x = layers.Dense(4 * projection_dim)(x)
        x = layers.Activation("gelu")(x)
        x = layers.Dense(projection_dim)(x)

        x = tf.keras.layers.Add()([x, x1])
        return x
    return apply

dims = [32, 64, 128, 256]
inputs = tf.keras.Input(shape=(32,32,3))
x = layers.Conv2D(filters=128,kernel_size=3,padding="same", activation='gelu')(inputs)
for i in range(4):
    x = layers.Conv2D(filters=dims[i],kernel_size=3,padding="same", activation='gelu')(x)
    x = efficonvres(dims[i])(x)
x = layers.GlobalAveragePooling2D(name="avg_pool")(x)
output = layers.Dense(100, activation='softmax')(x)
model = keras.Model(inputs=inputs, outputs=output)

In [5]:
opt = tf.keras.optimizers.Adam(learning_rate=1e-4)

model.compile(loss='categorical_crossentropy',
              optimizer=opt,
              metrics=['accuracy'])

In [6]:
model.fit(x_train, y_train, epochs=50, batch_size=64, 
                                  validation_data=(x_test, y_test))

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50


<keras.callbacks.History at 0x7f2e7aba7a50>

In [7]:
model.save("efficonvres_100.h5")