Define a model

TensorLayer provides two ways to define a model. Static model allows you to build model in a fluent way while dynamic model allows you to fully control the forward process.

Static model

import tensorflow as tf
from tensorlayer.layers import Input, Dropout, Dense
from tensorlayer.models import Model

def get_model(inputs_shape):
    ni = Input(inputs_shape)
    nn = Dropout(keep=0.8)(ni)
    nn = Dense(n_units=800, act=tf.nn.relu, name="dense1")(nn) # “name" is optional
    nn = Dropout(keep=0.8)(nn)
    nn = Dense(n_units=800, act=tf.nn.relu)(nn)
    nn = Dropout(keep=0.8)(nn)
    nn = Dense(n_units=10, act=None)(nn)
    M = Model(inputs=ni, outputs=nn, name="mlp") # “name" is optional
    return M

MLP = get_model([None, 784])
MLP.eval()
outputs = MLP(data)

Dynamic model

In this case, you need to manually input the output shape of the previous layer to the new layer.

class CustomModel(Model):

    def __init__(self):
        super(CustomModel, self).__init__()

        self.dropout1 = Dropout(keep=0.8)
        self.dense1 = Dense(n_units=800, act=tf.nn.relu, in_channels=784)
        self.dropout2 = Dropout(keep=0.8)
        self.dense2 = Dense(n_units=800, act=tf.nn.relu, in_channels=800)
        self.dropout3 = Dropout(keep=0.8)
        self.dense3 = Dense(n_units=10, act=None, in_channels=800)

    def forward(self, x, foo=False):
        z = self.dropout1(x)
        z = self.dense1(z)
        z = self.dropout2(z)
        z = self.dense2(z)
        z = self.dropout3(z)
        out = self.dense3(z)
        if foo:
            out = tf.nn.softmax(out)
        return out

MLP = CustomModel()
MLP.eval()
outputs = MLP(data, foo=True) # controls the forward here
outputs = MLP(data, foo=False)

Switching train/test modes

# method 1: switch before forward
Model.train() # enable dropout, batch norm moving avg ...
output = Model(train_data) 
... # training code here
Model.eval()  # disable dropout, batch norm moving avg ...
output = Model(test_data) 
... # testing code here

# method 2: switch while forward
output = Model(train_data, is_train=True)
output = Model(test_data, is_train=False)

Reuse weights

For static model, call the layer multiple time in model creation

# create siamese network

def create_base_network(input_shape):
      '''Base network to be shared (eq. to feature extraction).
      '''
      input = Input(shape=input_shape)
      x = Flatten()(input)
      x = Dense(128, act=tf.nn.relu)(x)
      x = Dropout(0.9)(x)
      x = Dense(128, act=tf.nn.relu)(x)
      x = Dropout(0.9)(x)
      x = Dense(128, act=tf.nn.relu)(x)
      return Model(input, x)


def get_siamese_network(input_shape):
      """Create siamese network with shared base network as layer
      """
      base_layer = create_base_network(input_shape).as_layer() # convert model as layer

      ni_1 = Input(input_shape)
      ni_2 = Input(input_shape)
      nn_1 = base_layer(ni_1) # call base_layer twice
      nn_2 = base_layer(ni_2)
      return Model(inputs=[ni_1, ni_2], outputs=[nn_1, nn_2])

siamese_net = get_siamese_network([None, 784])

For dynamic model, call the layer multiple time in forward function

class MyModel(Model):
    def __init__(self):
        super(MyModel, self).__init__()
        self.dense_shared = Dense(n_units=800, act=tf.nn.relu, in_channels=784)
        self.dense1 = Dense(n_units=10, act=tf.nn.relu, in_channels=800)
        self.dense2 = Dense(n_units=10, act=tf.nn.relu, in_channels=800)
        self.cat = Concat()

    def forward(self, x):
        x1 = self.dense_shared(x) # call dense_shared twice
        x2 = self.dense_shared(x)
        x1 = self.dense1(x1)
        x2 = self.dense2(x2)
        out = self.cat([x1, x2])
        return out

model = MyModel()

Print model information

print(MLP) # simply call print function

# Model(
#   (_inputlayer): Input(shape=[None, 784], name='_inputlayer')
#   (dropout): Dropout(keep=0.8, name='dropout')
#   (dense): Dense(n_units=800, relu, in_channels='784', name='dense')
#   (dropout_1): Dropout(keep=0.8, name='dropout_1')
#   (dense_1): Dense(n_units=800, relu, in_channels='800', name='dense_1')
#   (dropout_2): Dropout(keep=0.8, name='dropout_2')
#   (dense_2): Dense(n_units=10, None, in_channels='800', name='dense_2')
# )

import pprint
pprint.pprint(MLP.config) # print the model architecture
#   {'inputs': '_inputlayer_1_node_0',
#  'model_architecture': [{'args': {'dtype': tf.float32,
#                                   'layer_type': 'normal',
#                                   'name': '_inputlayer_1',
#                                   'shape': [None, 784]},
#                          'class': '_InputLayer',
#                          'prev_layer': None},
#                         {'args': {'keep': 0.8,
#                                   'layer_type': 'normal',
#                                   'name': 'dropout_1'},
#                          'class': 'Dropout',
#                          'prev_layer': ['_inputlayer_1_node_0']},
#                         {'args': {'act': 'relu',
#                                   'layer_type': 'normal',
#                                   'n_units': 800,
#                                   'name': 'dense_1'},
#                          'class': 'Dense',
#                          'prev_layer': ['dropout_1_node_0']},
#                         {'args': {'keep': 0.8,
#                                   'layer_type': 'normal',
#                                   'name': 'dropout_2'},
#                          'class': 'Dropout',
#                          'prev_layer': ['dense_1_node_0']},
#                         {'args': {'act': 'relu',
#                                   'layer_type': 'normal',
#                                   'n_units': 800,
#                                   'name': 'dense_2'},
#                          'class': 'Dense',
#                          'prev_layer': ['dropout_2_node_0']},
#                         {'args': {'keep': 0.8,
#                                   'layer_type': 'normal',
#                                   'name': 'dropout_3'},
#                          'class': 'Dropout',
#                          'prev_layer': ['dense_2_node_0']},
#                         {'args': {'act': None,
#                                   'layer_type': 'normal',
#                                   'n_units': 10,
#                                   'name': 'dense_3'},
#                          'class': 'Dense',
#                          'prev_layer': ['dropout_3_node_0']}],
#  'name': 'mlp',
#  'outputs': 'dense_3_node_0',
#  'version_info': {'backend': 'tensorflow',
#                   'backend_version': '2.0.0-alpha0',
#                   'save_date': None,
#                   'tensorlayer_version': '2.1.0',
#                   'training_device': 'gpu'}}

Get specific weights

We can get the specific weights by indexing or naming.

# indexing
all_weights = MLP.all_weights
some_weights = MLP.all_weights[1:3]

# naming
some_weights = MLP.get_layer('dense1').all_weights

Save and restore model

We provide two ways to save and restore models

Save weights only

MLP.save_weights('model_weights.h5') # by default, file will be in hdf5 format
MLP.load_weights('model_weights.h5')

Save model architecture and weights (optional)

# When using Model.load(), there is no need to reimplement or declare the architecture of the model explicitly in code
MLP.save('model.h5', save_weights=True)
MLP = Model.load('model.h5', load_weights=True)

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

get_start_model.rst

get_start_model.rst

Define a model

Static model

Dynamic model

Switching train/test modes

Reuse weights

Print model information

Get specific weights

Save and restore model

Save weights only

Save model architecture and weights (optional)

Files

get_start_model.rst

Latest commit

History

get_start_model.rst

File metadata and controls

Define a model

Static model

Dynamic model

Switching train/test modes

Reuse weights

Print model information

Get specific weights

Save and restore model

Save weights only

Save model architecture and weights (optional)