In [1]:
import tensorflow as tf
import tensorflow_datasets as tfds
import numpy as np
import pandas as pd

### Helper Functions

Function to help intialize random weights for fully connected or convolutional layers, we leave the shape attribute as a parameter for this.

In [2]:
def init_weights(shape):
    init_random_dist = tf.random.truncated_normal(shape, stddev=0.1)
    return tf.Variable(init_random_dist)

Same as init_weights, but for the biases

In [3]:
def init_bias(shape):
    init_bias_vals = tf.constant(0.1, shape=shape)
    return tf.Variable(init_bias_vals)

Create a 2D convolution using builtin conv2d from TF. From those docs:

Computes a 2-D convolution given 4-D `input` and `filter` tensors.

Given an input tensor of shape `[batch, in_height, in_width, in_channels]`
and a filter / kernel tensor of shape
`[filter_height, filter_width, in_channels, out_channels]`, this op
performs the following:

1. Flattens the filter to a 2-D matrix with shape
   `[filter_height * filter_width * in_channels, output_channels]`.
2. Extracts image patches from the input tensor to form a *virtual*
   tensor of shape `[batch, out_height, out_width,
   filter_height * filter_width * in_channels]`.
3. For each patch, right-multiplies the filter matrix and the image patch
   vector.


In [4]:
def conv2d(x, W):
    return tf.nn.conv2d(x, W, strides=[1, 1, 1, 1], padding='SAME')

Create a max pooling layer, again using built in TF functions:

Performs the max pooling on the input.

    Args:
      value: A 4-D `Tensor` with shape `[batch, height, width, channels]` and
        type `tf.float32`.
      ksize: A list of ints that has length >= 4.  The size of the window for
        each dimension of the input tensor.
      strides: A list of ints that has length >= 4.  The stride of the sliding
        window for each dimension of the input tensor.
      padding: A string, either `'VALID'` or `'SAME'`. 

In [5]:
def max_pool_2by2(x):
    return tf.nn.max_pool(x, ksize=[1, 2, 2, 1],
                          strides=[1, 2, 2, 1], padding='SAME')

Using the conv2d function, we'll return an actual convolutional layer here that uses an ReLu activation.

In [6]:
def convolutional_layer(input_x, shape):
    W = init_weights(shape)
    b = init_bias([shape[3]])
    return tf.nn.relu(conv2d(input_x, W) + b)

This is a normal fully connected layer

In [7]:
def normal_full_layer(input_layer, size):
    input_size = int(input_layer.get_shape()[1])
    W = init_weights([input_size, size])
    b = init_bias([size])
    return tf.matmul(input_layer, W) + b

### Layers

In [8]:
@tf.function
def layers(x_image, rate):
    # Using a 6by6 filter here, used 5by5 in video, you can play around with the filter size
    # You can change the 32 output, that essentially represents the amount of filters used
    # You need to pass in 32 to the next input though, the 1 comes from the original input of 
    # a single image.
    convo_1 = convolutional_layer(x_image,shape=[6,6,1,32])
    convo_1_pooling = max_pool_2by2(convo_1)
    # Using a 6by6 filter here, used 5by5 in video, you can play around with the filter size
    # You can actually change the 64 output if you want, you can think of that as a representation
    # of the amount of 6by6 filters used.
    convo_2 = convolutional_layer(convo_1_pooling,shape=[6,6,32,64])
    convo_2_pooling = max_pool_2by2(convo_2)
    # Why 7 by 7 image? Because we did 2 pooling layers, so (28/2)/2 = 7
    # 64 then just comes from the output of the previous Convolution
    convo_2_flat = tf.reshape(convo_2_pooling,[-1,7*7*64])
    full_layer_one = tf.nn.relu(normal_full_layer(convo_2_flat,1024))
    
    full_one_dropout = tf.nn.dropout(full_layer_one, rate=rate)
    
    y_pred = normal_full_layer(full_one_dropout,10)
    
    return y_pred

### Loss Function

In [9]:
@tf.function
def loss(x, rate, y_true):
    y_pred = layers(x, rate)
    cross_entropy = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(labels=y_true, logits=y_pred))
        
    return cross_entropy

### Optimizer

In [10]:
optimizer = tf.optimizers.Adam(learning_rate=0.0001)

### Load Data

In [11]:
ds_train, ds_test = tfds.load(name="mnist", split=["train", "test"])

In [12]:
# Reserve 5,000 samples for validation
ds_validation = ds_train.take(5000)
ds_train = ds_train.skip(5000)

In [13]:
train_images = []
train_labels = []

In [14]:
for features in ds_train.take(-1):
    image, label = features["image"], features["label"]
    train_images.append(image)
    train_labels.append(label)

In [15]:
# One hot encoding label
label_pd = pd.DataFrame(np.asarray(train_labels))
label_pd = pd.get_dummies(label_pd, columns=[0],prefix='', prefix_sep='')

In [16]:
encode_label = label_pd.values.tolist()

In [21]:
def do_train():
    steps = 5000
    batch = 50
    index = 0

    for i in range(steps):
        
        image_batch = train_images[index:(index+batch)]
        label_batch = train_labels[index:(index+batch)]
        rate = tf.cast(0.5, tf.float32)

        for j in range(len(image_batch)):
            x = tf.Variable(image_batch[j])
            y_true = tf.Variable(tf.cast(label_batch[j], tf.float16))
            loss_fn = loss(x, rate, y_true)
            
            train = optimizer.minimize(loss_fn,[x, y_true, rate])
            print(train)
        
        # PRINT OUT A MESSAGE EVERY 100 STEPS
        if i%100 == 0:
            
            print('Currently on step {}'.format(i))
            print('Accuracy is:')
            # Test the Train Model
            rate = tf.cast(1.0, tf.float32)
            y_pred = layers(image_batch, rate)
            
            matches = tf.equal(tf.argmax(y_pred,1),tf.argmax(label_batch,1))
            acc = tf.reduce_mean(tf.cast(matches,tf.float32))

            train = optimizer.minimize(loss,[x_image, y_true, rate])
            print('\n')
            
        index+=batch

In [22]:
do_train()

TypeError: in user code:

    <ipython-input-9-351042113305>:3 loss  *
        y_pred = layers(x, rate)
    c:\users\admin\appdata\local\programs\python\python38\lib\site-packages\tensorflow\python\eager\def_function.py:780 __call__  **
        result = self._call(*args, **kwds)
    c:\users\admin\appdata\local\programs\python\python38\lib\site-packages\tensorflow\python\eager\def_function.py:807 _call
        return self._stateless_fn(*args, **kwds)  # pylint: disable=not-callable

    TypeError: 'NoneType' object is not callable
