# Chapter 3 Deep Learning with Python

Some code snippets from chapter 3 of Deep Learning with Python. 

In [1]:
import tensorflow as tf

In [2]:
# Check for TensorFlow GPU access
print(f"TensorFlow has access to the following devices:\n{tf.config.list_physical_devices()}")

# See TensorFlow version
print(f"TensorFlow version: {tf.__version__}")

TensorFlow has access to the following devices:
[PhysicalDevice(name='/physical_device:CPU:0', device_type='CPU'), PhysicalDevice(name='/physical_device:GPU:0', device_type='GPU')]
TensorFlow version: 2.8.0


In [15]:
print("Num GPUs Available: ", len(tf.config.list_physical_devices('GPU')))

Num GPUs Available:  1


# Benchmarking CPU cs GPU performance on M1 macs

Run the Keras MNIST example on both CPU and GPU and compare the time taken for each.

In [4]:
import numpy as np
from tensorflow import keras
from tensorflow.keras import layers


In [5]:
# Model / data parameters
num_classes = 10
input_shape = (28, 28, 1)

# the data, split between train and test sets
(x_train, y_train), (x_test, y_test) = keras.datasets.mnist.load_data()

# Scale images to the [0, 1] range
x_train = x_train.astype("float32") / 255
x_test = x_test.astype("float32") / 255
# Make sure images have shape (28, 28, 1)
x_train = np.expand_dims(x_train, -1)
x_test = np.expand_dims(x_test, -1)
print("x_train shape:", x_train.shape)
print(x_train.shape[0], "train samples")
print(x_test.shape[0], "test samples")


# convert class vectors to binary class matrices
y_train = keras.utils.to_categorical(y_train, num_classes)
y_test = keras.utils.to_categorical(y_test, num_classes)


Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/mnist.npz
x_train shape: (60000, 28, 28, 1)
60000 train samples
10000 test samples


In [10]:
model = keras.Sequential(
    [
        keras.Input(shape=input_shape),
        layers.Conv2D(32, kernel_size=(3, 3), activation="relu"),
        layers.MaxPooling2D(pool_size=(2, 2)),
        layers.Conv2D(64, kernel_size=(3, 3), activation="relu"),
        layers.MaxPooling2D(pool_size=(2, 2)),
        layers.Flatten(),
        layers.Dropout(0.5),
        layers.Dense(num_classes, activation="softmax"),
    ]
)

model.summary()


Model: "sequential_1"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 conv2d_2 (Conv2D)           (None, 26, 26, 32)        320       
                                                                 
 max_pooling2d_2 (MaxPooling  (None, 13, 13, 32)       0         
 2D)                                                             
                                                                 
 conv2d_3 (Conv2D)           (None, 11, 11, 64)        18496     
                                                                 
 max_pooling2d_3 (MaxPooling  (None, 5, 5, 64)         0         
 2D)                                                             
                                                                 
 flatten_1 (Flatten)         (None, 1600)              0         
                                                                 
 dropout_1 (Dropout)         (None, 1600)             

In [8]:
import time 

In [9]:
batch_size = 128
epochs = 15

model.compile(loss="categorical_crossentropy", optimizer="adam", metrics=["accuracy"])
start_time = time.time()
model.fit(x_train, y_train, batch_size=batch_size, epochs=epochs, validation_split=0.1)
print("Time Taken is {}".format(time.time() - start_time))

Epoch 1/15


2022-05-02 12:48:17.771780: W tensorflow/core/platform/profile_utils/cpu_utils.cc:128] Failed to get CPU frequency: 0 Hz
2022-05-02 12:48:18.011626: I tensorflow/core/grappler/optimizers/custom_graph_optimizer_registry.cc:113] Plugin optimizer for device_type GPU is enabled.




2022-05-02 12:48:27.017258: I tensorflow/core/grappler/optimizers/custom_graph_optimizer_registry.cc:113] Plugin optimizer for device_type GPU is enabled.


Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15
Time Taken is 97.5620768070221


In [14]:
batch_size = 128
epochs = 15

model.compile(loss="categorical_crossentropy", optimizer="adam", metrics=["accuracy"])
start_time = time.time()
with tf.device('/cpu:0'):
    model.fit(x_train, y_train, batch_size=batch_size, epochs=epochs, validation_split=0.1)
print("Time Taken is {}".format(time.time() - start_time))

Epoch 1/15
  7/422 [..............................] - ETA: 7s - loss: 0.0178 - accuracy: 0.9922

2022-05-02 14:00:00.292156: I tensorflow/core/grappler/optimizers/custom_graph_optimizer_registry.cc:113] Plugin optimizer for device_type GPU is enabled.




2022-05-02 14:00:07.751927: I tensorflow/core/grappler/optimizers/custom_graph_optimizer_registry.cc:113] Plugin optimizer for device_type GPU is enabled.


Epoch 2/15
Epoch 3/15
Epoch 4/15
Epoch 5/15
Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15
Time Taken is 119.56062173843384


## Base Layer class in Keras

Everything in Keras is either a Layer class or something that interacts with the layer class.

Layer encapsulates some state (weights) and some computation (Forward Pass).

Following is a Naive Dense Layer implementation

In [23]:
class SimpleDense(keras.layers.Layer):
    
    def __init__(self, units, activation = None):
        
        super().__init__() # Run the constructor for the inherited class
        self.units = units
        self.activation = activation
        
    # Build the weights, used in a seperate function to infer weights from previous layer
    def build(self, input_shape):
        
        input_dim = input_shape[-1]
        self.W = self.add_weight(shape=(input_dim, self.units), initializer = "random_normal")
        self.b = self.add_weight(shape = (self.units, ), initializer = "zeros")
    
    # Run the forward action in this case forward pass
    def call(self, inputs):
        
        out = tf.matmul(inputs, self.W) + self.b
        
        if self.activation is not None: 
            
            out = self.activation(out)
        
        return out
        

In [24]:
mydense = SimpleDense(32, activation=tf.nn.relu)
input_tensor = tf.ones(shape=(2,784))
output_tensor = mydense(input_tensor)

In [26]:
output_tensor.shape

TensorShape([2, 32])