In [1]:
from datetime import datetime
import math
import time
import tensorflow as tf

# network info print function

In [2]:
def print_activations(t):
    print(t.op.name, ' ', t.get_shape().as_list())

# build alexnet network 

In [3]:
def inference(images):
    parameters = []
    
    # conv1
    with tf.name_scope('conv1') as scope:
        kernel = tf.Variable(tf.truncated_normal([11, 11, 3, 64],
                    dtype=tf.float32, stddev=1e-1), name='weights')
        conv = tf.nn.conv2d(images, kernel, [1, 4, 4, 1], padding='SAME')
        biases = tf.Variable(tf.constant(0.0, shape=[64], dtype=tf.float32),
                            trainable=True, name='biases')
        bias = tf.nn.bias_add(conv, biases)
        conv1 = tf.nn.relu(bias, name=scope)
        parameters +=[kernel, biases]       
    print_activations(conv1)
        
    # lrn(Local Response Normalization) and max_poor
    lrn1 = tf.nn.lrn(conv1, 4, bias=1.0, alpha=0.001/9, beta=0.75, name='lrn1')
    pool1 = tf.nn.max_pool(lrn1, ksize=[1, 3, 3, 1], strides=[1, 2, 2, 1],
                          padding='VALID', name='pool1')
    print_activations(pool1)
    
    # conv2
    with tf.name_scope('conv2') as scope:
        kernel = tf.Variable(tf.truncated_normal([5, 5, 64, 192],
                        dtype=tf.float32, stddev=1e-1), name='weights')
        conv = tf.nn.conv2d(pool1, kernel, [1, 1, 1, 1], padding='SAME')
        biases = tf.Variable(tf.constant(0.0, shape=[192], dtype=tf.float32), 
                             trainable=True, name='biases')
        bias = tf.nn.bias_add(conv, biases)
        conv2 = tf.nn.relu(bias, name=scope)
        parameters += [kernel, biases]        
    print_activations(conv2)
    
    # lrn and max_pool
    lrn2 = tf.nn.lrn(conv2, 4, bias=1.0, alpha=0.001/9, beta=0.75, name='lrn2')
    pool2 = tf.nn.max_pool(lrn2, ksize=[1, 3, 3, 1], strides=[1, 2, 2, 1],
                          padding='VALID', name='pool2')
    print_activations(pool2)
    
    # conv3
    with tf.name_scope('conv3') as scope:
        kernel = tf.Variable(tf.truncated_normal([3, 3, 192, 384],
                        dtype=tf.float32, stddev=1e-1), name='weights')
        conv = tf.nn.conv2d(pool2, kernel, [1, 1, 1, 1], padding='SAME')
        biases = tf.Variable(tf.constant(0.0, shape=[384], dtype=tf.float32), 
                            trainable=True, name='biases')
        bias = tf.nn.bias_add(conv, biases)
        conv3 = tf.nn.relu(bias, name=scope)
        parameters += [kernel, biases]
    print_activations(conv3)
    
    # conv4
    with tf.name_scope('conv4') as scope:
        kernel = tf.Variable(tf.truncated_normal([3, 3, 384, 256], 
                        dtype=tf.float32, stddev=1e-1), name='weights')
        conv = tf.nn.conv2d(conv3, kernel, [1, 1, 1, 1], padding='SAME')
        biases = tf.Variable(tf.constant(0.0, shape=[256], dtype=tf.float32), 
                            trainable=True, name='biases')
        bias = tf.nn.bias_add(conv, biases)
        conv4 = tf.nn.relu(bias, name=scope)
        parameters += [kernel, biases]
    print_activations(conv4)
    
    # conv5
    with tf.name_scope('conv5') as scope:
        kernel = tf.Variable(tf.truncated_normal([3, 3, 256, 256],
                        dtype=tf.float32, stddev=1e-1), name='weights')
        conv = tf.nn.conv2d(conv4, kernel, [1, 1, 1, 1], padding='SAME')
        biases = tf.Variable(tf.constant(0.0, shape=[256], dtype=tf.float32), 
                            trainable=True, name='biases')
        bias = tf.nn.bias_add(conv, biases)
        conv5 = tf.nn.relu(bias, name=scope)
        parameters += [kernel, biases]
    print_activations(conv5)
    
    # max_pool
    pool5 = tf.nn.max_pool(conv5, ksize=[1, 3, 3, 1], strides=[1, 2, 2, 1],
                          padding='VALID', name='pool5')
    print_activations(pool5)
    
    # fully connected layer 6
    with tf.name_scope('fc6') as scope:
        kernel = tf.Variable(tf.truncated_normal([6*6*256, 4096],
                        dtype=tf.float32, stddev=1e-1), name='weights')
        biases = tf.Variable(tf.constant(0.0, shape=[4096], dtype=tf.float32),
                            trainable=True, name='biases')
        flat = tf.reshape(pool5, [-1, 6*6*256])
        fc6 = tf.nn.relu(tf.matmul(flat, kernel) + biases)
        parameters += [kernel, biases]
    print_activations(fc6)
        
    # dropout
    keep_prob = 1.0
    fc6_drop = tf.nn.dropout(fc6, keep_prob)
    
    # fully connected layer 7
    with tf.name_scope('fc7') as scope:
        kernel = tf.Variable(tf.truncated_normal([4096, 4096],
                        dtype=tf.float32, stddev=1e-1), name='weights')
        biases = tf.Variable(tf.constant(0.0, shape=[4096], dtype=tf.float32),
                            trainable=True, name='biases')
        flat = tf.reshape(fc6_drop, [-1, 4096])
        fc7 = tf.nn.relu(tf.matmul(flat, kernel) + biases)
        parameters += [kernel, biases]
    print_activations(fc7)
        
    # dropout
    keep_prob = 1.0
    fc7_drop = tf.nn.dropout(fc7, keep_prob)
    
    # fully connected layer 8
    with tf.name_scope('fc8') as scope:
        kernel = tf.Variable(tf.truncated_normal([4096, 1000],
                        dtype=tf.float32, stddev=1e-1), name='weights')
        biases = tf.Variable(tf.constant(0.0, shape=[1000], dtype=tf.float32),
                            trainable=True, name='biases')
        flat = tf.reshape(fc7_drop, [-1, 4096])
        fc8 = tf.nn.relu(tf.matmul(flat, kernel) + biases)
        parameters += [kernel, biases]
    print_activations(fc8)
        
    # dropout
    keep_prob = 1.0
    fc8_drop = tf.nn.dropout(fc8, keep_prob)
    
    #return pool5, parameters
    return fc8_drop, parameters

# time per step function

In [4]:
def time_tensorflow_run(session, target, info_string):
    num_steps_burn_in = 10
    total_duration = 0.0
    total_duration_squared = 0.0
    
    for i in range(num_batches + num_steps_burn_in):
        start_time = time.time()
        _ = session.run(target)
        duration = time.time() - start_time
        if i >= num_steps_burn_in:
            if not i % 10:
                print('%s: step %d, duration = %.3f' % 
                     (datetime.now(), i-num_steps_burn_in, duration))
            total_duration += duration
            total_duration_squared += duration * duration
            
    # calculate average time and standard deviation
    mn = total_duration / num_batches
    vr = total_duration_squared / num_batches - mn * mn
    sd = math.sqrt(vr)
    print('%s: %s across %d steps, %.3f +/- %.3f sec/batch' % 
         (datetime.now(), info_string, num_batches, mn, sd))

# run function

In [5]:
def run_benchmark():
    with tf.Graph().as_default():
        image_size = 224
        images = tf.Variable(tf.random_normal(
            [batch_size, image_size, image_size, 3], dtype=tf.float32, stddev=1e-1))
        
        pool5, parameters = inference(images)
        
        # init
        init = tf.global_variables_initializer()
        sess = tf.Session()
        sess.run(init)
        
        # time evaluation of forward and backward
        time_tensorflow_run(sess, pool5, "Forward")
        
        objective = tf.nn.l2_loss(pool5)
        grad = tf.gradients(objective, parameters)
        time_tensorflow_run(sess, grad, "Forward-backward")

# run main func

In [6]:
batch_size = 32
num_batches = 100
run_benchmark()

conv1   [32, 56, 56, 64]
pool1   [32, 27, 27, 64]
conv2   [32, 27, 27, 192]
pool2   [32, 13, 13, 192]
conv3   [32, 13, 13, 384]
conv4   [32, 13, 13, 256]
conv5   [32, 13, 13, 256]
pool5   [32, 6, 6, 256]
fc6/Relu   [32, 4096]
fc7/Relu   [32, 4096]
fc8/Relu   [32, 1000]
2017-06-20 19:17:53.282997: step 0, duration = 1.610
2017-06-20 19:18:10.625997: step 10, duration = 1.693
2017-06-20 19:18:27.878084: step 20, duration = 1.706
2017-06-20 19:18:45.118179: step 30, duration = 1.822
2017-06-20 19:19:01.943945: step 40, duration = 1.725
2017-06-20 19:19:18.957362: step 50, duration = 1.753
2017-06-20 19:19:36.648059: step 60, duration = 1.809
2017-06-20 19:19:53.091543: step 70, duration = 1.555
2017-06-20 19:20:09.661809: step 80, duration = 1.615
2017-06-20 19:20:28.804743: step 90, duration = 2.181
2017-06-20 19:20:52.018289: Forward across 100 steps, 1.803 +/- 0.302 sec/batch
2017-06-20 19:22:18.549148: step 0, duration = 7.622
2017-06-20 19:23:35.050716: step 10, duration = 8.511
2017