## Math based differentiation

In [86]:
f = lambda x, n: x**n 
df_th = lambda x, n: n*f(x,n-1)

def df_ad(x, n):
    x_tf = tf.Variable(x)
    with tf.GradientTape() as tape:
        y = f(x_tf,n)
    return tape.gradient(y, x_tf)

x = float(2.0)
print("f(x,10) = 2^10 = ", f(x,10))
print("Theory: df(x,10)/dx = 10 x 2^9 = ", df_th(x,10))
print("AD: df(x,10) = ", df_ad(x,10))

f(x,10) = 2^10 =  1024.0
Theory: df(x,10)/dx = 10 x 2^9 =  5120.0
AD: df(x,10) =  tf.Tensor(5120.0, shape=(), dtype=float32)


In [87]:
x_all = np.random.randn(1000)
%time y_all = list(map(lambda x: df_ad(x,10), x_all))

CPU times: user 511 ms, sys: 2.65 ms, total: 514 ms
Wall time: 514 ms


## Code based differentiation

In [88]:
def f(x,n): 
    r = 1
    for m in range(n):
        r *= x
    return r
df_th = lambda x, n: n*f(x,n-1)

def df_ad(x, n):
    x_tf = tf.Variable(x)
    with tf.GradientTape() as tape:
        y = f(x_tf,n)
    return tape.gradient(y, x_tf)

x = float(2.0)
print("f(x,10) = 2^10 = ", f(x,10))
print("Theory: df(x,10)/dx = 10 x 2^9 = ", df_th(x,10))
print("AD: df(x,10) = ", df_ad(x,10))

f(x,10) = 2^10 =  1024.0
Theory: df(x,10)/dx = 10 x 2^9 =  5120.0
AD: df(x,10) =  tf.Tensor(5120.0, shape=(), dtype=float32)


In [89]:
x_all = np.random.randn(1000)
%time y_all = list(map(lambda x: df_ad(x,10), x_all))
len(y_all)

CPU times: user 2.24 s, sys: 5.18 ms, total: 2.25 s
Wall time: 2.25 s


1000