## Math based differentiation

In [1]:
import tensorflow as tf
import numpy as np
tf.__version__

'2.4.1'

In [63]:
# @tf.function
def f_fn(x,n):
    return x**n

f = lambda x, n: x**n 
df_th = lambda x, n: n*f(x,n-1)

def df_ad(x, n):
    x_tf = tf.Variable(x)
    with tf.GradientTape() as tape:
        y = f(x_tf,n)
    return tape.gradient(y, x_tf)

x = float(2.0)
print("f(x,10) = 2^10 = ", f(x,10))
print("Theory: df(x,10)/dx = 10 x 2^9 = ", df_th(x,10))
print("AD: df(x,10) = ", df_ad(x,10))

f(x,10) = 2^10 =  1024.0
Theory: df(x,10)/dx = 10 x 2^9 =  5120.0
AD: df(x,10) =  tf.Tensor(5120.0, shape=(), dtype=float32)


In [64]:
x_all = np.random.randn(1000)
%time y_all = list(map(lambda x: f_fn(x,10), x_all))
%time y_all = list(map(lambda x: f(x,10), x_all))
%time y_all = list(map(lambda x: df_ad(x,10), x_all))

CPU times: user 981 µs, sys: 0 ns, total: 981 µs
Wall time: 986 µs
CPU times: user 401 µs, sys: 0 ns, total: 401 µs
Wall time: 406 µs
CPU times: user 540 ms, sys: 8.76 ms, total: 548 ms
Wall time: 544 ms


## Code based differentiation

In [65]:
@tf.function
def f(x,n): 
    r = 1
    for m in range(n):
        r *= x
    return r
df_th = lambda x, n: n*f(x,n-1)

def df_ad(x, n):
    x_tf = tf.Variable(x)
    with tf.GradientTape() as tape:
        y = f(x_tf,n)
    return tape.gradient(y, x_tf)

x = float(2.0)
print("f(x,10) = 2^10 = ", f(x,10))
print("Theory: df(x,10)/dx = 10 x 2^9 = ", df_th(x,10))
print("AD: df(x,10) = ", df_ad(x,10))

f(x,10) = 2^10 =  tf.Tensor(1024.0, shape=(), dtype=float32)
Theory: df(x,10)/dx = 10 x 2^9 =  tf.Tensor(5120.0, shape=(), dtype=float32)
AD: df(x,10) =  tf.Tensor(5120.0, shape=(), dtype=float32)


In [66]:
x_all = np.random.randn(2)
%time y_all = list(map(lambda x: df_ad(x,10), x_all))
len(y_all)









CPU times: user 292 ms, sys: 124 µs, total: 292 ms
Wall time: 286 ms


2