# Forward auto-diff through Dual Numbers

In [1]:
import numpy as np

Let us define a class `DualNumber` that represents a dual number

$$
a + b \epsilon 
$$

where $a$ is the "real" part and $b$ is the "dual" part.

In [2]:
class DualNumber:
  def __init__(self, real, dual):
    # dual number: 'real' + 'dual' * eps
    self.real = real
    self.dual = dual

  def __repr__(self):
    return repr(self.real) + ' + ' + repr(self.dual) + ' epsilon'

Define the dual numbers

$$
\begin{split}
x &= 1 + 2 \epsilon \\
y &= 1.5 + 3.1 \epsilon \\
\end{split}
$$

In [30]:
x = DualNumber(1, 2)
y = DualNumber(1.5, 3.1)
print(x)
print(y)
# x + y TypeError: unsupported operand type(s) for +: 'DualNumber' and 'DualNumber'

1 + 2 epsilon
1.5 + 3.1 epsilon


Implement the operator sum `__add__` for this class.

In [4]:
class DualNumber:
  def __init__(self, real, dual):
    # dual number: 'real' + 'dual' * eps
    self.real = real
    self.dual = dual

  def __repr__(self):
    return repr(self.real) + ' + ' + repr(self.dual) + ' epsilon'

  def __add__(self, other):
    # implement the operation "self + other"
    return DualNumber(self.real + other.real, self.dual + other.dual)

Define the dual numbers

$$
\begin{split}
x &= 1 + 2 \epsilon \\
y &= 1.5 + 3.1 \epsilon \\
\end{split}
$$

Then, compute $z = x + y$ and display the result.

In [5]:
x = DualNumber(1, 2)
y = DualNumber(1.5, 3.1)
z = x + y
print(z)

2.5 + 5.1 epsilon


Define now the dual number

$$
\begin{split}
x &= 1 + 2 \epsilon \\
\end{split}
$$

and try to compute $w = x + 1$. What is going on?

In [29]:
x = DualNumber(1, 2)
# w = x + 1

Try now to compute $w = 1 + x$ (in this specific order). What is going on this time?

In [31]:
# w = 1 + x 
#TypeError: unsupported operand type(s) for +: 'int' and 'DualNumber'

To overcome the above inconvenient, introduce a check (inside the definition of `__add__`) on the type of `other`. Moroever, define the operator `__radd__`, besides `__add__`.

In [39]:
class DualNumber:
  def __init__(self, real, dual):
    # dual number: 'real' + 'dual' * eps
    self.real = real
    self.dual = dual

  def __repr__(self):
    return repr(self.real) + ' + ' + repr(self.dual) + ' epsilon'

  def __add__(self, other):
    # implement the operation "self + other"
    if isinstance(other, DualNumber):
      return DualNumber(self.real + other.real, self.dual + other.dual)
    else:
      return DualNumber(self.real + other, self.dual)

  def __radd__(self, other):
    # implement the operation "other + self"
    return self.__add__(other)

Try again to compute $w = x + 1$

In [40]:
x = DualNumber(1, 2)
w = x + 1
print(w)

2 + 2 epsilon


Try again to compute $w = 1 + x$

In [41]:
w = 1 + x
print(w)

2 + 2 epsilon


Now that we have learnt how to treat the operator "+", let us define the full class `DualNumber`, implementing also the operators "-", "*", "/", "**".

In [11]:
class DualNumber:
  def __init__(self, real, dual):
    # dual number: 'real' + 'dual' * eps
    self.real = real
    self.dual = dual

  def __add__(self, other):
    # implement the operation "self + other"
    if isinstance(other, DualNumber):
      return DualNumber(self.real + other.real,
                        self.dual + other.dual)
    else:
      return DualNumber(self.real + other, self.dual)
  
  def __radd__(self, other):
    # implement the operation "other + self"
    return self.__add__(other)

  def __sub__(self, other):
    # implement the operation "self - other"
    if isinstance(other, DualNumber):
      return DualNumber(self.real - other.real,
                        self.dual - other.dual)
    else:
      return DualNumber(self.real - other, self.dual)

  def __rsub__(self, other):
    # implement the operation "other - self"
    return DualNumber(other, 0.0) - self

  def __mul__(self, other):
    # implement the operation "self * other"
    if isinstance(other, DualNumber):
      return DualNumber(self.real * other.real,
                        self.real * other.dual + self.dual * other.real)
    else:
      return DualNumber(self.real * other, self.dual * other)

  def __rmul__(self, other):
    # implement the operation "other * self"
    return self.__mul__(other)

  def __truediv__(self, other):
    # implement the operation "self / other"
    if isinstance(other, DualNumber):
      return DualNumber(self.real/other.real, (self.dual*other.real - self.real*other.dual)/(other.real**2))
    else:
      return (1/other) * self

  def __rtruediv__(self, other):
    # implement the operation "other / self"
    return DualNumber(other, 0.0).__truediv__(self)

  def __pow__(self, other):
    # implement the operation "self ** other"
    return DualNumber(self.real**other,
                      self.dual * other * self.real**(other - 1))

  def __repr__(self):
    return repr(self.real) + ' + ' + repr(self.dual) + ' epsilon'


Define the dual numbers

$$
\begin{split}
x &= 1 + 2 \epsilon \\
y &= 1.5 + 3.1 \epsilon \\
\end{split}
$$

Then, compute the result of the following operations:
- $x + y$
- $x - y$
- $x y$
- $x / y$
- $x + 1$
- $2 x$
- $x ^ 3$

In [12]:
x = DualNumber(1.0, 2.0)
y = DualNumber(1.5, 3.1)
z = x + y
print("x     = %s" % x)
print("y     = %s" % y)
print("x + y = %s" % (x + y))
print("x - y = %s" % (x - y))
print("x * y = %s" % (x * y))
print("x / y = %s" % (x / y))
print("x + 1 = %s" % (x + 1))
print("2 * x = %s" % (2 * x))
print("x ^ 3 = %s" % (x ** 3))

x     = 1.0 + 2.0 epsilon
y     = 1.5 + 3.1 epsilon
x + y = 2.5 + 5.1 epsilon
x - y = -0.5 + -1.1 epsilon
x * y = 1.5 + 6.1 epsilon
x / y = 0.6666666666666666 + -0.04444444444444448 epsilon
x + 1 = 2.0 + 2.0 epsilon
2 * x = 2.0 + 4.0 epsilon
x ^ 3 = 1.0 + 6.0 epsilon


Define now the functions `my_sin`, `my_cos` and `my_exp`, implementing the operations sinus, cosinus and exponential, respectively.

In [13]:
import numpy as np
def my_sin(x):
  if isinstance(x, DualNumber):
    return DualNumber(np.sin(x.real), np.cos(x.real) * x.dual)
  else:
    return np.sin(x)

def my_cos(x):
  if isinstance(x, DualNumber):
    return DualNumber(np.cos(x.real), -np.sin(x.real) * x.dual)
  else:
    return np.cos(x)

def my_exp(x):
  if isinstance(x, DualNumber):
    return DualNumber(np.exp(x.real), np.exp(x.real) * x.dual)
  else:
    return np.exp(x)

Define the dual number

$$
\begin{split}
x &= 1 + 2.3 \epsilon \\
\end{split}
$$

Then, compute the result of the following operations:
- $\sin(x)$
- $\exp(x)$

In [14]:
x = DualNumber(1, 2.3)
print(my_sin(x))
print(my_exp(x))

0.8414709848078965 + 1.2426953034967214 epsilon
2.718281828459045 + 6.252048205455803 epsilon


Define now a function `auto_diff` that, given a function $f \colon \mathbb{R} \to \mathbb{R}$ and a real number $x$, returns $f'(x)$, exploiting the class `DualNumber`. The function must have the following signature:
```python
def auto_diff(f, x):
  ...
```


In [15]:
def auto_diff(f,x):
  return f(DualNumber(x, 1.0)).dual  

Consider the function 

$$
f(x) = x \sin(x^2)
$$

and use the function implemented above to compute $f'(x_0)$ for $x_0 = 0.13$. Compare the result with the analytical solution and compute the relative error.



In [21]:
func = lambda x : x*my_sin(x**2)
x0 = 0.13
df_AD = auto_diff(func, x0)
print('f\'(x0) (AD): %f' % df_AD)

dfunc = lambda x : np.sin(x**2)+2 * x**2 * np.cos(x**2)
df_ex = dfunc(x0)
print('f\'(x0) (ex): %f' % df_ex)
print('err (AD): %e' % (abs(df_AD - df_ex)/abs(df_ex)))

f'(x0) (AD): 0.050694
f'(x0) (ex): 0.050694
err (AD): 1.368770e-16


Repeat the previous point, this time by computing the numerical derivative (i.e. through finite differences).

In [22]:
import scipy.misc
df_FD = scipy.misc.derivative(func, x0, dx=1e-6)
print('f\'(x0) (FD): %f' % df_FD)
print('err (FD): %e' % (abs(df_FD - df_ex)/abs(df_ex)))

f'(x0) (FD): 0.050694
err (FD): 2.195234e-11


  df_FD = scipy.misc.derivative(func, x0, dx=1e-6)


Repeat the previous point, this time by computing the symbolic derivative (module `sympy` = **sym**bolic **py**thon)

In [42]:
import sympy
x = sympy.symbols('x')
func_sym = x*sympy.sin(x**2)
x0 = 0.13

dfunc_sym = sympy.diff(func_sym, x)
print(dfunc_sym)
df_sy = dfunc_sym.subs(x, x0)

print('f\'(x0) (sy): %f' % df_sy)
print('err (sy): %e' % (abs(df_sy - df_ex)/abs(df_ex)))

2*x**2*cos(x**2) + sin(x**2)
f'(x0) (sy): 0.050694
err (sy): 1.000000e+00


Evaluate and compare the execution time of the different approaches.
To compute the execution time of a line of code, prepend IPython [magic command](https://ipython.readthedocs.io/en/stable/interactive/magics.html) `%timeit` to the line.

Example:
```python
%timeit np.random.rand(1000)
```

In [24]:
%timeit sympy.diff(func_sym, x).subs(x, x0)

75.2 µs ± 1.76 µs per loop (mean ± std. dev. of 7 runs, 10,000 loops each)


In [25]:
%timeit scipy.misc.derivative(func, x0, dx=1e-6)



10.7 µs ± 627 ns per loop (mean ± std. dev. of 7 runs, 100,000 loops each)


In [26]:
%timeit auto_diff(func, x0)

2.82 µs ± 66 ns per loop (mean ± std. dev. of 7 runs, 100,000 loops each)


In [27]:
%timeit dfunc(x0)

1.39 µs ± 106 ns per loop (mean ± std. dev. of 7 runs, 1,000,000 loops each)


Consider now the function 
$$
f(x) = \frac{1}{x^5}
$$
compute the derivative in the point $x_0 = 10^{-2}$ with AD and FD and compare the results with the exact solution.

In [28]:
func = lambda x : 1 / x**5
dfunc = lambda x : -5 / x**6
x0 = 0.01

df_ex = dfunc(x0)
df_FD = scipy.misc.derivative(func, x0, dx=1e-6)
df_AD = auto_diff(func, x0)
print('f\'(x0) (ex): %f' % df_ex)
print('f\'(x0) (FD): %f' % df_FD)
print('f\'(x0) (AD): %f' % df_AD)

f'(x0) (ex): -4999999999999.999023
f'(x0) (FD): -5000000349996.567383
f'(x0) (AD): -4999999999999.998047


  df_FD = scipy.misc.derivative(func, x0, dx=1e-6)
