# "Bayesian Parameter Estimation"
> "We follow Chapters 2 and 3 of Sivia and Skilling's book to illustrate a simple Bayesian Parameter Estimation workflow"

- toc:true- branch: master- badges: true- comments: true
- author: John J. Molina
- categories: [Data Analysis, Parameter Estimation]

In [2]:
import numpy as np
import matplotlib as mpl
import matplotlib.pyplot as plt

#hide

$
\renewcommand{\vec}[1]{\mathbf{#1}}
\newcommand{\df}[1]{\textrm{d}{#1}}
\newcommand{\vdf}[1]{\df{\vec{#1}}}
$

$$\begin{align}
P(\vec{X}\lvert I) + P(\overline{\vec{X}}\lvert I) &= 1 &\textrm{(Sum Rule)}\label{e:sum_rule}\\
P(\vec{X},\vec{Y}\lvert I) &= P(\vec{X}\lvert \vec{Y}, I)\times P(\vec{Y}\lvert I) &\textrm{(Product Rule)}\notag\\
&=P(\vec{Y}\lvert\vec{X}, I)\times P(\vec{X}\lvert I) \label{e:product_rule} \\
\end{align}$$

$$\begin{align}
\overbrace{P(\vec{X} \lvert \vec{Y}, I)}^{\small{\mathrm{posterior}}} &= \frac{\overbrace{P(\vec{Y}\lvert \vec{X},I)}^{\small{\mathrm{likelihood}}} 
                                          \times\overbrace{P(\vec{X}\lvert I)}^{\small{\mathrm{prior}}}}{\underbrace{P(\vec{Y}\lvert I)}_{\small{\mathrm{evidence}}}}&\textrm{(Bayes' Theorem)}\label{e:bayes} \\
P(\vec{X}\lvert I) &= \int\vdf{Y} P(\vec{X}, \vec{Y}\lvert I) =\int\vdf{Y} P(\vec{X}\lvert\vec{Y}, I)\times P(\vec{Y}\lvert I) &\textrm{(Marginalization)}
\label{e:marginalization}
\end{align}$$

$$\begin{align}
P(\textrm{Hypothesis}\lvert \textrm{Data}, I) &= \frac{P(\textrm{Data}\lvert \textrm{Hypothesis}, I)\times P(\textrm{Hypothesis}\lvert I)}{P(\textrm{Data}, I)}\label{e:bayes_hypothesis}
\end{align}$$

$$\begin{align}
P(\vec{\Theta}\lvert \vec{D}, I) &= \frac{P(\vec{D}\lvert\vec{\Theta}, I) \times P(\vec{\Theta}\lvert I)}{P(\vec{D}\lvert I)} \label{e:bayes_theta}\\
&\propto P(\vec{D}\lvert\vec{\Theta}, I)\times P(\vec{\Theta}\lvert I)
\end{align}$$

$\vec{D} = \{D_k\}_{k=1}^N$
$$\begin{align*}
P(\vec{\Theta}\lvert \vec{D},I) &\propto P(\{D_k\}_{k=1}^N\lvert \vec{\Theta}, I)\times P(\vec{\Theta}\lvert I) \\
&= P(\{D_k\}_{k=2}^N\lvert D_1, \vec{\Theta}, I) \times P(D_1\lvert \vec{\Theta}, I)\times P(\vec{\Theta}\lvert I) \\
&= P(\{D_k\}_{k=2}^N\lvert \vec{\Theta}, I)\times P(D_1\lvert \vec{\Theta}, I)\times P(\vec{\Theta}\lvert I) \\ 
&= P(\{D_k\}_{k=3}^N\lvert \vec{\Theta}, I)\times P(D_2\lvert \vec{\Theta}, I)\times P(D_1\lvert \vec{\Theta}, I) \times P(\vec{\Theta}\lvert I) \\
&\vdots \\
&= \big(\Pi_{k=1}^N P(D_k\lvert \vec{\Theta}, I)\big) \times P(\vec{\Theta}\lvert I)
\end{align*}$$

$$\begin{align*}
P(\vec{\Theta}\lvert \vec{D},I)&= \big(\Pi_{k=m+1}^{N} P(D_k\lvert \vec{\Theta}, I)\big) \big(\Pi_{j=1}^{m} P(D_j\lvert\vec{\Theta}, I)\big) P(\vec{\Theta}\lvert I) \\
&=\big(\Pi_{k=m+1}^{N} P(D_k\lvert \vec{\Theta}, I)\big) \times P(\vec{\Theta}\lvert \{D_j\}_{j=1}^m, I)
\end{align*}$$

$$\begin{align}
L &= \ln{P(\vec{\Theta}\lvert \vec{D}, I)} = \ln P \\
&= L\lvert_{\vec{\Theta}_0} + \vec{\nabla}L\lvert_{\vec{\Theta}_0}\cdot(\vec{\Theta} - \vec{\Theta}_0) 
+ \frac{1}{2} (\vec{\Theta}-\vec{\Theta}_0)^{t}\cdot\vec{\nabla}\vec{\nabla}L\lvert_{\vec{\Theta}_0}\cdot(\vec{\Theta}-\vec{\Theta}_0) + \mathcal{O}((\vec{\Theta}-\vec{\Theta}_0)^3) \\
&\simeq L\lvert_{\vec{\Theta}_0} + \frac{1}{2} (\vec{\Theta}-\vec{\Theta}_0)^{t}\cdot\vec{\nabla}\vec{\nabla}L\lvert_{\vec{\Theta}_0}\cdot(\vec{\Theta}-\vec{\Theta}_0)
\end{align}
$$

$$\begin{align}
P(\vec{\Theta}\lvert \vec{D},I)\propto \exp{\left[-\frac{1}{2} \left(\vec{\Theta}-\vec{\Theta}_0\right)^t \cdot 
\left(-\vec{\nabla}\vec{\nabla}L\lvert_{\vec{\Theta}_0}\right)\cdot\left(\vec{\Theta}-\vec{\Theta}_0\right)\right]}
\end{align}$$

$$\begin{align}
P_{\textrm{Gaussian}}(\vec{x}\lvert \vec{\mu}, \vec{\Sigma}) &=
\frac{1}{\sqrt{(2\pi)^n \det{\vec{\Sigma}}}} \exp{\left[-\frac{1}{2}\left(\vec{x}-\vec{\mu}\right)^t \cdot\vec{\Sigma}^{-1}\cdot\left(\vec{x}-\vec{\mu}\right)\right]} \\
\left\langle\vec{x} \right\rangle &= \vec{\mu} \\
\left\langle(x_i - \mu_i)(x_j - \mu_j)\right\rangle &= \Sigma_{ij}
\end{align}$$

$$\begin{align}
\vec{\mu}&\rightarrow \vec{\Theta}_0 \\
\vec{\Sigma}&\rightarrow (-\vec{\nabla}\vec{\nabla}L\lvert_{\vec{\Theta}_0})^{-1}
\end{align}$$