# "Bayesian Parameter Estimation"
> "We follow Chapters 2 and 3 of Sivia and Skilling's book to illustrate a simple Bayesian Parameter Estimation workflow"

- toc:true
- branch: master
- badges: true
- comments: true
- author: John J. Molina
- categories: [Data Analysis, Parameter Estimation]

In [1]:
import numpy as np
import matplotlib as mpl
import matplotlib.pyplot as plt

$$\begin{align*}
P(X\lvert I) + P(\overline{X}\lvert I) &= 1 &\textrm{(Sum Rule)}\label{e:sum_rule}\\
P(X,Y\lvert I) &= P(X\lvert Y, I)\times P(Y\lvert I) &\textrm{(Product Rule)}\notag\\
&=P(Y\lvert X, I)\times P(X\lvert I) \label{e:product_rule} \\
\end{align*}$$

$$\begin{align*}
\overbrace{P(X \lvert Y, I)}^{\small{\mathrm{posterior}}} &= \frac{\overbrace{P(Y\lvert X,I)}^{\small{\mathrm{likelihood}}} 
                                          \times\overbrace{P(X\lvert I)}^{\small{\mathrm{prior}}}}{\underbrace{P(Y\lvert I)}_{\small{\mathrm{evidence}}}}&\textrm{(Bayes' Theorem)}\label{e:bayes} \\
P(X\lvert I) &= \int\textrm{d}Y P(X, Y\lvert I) =\int\textrm{d}Y P(X\lvert Y, I)\times P(Y\lvert I) &\textrm{(Marginalization)}
\label{e:marginalization}
\end{align*}$$

$$\begin{align*}
P(\textrm{Hypothesis}\lvert \textrm{Data}, I) &= \frac{P(\textrm{Data}\lvert \textrm{Hypothesis}, I)\times P(\textrm{Hypothesis}\lvert I)}{P(\textrm{Data}, I)}\label{e:bayes_hypothesis}
\end{align*}$$

$$\begin{align*}
P(\Theta\lvert D, I) &= \frac{P(D\lvert\Theta, I) \times P(\Theta\lvert I)}{P(D\lvert I)} \label{e:bayes_theta}\\
&\propto P(D\lvert\Theta, I)\times P(\Theta\lvert I)
\end{align*}$$

$D = \{D_k\}_{k=1}^N$

$$\begin{align*}
P(\Theta\lvert D,I) &\propto P(\{D_k\}_{k=1}^N\lvert \Theta, I)\times P(\Theta\lvert I) \\
&= P(\{D_k\}_{k=2}^N\lvert D_1, \Theta, I) \times P(D_1\lvert \Theta, I)\times P(\Theta\lvert I) \\
&= P(\{D_k\}_{k=2}^N\lvert \Theta, I)\times P(D_1\lvert \Theta, I)\times P(\Theta\lvert I) \\ 
&= P(\{D_k\}_{k=3}^N\lvert \Theta, I)\times P(D_2\lvert \Theta, I)\times P(D_1\lvert \Theta, I) \times P(\Theta\lvert I) \\
&\vdots \\
&= \left(\Pi_{k=1}^N P(D_k\lvert \Theta, I)\right) \times P(\Theta\lvert I)
\end{align*}$$


$$\begin{align*}
P(\Theta\lvert D,I)&= \big(\Pi_{k=m+1}^{N} P(D_k\lvert \Theta, I)\big) \big(\Pi_{j=1}^{m} P(D_j\lvert\Theta, I)\big) P(\Theta\lvert I) \\
&=\big(\Pi_{k=m+1}^{N} P(D_k\lvert \Theta, I)\big) \times P(\Theta\lvert \{D_j\}_{j=1}^m, I)
\end{align*}$$

$$\begin{align*}
L &= \ln{P(\Theta\lvert D, I)} = \ln P \\
&= L\lvert_{\Theta_0} + \nabla L\lvert_{\Theta_0}\cdot(\Theta - \Theta_0) 
+ \frac{1}{2} (\Theta-\Theta_0)^{t}\cdot\nabla\nabla L\lvert_{\Theta_0}\cdot(\Theta-\Theta_0) + \mathcal{O}\big((\Theta-\Theta_0)^3\big) \\
&\simeq L\lvert_{\Theta_0} + \\
&\frac{1}{2} (\Theta-\Theta_0)^{t}\cdot\nabla\nabla L\lvert_{\Theta_0}\cdot(\Theta-\Theta_0)
\end{align*}$$

$$\begin{align*}
P(\Theta\lvert D,I)\propto \exp{\left[-\frac{1}{2} \left(\Theta-\Theta_0\right)^t \cdot 
\left(-\nabla\nabla L\lvert_{\Theta_0}\right)\cdot\left(\Theta-\Theta_0\right)\right]}
\end{align*}$$

$$\begin{align*}
P_{\textrm{Gaussian}}(X \lvert \mu, \Sigma) &=
\frac{1}{\sqrt{(2\pi)^n \det{\Sigma}}} \exp{\left[-\frac{1}{2}\left(X-\mu\right)^t \cdot \Sigma^{-1}\cdot\left(X-\mu\right)\right]} \\
\left\langle X \right\rangle &= \mu \\
\left\langle(X^i - \mu^i)(X^j - \mu^j)\right\rangle &= \Sigma^{ij}
\end{align*}$$

$$\begin{align*}
\mu&\rightarrow \Theta_0 \\
\Sigma&\rightarrow (-\nabla\nabla L\lvert_{\Theta_0})^{-1}
\end{align*}$$