In [1]:
# import packages 
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
%matplotlib inline

# Markov Reward Process
## TSMC

**only one recurrent state**

$$
P = 
\begin{array}{c c} 
& \begin{array}{c c c} G & A & B \\ \end{array} \\
\begin{array}{c c c}G \\ A \\ B \end{array} &
\left
[
\begin{array}{c c c}
.3 & .6 & .1 \\
.2 & .5 & .3 \\
.3 & .5 & .2
\end{array}
\right
]
\end{array}
$$


In [2]:
# the TSMC profit matrix
P = np.array(
    [[.3, .6, .1],
    [.2, .5, .2],
    [.3, .5, .2]])
Pt = np.matrix(P).reshape(3,3)
Pt

matrix([[0.3, 0.6, 0.1],
        [0.2, 0.5, 0.2],
        [0.3, 0.5, 0.2]])

In [11]:
#r = np.array([10,3,1]).matrix().reshape(3,1)
R = np.matrix([10,3,1]).reshape(3,1)
r = .9
I3 = np.identity(3)
I3 - r*Pt

matrix([[ 0.73, -0.54, -0.09],
        [-0.18,  0.55, -0.18],
        [-0.27, -0.45,  0.82]])

In [12]:

np.linalg.inv(I3 - r*Pt)*R

matrix([[36.91087619],
        [26.70787543],
        [28.02985428]])

# MC processes & Transient to Recurrent Probability
 - **it is transient(1) and recurrent(2) MC**
 - *at least one absorbing state*
  


$$
P = 
\begin{array}{c c } 
 & \begin{array}{c c c c} S1 & S2 & D1 & F \\ \end{array} \\
\begin{array}{c c c c}S1 \\ S2 \\ D1 \\ F \end{array} &
\left
[
\begin{array}{c c c}
.5 & .5 & 0 & 0 \\
.4 & .6 & 0 & 0 \\
.1 & .5 & .6 & .15 \\
0 & 0 & 0 & 1
\end{array}
\right
]
\end{array}
\\
$$

- The revenue is 
$$
R(s) = 
\begin{array}{c c}
X_t & R(X_t)\\
S1 & 20 \\
S2 & 10 \\
D1 & -15 \\
F  & 0
\end{array}
$$
---

In [15]:

P = np.array(
    [[.5, .5, 0, 0],
    [.4, .6, 0, 0],
    [.1, .15, .6, .15],
    [0, 0, 0, 1]])
Pt = np.matrix(P).reshape(4,4)
Pt

matrix([[0.5 , 0.5 , 0.  , 0.  ],
        [0.4 , 0.6 , 0.  , 0.  ],
        [0.1 , 0.15, 0.6 , 0.15],
        [0.  , 0.  , 0.  , 1.  ]])

## The similar example for recurrent and transient state MC
![image.png](attachment:85f8b170-f427-4fbf-ad2a-5276b6758c11.png)
![image.png](attachment:cd482b3e-2cdc-4881-b205-ca950c43ee9f.png)