# USE HMM network to inference 

1. Since max step =2, each room can generate a HMM with neibours room in previous time state and relevant sensors at current and all previous  time stamp.
2. we use a binary situation for outcome space {0,1} 
3. Based on the network, we will learn P(X_1={0/1} | X ={0/1}}, note the state will determine the action directly
4. Then we can inference B(X_t) by passage of time and observations Topic 8 from page 28


In [1]:
from __future__ import division
from __future__ import print_function

# Allowed libraries 
import numpy as np
import pandas as pd
import scipy as sp
import scipy.special
import heapq as pq
import matplotlib as mp
import matplotlib.pyplot as plt
import math
from itertools import product, combinations
from collections import OrderedDict as odict
import collections
from graphviz import Digraph, Graph
from tabulate import tabulate
import copy
import sys
import os
import datetime
import sklearn
import ast
import re

In [2]:
data = pd.read_csv("data.csv")

In [3]:
data.columns

Index(['Unnamed: 0', 'reliable_sensor1', 'reliable_sensor2',
       'reliable_sensor3', 'reliable_sensor4', 'unreliable_sensor1',
       'unreliable_sensor2', 'unreliable_sensor3', 'unreliable_sensor4',
       'robot1', 'robot2', 'door_sensor1', 'door_sensor2', 'door_sensor3',
       'door_sensor4', 'time', 'electricity_price', 'r1', 'r2', 'r3', 'r4',
       'r5', 'r6', 'r7', 'r8', 'r9', 'r10', 'r11', 'r12', 'r13', 'r14', 'r15',
       'r16', 'r17', 'r18', 'r19', 'r20', 'r21', 'r22', 'r23', 'r24', 'r25',
       'r26', 'r27', 'r28', 'r29', 'r30', 'r31', 'r32', 'r33', 'r34', 'r35',
       'c1', 'c2', 'c3', 'c4', 'o1', 'outside'],
      dtype='object')

In [4]:
data_copy = copy.deepcopy(data)

In [5]:
MAP = {
    "r1":["r2","r3"],
    "r2":["r1","r4"],
    "r3":["r1","r7"],
    "r4":["r2","r8"],
    "r5":["r6","r9","c3"],
    "r6":["r5","c3"],
    "r7":["r3","c1"],
    "r8":["r4","r9"],
    "r9":["r5","r8","r13"],
    "r10":["c3"],
    "r11":["c3"],
    "r12":["outside","r22"],
    "r13":["r9","r24"],
    "r14":["r24"],
    "r15":["c3"],
    "r16":["c3"],
    "r17":["c3"],
    "r18":["c3"],
    "r19":["c3"],
    "r20":["c3"],
    "r21":["c3"],
    "r22":["r12","r25"],
    "r23":["r24"],
    "r24":["r13","r14","r23"],
    "r25":["r22","r26","c1"],
    "r26":["r25","r27"],
    "r27":["r26","r32"],
    "r28":["c4"],
    "r29":["c4","r30"],
    "r30":["r29"],
    "r31":["r32"],
    "r32":["r27","r31","r33"],
    "r33":["r32"],
    "r34":["c2"],
    "r35":["c4"],
    "c1":["r7","r25","c2"],
    "c2":["c1","r34","c4"],
    "c3": ["r5","r6","r10","r11","r15","r16","r17","r18","r19","r20","r21","o1"],
    "c4":["r29","c2","r35","r28","o1"],
    "o1":["c3","c4"],
    "outside":["r12"]  
}
censor_dict =  {
    "r1": "us3", #us for unreliable_sensor
    "r5": "rs2" ,#rs for reliable_sensor
    "r8": "ds1", #ds for door sensor
    "r9": "ds1",
    "r16": "rs1",
    "r24" : "us4",
    "r25" : "rs3",
    "r26" : "ds3", 
    "r27" : "ds3",
    "r31" : "rs4",
    "r35" : "ds4",
    "c1" : "ds2",
    "c2" : "ds2",
    "c3" : "us2",
    "c4" : "ds4",
    "o1" : "us1"
}

In [6]:
def n_step_neighbour(node,n,G):
    neighbour_list = []
    neighbour_list = neighbour_list + G[node]
    while n > 1:
        for new_node in neighbour_list:
            neighbour_list = neighbour_list+ G[new_node]
        n = n -1 
    n_list = list(set(neighbour_list))
    n_list.remove(node)
    return(n_list)

In [7]:
def generate_HMM(node,G,censors):
    HMM = {}
    curr_node = "current_" + node
    node_neighbour = n_step_neighbour(node,2,G)
    HMM = {i:[curr_node] for i in node_neighbour}
    HMM[node] = [curr_node]
    
    related_censor = [censors.get(node)] + [censors.get(i) for i in node_neighbour]
    related_censor = [x for x in related_censor  if x is not None]
    
    for i in related_censor:
        if i[0] =="d":
            if sum([censor == i for censor in related_censor]) < 2:
                related_censor.remove(i) #drop door censor when you only at one side
    
    
    
    HMM[curr_node] = list(set(related_censor))
    for censor_evi in related_censor: 
        HMM[censor_evi] = []
    
    return(HMM)
    
    
#def learn_prob(G,data):
    

In [8]:
generate_HMM('r25',MAP,censor_dict)


{'r7': ['current_r25'],
 'r27': ['current_r25'],
 'r26': ['current_r25'],
 'c2': ['current_r25'],
 'r22': ['current_r25'],
 'r12': ['current_r25'],
 'c1': ['current_r25'],
 'r25': ['current_r25'],
 'current_r25': ['ds2', 'rs3', 'ds3'],
 'rs3': [],
 'ds3': [],
 'ds2': []}

In [9]:
def learn_tranisition(curr_node,pre_node,data):
    new_df = pd.DataFrame()
    new_df['curr'] = data[curr_node][1:]
    new_df['pre'] = data[pre_node].shift(1)[:-1]
    
    
    prob_ct = pd.crosstab(new_df['pre'] > 0 , new_df['curr'] > 0, normalize = "index")
    
    tran_table = odict()
    
    tran_table[(1,1)] = prob_ct.loc[True,True] # p(current = 1 | previous = 1)
    tran_table[(1,0)] = prob_ct.loc[True,False]
    tran_table[(0,1)] =prob_ct.loc[False,True]# p(current = 1 | previous = 0)
    tran_table[(0,0)] =  prob_ct.loc[False,False]
    
    
    return ({'dom': (pre_node,curr_node), 'table':tran_table})

def learn_censor_prob(node, censor, data):
    
    prob_ct = pd.crosstab(data[node] > 0 , data[censor] == "motion", normalize = "index")
    
    tran_table = odict()
    
    tran_table[(1,1)] = prob_ct.loc[True,True] # p(current = 1 | previous = 1)
    tran_table[(1,0)] = prob_ct.loc[True,False]
    tran_table[(0,1)] =prob_ct.loc[False,True]# p(current = 1 | previous = 0)
    tran_table[(0,0)] =  prob_ct.loc[False,False]
    
    return ({'dom': (node,censor), 'table':tran_table})

In [10]:
learn_tranisition('r22','r25',data)

{'dom': ('r25', 'r22'),
 'table': OrderedDict([((1, 1), 0.10268378063010501),
              ((1, 0), 0.897316219369895),
              ((0, 1), 0.13933895009721323),
              ((0, 0), 0.8606610499027868)])}

In [11]:
learn_censor_prob('r25','reliable_sensor3',data)

{'dom': ('r25', 'reliable_sensor3'),
 'table': OrderedDict([((1, 1), 0.9568261376896149),
              ((1, 0), 0.043173862310385065),
              ((0, 1), 0.03367875647668394),
              ((0, 0), 0.966321243523316)])}

For one room:
    1. generate the network 
    2. Assign the conditional prob (factor tables) 
    3. Find P(X=1| other nodes, e) and P(X=0| other nodes, e) by HMM algorithm;
    4. Make decicions (threshold) 
 
Entire inference process: 
    1. calculate all the probabilities 
    2. For t = 1, ... T: 
        a. Do inference for each room
        b. Store the decision 
        c. move to next timestep 
             
  
  

In [123]:
# room 25 P(x= 1 | A) and P(x= 0|A)
rooms_df = pd.read_csv("rooms_tran.csv")
censor_df= pd.read_csv("censor_prob.csv")


In [14]:
room = 'r25'
room_prob = rooms_df.loc[rooms_tran['current_room'] == room, :]
censor_prob = censor_df.loc[censor_tran['room'] == room, :] #extract relevant probabilities 

censor_prob_tem = censor_prob.set_index('censor')

Next step
1. reset index for room_prob and censor_prob
2. extract the probabilities from the dataset
3. compute the P(x=1) and P(x=0) with conditions
4. log likelihood sum 
5. return the prob of room 

In [29]:
def prob_have_people(state,trans, room):
    "trans is the dictionary from rooms_tran/ censor trans; state is a dictionary with room as key and (p(0), p(1)) as value "
    prob_have = trans['(1, 1)']*state[room][1] +  trans["(1, 0)"]*state[room][0]
    return (prob_have)
    
def prob_no_people(state,trans, room):    
    prob_no = trans["(0, 1)"]*state[room][1] +  trans["(0, 0)"]*state[room][0] 
    return (prob_no)


state_tem = {'c1': (1.0,0)}
trans_tem = room_prob_tem.loc['c1',:].to_dict()
#print(trans_tem)

print(prob_have_people(state_tem, trans_tem,"c1"))

print(prob_no_people(state_tem, trans_tem,"c1"))

0.634494575
0.665639445


In [72]:
def joint_prob_room(curr_room, room_prob_df, state):
    list_have_people = []
    list_no_people = []
    room_prob_tem =room_prob_df.set_index('previous_room')
    for rooms in room_prob_df['previous_room']:
        room_dict = room_prob_tem.loc[rooms,:].to_dict()
        have_people = prob_have_people(state,room_dict, rooms)
        no_people =  prob_no_people(state,room_dict, rooms)
        list_have_people.append(have_people)
        list_no_people.append(no_people)
    
    prob_have = np.prod(list_have_people)
    prob_no = np.prod(list_no_people)
    
    prob_have = prob_have/ (prob_have+ prob_no)
    prob_no = 1- prob_have  
    
    return(( prob_no,prob_have))
    

In [73]:
state_tem = {room : (0.8,0.2) for room in room_prob['previous_room'] }
print(state_tem)

probability_room = joint_prob_room(room, room_prob, state_tem)
probability_room

{'c1': (0.8, 0.2), 'r26': (0.8, 0.2), 'r7': (0.8, 0.2), 'c2': (0.8, 0.2), 'r22': (0.8, 0.2), 'r27': (0.8, 0.2), 'r12': (0.8, 0.2)}


(0.5492262332959444, 0.45077376670405556)

1. censors 
2. combine the prob
3. iterate all rooms in one timestep 
4. all rooms all time 


In [71]:
def censor_cal(curr_room, censor_prob_df, state):
    list_have_people = []
    list_no_people = []
    censor_prob_tem = censor_prob_df.set_index('censor')
    for censors in censor_prob_df['censor']:
        censor_dict = censor_prob_tem.loc[censors,:].to_dict()
        have_people = prob_have_people(state, censor_dict, censors )
        no_people = prob_no_people(state, censor_dict, censors )
        list_have_people.append(have_people)
        list_no_people.append(no_people)
    
    prob_have = np.prod(list_have_people)
    prob_no = np.prod(list_no_people)

    
    prob_have = prob_have/ (prob_have+ prob_no)
    prob_no = 1- prob_have  
    return(( prob_no, prob_have))
    

In [74]:
state_temp = {'reliable_sensor3': (0.0,1.0)} 
probability_censor = censor_cal('r25',censor_prob,state_temp)
probability_censor

(0.03400160531769114, 0.9659983946823089)

In [75]:
def make_decision(prob_room, prob_censor, weight, theta):
    people = 0
    no_people = prob_room[0] * weight[0] * prob_censor[0] * weight[1]
    have_people = prob_room[1] * weight[0] * prob_censor[1] * weight[1]
    
    prob_have = have_people/ (have_people+ no_people)
    if prob_have > theta: 
        people = 1
    return(people)
    
make_decision(probability_room, probability_censor, [1,9], 0.5)    

1

Now let's do all rooms at one time stamp given previous time step

In [86]:
data_sample = data.sample(1)
censor_sample = data_sample.iloc[:,1:9]
room_sample = data_sample.iloc[:,17:]

In [114]:
room_dict = room_sample.to_dict()
room_state = {k: list(v.values())[0] for k, v in room_dict.items()}
room_state2 = {k: (0,1) if v > 0 else (1,0) for k,v in room_state.items() }

censor_dict = censor_sample.to_dict()
censor_state = {k: list(v.values())[0] for k, v in censor_dict.items()}
censor_state2 = {k: (0,1) if v == "motion" else (1,0) for k,v in censor_state.items() }
censor_state2

{'reliable_sensor1': (0, 1),
 'reliable_sensor2': (1, 0),
 'reliable_sensor3': (0, 1),
 'reliable_sensor4': (1, 0),
 'unreliable_sensor1': (0, 1),
 'unreliable_sensor2': (1, 0),
 'unreliable_sensor3': (0, 1),
 'unreliable_sensor4': (1, 0)}

In [117]:
[room for room in list(room_state2.keys()) if room[0] == 'r']

['r1',
 'r2',
 'r3',
 'r4',
 'r5',
 'r6',
 'r7',
 'r8',
 'r9',
 'r10',
 'r11',
 'r12',
 'r13',
 'r14',
 'r15',
 'r16',
 'r17',
 'r18',
 'r19',
 'r20',
 'r21',
 'r22',
 'r23',
 'r24',
 'r25',
 'r26',
 'r27',
 'r28',
 'r29',
 'r30',
 'r31',
 'r32',
 'r33',
 'r34',
 'r35']

In [138]:
def all_room_predict(room_state, censors_state, room_prob_df, censor_prob_df, w, theta = 0.5):
    room_predict_dict = {}
    room_list = list(room_state.keys())
    room_list = [room for room in room_list if room[0] == 'r']
    for room in room_list: 
        room_prob = room_prob_df.loc[room_prob_df['current_room'] == room, :]
        censor_prob =  censor_prob_df.loc[censor_prob_df['room'] == room, :]
        probability_room = joint_prob_room(room, room_prob, room_state)
        probability_censor = censor_cal(room,censor_prob,censors_state)
        room_predict_dict[room] = make_decision(probability_room , probability_censor, w , theta)
        
    return room_predict_dict

In [139]:
all_room_predict(room_state2,censor_state2, rooms_df,censor_df, [1,9]  )

{'r1': 1,
 'r2': 0,
 'r3': 1,
 'r4': 1,
 'r5': 0,
 'r6': 1,
 'r7': 1,
 'r8': 0,
 'r9': 0,
 'r10': 1,
 'r11': 1,
 'r12': 1,
 'r13': 0,
 'r14': 1,
 'r15': 1,
 'r16': 1,
 'r17': 0,
 'r18': 0,
 'r19': 1,
 'r20': 0,
 'r21': 1,
 'r22': 0,
 'r23': 0,
 'r24': 0,
 'r25': 1,
 'r26': 1,
 'r27': 1,
 'r28': 1,
 'r29': 0,
 'r30': 1,
 'r31': 0,
 'r32': 0,
 'r33': 1,
 'r34': 1,
 'r35': 1}

In [106]:
list(room_dict['r1'].values())[0]

2

In [88]:
censor_sample

Unnamed: 0,reliable_sensor1,reliable_sensor2,reliable_sensor3,reliable_sensor4,unreliable_sensor1,unreliable_sensor2,unreliable_sensor3,unreliable_sensor4
1211,motion,no motion,motion,no motion,motion,no motion,motion,no motion


In [81]:
state = {}

{'Unnamed: 0': {1051: 1051},
 'reliable_sensor1': {1051: 'motion'},
 'reliable_sensor2': {1051: 'no motion'},
 'reliable_sensor3': {1051: 'no motion'},
 'reliable_sensor4': {1051: 'motion'},
 'unreliable_sensor1': {1051: 'motion'},
 'unreliable_sensor2': {1051: 'motion'},
 'unreliable_sensor3': {1051: 'motion'},
 'unreliable_sensor4': {1051: 'motion'},
 'robot1': {1051: "('r1', 1)"},
 'robot2': {1051: "('r35', 0)"},
 'door_sensor1': {1051: 0},
 'door_sensor2': {1051: 0},
 'door_sensor3': {1051: 0},
 'door_sensor4': {1051: 0},
 'time': {1051: '12:23:00'},
 'electricity_price': {1051: 1.0624824690392611},
 'r1': {1051: 1},
 'r2': {1051: 0},
 'r3': {1051: 1},
 'r4': {1051: 0},
 'r5': {1051: 0},
 'r6': {1051: 0},
 'r7': {1051: 3},
 'r8': {1051: 0},
 'r9': {1051: 0},
 'r10': {1051: 3},
 'r11': {1051: 3},
 'r12': {1051: 0},
 'r13': {1051: 0},
 'r14': {1051: 0},
 'r15': {1051: 1},
 'r16': {1051: 1},
 'r17': {1051: 0},
 'r18': {1051: 0},
 'r19': {1051: 1},
 'r20': {1051: 0},
 'r21': {1051: 1},

In [79]:
def prob_have_people(state,trans):
    "trans is the dictionary from rooms_tran; state is a dictionary with room as key and (p(0), p(1)) as value "
    prob_have = trans['(1,1)']*state[1] +  trans["(1,0)"]*state[0] 
    return (prob_have)
    
def prob_no_people(state,trans):    
    prob_no = trans["(0,1)"]*state[1] +  trans["(0,0)"]*state[0] 
    return (prob_no)


state_tem = {'c1': (1.0,0)}
trans_tem = room_prob.loc[ room_prob['previous_room'] == 'c1',:].to_dict()
print(trans_tem)

print(prob_have_people(state_tem, trans_tem))

{'Unnamed: 0': {193: 193}, 'previous_room': {193: 'c1'}, 'current_room': {193: 'r25'}, '(1, 1)': {193: 0.365505425}, '(1, 0)': {193: 0.634494575}, '(0, 1)': {193: 0.334360555}, '(0, 0)': {193: 0.665639445}}


KeyError: '(1,1)'

In [57]:
for rooms in room_prob['previous_room']:
    room_tran = room_prob.loc[ room_prob['previous_room'] == rooms,:].to_dict
    room_state = current_state['rooms']

0.3655

In [None]:
def state_generator(room):
    state_dict = {'dom': (room,),    
                  'table': odict([
        ((1,), 0.0),
        ((0,), 1.0),
    ])}
    return (state_dict)
state_info = []
for rooms in room_prob['previous_room']:
    state_info.append(state_generator(rooms))
    
state_info

In [None]:
def printFactor(f):
    """
    argument 
    `f`, a factor to print on screen
    """
    # Create a empty list that we will fill in with the probability table entries
    table = list()
    
    # Iterate over all keys and probability values in the table
    for key, item in f['table'].items():
        # Convert the tuple to a list to be able to manipulate it
        k = list(key)
        # Append the probability value to the list with key values
        k.append(item)
        # Append an entire row to the table
        table.append(k)
    # dom is used as table header. We need it converted to list
    dom = list(f['dom'])
    # Append a 'Pr' to indicate the probabity column
    dom.append('Pr')
    print(tabulate(table,headers=dom,tablefmt='orgtbl'))

def prob(factor, *entry):
    """
    argument 
    `factor`, a dictionary of domain and probability values,
    `entry`, a list of values, one for each variable in the same order as specified in the factor domain.
    
    Returns p(entry)
    """

    return factor['table'][entry]     # insert your code here, 1 line   

def join(f1, f2, outcomeSpace):
    """
    argument 
    `f1`, first factor to be joined.
    `f2`, second factor to be joined.
    `outcomeSpace`, dictionary with the domain of each variable
    
    Returns a new factor with a join of f1 and f2
    """
    
    # First, we need to determine the domain of the new factor. It will be union of the domain in f1 and f2
    # But it is important to eliminate the repetitions
    common_vars = list(f1['dom']) + list(set(f2['dom']) - set(f1['dom']))
    
    # We will build a table from scratch, starting with an empty list. Later on, we will transform the list into a odict
    table = list()
    
    # Here is where the magic happens. The product iterator will generate all combinations of varible values 
    # as specified in outcomeSpace. Therefore, it will naturally respect observed values
    for entries in product(*[outcomeSpace[node] for node in common_vars]):
        
        # We need to map the entries to the domain of the factors f1 and f2
        entryDict = dict(zip(common_vars, entries))
        f1_entry = (entryDict[var] for var in f1['dom'])
        f2_entry = (entryDict[var] for var in f2['dom'])
        
        # Insert your code here
        p1 = prob(f1, *f1_entry)           # Use the fuction prob to calculate the probability in factor f1 for entry f1_entry 
        p2 = prob(f2, *f2_entry)           # Use the fuction prob to calculate the probability in factor f2 for entry f2_entry 
        
        # Create a new table entry with the multiplication of p1 and p2
        table.append((entries, p1 * p2))
    return {'dom': tuple(common_vars), 'table': odict(table)}


def marginalize(f, var, outcomeSpace):
    """
    argument 
    `f`, factor to be marginalized.
    `var`, variable to be summed out.
    `outcomeSpace`, dictionary with the domain of each variable
    
    Returns a new factor f' with dom(f') = dom(f) - {var}
    """    
    
    # Let's make a copy of f domain and convert it to a list. We need a list to be able to modify its elements
    new_dom = list(f['dom'])
    
    new_dom.remove(var)            # Remove var from the list new_dom by calling the method remove(). 1 line
    table = list()                 # Create an empty list for table. We will fill in table from scratch. 1 line
    for entries in product(*[outcomeSpace[node] for node in new_dom]):
        s = 0;                     # Initialize the summation variable s. 1 line

        # We need to iterate over all possible outcomes of the variable var
        for val in outcomeSpace[var]:
            # To modify the tuple entries, we will need to convert it to a list
            entriesList = list(entries)
            # We need to insert the value of var in the right position in entriesList
            entriesList.insert(f['dom'].index(var), val)
            
            p = prob(f, *tuple(entriesList))     # Calculate the probability of factor f for entriesList. 1 line
            s = s + p                            # Sum over all values of var by accumulating the sum in s. 1 line
            
        # Create a new table entry with the multiplication of p1 and p2
        table.append((entries, s))
    return {'dom': tuple(new_dom), 'table': odict(table)}

In [None]:
c1_trans = {
    'dom': ('previous', 'current'), 
    'table': odict([
        (((1,1),), 0.3655),
        (((1,0),), 0.6345),
        (((0,1),), 0.3344),
        (((0,0),), 0.6656),
    ])
}
state_current = {'dom': ('c1',), 'table': odict([((1,), 0.0), ((0,), 1.0)])}

prob(c1_trans , (1,1))
current_state = {'c1': (0,1)}


In [None]:
def prob_have_people(state,trans):
    prob_have = prob(trans, (1,1))*state[1] +  prob(trans, (1,0))*state[0] 
    return (prob_have)

def prob_no_people(state,trans):    
    prob_no = prob(trans, (0,1))*prob(state,(1)) +  prob(trans, (0,0))*prob(state,(0))
    return (prob_no)

print(prob_have_people(state_current,c1_trans))
print(prob_no_people(state_current,c1_trans))