In [95]:
import numpy as np
import random
from sklearn.utils import shuffle

%load_ext autoreload
%autoreload 2

from Node import Node
from SumNode import SumNode
from ProductNode import ProductNode
from Node import LeafNode
from SPN import SPN

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload


# Generative

In [96]:
x1 = np.array([0.0,0.0,0.0])
x2 = np.array([0.0,1.0,0.0])
x3 = np.array([1.0,0.0,0.0])
x4 = np.array([1.0,1.0,0.0])

x5 = np.array([0.0,0.0,1.0])
x6 = np.array([0.0,1.0,1.0])
x7 = np.array([1.0,0.0,1.0])
x8 = np.array([1.0,1.0,1.0])

### Define XOR structure

In [97]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))

# Sum nodes 3 and 4
sum_node3 = SumNode(3,1)
sum_node4 = SumNode(4,2)
spn.add_node(sum_node3)
spn.add_node(sum_node4)

# Product nodes 5-8
prod_node5 = ProductNode(5,4)
prod_node6 = ProductNode(6,4)
prod_node7 = ProductNode(7,3)
prod_node8 = ProductNode(8,3)
spn.add_node(prod_node5, random.randint(1,9))
spn.add_node(prod_node6, random.randint(1,9))
spn.add_node(prod_node7, random.randint(1,9))
spn.add_node(prod_node8, random.randint(1,9))

# Add leaf nodes
X1 = LeafNode(9,np.array([6,7]), 0, False)
X_1 = LeafNode(10,np.array([5,8]), 0, True)
X2 = LeafNode(11,np.array([5,7]), 1, False)
X_2 = LeafNode(12,np.array([6,8]), 1, True)
X3 = LeafNode(13,np.array([2]), 2, False)
X_3 = LeafNode(14,np.array([1]), 2, True)
spn.add_node(X1)
spn.add_node(X_1)
spn.add_node(X2)
spn.add_node(X_2)
spn.add_node(X3)
spn.add_node(X_3)
spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.3571
To node 2 :    0.6429

Node ID 3
To node 7 :    0.7778
To node 8 :    0.2222

Node ID 4
To node 5 :    0.8000
To node 6 :    0.2000


### Untrained forward pass

In [98]:
print("Evaluate Forward Passes")
z = spn.compute_marginal()
print("Probability x1",np.exp(spn.evaluate(x1)))
print("Probability x2",np.exp(spn.evaluate(x2)))
print("Probability x3",np.exp(spn.evaluate(x3)))
print("Probability x4",np.exp(spn.evaluate(x4)))
print("Probability x5",np.exp(spn.evaluate(x5)))
print("Probability x6",np.exp(spn.evaluate(x6)))
print("Probability x7",np.exp(spn.evaluate(x7)))
print("Probability x8",np.exp(spn.evaluate(x8)))

print()
print("Probability x3=1 given x1's first two indicators", np.exp(spn.map_inference(x1)))
print("Probability x3=1 given x2's first two indicators", np.exp(spn.map_inference(x2)))
print("Probability x3=1 given x3's first two indicators", np.exp(spn.map_inference(x3)))
print("Probability x3=1 given x4's first two indicators", np.exp(spn.map_inference(x4)))
print("Probability x3=1 given x5's first two indicators", np.exp(spn.map_inference(x5)))
print("Probability x3=1 given x6's first two indicators", np.exp(spn.map_inference(x6)))
print("Probability x3=1 given x7's first two indicators", np.exp(spn.map_inference(x7)))
print("Probability x3=1 given x8's first two indicators", np.exp(spn.map_inference(x8)))

Evaluate Forward Passes
Probability x1 0.0793651373016
Probability x2 0.0
Probability x3 0.0
Probability x4 0.27777789127
Probability x5 0.0
Probability x6 0.514285858571
Probability x7 0.128571512857
Probability x8 0.0

Probability x3=1 given x1's first two indicators 1.0
Probability x3=1 given x2's first two indicators 0.0
Probability x3=1 given x3's first two indicators 0.0
Probability x3=1 given x4's first two indicators 1.0
Probability x3=1 given x5's first two indicators 0.0
Probability x3=1 given x6's first two indicators 1.0
Probability x3=1 given x7's first two indicators 1.0
Probability x3=1 given x8's first two indicators 0.0


### Train model

In [100]:
data = np.array([x1,x2,x3,x4,x5,x6,x7,x8])

print("Training...")
for i in range(10):
    #spn.generative_hard_gd(data)
    spn.generative_soft_gd(data)
    
print("Probability x1",np.exp(spn.evaluate(x1)))
print("Probability x2",np.exp(spn.evaluate(x2)))
print("Probability x3",np.exp(spn.evaluate(x3)))
print("Probability x4",np.exp(spn.evaluate(x4)))
print("Probability x5",np.exp(spn.evaluate(x5)))
print("Probability x6",np.exp(spn.evaluate(x6)))
print("Probability x7",np.exp(spn.evaluate(x7)))
print("Probability x8",np.exp(spn.evaluate(x8)))

spn.print_weights()

Training...
Probability x1 0.246293180029
Probability x2 0.0
Probability x3 0.0
Probability x4 0.25353627759
Probability x5 0.0
Probability x6 0.253999416064
Probability x7 0.246171526317
Probability x8 0.0

Node ID 0
To node 1 :    0.4998
To node 2 :    0.5002

Node ID 3
To node 7 :    0.5072
To node 8 :    0.4928

Node ID 4
To node 5 :    0.5078
To node 6 :    0.4922


In [30]:
print("Probability x3=1 given x1's first two indicators", np.exp(spn.map_inference(x1)))
print("Probability x3=1 given x2's first two indicators", np.exp(spn.map_inference(x2)))
print("Probability x3=1 given x3's first two indicators", np.exp(spn.map_inference(x3)))
print("Probability x3=1 given x4's first two indicators", np.exp(spn.map_inference(x4)))
print("Probability x3=1 given x5's first two indicators", np.exp(spn.map_inference(x5)))
print("Probability x3=1 given x6's first two indicators", np.exp(spn.map_inference(x6)))
print("Probability x3=1 given x7's first two indicators", np.exp(spn.map_inference(x7)))
print("Probability x3=1 given x8's first two indicators", np.exp(spn.map_inference(x8)))

Probability x3=1 given x1's first two indicators 1.0
Probability x3=1 given x2's first two indicators 0.0
Probability x3=1 given x3's first two indicators 0.0
Probability x3=1 given x4's first two indicators 1.0
Probability x3=1 given x5's first two indicators 0.0
Probability x3=1 given x6's first two indicators 1.0
Probability x3=1 given x7's first two indicators 1.0
Probability x3=1 given x8's first two indicators 0.0


# Example 2

### Define Example 2 structure

In [78]:
# generate new dataset
x1 = np.array([0.0,0.0,0.0])
x2 = np.array([0.0,0.0,1.0])
x3 = np.array([0.0,1.0,0.0])
x4 = np.array([0.0,1.0,1.0])

x5 = np.array([1.0,0.0,0.0])
x6 = np.array([1.0,0.0,1.0])
x7 = np.array([1.0,1.0,0.0])
x8 = np.array([1.0,1.0,1.0])

data = []
y = []
for i in range(10):
    data.append(x1)
    y.append(0)
for i in range(90):
    data.append(x2)
    y.append(0)
for i in range(10):
    data.append(x3)
    y.append(0)
for i in range(90):
    data.append(x4)
    y.append(0)
for i in range(224):
    data.append(x5)
for i in range(336):
    data.append(x6)
for i in range(96):
    data.append(x7)
for i in range(144):
    data.append(x8)
# make arrays
data = np.array(data)

data = shuffle(data, random_state=0)
print(data.shape)

(1000, 3)


In [82]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))

# Sum nodes 3 - 6
sum_node3 = SumNode(3,1)
sum_node4 = SumNode(4,2)
sum_node5 = SumNode(5,1)
sum_node6 = SumNode(6,2)
spn.add_node(sum_node3)
spn.add_node(sum_node4)
spn.add_node(sum_node5)
spn.add_node(sum_node6)

# Add leaf nodes
X1 = LeafNode(7,np.array([1]), 0, False)
X_1 = LeafNode(8,np.array([2]), 0, True)
X2 = LeafNode(9,np.array([3,4]), 1, False)
X_2 = LeafNode(10,np.array([3,4]), 1, True)
X3 = LeafNode(11,np.array([5,6]), 2, False)
X_3 = LeafNode(12,np.array([5,6]), 2, True)
spn.add_node(X1,  np.array([random.randint(1,9)]) )
spn.add_node(X_1, np.array([random.randint(1,9)]))
spn.add_node(X2, np.array([random.randint(1,9), random.randint(1,9)]) )
spn.add_node(X_2, np.array([random.randint(1,9), random.randint(1,9)]))
spn.add_node(X3, np.array([random.randint(1,9), random.randint(1,9)]))
spn.add_node(X_3, np.array([random.randint(1,9), random.randint(1,9)]))

spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.3077
To node 2 :    0.6923

Node ID 3
To node 9 :    0.3636
To node 10 :    0.6364

Node ID 4
To node 9 :    0.5385
To node 10 :    0.4615

Node ID 5
To node 11 :    0.6429
To node 12 :    0.3571

Node ID 6
To node 11 :    0.6667
To node 12 :    0.3333


In [83]:
for i in range(100):
    spn.generative_soft_gd(data, batch=True)
    #spn.generative_hard_gd(data, batch=False)
    
print("\nProbability x1",np.exp(spn.evaluate(x1)))
print("Probability x2",np.exp(spn.evaluate(x2)))
print("Probability x3",np.exp(spn.evaluate(x3)))
print("Probability x4",np.exp(spn.evaluate(x4)))
print("Probability x5",np.exp(spn.evaluate(x5)))
print("Probability x6",np.exp(spn.evaluate(x6)))
print("Probability x7",np.exp(spn.evaluate(x7)))
print("Probability x8",np.exp(spn.evaluate(x8)))

spn.print_weights()
print("\nShould be:")
print("0: 0.8, 0.2")
print("3: 0.3, 0.7")
print("4: 0.5, 0.5")
print("5: 0.6, 0.4")
print("6: 0.9, 0.1")


Probability x1 0.010000017
Probability x2 0.090000073
Probability x3 0.010000017
Probability x4 0.090000073
Probability x5 0.224000116
Probability x6 0.336000146
Probability x7 0.096000068
Probability x8 0.14400009

Node ID 0
To node 1 :    0.8000
To node 2 :    0.2000

Node ID 3
To node 9 :    0.3000
To node 10 :    0.7000

Node ID 4
To node 9 :    0.5000
To node 10 :    0.5000

Node ID 5
To node 11 :    0.6000
To node 12 :    0.4000

Node ID 6
To node 11 :    0.9000
To node 12 :    0.1000

Should be:
0: 0.8, 0.2
3: 0.3, 0.7
4: 0.5, 0.5
5: 0.6, 0.4
6: 0.9, 0.1


# Test with correct weights

In [20]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, 0.8)
spn.add_node(prod_node2, 0.2)

# Sum nodes 3 - 6
sum_node3 = SumNode(3,1)
sum_node4 = SumNode(4,2)
sum_node5 = SumNode(5,1)
sum_node6 = SumNode(6,2)
spn.add_node(sum_node3)
spn.add_node(sum_node4)
spn.add_node(sum_node5)
spn.add_node(sum_node6)

# Add leaf nodes
X1 = LeafNode(7,np.array([1]), 0, False)
X_1 = LeafNode(8,np.array([2]), 0, True)
X2 = LeafNode(9,np.array([3,4]), 1, False)
X_2 = LeafNode(10,np.array([3,4]), 1, True)
X3 = LeafNode(11,np.array([5,6]), 2, False)
X_3 = LeafNode(12,np.array([5,6]), 2, True)
spn.add_node(X1,  np.array([random.randint(1,9)]) )
spn.add_node(X_1, np.array([random.randint(1,9)]))
spn.add_node(X2, np.array([0.3, 0.5]) )
spn.add_node(X_2, np.array([0.7, 0.5]))
spn.add_node(X3, np.array([0.6, 0.9]))
spn.add_node(X_3, np.array([0.4, 0.1]))

spn.normalise_weights()
spn.print_weights()
print()
print("\nProbability x1",np.exp(spn.evaluate(x1)))
print("Probability x2",np.exp(spn.evaluate(x2)))
print("Probability x3",np.exp(spn.evaluate(x3)))
print("Probability x4",np.exp(spn.evaluate(x4)))
print("Probability x5",np.exp(spn.evaluate(x5)))
print("Probability x6",np.exp(spn.evaluate(x6)))
print("Probability x7",np.exp(spn.evaluate(x7)))
print("Probability x8",np.exp(spn.evaluate(x8)))


Node ID 0
To node 1 :    0.8000
To node 2 :    0.2000

Node ID 3
To node 9 :    0.3000
To node 10 :    0.7000

Node ID 4
To node 9 :    0.5000
To node 10 :    0.5000

Node ID 5
To node 11 :    0.6000
To node 12 :    0.4000

Node ID 6
To node 11 :    0.9000
To node 12 :    0.1000


Probability x1 0.010000017
Probability x2 0.090000073
Probability x3 0.010000017
Probability x4 0.090000073
Probability x5 0.224000116
Probability x6 0.336000146
Probability x7 0.096000068
Probability x8 0.14400009


In [21]:
for i in range(10):
    spn.generative_soft_gd(data)
    #spn.generative_hard_gd(data)
    spn.normalise_weights()
    
print("Probability x1",spn.evaluate(x1)/spn.compute_marginal())
print("Probability x2",spn.evaluate(x2)/spn.compute_marginal())
print("Probability x3",spn.evaluate(x3)/spn.compute_marginal())
print("Probability x4",spn.evaluate(x4)/spn.compute_marginal())
print("Probability x5",spn.evaluate(x5)/spn.compute_marginal())
print("Probability x6",spn.evaluate(x6)/spn.compute_marginal())
print("Probability x7",spn.evaluate(x7)/spn.compute_marginal())
print("Probability x8",spn.evaluate(x8)/spn.compute_marginal())

spn.print_weights()

Probability x1 -7675281.57952
Probability x2 -4013241.73161
Probability x3 -7675281.57952
Probability x4 -4013241.73161
Probability x5 -2493514.76545
Probability x6 -1817739.65641
Probability x7 -3905677.69022
Probability x8 -3229902.58118

Node ID 0
To node 1 :    0.8000
To node 2 :    0.2000

Node ID 3
To node 9 :    0.3000
To node 10 :    0.7000

Node ID 4
To node 9 :    0.5000
To node 10 :    0.5000

Node ID 5
To node 11 :    0.6000
To node 12 :    0.4000

Node ID 6
To node 11 :    0.9000
To node 12 :    0.1000


# Really Basic Example

In [85]:
# generate new dataset
x1 = np.array([0.0,0.0])
x2 = np.array([0.0,1.0])
x3 = np.array([1.0,0.0])
x4 = np.array([1.0,1.0])


data = []
for i in range(3):
    data.append(x1)
for i in range(7):
    data.append(x4)
    
data = np.array(data)
data = shuffle(data, random_state=0)

In [86]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))

# Add leaf nodes
X1 = LeafNode(3, 2, 0, False)
X_1 = LeafNode(4, 1, 0, True)
X2 = LeafNode(5, 2, 1, False)
X_2 = LeafNode(6, 1, 1, True )

spn.add_node(X1)
spn.add_node(X_1)
spn.add_node(X2)
spn.add_node(X_2)

spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.6364
To node 2 :    0.3636


In [94]:
for i in range(5):
    spn.generative_soft_gd(data)
    #spn.generative_hard_gd(data)
    
print("\nProbability x1", np.exp(spn.evaluate(x1)))
print("Probability x2", np.exp(spn.evaluate(x2)))
print("Probability x3", np.exp(spn.evaluate(x3)))
print("Probability x4", np.exp(spn.evaluate(x4)))

spn.print_weights()


Probability x1 0.636363736364
Probability x2 0.0
Probability x3 0.0
Probability x4 0.363636463636

Node ID 0
To node 1 :    0.6364
To node 2 :    0.3636


# Example 3

In [27]:
# generate new dataset
x1 = np.array([0.0,0.0])
x2 = np.array([0.0,1.0])
x3 = np.array([1.0,0.0])
x4 = np.array([1.0,1.0])


data = []
for i in range(603):
    data.append(x1)
for i in range(207):
    data.append(x2)
for i in range(147):
    data.append(x3)
for i in range(43):
    data.append(x4)
    
data = np.array(data)
data = shuffle(data)
print(data.shape)

(1000, 2)


In [28]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
prod_node3 = ProductNode(3, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))
spn.add_node(prod_node3, random.randint(1,9))

# Sum nodes 4 - 7

sum_node4 = SumNode(4,np.array([1,2]))
sum_node5 = SumNode(5,3)
sum_node6 = SumNode(6,1)
sum_node7 = SumNode(7,np.array([2,3]))

spn.add_node(sum_node4)
spn.add_node(sum_node5)
spn.add_node(sum_node6)
spn.add_node(sum_node7)

# Add leaf nodes
X1 = LeafNode(8,np.array([4,5]), 0, False)
X_1 = LeafNode(9,np.array([4,5]), 0, True)
X2 = LeafNode(10,np.array([6,7]), 1, False)
X_2 = LeafNode(11,np.array([6,7]), 1, True)
spn.add_node(X1,  np.array([random.randint(1,9),random.randint(1,9)]) )
spn.add_node(X_1, np.array([random.randint(1,9),random.randint(1,9)]))
spn.add_node(X2, np.array([random.randint(1,9), random.randint(1,9)]) )
spn.add_node(X_2, np.array([random.randint(1,9), random.randint(1,9)]))

spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.2222
To node 2 :    0.3333
To node 3 :    0.4444

Node ID 4
To node 8 :    0.3636
To node 9 :    0.6364

Node ID 5
To node 8 :    0.9000
To node 9 :    0.1000

Node ID 6
To node 10 :    0.6667
To node 11 :    0.3333

Node ID 7
To node 10 :    0.5000
To node 11 :    0.5000


In [31]:
for i in range(10):
    #spn.generative_soft_gd(data)
    spn.generative_hard_gd(data)
    
print("\nProbability x1", np.exp(spn.evaluate(x1)))
print("Probability x2", np.exp(spn.evaluate(x2)))
print("Probability x3", np.exp(spn.evaluate(x3)))
print("Probability x4", np.exp(spn.evaluate(x4)))


spn.print_weights()


Probability x1 0.922180468754
Probability x2 0.057820121246
Probability x3 0.018820101746
Probability x4 0.00118000825401

Node ID 0
To node 1 :    0.3340
To node 2 :    0.3339
To node 3 :    0.3321

Node ID 4
To node 8 :    0.0200
To node 9 :    0.9800

Node ID 5
To node 8 :    0.0200
To node 9 :    0.9800

Node ID 6
To node 10 :    0.0590
To node 11 :    0.9410

Node ID 7
To node 10 :    0.0590
To node 11 :    0.9410


# Example 4

In [273]:
# generate new dataset
x1 = np.array([0.0,0.0])
x2 = np.array([0.0,1.0])
x3 = np.array([1.0,0.0])
x4 = np.array([1.0,1.0])


data = []
for i in range(3):
    data.append(x1)
for i in range(1):
    data.append(x2)
for i in range(2):
    data.append(x3)
for i in range(4):
    data.append(x4)
    
data = np.array(data)
data = shuffle(data)
print(data.shape)

(10, 2)


In [317]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))


# Sum nodes 4 - 7
sum_node3 = SumNode(3,1)
sum_node4 = SumNode(4,2)

spn.add_node(sum_node3)
spn.add_node(sum_node4)

# Add leaf nodes
X1 = LeafNode(5,1, 0, False)
X_1 = LeafNode(6,2, 0, True)
X2 = LeafNode(7,np.array([3,4]), 1, False)
X_2 = LeafNode(8,np.array([3,4]), 1, True)
spn.add_node(X1, random.randint(1,9))
spn.add_node(X_1, random.randint(1,9))
spn.add_node(X2, random.randint(1,9))
spn.add_node(X_2, random.randint(1,9))

spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.3636
To node 2 :    0.6364

Node ID 3
To node 7 :    0.2500
To node 8 :    0.7500

Node ID 4
To node 7 :    0.2500
To node 8 :    0.7500


In [318]:
for i in range(10):
    #spn.generative_soft_gd(data)
    spn.generative_hard_gd(data)

print("\nProbability x1", np.exp(spn.evaluate(x1)))
print("Probability x2", np.exp(spn.evaluate(x2)))
print("Probability x3", np.exp(spn.evaluate(x3)))
print("Probability x4", np.exp(spn.evaluate(x4)))

spn.print_weights()

AttributeError: 'SPN' object has no attribute 'update_weights_gen_hard1'