In [1]:
import numpy as np
import random

%load_ext autoreload
%autoreload 2

from Node import Node
from Node import SumNode
from Node import ProductNode
from Node import LeafNode
from SPN import SPN

%matplotlib inline

# Generative

In [2]:
x1 = np.array([0.0,0.0,0.0])
x2 = np.array([0.0,1.0,0.0])
x3 = np.array([1.0,0.0,0.0])
x4 = np.array([1.0,1.0,0.0])

x5 = np.array([0.0,0.0,1.0])
x6 = np.array([0.0,1.0,1.0])
x7 = np.array([1.0,0.0,1.0])
x8 = np.array([1.0,1.0,1.0])

### Define XOR structure

In [3]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))

# Sum nodes 3 and 4
sum_node3 = SumNode(3,1)
sum_node4 = SumNode(4,2)
spn.add_node(sum_node3)
spn.add_node(sum_node4)

# Product nodes 5-8
prod_node5 = ProductNode(5,4)
prod_node6 = ProductNode(6,4)
prod_node7 = ProductNode(7,3)
prod_node8 = ProductNode(8,3)
spn.add_node(prod_node5, random.randint(1,9))
spn.add_node(prod_node6, random.randint(1,9))
spn.add_node(prod_node7, random.randint(1,9))
spn.add_node(prod_node8, random.randint(1,9))

# Add leaf nodes
X1 = LeafNode(9,np.array([6,7]), 0, False)
X_1 = LeafNode(10,np.array([5,8]), 0, True)
X2 = LeafNode(11,np.array([5,7]), 1, False)
X_2 = LeafNode(12,np.array([6,8]), 1, True)
X3 = LeafNode(13,np.array([2]), 2, False)
X_3 = LeafNode(14,np.array([1]), 2, True)
spn.add_node(X1)
spn.add_node(X_1)
spn.add_node(X2)
spn.add_node(X_2)
spn.add_node(X3)
spn.add_node(X_3)
spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.5000
To node 2 :    0.5000

Node ID 3
To node 7 :    0.2000
To node 8 :    0.8000

Node ID 4
To node 5 :    0.6667
To node 6 :    0.3333


### Untrained forward pass

In [4]:
print("Evaluate Forward Passes")
z = spn.compute_marginal()
print(spn.evaluate(x1))
print(spn.evaluate(x2))
print(spn.evaluate(x3))
print(spn.evaluate(x4))
print(spn.evaluate(x5))
print(spn.evaluate(x6))
print(spn.evaluate(x7))
print(spn.evaluate(x8))

print()
print(spn.map_inference())

Evaluate Forward Passes
0.4
0.0
0.0
0.1
0.0
0.333333333333
0.166666666667
0.0

parts
-1.12393009665
-0.994252273344
-0.129677823309
0.878378378378


### Train model

In [32]:
data = np.array([x1,x2,x3,x4,x5,x6,x7,x8])

print("Training...")
for i in range(10):
    #spn.generative_hard_gd(data)
    spn.generative_soft_gd(data)
    spn.normalise_weights()
    
print("Probability x1",spn.evaluate(x1))
print("Probability x2",spn.evaluate(x2))
print("Probability x3",spn.evaluate(x3))
print("Probability x4",spn.evaluate(x4))
print("Probability x5",spn.evaluate(x5))
print("Probability x6",spn.evaluate(x6))
print("Probability x7",spn.evaluate(x7))
print("Probability x8",spn.evaluate(x8))

spn.print_weights()

Training...
Probability x1 0.250149076418
Probability x2 0.0
Probability x3 0.0
Probability x4 0.249850923582
Probability x5 0.0
Probability x6 0.250082820232
Probability x7 0.249917179768
Probability x8 0.0

Node ID 0
To node 1 :    0.5000
To node 2 :    0.5000

Node ID 3
To node 7 :    0.4997
To node 8 :    0.5003

Node ID 4
To node 5 :    0.5002
To node 6 :    0.4998


# Example 2

### Define Example 2 structure

In [33]:
# generate new dataset
x1 = np.array([0.0,0.0,0.0])
x2 = np.array([0.0,0.0,1.0])
x3 = np.array([0.0,1.0,0.0])
x4 = np.array([0.0,1.0,1.0])

x5 = np.array([1.0,0.0,0.0])
x6 = np.array([1.0,0.0,1.0])
x7 = np.array([1.0,1.0,0.0])
x8 = np.array([1.0,1.0,1.0])

data = []
y = []
for i in range(10):
    data.append(x1)
    y.append(0)
for i in range(90):
    data.append(x2)
    y.append(0)
for i in range(10):
    data.append(x3)
    y.append(0)
for i in range(90):
    data.append(x4)
    y.append(0)
for i in range(224):
    data.append(x5)
for i in range(336):
    data.append(x6)
for i in range(96):
    data.append(x7)
for i in range(144):
    data.append(x8)
# make arrays
data = np.array(data)
random.shuffle(data)
print(data.shape)

(1000, 3)


In [34]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))

# Sum nodes 3 - 6
sum_node3 = SumNode(3,1)
sum_node4 = SumNode(4,2)
sum_node5 = SumNode(5,1)
sum_node6 = SumNode(6,2)
spn.add_node(sum_node3)
spn.add_node(sum_node4)
spn.add_node(sum_node5)
spn.add_node(sum_node6)

# Add leaf nodes
X1 = LeafNode(7,np.array([1]), 0, False)
X_1 = LeafNode(8,np.array([2]), 0, True)
X2 = LeafNode(9,np.array([3,4]), 1, False)
X_2 = LeafNode(10,np.array([3,4]), 1, True)
X3 = LeafNode(11,np.array([5,6]), 2, False)
X_3 = LeafNode(12,np.array([5,6]), 2, True)
spn.add_node(X1,  np.array([random.randint(1,9)]) )
spn.add_node(X_1, np.array([random.randint(1,9)]))
spn.add_node(X2, np.array([random.randint(1,9), random.randint(1,9)]) )
spn.add_node(X_2, np.array([random.randint(1,9), random.randint(1,9)]))
spn.add_node(X3, np.array([random.randint(1,9), random.randint(1,9)]))
spn.add_node(X_3, np.array([random.randint(1,9), random.randint(1,9)]))

spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.8000
To node 2 :    0.2000

Node ID 3
To node 9 :    0.3077
To node 10 :    0.6923

Node ID 4
To node 9 :    0.5000
To node 10 :    0.5000

Node ID 5
To node 11 :    0.7273
To node 12 :    0.2727

Node ID 6
To node 11 :    0.5294
To node 12 :    0.4706


In [35]:
for i in range(200):
    spn.generative_soft_gd(data)
    #spn.generative_hard_gd(data)
    spn.normalise_weights()
    
print("Probability x1",spn.evaluate(x1))
print("Probability x2",spn.evaluate(x2))
print("Probability x3",spn.evaluate(x3))
print("Probability x4",spn.evaluate(x4))
print("Probability x5",spn.evaluate(x5))
print("Probability x6",spn.evaluate(x6))
print("Probability x7",spn.evaluate(x7))
print("Probability x8",spn.evaluate(x8))

spn.print_weights()
print("\nShould be:")
print("0: 0.8, 0.2")
print("3: 0.3, 0.7")
print("4: 0.5, 0.5")
print("5: 0.6, 0.4")
print("6: 0.9, 0.1")

Probability x1 0.122377276909
Probability x2 0.122503535635
Probability x3 0.122377276909
Probability x4 0.122503535635
Probability x5 0.127502661766
Probability x6 0.127984177015
Probability x7 0.127135703353
Probability x8 0.127615832779

Node ID 0
To node 1 :    0.5102
To node 2 :    0.4898

Node ID 3
To node 9 :    0.4993
To node 10 :    0.5007

Node ID 4
To node 9 :    0.5000
To node 10 :    0.5000

Node ID 5
To node 11 :    0.5009
To node 12 :    0.4991

Node ID 6
To node 11 :    0.5003
To node 12 :    0.4997

Should be:
0: 0.8, 0.2
3: 0.3, 0.7
4: 0.5, 0.5
5: 0.6, 0.4
6: 0.9, 0.1


# Test with correct weights

In [36]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, 0.8)
spn.add_node(prod_node2, 0.2)

# Sum nodes 3 - 6
sum_node3 = SumNode(3,1)
sum_node4 = SumNode(4,2)
sum_node5 = SumNode(5,1)
sum_node6 = SumNode(6,2)
spn.add_node(sum_node3)
spn.add_node(sum_node4)
spn.add_node(sum_node5)
spn.add_node(sum_node6)

# Add leaf nodes
X1 = LeafNode(7,np.array([1]), 0, False)
X_1 = LeafNode(8,np.array([2]), 0, True)
X2 = LeafNode(9,np.array([3,4]), 1, False)
X_2 = LeafNode(10,np.array([3,4]), 1, True)
X3 = LeafNode(11,np.array([5,6]), 2, False)
X_3 = LeafNode(12,np.array([5,6]), 2, True)
spn.add_node(X1,  np.array([random.randint(1,9)]) )
spn.add_node(X_1, np.array([random.randint(1,9)]))
spn.add_node(X2, np.array([0.3, 0.5]) )
spn.add_node(X_2, np.array([0.7, 0.5]))
spn.add_node(X3, np.array([0.6, 0.9]))
spn.add_node(X_3, np.array([0.4, 0.1]))

spn.normalise_weights()
spn.print_weights()
print()
print("Probability x1",spn.evaluate(x1)/spn.compute_marginal())
print("Probability x2",spn.evaluate(x2)/spn.compute_marginal())
print("Probability x3",spn.evaluate(x3)/spn.compute_marginal())
print("Probability x4",spn.evaluate(x4)/spn.compute_marginal())
print("Probability x5",spn.evaluate(x5)/spn.compute_marginal())
print("Probability x6",spn.evaluate(x6)/spn.compute_marginal())
print("Probability x7",spn.evaluate(x7)/spn.compute_marginal())
print("Probability x8",spn.evaluate(x8)/spn.compute_marginal())


Node ID 0
To node 1 :    0.8000
To node 2 :    0.2000

Node ID 3
To node 9 :    0.3000
To node 10 :    0.7000

Node ID 4
To node 9 :    0.5000
To node 10 :    0.5000

Node ID 5
To node 11 :    0.6000
To node 12 :    0.4000

Node ID 6
To node 11 :    0.9000
To node 12 :    0.1000

Probability x1 0.01
Probability x2 0.09
Probability x3 0.01
Probability x4 0.09
Probability x5 0.224
Probability x6 0.336
Probability x7 0.096
Probability x8 0.144


In [37]:
for i in range(10):
    #spn.generative_soft_gd(data)
    spn.generative_hard_gd(data)
    spn.normalise_weights()
    
print("Probability x1",spn.evaluate(x1)/spn.compute_marginal())
print("Probability x2",spn.evaluate(x2)/spn.compute_marginal())
print("Probability x3",spn.evaluate(x3)/spn.compute_marginal())
print("Probability x4",spn.evaluate(x4)/spn.compute_marginal())
print("Probability x5",spn.evaluate(x5)/spn.compute_marginal())
print("Probability x6",spn.evaluate(x6)/spn.compute_marginal())
print("Probability x7",spn.evaluate(x7)/spn.compute_marginal())
print("Probability x8",spn.evaluate(x8)/spn.compute_marginal())

spn.print_weights()

Probability x1 0.0527659574468
Probability x2 0.288234042553
Probability x3 0.0272340425532
Probability x4 0.148765957447
Probability x5 0.251552795031
Probability x6 0.198447204969
Probability x7 0.0184472049689
Probability x8 0.0145527950311

Node ID 0
To node 1 :    0.4830
To node 2 :    0.5170

Node ID 3
To node 9 :    0.0683
To node 10 :    0.9317

Node ID 4
To node 9 :    0.3404
To node 10 :    0.6596

Node ID 5
To node 11 :    0.4410
To node 12 :    0.5590

Node ID 6
To node 11 :    0.8453
To node 12 :    0.1547


# Desperate Example

In [38]:
# generate new dataset
x1 = np.array([0.0,0.0])
x2 = np.array([0.0,1.0])
x3 = np.array([1.0,0.0])
x4 = np.array([1.0,1.0])


data = []
for i in range(3):
    data.append(x1)
for i in range(7):
    data.append(x4)
    
data = np.array(data)

In [39]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))

# Add leaf nodes
X1 = LeafNode(3, 2, 0, False)
X_1 = LeafNode(4, 1, 0, True)
X2 = LeafNode(5, 2, 1, False)
X_2 = LeafNode(6, 1, 1, True )

spn.add_node(X1)
spn.add_node(X_1)
spn.add_node(X2)
spn.add_node(X_2)

spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.4000
To node 2 :    0.6000


In [40]:
for i in range(10):
    spn.generative_soft_gd(data)
    #spn.generative_hard_gd(data)
    spn.normalise_weights()
    
print("Probability x1",spn.evaluate(x1)/spn.compute_marginal())
print("Probability x2",spn.evaluate(x2)/spn.compute_marginal())
print("Probability x3",spn.evaluate(x3)/spn.compute_marginal())
print("Probability x4",spn.evaluate(x4)/spn.compute_marginal())

spn.print_weights()

Probability x1 0.300000000004
Probability x2 0.0
Probability x3 0.0
Probability x4 0.699999999996

Node ID 0
To node 1 :    0.3000
To node 2 :    0.7000


# Example 3

In [41]:
# generate new dataset
x1 = np.array([0.0,0.0])
x2 = np.array([0.0,1.0])
x3 = np.array([1.0,0.0])
x4 = np.array([1.0,1.0])


data = []
for i in range(603):
    data.append(x1)
for i in range(207):
    data.append(x2)
for i in range(147):
    data.append(x3)
for i in range(43):
    data.append(x4)
    
data = np.array(data)
random.shuffle(data)
print(data.shape)

(1000, 2)


In [45]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
prod_node3 = ProductNode(3, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))
spn.add_node(prod_node3, random.randint(1,9))

# Sum nodes 4 - 7

sum_node4 = SumNode(4,np.array([1,2]))
sum_node5 = SumNode(5,3)
sum_node6 = SumNode(6,1)
sum_node7 = SumNode(7,np.array([2,3]))

spn.add_node(sum_node4)
spn.add_node(sum_node5)
spn.add_node(sum_node6)
spn.add_node(sum_node7)

# Add leaf nodes
X1 = LeafNode(8,np.array([4,5]), 0, False)
X_1 = LeafNode(9,np.array([4,5]), 0, True)
X2 = LeafNode(10,np.array([6,7]), 1, False)
X_2 = LeafNode(11,np.array([6,7]), 1, True)
spn.add_node(X1,  np.array([random.randint(1,9),random.randint(1,9)]) )
spn.add_node(X_1, np.array([random.randint(1,9),random.randint(1,9)]))
spn.add_node(X2, np.array([random.randint(1,9), random.randint(1,9)]) )
spn.add_node(X_2, np.array([random.randint(1,9), random.randint(1,9)]))

spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.4375
To node 2 :    0.5625

Node ID 3
To node 7 :    0.4000
To node 8 :    0.6000

Node ID 4
To node 7 :    0.4000
To node 8 :    0.6000


In [46]:
for i in range(10):
    spn.generative_soft_gd(data)
    #spn.generative_hard_gd(data)
    spn.normalise_weights()
    
print("Probability x1",spn.evaluate(x1))
print("Probability x2",spn.evaluate(x2)/spn.compute_marginal())
print("Probability x3",spn.evaluate(x3)/spn.compute_marginal())
print("Probability x4",spn.evaluate(x4)/spn.compute_marginal())


spn.print_weights()

Probability x1 0.256069211191
Probability x2 0.202291137596
Probability x3 0.30289107833
Probability x4 0.238748572883

Node ID 0
To node 1 :    0.5416
To node 2 :    0.4584

Node ID 3
To node 7 :    0.4408
To node 8 :    0.5592

Node ID 4
To node 7 :    0.4413
To node 8 :    0.5587


# Example 4

In [47]:
# generate new dataset
x1 = np.array([0.0,0.0])
x2 = np.array([0.0,1.0])
x3 = np.array([1.0,0.0])
x4 = np.array([1.0,1.0])


data = []
for i in range(30):
    data.append(x1)
for i in range(10):
    data.append(x2)
for i in range(20):
    data.append(x3)
for i in range(40):
    data.append(x4)
    
data = np.array(data)
random.shuffle(data)
print(data.shape)

(100, 2)


In [48]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))


# Sum nodes 4 - 7
sum_node3 = SumNode(3,1)
sum_node4 = SumNode(4,2)

spn.add_node(sum_node3)
spn.add_node(sum_node4)

# Add leaf nodes
X1 = LeafNode(5,1, 0, False)
X_1 = LeafNode(6,2, 0, True)
X2 = LeafNode(7,np.array([3,4]), 1, False)
X_2 = LeafNode(8,np.array([3,4]), 1, True)
spn.add_node(X1, random.randint(1,9))
spn.add_node(X_1, random.randint(1,9))
spn.add_node(X2, random.randint(1,9))
spn.add_node(X_2, random.randint(1,9))

spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.5000
To node 2 :    0.5000

Node ID 3
To node 7 :    0.4167
To node 8 :    0.5833

Node ID 4
To node 7 :    0.4167
To node 8 :    0.5833


In [68]:
for i in range(10):
    spn.generative_soft_gd(data)
    #spn.generative_hard_gd(data)
    spn.normalise_weights()
    
print("Probability x1",spn.evaluate(x1))
print("Probability x2",spn.evaluate(x2)/spn.compute_marginal())
print("Probability x3",spn.evaluate(x3)/spn.compute_marginal())
print("Probability x4",spn.evaluate(x4)/spn.compute_marginal())


spn.print_weights()

Probability x1 0.201680631498
Probability x2 0.201660270174
Probability x3 0.298330018408
Probability x4 0.29832907992

Node ID 0
To node 1 :    0.5967
To node 2 :    0.4033

Node ID 3
To node 7 :    0.5000
To node 8 :    0.5000

Node ID 4
To node 7 :    0.5000
To node 8 :    0.5000
