In [1]:
import numpy as np
import random

%load_ext autoreload
%autoreload 2

from Node import Node
from Node import SumNode
from Node import ProductNode
from Node import LeafNode
from SPN import SPN

%matplotlib inline

# Generative

In [2]:
x1 = np.array([0.0,0.0,0.0])
x2 = np.array([0.0,1.0,0.0])
x3 = np.array([1.0,0.0,0.0])
x4 = np.array([1.0,1.0,0.0])

x5 = np.array([0.0,0.0,1.0])
x6 = np.array([0.0,1.0,1.0])
x7 = np.array([1.0,0.0,1.0])
x8 = np.array([1.0,1.0,1.0])

### Define XOR structure

In [3]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))

# Sum nodes 3 and 4
sum_node3 = SumNode(3,1)
sum_node4 = SumNode(4,2)
spn.add_node(sum_node3)
spn.add_node(sum_node4)

# Product nodes 5-8
prod_node5 = ProductNode(5,4)
prod_node6 = ProductNode(6,4)
prod_node7 = ProductNode(7,3)
prod_node8 = ProductNode(8,3)
spn.add_node(prod_node5, random.randint(1,9))
spn.add_node(prod_node6, random.randint(1,9))
spn.add_node(prod_node7, random.randint(1,9))
spn.add_node(prod_node8, random.randint(1,9))

# Add leaf nodes
X1 = LeafNode(9,np.array([6,7]), 0, False)
X_1 = LeafNode(10,np.array([5,8]), 0, True)
X2 = LeafNode(11,np.array([5,7]), 1, False)
X_2 = LeafNode(12,np.array([6,8]), 1, True)
X3 = LeafNode(13,np.array([2]), 2, False)
X_3 = LeafNode(14,np.array([1]), 2, True)
spn.add_node(X1)
spn.add_node(X_1)
spn.add_node(X2)
spn.add_node(X_2)
spn.add_node(X3)
spn.add_node(X_3)
spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.2000
To node 2 :    0.8000

Node ID 3
To node 7 :    0.5000
To node 8 :    0.5000

Node ID 4
To node 5 :    0.3000
To node 6 :    0.7000


### Untrained forward pass

In [4]:
print("Evaluate Forward Passes")
z = spn.compute_marginal()
print(spn.evaluate(x1))
print(spn.evaluate(x2))
print(spn.evaluate(x3))
print(spn.evaluate(x4))
print(spn.evaluate(x5))
print(spn.evaluate(x6))
print(spn.evaluate(x7))
print(spn.evaluate(x8))

print()
print(spn.map_inference())

Evaluate Forward Passes
0.1
0.0
0.0
0.1
0.0
0.24
0.56
0.0

parts
-2.50103603172
-1.87080267657
-0.630233355149
0.532467532468


### Train model

In [37]:
data = np.array([x1,x2,x3,x4,x5,x6,x7,x8])
#data = np.array([x1,x2])

print("Training...")
for i in range(10):
    #spn.generative_hard_gd(data)
    spn.generative_soft_gd(data)
    spn.normalise_weights()
    
print("Probability x1",spn.evaluate(x1)/spn.compute_marginal())
print("Probability x2",spn.evaluate(x2)/spn.compute_marginal())
print("Probability x3",spn.evaluate(x3)/spn.compute_marginal())
print("Probability x4",spn.evaluate(x4)/spn.compute_marginal())
print("Probability x5",spn.evaluate(x5)/spn.compute_marginal())
print("Probability x6",spn.evaluate(x6)/spn.compute_marginal())
print("Probability x7",spn.evaluate(x7)/spn.compute_marginal())
print("Probability x8",spn.evaluate(x8)/spn.compute_marginal())

spn.print_weights()

Training...
Probability x1 0.24997676937
Probability x2 0.0
Probability x3 0.0
Probability x4 0.24997676937
Probability x5 0.0
Probability x6 0.244155084163
Probability x7 0.255891377096
Probability x8 0.0

Node ID 0
To node 1 :    0.5000
To node 2 :    0.5000

Node ID 3
To node 7 :    0.5000
To node 8 :    0.5000

Node ID 4
To node 5 :    0.4883
To node 6 :    0.5117


  d_ds = np.log(output)


# Example 2

### Define Example 2 structure

In [38]:
# generate new dataset
x1 = np.array([0.0,0.0,0.0])
x2 = np.array([0.0,0.0,1.0])
x3 = np.array([0.0,1.0,0.0])
x4 = np.array([0.0,1.0,1.0])

x5 = np.array([1.0,0.0,0.0])
x6 = np.array([1.0,0.0,1.0])
x7 = np.array([1.0,1.0,0.0])
x8 = np.array([1.0,1.0,1.0])

data = []
y = []
for i in range(10):
    data.append(x1)
    y.append(0)
for i in range(90):
    data.append(x2)
    y.append(0)
for i in range(10):
    data.append(x3)
    y.append(0)
for i in range(90):
    data.append(x4)
    y.append(0)
for i in range(224):
    data.append(x5)
for i in range(336):
    data.append(x6)
for i in range(96):
    data.append(x7)
for i in range(144):
    data.append(x8)
# make arrays
data = np.array(data)
random.shuffle(data)
print(data.shape)

(1000, 3)


In [39]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))

# Sum nodes 3 - 6
sum_node3 = SumNode(3,1)
sum_node4 = SumNode(4,2)
sum_node5 = SumNode(5,1)
sum_node6 = SumNode(6,2)
spn.add_node(sum_node3)
spn.add_node(sum_node4)
spn.add_node(sum_node5)
spn.add_node(sum_node6)

# Add leaf nodes
X1 = LeafNode(7,np.array([1]), 0, False)
X_1 = LeafNode(8,np.array([2]), 0, True)
X2 = LeafNode(9,np.array([3,4]), 1, False)
X_2 = LeafNode(10,np.array([3,4]), 1, True)
X3 = LeafNode(11,np.array([5,6]), 2, False)
X_3 = LeafNode(12,np.array([5,6]), 2, True)
spn.add_node(X1,  np.array([random.randint(1,9)]) )
spn.add_node(X_1, np.array([random.randint(1,9)]))
spn.add_node(X2, np.array([random.randint(1,9), random.randint(1,9)]) )
spn.add_node(X_2, np.array([random.randint(1,9), random.randint(1,9)]))
spn.add_node(X3, np.array([random.randint(1,9), random.randint(1,9)]))
spn.add_node(X_3, np.array([random.randint(1,9), random.randint(1,9)]))

spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.6923
To node 2 :    0.3077

Node ID 3
To node 9 :    0.5455
To node 10 :    0.4545

Node ID 4
To node 9 :    0.3333
To node 10 :    0.6667

Node ID 5
To node 11 :    0.6154
To node 12 :    0.3846

Node ID 6
To node 11 :    0.5556
To node 12 :    0.4444


In [42]:
for i in range(200):
    spn.generative_soft_gd(data)
    #spn.generative_hard_gd(data)
    spn.normalise_weights()
    
print("Probability x1",spn.evaluate(x1)/spn.compute_marginal())
print("Probability x2",spn.evaluate(x2)/spn.compute_marginal())
print("Probability x3",spn.evaluate(x3)/spn.compute_marginal())
print("Probability x4",spn.evaluate(x4)/spn.compute_marginal())
print("Probability x5",spn.evaluate(x5)/spn.compute_marginal())
print("Probability x6",spn.evaluate(x6)/spn.compute_marginal())
print("Probability x7",spn.evaluate(x7)/spn.compute_marginal())
print("Probability x8",spn.evaluate(x8)/spn.compute_marginal())

spn.print_weights()
print("\nShould be:")
print("0: 0.8, 0.2")
print("3: 0.3, 0.7")
print("4: 0.5, 0.5")
print("5: 0.6, 0.4")
print("6: 0.9, 0.1")

Probability x1 0.122205039901
Probability x2 0.123325162447
Probability x3 0.119754027334
Probability x4 0.120851684077
Probability x5 0.127243854093
Probability x6 0.128849958676
Probability x7 0.128076827443
Probability x8 0.12969344603

Node ID 0
To node 1 :    0.5139
To node 2 :    0.4861

Node ID 3
To node 9 :    0.5016
To node 10 :    0.4984

Node ID 4
To node 9 :    0.4949
To node 10 :    0.5051

Node ID 5
To node 11 :    0.5031
To node 12 :    0.4969

Node ID 6
To node 11 :    0.5023
To node 12 :    0.4977

Should be:
0: 0.8, 0.2
3: 0.3, 0.7
4: 0.5, 0.5
5: 0.6, 0.4
6: 0.9, 0.1


In [43]:
print(x3)

[ 0.  1.  0.]


# Test with correct weights

In [38]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, 0.8)
spn.add_node(prod_node2, 0.2)

# Sum nodes 3 - 6
sum_node3 = SumNode(3,1)
sum_node4 = SumNode(4,2)
sum_node5 = SumNode(5,1)
sum_node6 = SumNode(6,2)
spn.add_node(sum_node3)
spn.add_node(sum_node4)
spn.add_node(sum_node5)
spn.add_node(sum_node6)

# Add leaf nodes
X1 = LeafNode(7,np.array([1]), 0, False)
X_1 = LeafNode(8,np.array([2]), 0, True)
X2 = LeafNode(9,np.array([3,4]), 1, False)
X_2 = LeafNode(10,np.array([3,4]), 1, True)
X3 = LeafNode(11,np.array([5,6]), 2, False)
X_3 = LeafNode(12,np.array([5,6]), 2, True)
spn.add_node(X1,  np.array([random.randint(1,9)]) )
spn.add_node(X_1, np.array([random.randint(1,9)]))
spn.add_node(X2, np.array([0.3, 0.5]) )
spn.add_node(X_2, np.array([0.7, 0.5]))
spn.add_node(X3, np.array([0.6, 0.9]))
spn.add_node(X_3, np.array([0.4, 0.1]))

spn.normalise_weights()
spn.print_weights()
print()
print("Probability x1",spn.evaluate(x1)/spn.compute_marginal())
print("Probability x2",spn.evaluate(x2)/spn.compute_marginal())
print("Probability x3",spn.evaluate(x3)/spn.compute_marginal())
print("Probability x4",spn.evaluate(x4)/spn.compute_marginal())
print("Probability x5",spn.evaluate(x5)/spn.compute_marginal())
print("Probability x6",spn.evaluate(x6)/spn.compute_marginal())
print("Probability x7",spn.evaluate(x7)/spn.compute_marginal())
print("Probability x8",spn.evaluate(x8)/spn.compute_marginal())


Node ID 0
To node 1 :    0.8000
To node 2 :    0.2000

Node ID 3
To node 9 :    0.3000
To node 10 :    0.7000

Node ID 4
To node 9 :    0.5000
To node 10 :    0.5000

Node ID 5
To node 11 :    0.6000
To node 12 :    0.4000

Node ID 6
To node 11 :    0.9000
To node 12 :    0.1000

Probability x1 0.01
Probability x2 0.09
Probability x3 0.01
Probability x4 0.09
Probability x5 0.224
Probability x6 0.336
Probability x7 0.096
Probability x8 0.144


In [39]:
for i in range(10):
    #spn.generative_soft_gd(data)
    spn.generative_hard_gd(data)
    spn.normalise_weights()
    
print("Probability x1",spn.evaluate(x1)/spn.compute_marginal())
print("Probability x2",spn.evaluate(x2)/spn.compute_marginal())
print("Probability x3",spn.evaluate(x3)/spn.compute_marginal())
print("Probability x4",spn.evaluate(x4)/spn.compute_marginal())
print("Probability x5",spn.evaluate(x5)/spn.compute_marginal())
print("Probability x6",spn.evaluate(x6)/spn.compute_marginal())
print("Probability x7",spn.evaluate(x7)/spn.compute_marginal())
print("Probability x8",spn.evaluate(x8)/spn.compute_marginal())

spn.print_weights()

Probability x1 0.0485139664804
Probability x2 0.28548603352
Probability x3 0.0294860335196
Probability x4 0.17351396648
Probability x5 0.235278617711
Probability x6 0.198721382289
Probability x7 0.0157213822894
Probability x8 0.0132786177106

Node ID 0
To node 1 :    0.4630
To node 2 :    0.5370

Node ID 3
To node 9 :    0.0626
To node 10 :    0.9374

Node ID 4
To node 9 :    0.3780
To node 10 :    0.6220

Node ID 5
To node 11 :    0.4579
To node 12 :    0.5421

Node ID 6
To node 11 :    0.8547
To node 12 :    0.1453


# Desperate Example

In [40]:
# generate new dataset
x1 = np.array([0.0,0.0])
x2 = np.array([0.0,1.0])
x3 = np.array([1.0,0.0])
x4 = np.array([1.0,1.0])


data = []
for i in range(3):
    data.append(x1)
for i in range(7):
    data.append(x4)
    
data = np.array(data)

In [41]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))

# Add leaf nodes
X1 = LeafNode(3, 2, 0, False)
X_1 = LeafNode(4, 1, 0, True)
X2 = LeafNode(5, 2, 1, False)
X_2 = LeafNode(6, 1, 1, True )

spn.add_node(X1)
spn.add_node(X_1)
spn.add_node(X2)
spn.add_node(X_2)

spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.5294
To node 2 :    0.4706


In [42]:
for i in range(10):
    #spn.generative_soft_gd(data)
    spn.generative_hard_gd(data)
    spn.normalise_weights()
    
print("Probability x1",spn.evaluate(x1)/spn.compute_marginal())
print("Probability x2",spn.evaluate(x2)/spn.compute_marginal())
print("Probability x3",spn.evaluate(x3)/spn.compute_marginal())
print("Probability x4",spn.evaluate(x4)/spn.compute_marginal())

spn.print_weights()

Probability x1 0.300000000009
Probability x2 0.0
Probability x3 0.0
Probability x4 0.699999999991

Node ID 0
To node 1 :    0.3000
To node 2 :    0.7000


# Example 3

In [57]:
# generate new dataset
x1 = np.array([0.0,0.0])
x2 = np.array([0.0,1.0])
x3 = np.array([1.0,0.0])
x4 = np.array([1.0,1.0])


data = []
for i in range(603):
    data.append(x1)
for i in range(207):
    data.append(x2)
for i in range(147):
    data.append(x3)
for i in range(43):
    data.append(x4)
    
data = np.array(data)
random.shuffle(data)
print(data.shape)

(1000, 2)


In [106]:
spn = SPN()
# root node id = 0
root_node = SumNode(0, 0)
spn.add_node(root_node)

# Product nodes 1 and 2
prod_node1 = ProductNode(1, 0)
prod_node2 = ProductNode(2, 0)
prod_node3 = ProductNode(3, 0)
spn.add_node(prod_node1, random.randint(1,9))
spn.add_node(prod_node2, random.randint(1,9))
spn.add_node(prod_node3, random.randint(1,9))

# Sum nodes 4 - 7

sum_node4 = SumNode(4,np.array([1,2]))
sum_node5 = SumNode(5,3)
sum_node6 = SumNode(6,1)
sum_node7 = SumNode(7,np.array([2,3]))

spn.add_node(sum_node4)
spn.add_node(sum_node5)
spn.add_node(sum_node6)
spn.add_node(sum_node7)

# Add leaf nodes
X1 = LeafNode(8,np.array([4,5]), 0, False)
X_1 = LeafNode(9,np.array([4,5]), 0, True)
X2 = LeafNode(10,np.array([6,7]), 1, False)
X_2 = LeafNode(11,np.array([6,7]), 1, True)
spn.add_node(X1,  np.array([random.randint(1,9),random.randint(1,9)]) )
spn.add_node(X_1, np.array([random.randint(1,9),random.randint(1,9)]))
spn.add_node(X2, np.array([random.randint(1,9), random.randint(1,9)]) )
spn.add_node(X_2, np.array([random.randint(1,9), random.randint(1,9)]))

spn.normalise_weights()
spn.print_weights()


Node ID 0
To node 1 :    0.2308
To node 2 :    0.0769
To node 3 :    0.6923

Node ID 4
To node 8 :    0.4000
To node 9 :    0.6000

Node ID 5
To node 8 :    0.6000
To node 9 :    0.4000

Node ID 6
To node 10 :    0.3333
To node 11 :    0.6667

Node ID 7
To node 10 :    0.6923
To node 11 :    0.3077


In [115]:
for i in range(10):
    spn.generative_soft_gd(data)
    #spn.generative_hard_gd(data)
    spn.normalise_weights()
    
print("Probability x1",spn.evaluate(x1))
print("Probability x2",spn.evaluate(x2)/spn.compute_marginal())
print("Probability x3",spn.evaluate(x3)/spn.compute_marginal())
print("Probability x4",spn.evaluate(x4)/spn.compute_marginal())


spn.print_weights()

Probability x1 1.0
Probability x2 1.0
Probability x3 1.0
Probability x4 1.0


In [114]:
x = np.log(0.5)
y = Node.LOG_ZERO
print (np.logaddexp(x,y))
print (np.exp(np.logaddexp(x,y)))

-0.69314718056
0.5
