From 5b48e94933344471233afdcea8bdf592eb90efb5 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Wed, 8 Jul 2020 20:23:04 -0700
Subject: [PATCH 001/131] refactoring LogicNode hierarchy

---
 src/IO/CircuitLineCompiler.jl            |  6 +-
 src/IO/CircuitSaver.jl                   | 28 ++++-----
 src/IO/IO.jl                             |  2 +-
 src/Logistic/Logistic.jl                 |  2 +-
 src/Logistic/LogisticCircuits.jl         | 26 ++++----
 src/Probabilistic/ProbCircuits.jl        | 78 ++++++++++++------------
 src/Probabilistic/ProbFlowCircuits.jl    |  4 +-
 src/Probabilistic/Probabilistic.jl       |  2 +-
 src/Probabilistic/Queries.jl             | 48 +++++++--------
 src/Probabilistic/VtreeLearner.jl        |  2 +-
 src/Reasoning/ExpFlowCircuits.jl         | 28 ++++-----
 src/Reasoning/Expectation.jl             |  8 +--
 src/StructureLearner/CircuitBuilder.jl   | 14 ++---
 src/StructureLearner/PSDDInitializer.jl  | 50 +++++++--------
 test/Logistic/LogisticCircuitTest.jl     |  4 +-
 test/Probabilistic/CircuitQueriesTest.jl |  4 +-
 test/Probabilistic/EntropyKLDTest.jl     |  6 +-
 test/Probabilistic/PrConstraintTest.jl   |  4 +-
 18 files changed, 158 insertions(+), 158 deletions(-)

diff --git a/src/IO/CircuitLineCompiler.jl b/src/IO/CircuitLineCompiler.jl
index 32abf1a2..ed689467 100644
--- a/src/IO/CircuitLineCompiler.jl
+++ b/src/IO/CircuitLineCompiler.jl
@@ -35,7 +35,7 @@ function compile_struct_prob(circuit_lines::CircuitFormatLines, vtree_lines::Vtr
     return prob_circuit, vtree
 end
 
-function decorate_prob(lines::CircuitFormatLines, logical_circuit::LogicalΔ, id2lognode::Dict{ID,<:LogicalΔNode})::ProbΔ
+function decorate_prob(lines::CircuitFormatLines, logical_circuit::LogicΔ, id2lognode::Dict{ID,<:LogicNode})::ProbΔ
     # set up cache mapping logical circuit nodes to their probabilistic decorator
     lognode2probnode = ProbCache()
     # build a corresponding probabilistic circuit
@@ -68,8 +68,8 @@ function decorate_prob(lines::CircuitFormatLines, logical_circuit::LogicalΔ, id
 end
 
 
-function decorate_logistic(lines::CircuitFormatLines, logical_circuit::LogicalΔ, 
-                            classes::Int, id2lognode::Dict{ID,<:LogicalΔNode})::LogisticΔ
+function decorate_logistic(lines::CircuitFormatLines, logical_circuit::LogicΔ, 
+                            classes::Int, id2lognode::Dict{ID,<:LogicNode})::LogisticΔ
                         
     # set up cache mapping logical circuit nodes to their logistic decorator
     log2logistic = LogisticCache()
diff --git a/src/IO/CircuitSaver.jl b/src/IO/CircuitSaver.jl
index 9bba0d78..149d6d55 100644
--- a/src/IO/CircuitSaver.jl
+++ b/src/IO/CircuitSaver.jl
@@ -24,12 +24,12 @@ decompile(n::ProbLiteral, node2id, vtree2id)::UnweightedLiteralLine =
 make_element(n::Prob⋀, w::AbstractFloat, node2id) = 
     PSDDElement(node2id[n.children[1]],  node2id[n.children[2]], w)
 
-is_true_node(n)::Bool = 
+istrue_node(n)::Bool = 
     GateType(n) isa ⋁Gate && num_children(n) == 2 && GateType(children(n)[1]) isa LiteralGate && GateType(children(n)[2]) isa LiteralGate && 
-    positive(children(n)[1]) && negative(children(n)[2])
+    ispositive(children(n)[1]) && isnegative(children(n)[2])
 
 function decompile(n::Prob⋁, node2id, vtree2id)::Union{WeightedNamedConstantLine, DecisionLine{PSDDElement}} 
-    if is_true_node(n)
+    if istrue_node(n)
         WeightedNamedConstantLine(node2id[n], vtree2id[n.origin.vtree], lit2var(n.children[1].origin.literal), n.log_thetas[1]) # TODO
     else
         DecisionLine(node2id[n], vtree2id[n.origin.vtree], UInt32(num_children(n)), map(x -> make_element(x[1], x[2], node2id), zip(children(n), n.log_thetas)))
@@ -52,8 +52,8 @@ function get_node2id(ln::AbstractVector{X}, T::Type)where X #<: T#::Dict{T, ID}
     node2id
 end
 
-function get_vtree2id(ln::PlainVtree):: Dict{PlainVtreeNode, ID}
-    vtree2id = Dict{PlainVtreeNode, ID}()
+function get_vtree2id(ln::PlainVtree):: Dict{PlainVTree, ID}
+    vtree2id = Dict{PlainVTree, ID}()
     sizehint!(vtree2id, length(ln))
     index = ID(0) # vtree id start from 0
 
@@ -86,9 +86,9 @@ end
 
 function save_psdd_file(name::String, ln::ProbΔ, vtree::PlainVtree)
     # TODO add method isstructured
-    @assert ln[end].origin isa StructLogicalΔNode "PSDD should decorate on StructLogicalΔ"
+    @assert ln[end].origin isa StructLogicNode "PSDD should decorate on StructLogicΔ"
     @assert endswith(name, ".psdd")
-    node2id = get_node2id(ln, ProbΔNode)
+    node2id = get_node2id(ln, ProbNode)
     vtree2id = get_vtree2id(vtree)
     formatlines = Vector{CircuitFormatLine}()
     append!(formatlines, parse_psdd_file(IOBuffer(psdd_header())))
@@ -122,9 +122,9 @@ function lc_header()
 end
     
 function save_lc_file(name::String, ln::LogisticΔ, vtree)
-    @assert ln[end].origin isa StructLogicalΔNode "LC should decorate on StructLogicalΔ"
+    @assert ln[end].origin isa StructLogicNode "LC should decorate on StructLogicΔ"
     @assert endswith(name, ".circuit")
-    node2id = get_node2id(ln, ProbΔNode)
+    node2id = get_node2id(ln, ProbNode)
     vtree2id = get_vtree2id(vtree)
     formatlines = Vector{CircuitFormatLine}()
     append!(formatlines, parse_lc_file(IOBuffer(lc_header())))
@@ -150,14 +150,14 @@ function save_circuit(name::String, circuit, vtree=nothing)
 end
 
 "Save prob circuit to .dot file"
-function save_as_dot(root::ProbΔNode, file::String)
-    return save_as_dot(node2dag(root), file)
+function save_as_dot(root::ProbNode, file::String)
+    return save_as_dot(linearize(root), file)
 end
 
 "Save prob circuits to .dot file"
 function save_as_dot(circuit::ProbΔ, file::String)
     # TODO (https://github.com/Juice-jl/LogicCircuits.jl/issues/7)
-    node_cache = Dict{ProbΔNode, Int64}()
+    node_cache = Dict{ProbNode, Int64}()
     for (i, n) in enumerate(circuit)
         node_cache[n] = i
     end
@@ -183,9 +183,9 @@ function save_as_dot(circuit::ProbΔ, file::String)
             write(f, "$(node_cache[n]) [label=\"*$(node_cache[n])\"]\n")
         elseif n isa Prob⋁
             write(f, "$(node_cache[n]) [label=\"+$(node_cache[n])\"]\n")
-        elseif n isa ProbLiteral && positive(n)
+        elseif n isa ProbLiteral && ispositive(n)
             write(f, "$(node_cache[n]) [label=\"+$(variable(n.origin))\"]\n")
-        elseif n isa ProbLiteral && negative(n)
+        elseif n isa ProbLiteral && isnegative(n)
             write(f, "$(node_cache[n]) [label=\"-$(variable(n.origin))\"]\n")
         else
             throw("unknown ProbNode type")
diff --git a/src/IO/IO.jl b/src/IO/IO.jl
index c670cac8..538edc8a 100644
--- a/src/IO/IO.jl
+++ b/src/IO/IO.jl
@@ -15,7 +15,7 @@ load_logistic_circuit,
 parse_clt,
 
 # CircuitSaver
-save_as_dot, is_true_node, save_circuit,
+save_as_dot, istrue_node, save_circuit,
 # get_node2id,get_vtree2id,vtree_node, decompile, make_element, save_lines, save_psdd_comment_line, save_sdd_comment_line, 
 # save_line, to_string
 
diff --git a/src/Logistic/Logistic.jl b/src/Logistic/Logistic.jl
index 433c9ad5..e5871408 100644
--- a/src/Logistic/Logistic.jl
+++ b/src/Logistic/Logistic.jl
@@ -4,7 +4,7 @@ using LogicCircuits
 using ..Utils
 
 export 
-    LogisticΔNode, 
+    LogisticNode, 
     LogisticLeafNode, 
     LogisticInnerNode, 
     LogisticLiteral,
diff --git a/src/Logistic/LogisticCircuits.jl b/src/Logistic/LogisticCircuits.jl
index 4e40f70b..8632abca 100644
--- a/src/Logistic/LogisticCircuits.jl
+++ b/src/Logistic/LogisticCircuits.jl
@@ -3,9 +3,9 @@
 #######################
 
 
-abstract type LogisticΔNode{O} <: DecoratorΔNode{O} end
-abstract type LogisticLeafNode{O} <: LogisticΔNode{O} end
-abstract type LogisticInnerNode{O} <: LogisticΔNode{O} end
+abstract type LogisticNode{O} <: DecoratorNode{O} end
+abstract type LogisticLeafNode{O} <: LogisticNode{O} end
+abstract type LogisticInnerNode{O} <: LogisticNode{O} end
 
 struct LogisticLiteral{O} <: LogisticLeafNode{O}
     origin::O
@@ -13,18 +13,18 @@ end
 
 struct Logistic⋀{O} <: LogisticInnerNode{O}
     origin::O
-    children::Vector{<:LogisticΔNode{<:O}}
+    children::Vector{<:LogisticNode{<:O}}
 end
 
 mutable struct Logistic⋁{O} <: LogisticInnerNode{O}
     origin::O
-    children::Vector{<:LogisticΔNode{<:O}}
+    children::Vector{<:LogisticNode{<:O}}
     thetas::Array{Float64, 2}
 end
 
 
 
-const LogisticΔ{O} = AbstractVector{<:LogisticΔNode{O}}
+const LogisticΔ{O} = AbstractVector{<:LogisticNode{O}}
 
 #####################
 # traits
@@ -47,7 +47,7 @@ function Logistic⋁(::Type{O}, origin, children, classes::Int) where {O}
 end
 
 
-const LogisticCache = Dict{ΔNode, LogisticΔNode}
+const LogisticCache = Dict{Node, LogisticNode}
 
 function LogisticΔ(circuit::Δ, classes::Int, cache::LogisticCache = LogisticCache())
 
@@ -55,15 +55,15 @@ function LogisticΔ(circuit::Δ, classes::Int, cache::LogisticCache = LogisticCa
     
     O = grapheltype(circuit) # type of node in the origin
 
-    pc_node(::LiteralGate, n::ΔNode) = LogisticLiteral{O}(n)
-    pc_node(::ConstantGate, n::ΔNode) = error("Cannot construct a logistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
+    pc_node(::LiteralGate, n::LogicNode) = LogisticLiteral{O}(n)
+    pc_node(::ConstantGate, n::LogicNode) = error("Cannot construct a logistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
 
-    pc_node(::⋀Gate, n::ΔNode) = begin
+    pc_node(::⋀Gate, n::LogicNode) = begin
         children = map(c -> cache[c], n.children)
         Logistic⋀{O}(n, children)
     end
 
-    pc_node(::⋁Gate, n::ΔNode) = begin
+    pc_node(::⋁Gate, n::LogicNode) = begin
         children = map(c -> cache[c], n.children)
         Logistic⋁(O, n, children, classes)
     end
@@ -93,10 +93,10 @@ num_parameters_perclass(n::Logistic⋁) = num_children(n)
 num_parameters_perclass(c::LogisticΔ) = sum(n -> num_parameters_perclass(n), ⋁_nodes(c))
 
 "Return the first origin that is a Logistic circuit node"
-logistic_origin(n::DecoratorΔNode)::LogisticΔNode = origin(n,LogisticΔNode)
+logistic_origin(n::DecoratorNode)::LogisticNode = origin(n,LogisticNode)
 
 "Return the first origin that is a Logistic circuit"
-logistic_origin(c::DecoratorΔ)::LogisticΔ = origin(c, LogisticΔNode)
+logistic_origin(c::DecoratorΔ)::LogisticΔ = origin(c, LogisticNode)
 
 
 # TODO Learning
diff --git a/src/Probabilistic/ProbCircuits.jl b/src/Probabilistic/ProbCircuits.jl
index c6156eb6..f5e1dffe 100644
--- a/src/Probabilistic/ProbCircuits.jl
+++ b/src/Probabilistic/ProbCircuits.jl
@@ -1,84 +1,84 @@
 #####################
 # Probabilistic circuits
 #####################
-abstract type ProbΔNode{O} <: DecoratorΔNode{O} end
-abstract type ProbLeafNode{O} <: ProbΔNode{O} end
-abstract type ProbInnerNode{O} <: ProbΔNode{O} end
+abstract type ProbNode{O} <: DecoratorNode{O} end
+abstract type ProbLeafNode{O} <: ProbNode{O} end
+abstract type ProbInnerNode{O} <: ProbNode{O} end
 
 mutable struct ProbLiteral{O} <: ProbLeafNode{O}
     origin::O
     data
     bit::Bool
-    ProbLiteral(n) = new{node_type(n)}(n, nothing, false)
+    ProbLiteral(n) = new{node_type_deprecated(n)}(n, nothing, false)
 end
 
 mutable struct Prob⋀{O} <: ProbInnerNode{O}
     origin::O
-    children::Vector{<:ProbΔNode{<:O}}
+    children::Vector{<:ProbNode{<:O}}
     data
     bit::Bool
     Prob⋀(n, children) = begin
-        new{node_type(n)}(n, convert(Vector{ProbΔNode{node_type(n)}},children), nothing, false)
+        new{node_type_deprecated(n)}(n, convert(Vector{ProbNode{node_type_deprecated(n)}},children), nothing, false)
     end
 end
 
 mutable struct Prob⋁{O} <: ProbInnerNode{O}
     origin::O
-    children::Vector{<:ProbΔNode{<:O}}
+    children::Vector{<:ProbNode{<:O}}
     log_thetas::Vector{Float64}
     data
     bit::Bool
-    Prob⋁(n, children) = new{node_type(n)}(n, convert(Vector{ProbΔNode{node_type(n)}},children), some_vector(Float64, length(children)), nothing, false)
+    Prob⋁(n, children) = new{node_type_deprecated(n)}(n, convert(Vector{ProbNode{node_type_deprecated(n)}},children), init_array(Float64, length(children)), nothing, false)
 end
 
-const ProbΔ{O} = AbstractVector{<:ProbΔNode{<:O}}
+const ProbΔ{O} = AbstractVector{<:ProbNode{<:O}}
 
-Base.eltype(::Type{ProbΔ{O}}) where {O} = ProbΔNode{<:O}
+Base.eltype(::Type{ProbΔ{O}}) where {O} = ProbNode{<:O}
 
 #####################
 # traits
 #####################
 
 import LogicCircuits.GateType # make available for extension
-import LogicCircuits.node_type
+import LogicCircuits.node_type_deprecated
 
 @inline GateType(::Type{<:ProbLiteral}) = LiteralGate()
 @inline GateType(::Type{<:Prob⋀}) = ⋀Gate()
 @inline GateType(::Type{<:Prob⋁}) = ⋁Gate()
 
-@inline node_type(::ProbΔNode) = ProbΔNode
+@inline node_type_deprecated(::ProbNode) = ProbNode
 
 #####################
 # constructors and conversions
 #####################
 
-const ProbCache = Dict{ΔNode, ProbΔNode}
+const ProbCache = Dict{Node, ProbNode}
 
 function ProbΔ2(circuit::Δ)::ProbΔ
-    node2dag(ProbΔ2(circuit[end]))
+    linearize(ProbΔ2(circuit[end]))
 end
 
-function ProbΔ2(circuit::ΔNode)::ProbΔNode
+function ProbΔ2(circuit::LogicNode)::ProbNode
     f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
     f_lit(n) = ProbLiteral(n)
     f_a(n, cn) = Prob⋀(n, cn)
     f_o(n, cn) = Prob⋁(n, cn)
-    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, ProbΔNode{node_type(circuit)})
+    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, ProbNode{node_type_deprecated(circuit)})
 end
 
 function ProbΔ(circuit::Δ, cache::ProbCache = ProbCache())
 
     sizehint!(cache, length(circuit)*4÷3)
 
-    pc_node(::LiteralGate, n::ΔNode) = ProbLiteral(n)
-    pc_node(::ConstantGate, n::ΔNode) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
+    pc_node(::LiteralGate, n::LogicNode) = ProbLiteral(n)
+    pc_node(::ConstantGate, n::LogicNode) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
 
-    pc_node(::⋀Gate, n::ΔNode) = begin
+    pc_node(::⋀Gate, n::LogicNode) = begin
         children = map(c -> cache[c], n.children)
         Prob⋀(n, children)
     end
 
-    pc_node(::⋁Gate, n::ΔNode) = begin
+    pc_node(::⋁Gate, n::LogicNode) = begin
         children = map(c -> cache[c], n.children)
         Prob⋁(n, children)
     end
@@ -103,13 +103,13 @@ num_parameters(n::Prob⋁) = num_children(n)
 num_parameters(c::ProbΔ) = sum(n -> num_parameters(n), ⋁_nodes(c))
 
 "Return the first origin that is a probabilistic circuit node"
-prob_origin(n::DecoratorΔNode)::ProbΔNode = origin(n, ProbΔNode)
+prob_origin(n::DecoratorNode)::ProbNode = origin(n, ProbNode)
 
 "Return the first origin that is a probabilistic circuit"
-prob_origin(c::DecoratorΔ)::ProbΔ = origin(c, ProbΔNode)
+prob_origin(c::DecoratorΔ)::ProbΔ = origin(c, ProbNode)
 
 function estimate_parameters2(pc::ProbΔ, data::XData{Bool}; pseudocount::Float64)
-    Logical.pass_up_down2(pc, data)
+    Logic.pass_up_down2(pc, data)
     w = (data isa PlainXData) ? nothing : weights(data)
     estimate_parameters_cached2(pc, w; pseudocount=pseudocount)
 end
@@ -125,7 +125,7 @@ function estimate_parameters_cached2(pc::ProbΔ, w; pseudocount::Float64)
         children_flows = children_flows_w
     end
 
-    estimate_parameters_node2(n::ProbΔNode) = ()
+    estimate_parameters_node2(n::ProbNode) = ()
     function estimate_parameters_node2(n::Prob⋁)
         if num_children(n) == 1
             n.log_thetas .= 0.0
@@ -143,13 +143,13 @@ function estimate_parameters_cached2(pc::ProbΔ, w; pseudocount::Float64)
 end
 
 function log_likelihood_per_instance2(pc::ProbΔ, data::XData{Bool})
-    Logical.pass_up_down2(pc, data)
+    Logic.pass_up_down2(pc, data)
     log_likelihood_per_instance_cached(pc, data)
 end
 
 function log_likelihood_per_instance_cached(pc::ProbΔ, data::XData{Bool})
     log_likelihoods = zeros(num_examples(data))
-    indices = some_vector(Bool, num_examples(data))::BitVector
+    indices = init_array(Bool, num_examples(data))::BitVector
     for n in pc
          if n isa Prob⋁ && num_children(n) != 1 # other nodes have no effect on likelihood
             foreach(n.children, n.log_thetas) do c, log_theta
@@ -164,7 +164,7 @@ end
 import LogicCircuits: conjoin_like, disjoin_like, literal_like, copy_node, normalize, replace_node # make available for extension
 
 "Conjoin nodes in the same way as the example"
-@inline function conjoin_like(example::ProbΔNode, arguments::Vector)
+@inline function conjoin_like(example::ProbNode, arguments::Vector)
     if isempty(arguments)
         # @assert false "Probabilistic circuit does not have anonymous true node"
         nothing
@@ -177,7 +177,7 @@ import LogicCircuits: conjoin_like, disjoin_like, literal_like, copy_node, norma
 end
 
 "Disjoin nodes in the same way as the example"
-@inline function disjoin_like(example::ProbΔNode, arguments::Vector)
+@inline function disjoin_like(example::ProbNode, arguments::Vector)
     if isempty(arguments)
         # @assert false "Probabilistic circuit does not have false node"
         nothing
@@ -205,7 +205,7 @@ end
 end
 
 "Construct a new literal node like the given node's type"
-@inline literal_like(::ProbΔNode, lit::Lit) = ProbLiteral(lit)
+@inline literal_like(::ProbNode, lit::Lit) = ProbLiteral(lit)
 
 @inline copy_node(n::Prob⋁, cns) = begin
     orig = copy_node(origin(n), origin.(cns))
@@ -232,7 +232,7 @@ end
 
 function estimate_parameters(afc::AggregateFlowΔ, data::XBatches{Bool}; pseudocount::Float64)
     @assert feature_type(data) == Bool "Can only learn probabilistic circuits on Bool data"
-    @assert (afc[end].origin isa ProbΔNode) "AggregateFlowΔ must originate in a ProbΔ"
+    @assert (afc[end].origin isa ProbNode) "AggregateFlowΔ must originate in a ProbΔ"
     collect_aggr_flows(afc, data)
     estimate_parameters_cached(afc; pseudocount=pseudocount)
     afc
@@ -240,7 +240,7 @@ end
 
 function estimate_parameters(fc::FlowΔ, data::XBatches{Bool}; pseudocount::Float64)
     @assert feature_type(data) == Bool "Can only learn probabilistic circuits on Bool data"
-    @assert (prob_origin(afc[end]) isa ProbΔNode) "FlowΔ must originate in a ProbΔ"
+    @assert (prob_origin(afc[end]) isa ProbNode) "FlowΔ must originate in a ProbΔ"
     collect_aggr_flows(fc, data)
     estimate_parameters_cached(origin(fc); pseudocount=pseudocount)
 end
@@ -250,7 +250,7 @@ function estimate_parameters_cached(afc::AggregateFlowΔ; pseudocount::Float64)
     foreach(n -> estimate_parameters_node(n; pseudocount=pseudocount), afc)
 end
 
-estimate_parameters_node(::AggregateFlowΔNode; pseudocount::Float64) = () # do nothing
+estimate_parameters_node(::AggregateFlowNode; pseudocount::Float64) = () # do nothing
 function estimate_parameters_node(n::AggregateFlow⋁; pseudocount)
     origin = n.origin::Prob⋁
     if num_children(n) == 1
@@ -283,7 +283,7 @@ function log_likelihood(afc::AggregateFlowΔ)
     sum(n -> log_likelihood(n), afc)
 end
 
-log_likelihood(::AggregateFlowΔNode) = 0.0
+log_likelihood(::AggregateFlowNode) = 0.0
 log_likelihood(n::AggregateFlow⋁) = sum(n.origin.log_thetas .* n.aggr_flow_children)
 
 """
@@ -315,10 +315,10 @@ Calculate log likelihood for a batch of fully observed samples.
 (This is for when you already have a FlowΔ)
 """
 function log_likelihood_per_instance(fc::FlowΔ, batch::PlainXData{Bool})
-    @assert (prob_origin(fc[end]) isa ProbΔNode) "FlowΔ must originate in a ProbΔ"
+    @assert (prob_origin(fc[end]) isa ProbNode) "FlowΔ must originate in a ProbΔ"
     pass_up_down(fc, batch)
     log_likelihoods = zeros(num_examples(batch))
-    indices = some_vector(Bool, flow_length(fc))::BitVector
+    indices = init_array(Bool, flow_length(fc))::BitVector
     for n in fc
          if n isa DownFlow⋁ && num_children(n) != 1 # other nodes have no effect on likelihood
             origin = prob_origin(n)::Prob⋁
@@ -353,7 +353,7 @@ Calculate log likelihood for a batch of samples with partial evidence P(e).
 To indicate a variable is not observed, pass -1 for that variable.
 """
 function marginal_log_likelihood_per_instance(fc::UpFlowΔ, batch::PlainXData{Int8})
-    @assert (prob_origin(fc[end]) isa ProbΔNode) "FlowΔ must originate in a ProbΔ"
+    @assert (prob_origin(fc[end]) isa ProbNode) "FlowΔ must originate in a ProbΔ"
     marginal_pass_up(fc, batch)
     pr(fc[end])
 end
@@ -399,7 +399,7 @@ function sample(probs::AbstractVector{<:Number})::Int32
 end
 
 function simulate(node::ProbLiteral, inst::Dict{Var,Int64})
-    if positive(node)
+    if ispositive(node)
         inst[variable(node.origin)] = 1
     else
         inst[variable(node.origin)] = 0
@@ -443,7 +443,7 @@ function sample(circuit::UpFlowΔ)::AbstractVector{Bool}
 end
 
 function simulate2(node::UpFlowLiteral, inst::Dict{Var,Int64})
-    if positive(node)
+    if ispositive(node)
         #TODO I don't think we need these 'grand_origin' parts below
         inst[variable(grand_origin(node))] = 1
     else
@@ -490,7 +490,7 @@ active_samples: bool vector indicating which samples are active for this node du
 result: Matrix (num_samples, num_variables) indicating the final result of mpe
 """
 function mpe_simulate(node::UpFlowLiteral, active_samples::Vector{Bool}, result::Matrix{Bool})
-    if positive(node)
+    if ispositive(node)
         result[active_samples, variable(node)] .= 1
     else
         result[active_samples, variable(node)] .= 0
diff --git a/src/Probabilistic/ProbFlowCircuits.jl b/src/Probabilistic/ProbFlowCircuits.jl
index dc145e35..00916954 100644
--- a/src/Probabilistic/ProbFlowCircuits.jl
+++ b/src/Probabilistic/ProbFlowCircuits.jl
@@ -4,7 +4,7 @@
 function marginal_pass_up(circuit::UpFlowΔ{O,F}, data::XData{E}) where {E <: eltype(F)} where {O,F}
     resize_flows(circuit, num_examples(data))
     cache = zeros(Float64, num_examples(data)) #TODO: fix type later
-    marginal_pass_up_node(n::UpFlowΔNode, ::PlainXData) = ()
+    marginal_pass_up_node(n::UpFlowNode, ::PlainXData) = ()
 
     function marginal_pass_up_node(n::UpFlowLiteral{O,F}, cache::Array{Float64}, data::PlainXData{E}) where {E <: eltype(F)} where {O,F}
         pass_up_node(n, data)
@@ -63,7 +63,7 @@ function marginal_pass_down(circuit::DownFlowΔ{O,F}) where {O,F}
     end
 end
 
-marginal_pass_down_node(n::DownFlowΔNode) = () # do nothing
+marginal_pass_down_node(n::DownFlowNode) = () # do nothing
 marginal_pass_down_node(n::DownFlowLeaf) = ()
 
 function marginal_pass_down_node(n::DownFlow⋀Cached)
diff --git a/src/Probabilistic/Probabilistic.jl b/src/Probabilistic/Probabilistic.jl
index 376467f2..9dd95e70 100644
--- a/src/Probabilistic/Probabilistic.jl
+++ b/src/Probabilistic/Probabilistic.jl
@@ -6,7 +6,7 @@ using ..Utils
 export
 
 # ProbCircuits
-ProbΔNode, ProbΔ, ProbΔ, ProbLeafNode, ProbInnerNode,
+ProbNode, ProbΔ, ProbΔ, ProbLeafNode, ProbInnerNode,
 ProbLiteral, Prob⋀, Prob⋁, ProbCache, variable, num_parameters, compute_log_likelihood,
 log_proba,
 log_likelihood, estimate_parameters, log_likelihood_per_instance, marginal_log_likelihood_per_instance,
diff --git a/src/Probabilistic/Queries.jl b/src/Probabilistic/Queries.jl
index c960ed6c..45d7b238 100644
--- a/src/Probabilistic/Queries.jl
+++ b/src/Probabilistic/Queries.jl
@@ -3,13 +3,13 @@ using DataStructures
 # Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability
 # spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
 "Calculate the probability of the logic formula given by sdd for the psdd"
-function pr_constraint(psdd_node::ProbΔNode, sdd_node::Union{ProbΔNode, StructLogicalΔNode})
-    cache = Dict{Tuple{ProbΔNode, Union{ProbΔNode, StructLogicalΔNode}}, Float64}()
+function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogicNode})
+    cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64}()
 
     return pr_constraint(psdd_node, sdd_node, cache)
 end
-function pr_constraint(psdd_node::ProbΔNode, sdd_node::Union{ProbΔNode, StructLogicalΔNode},
-                       cache::Dict{Tuple{ProbΔNode, Union{ProbΔNode, StructLogicalΔNode}}, Float64})::Float64
+function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogicNode},
+                       cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64})::Float64
     if (psdd_node, sdd_node) in keys(cache) # Cache hit
         return cache[psdd_node, sdd_node]
     elseif psdd_node isa ProbLiteral # Boundary cases
@@ -55,12 +55,12 @@ end
 
 
 "Entropy of the distribution of the input psdd."
-function psdd_entropy(psdd_node::ProbΔNode)::Float64
-    psdd_entropy_cache = Dict{ProbΔNode, Float64}()
+function psdd_entropy(psdd_node::ProbNode)::Float64
+    psdd_entropy_cache = Dict{ProbNode, Float64}()
 
     return psdd_entropy(psdd_node, psdd_entropy_cache)
 end
-function psdd_entropy(psdd_node::Prob⋁, psdd_entropy_cache::Dict{ProbΔNode, Float64})::Float64
+function psdd_entropy(psdd_node::Prob⋁, psdd_entropy_cache::Dict{ProbNode, Float64})::Float64
     if psdd_node in keys(psdd_entropy_cache)
         return psdd_entropy_cache[psdd_node]
     elseif psdd_node.children[1] isa ProbLiteral
@@ -80,31 +80,31 @@ function psdd_entropy(psdd_node::Prob⋁, psdd_entropy_cache::Dict{ProbΔNode, F
         return get!(psdd_entropy_cache, psdd_node, local_entropy)
     end
 end
-function psdd_entropy(psdd_node::Prob⋀, psdd_entropy_cache::Dict{ProbΔNode, Float64})::Float64
+function psdd_entropy(psdd_node::Prob⋀, psdd_entropy_cache::Dict{ProbNode, Float64})::Float64
     return get!(psdd_entropy_cache, psdd_node.children[1], psdd_entropy(psdd_node.children[1], psdd_entropy_cache)) +
         get!(psdd_entropy_cache, psdd_node.children[2], psdd_entropy(psdd_node.children[2], psdd_entropy_cache))
 end
-function psdd_entropy(psdd_node::ProbLiteral, psdd_entropy_cache::Dict{ProbΔNode, Float64})::Float64
+function psdd_entropy(psdd_node::ProbLiteral, psdd_entropy_cache::Dict{ProbNode, Float64})::Float64
     return get!(psdd_entropy_cache, psdd_node, 0.0)
 end
 
 
 "KL divergence calculation for psdds that are not necessarily identical"
-function psdd_kl_divergence(psdd_node1::ProbΔNode, psdd_node2::ProbΔNode)::Float64
-    kl_divergence_cache = Dict{Tuple{ProbΔNode, ProbΔNode}, Float64}()
-    pr_constraint_cache = Dict{Tuple{ProbΔNode, Union{ProbΔNode, StructLogicalΔNode}}, Float64}()
+function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode)::Float64
+    kl_divergence_cache = Dict{Tuple{ProbNode, ProbNode}, Float64}()
+    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64}()
 
     return psdd_kl_divergence(psdd_node1, psdd_node2, kl_divergence_cache, pr_constraint_cache)
 end
-function psdd_kl_divergence(psdd_node1::ProbΔNode, psdd_node2::ProbΔNode,
-        kl_divergence_cache::Dict{Tuple{ProbΔNode, ProbΔNode}, Float64})::Float64
-    pr_constraint_cache = Dict{Tuple{ProbΔNode, Union{ProbΔNode, StructLogicalΔNode}}, Float64}()
+function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
+        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64})::Float64
+    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64}()
 
     return psdd_kl_divergence(psdd_node1, psdd_node2, kl_divergence_cache, pr_constraint_cache)
 end
-function psdd_kl_divergence(psdd_node1::ProbΔNode, psdd_node2::ProbΔNode,
-        kl_divergence_cache::Dict{Tuple{ProbΔNode, ProbΔNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbΔNode, Union{ProbΔNode, StructLogicalΔNode}}, Float64})
+function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
+        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
+        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64})
     @assert !(psdd_node1 isa Prob⋀ || psdd_node2 isa Prob⋀) "Prob⋀ not a valid PSDD node for KL-Divergence"
 
     # Check if both nodes are normalized for same vtree node
@@ -174,8 +174,8 @@ function psdd_kl_divergence(psdd_node1::ProbΔNode, psdd_node2::ProbΔNode,
     end
 end
 function psdd_kl_divergence(psdd_node1::ProbLiteral, psdd_node2::ProbLiteral,
-        kl_divergence_cache::Dict{Tuple{ProbΔNode, ProbΔNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbΔNode, Union{ProbΔNode, StructLogicalΔNode}}, Float64})
+        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
+        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64})
     # Check if literals are over same variables in vtree
    @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
@@ -187,8 +187,8 @@ function psdd_kl_divergence(psdd_node1::ProbLiteral, psdd_node2::ProbLiteral,
     end
 end
 function psdd_kl_divergence(psdd_node1::Prob⋁, psdd_node2::ProbLiteral,
-        kl_divergence_cache::Dict{Tuple{ProbΔNode, ProbΔNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbΔNode, Union{ProbΔNode, StructLogicalΔNode}}, Float64})
+        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
+        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64})
     @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
@@ -208,8 +208,8 @@ function psdd_kl_divergence(psdd_node1::Prob⋁, psdd_node2::ProbLiteral,
     end
 end
 function psdd_kl_divergence(psdd_node1::ProbLiteral, psdd_node2::Prob⋁,
-        kl_divergence_cache::Dict{Tuple{ProbΔNode, ProbΔNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbΔNode, Union{ProbΔNode, StructLogicalΔNode}}, Float64})
+        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
+        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64})
     @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
diff --git a/src/Probabilistic/VtreeLearner.jl b/src/Probabilistic/VtreeLearner.jl
index 3fd4f719..86d91169 100644
--- a/src/Probabilistic/VtreeLearner.jl
+++ b/src/Probabilistic/VtreeLearner.jl
@@ -224,7 +224,7 @@ function learn_vtree_bottom_up(train_x::PlainXData; α)
     (_, mi) = mutual_information(feature_matrix(train_x), Data.weights(train_x); α = α)
     vars = Var.(collect(1:num_features(train_x)))
     context = BlossomContext(vars, mi)
-    vtree = bottom_up_vtree(PlainVtreeNode, vars, blossom_bottom_up_curry(context))
+    vtree = bottom_up_vtree(PlainVTree, vars, blossom_bottom_up_curry(context))
 end
 
 #############
diff --git a/src/Reasoning/ExpFlowCircuits.jl b/src/Reasoning/ExpFlowCircuits.jl
index 869cd966..8c3011ea 100644
--- a/src/Reasoning/ExpFlowCircuits.jl
+++ b/src/Reasoning/ExpFlowCircuits.jl
@@ -7,16 +7,16 @@
 #####################
 
 "A expectation circuit node that has pair of origins of type PC and type LC"
-abstract type DecoratorΔNodePair{PC<:ΔNode, LC<:ΔNode} <: ΔNode end
+abstract type DecoratorNodePair{PC<:Node, LC<:Node} <: Node end
 
-abstract type ExpFlowΔNode{PC, LC, F} <: DecoratorΔNodePair{PC, LC} end
+abstract type ExpFlowNode{PC, LC, F} <: DecoratorNodePair{PC, LC} end
 
-const ExpFlowΔ{O} = AbstractVector{<:ExpFlowΔNode{<:O}}
+const ExpFlowΔ{O} = AbstractVector{<:ExpFlowNode{<:O}}
 
-struct UpExpFlow{PC, LC, F} <: ExpFlowΔNode{PC, LC, F}
+struct UpExpFlow{PC, LC, F} <: ExpFlowNode{PC, LC, F}
     p_origin::PC
     f_origin::LC
-    children::Vector{<:ExpFlowΔNode{<:PC, <:LC, <:F}}
+    children::Vector{<:ExpFlowNode{<:PC, <:LC, <:F}}
     f::F
     fg::F
 end
@@ -31,15 +31,15 @@ function ExpFlowΔ(pc::ProbΔ, lc::LogisticΔ, batch_size::Int, ::Type{El}) wher
     lc_type = grapheltype(lc)
 
     F = Array{El, 2}
-    fmem = () -> zeros(1, batch_size) #Vector{El}(undef, batch_size)  #some_vector(El, batch_size) # note: fmem's return type will determine type of all UpFlows in the circuit (should be El)
+    fmem = () -> zeros(1, batch_size) #Vector{El}(undef, batch_size)  #init_array(El, batch_size) # note: fmem's return type will determine type of all UpFlows in the circuit (should be El)
     fgmem = () -> zeros(classes(lc[end]), batch_size)
 
     root_pc = pc[end]
     root_lc = lc[end- 1]
     
-    cache = Dict{Pair{ΔNode, ΔNode}, ExpFlowΔNode}()
+    cache = Dict{Pair{Node, Node}, ExpFlowNode}()
     sizehint!(cache, (length(pc) + length(lc))*4÷3)
-    expFlowCircuit = Vector{ExpFlowΔNode}()
+    expFlowCircuit = Vector{ExpFlowNode}()
 
     function ExpflowTraverse(n::Prob⋁, m::Logistic⋁) 
         get!(cache, Pair(n, m)) do
@@ -59,7 +59,7 @@ function ExpFlowΔ(pc::ProbΔ, lc::LogisticΔ, batch_size::Int, ::Type{El}) wher
     end
     function ExpflowTraverse(n::ProbLiteral, m::Logistic⋁) 
         get!(cache, Pair(n, m)) do
-            children = Vector{ExpFlowΔNode{pc_type,lc_type, F}}() # TODO
+            children = Vector{ExpFlowNode{pc_type,lc_type, F}}() # TODO
             node = UpExpFlow{pc_type,lc_type, F}(n, m, children, fmem(), fgmem())
             push!(expFlowCircuit, node)
             return node
@@ -67,7 +67,7 @@ function ExpFlowΔ(pc::ProbΔ, lc::LogisticΔ, batch_size::Int, ::Type{El}) wher
     end
     function ExpflowTraverse(n::ProbLiteral, m::LogisticLiteral) 
         get!(cache, Pair(n, m)) do
-            children = Vector{ExpFlowΔNode{pc_type,lc_type, F}}() # TODO
+            children = Vector{ExpFlowNode{pc_type,lc_type, F}}() # TODO
             node = UpExpFlow{pc_type,lc_type, F}(n, m, children, fmem(), fgmem())
             push!(expFlowCircuit, node)
             return node
@@ -95,12 +95,12 @@ function exp_pass_up(fc::ExpFlowΔ, data::XData{E}) where{E <: eltype(F)} where{
     end
 end
 
-function exp_pass_up_node(node::ExpFlowΔNode{PC,LC,F}, data::XData{E}) where{E <: eltype(F)} where{PC, LC, F}
+function exp_pass_up_node(node::ExpFlowNode{PC,LC,F}, data::XData{E}) where{E <: eltype(F)} where{PC, LC, F}
     pType = typeof(node.p_origin)
     fType = typeof(node.f_origin)
 
     if node.p_origin isa Prob⋁ && node.f_origin isa Logistic⋁
-        #todo this ordering might be different than the ExpFlowΔNode children
+        #todo this ordering might be different than the ExpFlowNode children
         pthetas = [exp(node.p_origin.log_thetas[i])
                     for i in 1:length(node.p_origin.children) for j in 1:length(node.f_origin.children)]
         fthetas = [node.f_origin.thetas[j,:] # only taking the first class for now
@@ -129,10 +129,10 @@ function exp_pass_up_node(node::ExpFlowΔNode{PC,LC,F}, data::XData{E}) where{E
 
         var = lit2var(literal(m))
         X = feature_matrix(data)
-        if positive(node.p_origin) && positive(m)
+        if ispositive(node.p_origin) && ispositive(m)
             node.f[:, X[:, var] .!= 0 ] .= 1.0 # positive and missing observations
             node.f[:, X[:, var] .== 0 ] .= 0.0
-        elseif negative(node.p_origin) && negative(m)
+        elseif isnegative(node.p_origin) && isnegative(m)
             node.f[:, X[:, var] .!= 1 ] .= 1.0 # negative and missing observations
             node.f[:, X[:, var] .== 1 ] .= 0.0
         else
diff --git a/src/Reasoning/Expectation.jl b/src/Reasoning/Expectation.jl
index 783dc923..43a410b6 100644
--- a/src/Reasoning/Expectation.jl
+++ b/src/Reasoning/Expectation.jl
@@ -1,5 +1,5 @@
-ExpCacheDict = Dict{Pair{ProbΔNode, LogisticΔNode}, Array{Float64, 2}}
-MomentCacheDict = Dict{Tuple{ProbΔNode, LogisticΔNode, Int64}, Array{Float64, 2}}
+ExpCacheDict = Dict{Pair{ProbNode, LogisticNode}, Array{Float64, 2}}
+MomentCacheDict = Dict{Tuple{ProbNode, LogisticNode, Int64}, Array{Float64, 2}}
 
 struct ExpectationCache 
     f::ExpCacheDict
@@ -122,11 +122,11 @@ end
         value = zeros(1 , num_examples(data) )
         var = lit2var(literal(m))
         X = feature_matrix(data)
-        if positive(n) && positive(m) 
+        if ispositive(n) && ispositive(m) 
             # value[1, X[:, var] .== -1 ] .= 1.0  # missing observation always agrees
             # value[1, X[:, var] .== 1 ] .= 1.0 # positive observations
             value[1, X[:, var] .!= 0 ] .= 1.0 # positive or missing observations
-        elseif negative(n) && negative(m)
+        elseif isnegative(n) && isnegative(m)
             # value[1, X[:, var] .== -1 ] .= 1.0  # missing observation always agrees
             # value[1, X[:, var] .== 0 ] .= 1.0 # negative observations
             value[1, X[:, var] .!= 1 ] .= 1.0 # negative or missing observations
diff --git a/src/StructureLearner/CircuitBuilder.jl b/src/StructureLearner/CircuitBuilder.jl
index 8d3c8c96..b21b47d2 100644
--- a/src/StructureLearner/CircuitBuilder.jl
+++ b/src/StructureLearner/CircuitBuilder.jl
@@ -23,13 +23,13 @@ end
 "Build decomposable probability circuits from Chow-Liu tree"
 function compile_prob_circuit_from_clt(clt::CLT)::ProbΔ
     topo_order = Var.(reverse(topological_sort_by_dfs(clt::CLT))) #order to parse the node
-    lin = Vector{ProbΔNode}()
-    node_cache = Dict{Lit, LogicalΔNode}()
+    lin = Vector{ProbNode}()
+    node_cache = Dict{Lit, LogicNode}()
     prob_cache = ProbCache()
     parent = parent_vector(clt)
 
-    prob_children(n)::Vector{<:ProbΔNode{<:node_type(n)}} =  
-        copy_with_eltype(map(c -> prob_cache[c], n.children), ProbΔNode{<:node_type(n)})
+    prob_children(n)::Vector{<:ProbNode{<:node_type_deprecated(n)}} =  
+        collect(ProbNode{<:node_type_deprecated(n)}, map(c -> prob_cache[c], n.children))
 
     "default order of circuit node, from left to right: +/1 -/0"
 
@@ -100,19 +100,19 @@ function compile_prob_circuit_from_clt(clt::CLT)::ProbΔ
         return n
     end
 
-    function compile_independent_roots(roots::Vector{ProbΔNode})
+    function compile_independent_roots(roots::Vector{ProbNode})
         temp = ⋀Node([c.origin for c in roots])
         n = Prob⋀(temp, prob_children(temp))
         prob_cache[temp] = n
         push!(lin, n)
         temp = ⋁Node([temp])
-        n = Prob⋁{LogicalΔNode}(temp, prob_children(temp))
+        n = Prob⋁{LogicNode}(temp, prob_children(temp))
         prob_cache[temp] = n
         n.log_thetas = [0.0]
         push!(lin, n)
     end
 
-    roots = Vector{ProbΔNode}()
+    roots = Vector{ProbNode}()
     for id in topo_order
         children = Var.(outneighbors(clt, id))
         if isequal(children, [])
diff --git a/src/StructureLearner/PSDDInitializer.jl b/src/StructureLearner/PSDDInitializer.jl
index 439b691a..cb1bd27c 100644
--- a/src/StructureLearner/PSDDInitializer.jl
+++ b/src/StructureLearner/PSDDInitializer.jl
@@ -1,7 +1,7 @@
 using ..Utils
 
-"Map from literal to LogicalΔNode"
-const LitCache = Dict{Lit, LogicalΔNode}
+"Map from literal to LogicNode"
+const LitCache = Dict{Lit, LogicNode}
 
 "Use literal to represent constraint (1 to X, -1 to not X), 0 to represent true"
 const ⊤ = convert(Lit, 0)
@@ -34,10 +34,10 @@ function learn_vtree_from_clt(clt::CLT; vtree_mode::String)::PlainVtree
     roots = [i for (i, x) in enumerate(parent_vector(clt)) if x == 0]
     rootnode = construct_children(Var.(roots), clt, vtree_mode)
 
-    return node2dag(rootnode)
+    return linearize(rootnode)
 end
 
-function construct_node(v::Var, clt::CLT, strategy::String)::PlainVtreeNode
+function construct_node(v::Var, clt::CLT, strategy::String)::PlainVTree
     children = Var.(outneighbors(clt, v))
     if isempty(children) # leaf node
         return PlainVtreeLeafNode(v)
@@ -47,9 +47,9 @@ function construct_node(v::Var, clt::CLT, strategy::String)::PlainVtreeNode
     end
 end
 
-function construct_children(children::Vector{Var}, clt::CLT, strategy::String)::PlainVtreeNode
+function construct_children(children::Vector{Var}, clt::CLT, strategy::String)::PlainVTree
     sorted_vars = sort(collect(children))
-    children_nodes = Vector{PlainVtreeNode}()
+    children_nodes = Vector{PlainVTree}()
     foreach(x -> push!(children_nodes, construct_node(x, clt, strategy)), sorted_vars)
 
     if strategy == "linear"
@@ -61,7 +61,7 @@ function construct_children(children::Vector{Var}, clt::CLT, strategy::String)::
     end
 end
 
-function construct_children_linear(children_nodes::Vector{PlainVtreeNode}, clt::CLT)::PlainVtreeNode
+function construct_children_linear(children_nodes::Vector{PlainVTree}, clt::CLT)::PlainVTree
     children_nodes = Iterators.Stateful(reverse(children_nodes))
 
     right = popfirst!(children_nodes)
@@ -71,7 +71,7 @@ function construct_children_linear(children_nodes::Vector{PlainVtreeNode}, clt::
     return right
 end
 
-function construct_children_balanced(children_nodes::Vector{PlainVtreeNode}, clt::CLT)::PlainVtreeNode
+function construct_children_balanced(children_nodes::Vector{PlainVTree}, clt::CLT)::PlainVTree
     if length(children_nodes) == 1
         return children_nodes[1]
     elseif length(children_nodes) == 2
@@ -84,7 +84,7 @@ function construct_children_balanced(children_nodes::Vector{PlainVtreeNode}, clt
     end
 end
 
-function add_parent(parent::Var, children::PlainVtreeNode)
+function add_parent(parent::Var, children::PlainVTree)
     return PlainVtreeInnerNode(PlainVtreeLeafNode(parent), children)
 end
 
@@ -94,17 +94,17 @@ end
 
 "Compile a psdd circuit from clt and vtree"
 function compile_psdd_from_clt(clt::MetaDiGraph, vtree::PlainVtree)
-    order = node2dag(vtree[end])
+    order = linearize(vtree[end])
     parent_clt = Var.(parent_vector(clt))
 
-    lin = Vector{ProbΔNode}()
+    lin = Vector{ProbNode}()
     prob_cache = ProbCache()
     lit_cache = LitCache()
-    v2p = Dict{PlainVtreeNode, ProbΔ}()
+    v2p = Dict{PlainVTree, ProbΔ}()
 
     get_params(cpt::Dict) = length(cpt) == 2 ? [cpt[1], cpt[0]] : [cpt[(1,1)], cpt[(0,1)], cpt[(1,0)], cpt[(0,0)]]
-    function add_mapping!(v::PlainVtreeNode, circuits::ProbΔ)
-        if !haskey(v2p, v); v2p[v] = Vector{ProbΔNode}(); end
+    function add_mapping!(v::PlainVTree, circuits::ProbΔ)
+        if !haskey(v2p, v); v2p[v] = Vector{ProbNode}(); end
         foreach(c -> if !(c in v2p[v]) push!(v2p[v], c);end, circuits)
     end
 
@@ -124,8 +124,8 @@ function compile_psdd_from_clt(clt::MetaDiGraph, vtree::PlainVtree)
 
     # compile to decision node
     function compile_from_vtree_node(v::PlainVtreeInnerNode)
-        left_var = left_most_child(v.left).var
-        right_var = left_most_child(v.right).var
+        left_var = left_most_descendent(v.left).var
+        right_var = left_most_descendent(v.right).var
         left_circuit = v2p[v.left]
         right_circuit = v2p[v.right]
 
@@ -149,12 +149,12 @@ end
 #####################
 
 prob_children(n, prob_cache) =  
-    copy_with_eltype(map(c -> prob_cache[c], n.children), ProbΔNode{<:StructLogicalΔNode})
+    collect(ProbNode{<:StructLogicNode}, map(c -> prob_cache[c], n.children))
 
 "Add leaf nodes to circuit `lin`"
 function add_prob_leaf_node(var::Var, vtree::PlainVtreeLeafNode, lit_cache::LitCache, prob_cache::ProbCache, lin)
-    pos = StructLiteralNode{PlainVtreeNode}( var2lit(var), vtree)
-    neg = StructLiteralNode{PlainVtreeNode}(-var2lit(var), vtree)
+    pos = StructLiteralNode{PlainVTree}( var2lit(var), vtree)
+    neg = StructLiteralNode{PlainVTree}(-var2lit(var), vtree)
     lit_cache[var2lit(var)] = pos
     lit_cache[-var2lit(var)] = neg
     pos2 = ProbLiteral(pos)
@@ -168,7 +168,7 @@ end
 
 "Add prob⋀ node to circuit `lin`"
 function add_prob⋀_node(children::ProbΔ, vtree::PlainVtreeInnerNode, prob_cache::ProbCache, lin)::Prob⋀
-    logic = Struct⋀Node{PlainVtreeNode}([c.origin for c in children], vtree)
+    logic = Struct⋀Node{PlainVTree}([c.origin for c in children], vtree)
     prob = Prob⋀(logic, prob_children(logic, prob_cache))
     prob_cache[logic] = prob
     push!(lin, prob)
@@ -176,8 +176,8 @@ function add_prob⋀_node(children::ProbΔ, vtree::PlainVtreeInnerNode, prob_cac
 end
 
 "Add prob⋁ node to circuit `lin`"
-function add_prob⋁_node(children::ProbΔ, vtree::PlainVtreeNode, thetas::Vector{Float64}, prob_cache::ProbCache, lin)::Prob⋁
-    logic = Struct⋁Node{PlainVtreeNode}([c.origin for c in children], vtree)
+function add_prob⋁_node(children::ProbΔ, vtree::PlainVTree, thetas::Vector{Float64}, prob_cache::ProbCache, lin)::Prob⋁
+    logic = Struct⋁Node{PlainVTree}([c.origin for c in children], vtree)
     prob = Prob⋁(logic, prob_children(logic, prob_cache))
     prob.log_thetas = log.(thetas)
     prob_cache[logic] = prob
@@ -213,7 +213,7 @@ end
 #####################
 
 function set_base(index, n::StructLiteralNode, bases)
-    if positive(n)
+    if ispositive(n)
         bases[n][variable(n)] = 1
     else
         bases[n][variable(n)] = -1
@@ -262,10 +262,10 @@ function compile_fully_factorized_psdd_from_vtree(vtree::PlainVtree)::ProbΔ
         nothing
     end
 
-    lin = Vector{ProbΔNode}()
+    lin = Vector{ProbNode}()
     prob_cache = ProbCache()
     lit_cache = LitCache()
-    v2n = Dict{PlainVtreeNode, ProbΔNode}()
+    v2n = Dict{PlainVTree, ProbNode}()
 
     for v in vtree
         ful_factor_node(v, lit_cache, prob_cache, v2n, lin)
diff --git a/test/Logistic/LogisticCircuitTest.jl b/test/Logistic/LogisticCircuitTest.jl
index 5ca7ab24..7802c012 100644
--- a/test/Logistic/LogisticCircuitTest.jl
+++ b/test/Logistic/LogisticCircuitTest.jl
@@ -13,10 +13,10 @@ using ProbabilisticCircuits
             compact⋁=false)
         
     logistic_circuit = zoo_lc("little_4var.circuit", 2);
-    @test logistic_circuit isa Vector{<:LogisticΔNode};
+    @test logistic_circuit isa Vector{<:LogisticNode};
 
     flow_circuit = FlowΔ(logistic_circuit, 16, Float64, my_opts)
-    @test flow_circuit isa Vector{<:FlowΔNode};
+    @test flow_circuit isa Vector{<:FlowNode};
 
     # Step 1. Check Probabilities for 3 samples
     data = XData(Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]));
diff --git a/test/Probabilistic/CircuitQueriesTest.jl b/test/Probabilistic/CircuitQueriesTest.jl
index 26a31784..4b1bd1f4 100644
--- a/test/Probabilistic/CircuitQueriesTest.jl
+++ b/test/Probabilistic/CircuitQueriesTest.jl
@@ -9,10 +9,10 @@ using ProbabilisticCircuits
 
     EPS = 1e-7;
     prob_circuit = zoo_psdd("little_4var.psdd");
-    @test prob_circuit isa Vector{<:ProbΔNode};
+    @test prob_circuit isa Vector{<:ProbNode};
 
     flow_circuit = FlowΔ(prob_circuit, 16, Bool)
-    @test flow_circuit isa Vector{<:FlowΔNode};
+    @test flow_circuit isa Vector{<:FlowNode};
 
 
     # Step 1. Check Probabilities for 3 samples
diff --git a/test/Probabilistic/EntropyKLDTest.jl b/test/Probabilistic/EntropyKLDTest.jl
index ad459fcf..0c7542e9 100644
--- a/test/Probabilistic/EntropyKLDTest.jl
+++ b/test/Probabilistic/EntropyKLDTest.jl
@@ -16,8 +16,8 @@ using ProbabilisticCircuits
 
     # KLD Tests #
     # KLD base tests
-    pr_constraint_cache = Dict{Tuple{ProbΔNode, Union{ProbΔNode, StructLogicalΔNode}}, Float64}()
-    kl_divergence_cache = Dict{Tuple{ProbΔNode, ProbΔNode}, Float64}()
+    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64}()
+    kl_divergence_cache = Dict{Tuple{ProbNode, ProbNode}, Float64}()
 
     @test_throws AssertionError("Both nodes not normalized for same vtree node") psdd_kl_divergence(pc1[1], pc1[3], kl_divergence_cache, pr_constraint_cache)
     @test_throws AssertionError("Both nodes not normalized for same vtree node") psdd_kl_divergence(pc1[2], pc1[3], kl_divergence_cache, pr_constraint_cache)
@@ -39,7 +39,7 @@ using ProbabilisticCircuits
     @test abs(psdd_kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
     @test abs(psdd_kl_divergence(pc1[end], pc2[end]) - 0.5672800167911778) < 1e-8
 
-    kl_divergence_cache = Dict{Tuple{ProbΔNode, ProbΔNode}, Float64}()
+    kl_divergence_cache = Dict{Tuple{ProbNode, ProbNode}, Float64}()
     @test abs(psdd_kl_divergence(pc2[4], pc3[5], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
     @test abs(psdd_kl_divergence(pc2[4], pc3[4], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
     @test abs(psdd_kl_divergence(pc2[3], pc3[3], kl_divergence_cache, pr_constraint_cache) - 0.9 * log(0.9 / 0.5) - 0.1 * log(0.1 / 0.5)) < 1e-8
diff --git a/test/Probabilistic/PrConstraintTest.jl b/test/Probabilistic/PrConstraintTest.jl
index b7ea73fb..ceb6fcb5 100644
--- a/test/Probabilistic/PrConstraintTest.jl
+++ b/test/Probabilistic/PrConstraintTest.jl
@@ -9,7 +9,7 @@ using ProbabilisticCircuits
     pc, vtree = load_struct_prob_circuit(
                     zoo_psdd_file("simple2.4.psdd"), simplevtree)
 
-    cache = Dict{Tuple{ProbΔNode, Union{ProbΔNode, StructLogicalΔNode}}, Float64}()
+    cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64}()
 
     @test abs(pr_constraint(pc[end], pc[end], cache) - 1.0) < 1e-8
     @test abs(pr_constraint(pc[5], pc[3], cache) - 0.2) < 1e-8
@@ -28,7 +28,7 @@ using ProbabilisticCircuits
     pc1, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.5.psdd"), simplevtree)
     pc2, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.6.psdd"), simplevtree)
 
-    pr_constraint_cache = Dict{Tuple{ProbΔNode, Union{ProbΔNode, StructLogicalΔNode}}, Float64}()
+    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64}()
     pr_constraint(pc1[end], pc2[end], pr_constraint_cache)
     @test abs(pr_constraint_cache[pc1[1], pc2[1]] - 1.0) < 1e-8
     @test abs(pr_constraint_cache[pc1[1], pc2[2]] - 0.0) < 1e-8

From cf90550a14d51f9c171c54fd2e4422a436d2b3d5 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Fri, 10 Jul 2020 21:33:56 -0700
Subject: [PATCH 002/131] reinstating vtrees

---
 src/IO/CircuitLineCompiler.jl                |  4 +--
 src/IO/CircuitParser.jl                      |  2 +-
 src/IO/CircuitSaver.jl                       |  8 ++---
 src/Logistic/LogisticCircuits.jl             |  8 ++---
 src/Probabilistic/ProbCircuits.jl            | 10 +++---
 src/Probabilistic/Queries.jl                 | 20 +++++------
 src/Probabilistic/VtreeLearner.jl            |  2 +-
 src/StructureLearner/CircuitBuilder.jl       |  4 +--
 src/StructureLearner/PSDDInitializer.jl      | 38 ++++++++++----------
 test/Probabilistic/EntropyKLDTest.jl         |  2 +-
 test/Probabilistic/PrConstraintTest.jl       |  4 +--
 test/StructureLearner/PSDDInitializerTest.jl |  2 +-
 12 files changed, 52 insertions(+), 52 deletions(-)

diff --git a/src/IO/CircuitLineCompiler.jl b/src/IO/CircuitLineCompiler.jl
index ed689467..9f14d375 100644
--- a/src/IO/CircuitLineCompiler.jl
+++ b/src/IO/CircuitLineCompiler.jl
@@ -35,7 +35,7 @@ function compile_struct_prob(circuit_lines::CircuitFormatLines, vtree_lines::Vtr
     return prob_circuit, vtree
 end
 
-function decorate_prob(lines::CircuitFormatLines, logical_circuit::LogicΔ, id2lognode::Dict{ID,<:LogicNode})::ProbΔ
+function decorate_prob(lines::CircuitFormatLines, logical_circuit::LogicΔ, id2lognode::Dict{ID,<:LogicCircuit})::ProbΔ
     # set up cache mapping logical circuit nodes to their probabilistic decorator
     lognode2probnode = ProbCache()
     # build a corresponding probabilistic circuit
@@ -69,7 +69,7 @@ end
 
 
 function decorate_logistic(lines::CircuitFormatLines, logical_circuit::LogicΔ, 
-                            classes::Int, id2lognode::Dict{ID,<:LogicNode})::LogisticΔ
+                            classes::Int, id2lognode::Dict{ID,<:LogicCircuit})::LogisticΔ
                         
     # set up cache mapping logical circuit nodes to their logistic decorator
     log2logistic = LogisticCache()
diff --git a/src/IO/CircuitParser.jl b/src/IO/CircuitParser.jl
index e76e28f5..589d1bb2 100644
--- a/src/IO/CircuitParser.jl
+++ b/src/IO/CircuitParser.jl
@@ -23,7 +23,7 @@ Load a structured probabilistic circuit from file.
 Support circuit file formats:
  * ".psdd" for PSDD files
 Supported vtree file formats:
- * ".vtree" for VTree files
+ * ".vtree" for Vtree files
 """
 function load_struct_prob_circuit(circuit_file::String, vtree_file::String)::Tuple{ProbΔ,PlainVtree}
     @assert endswith(circuit_file,".psdd")
diff --git a/src/IO/CircuitSaver.jl b/src/IO/CircuitSaver.jl
index 149d6d55..8d35f964 100644
--- a/src/IO/CircuitSaver.jl
+++ b/src/IO/CircuitSaver.jl
@@ -52,8 +52,8 @@ function get_node2id(ln::AbstractVector{X}, T::Type)where X #<: T#::Dict{T, ID}
     node2id
 end
 
-function get_vtree2id(ln::PlainVtree):: Dict{PlainVTree, ID}
-    vtree2id = Dict{PlainVTree, ID}()
+function get_vtree2id(ln::PlainVtree):: Dict{PlainVtree, ID}
+    vtree2id = Dict{PlainVtree, ID}()
     sizehint!(vtree2id, length(ln))
     index = ID(0) # vtree id start from 0
 
@@ -86,7 +86,7 @@ end
 
 function save_psdd_file(name::String, ln::ProbΔ, vtree::PlainVtree)
     # TODO add method isstructured
-    @assert ln[end].origin isa StructLogicNode "PSDD should decorate on StructLogicΔ"
+    @assert ln[end].origin isa StructLogicCircuit "PSDD should decorate on StructLogicΔ"
     @assert endswith(name, ".psdd")
     node2id = get_node2id(ln, ProbNode)
     vtree2id = get_vtree2id(vtree)
@@ -122,7 +122,7 @@ function lc_header()
 end
     
 function save_lc_file(name::String, ln::LogisticΔ, vtree)
-    @assert ln[end].origin isa StructLogicNode "LC should decorate on StructLogicΔ"
+    @assert ln[end].origin isa StructLogicCircuit "LC should decorate on StructLogicΔ"
     @assert endswith(name, ".circuit")
     node2id = get_node2id(ln, ProbNode)
     vtree2id = get_vtree2id(vtree)
diff --git a/src/Logistic/LogisticCircuits.jl b/src/Logistic/LogisticCircuits.jl
index 8632abca..98239895 100644
--- a/src/Logistic/LogisticCircuits.jl
+++ b/src/Logistic/LogisticCircuits.jl
@@ -55,15 +55,15 @@ function LogisticΔ(circuit::Δ, classes::Int, cache::LogisticCache = LogisticCa
     
     O = grapheltype(circuit) # type of node in the origin
 
-    pc_node(::LiteralGate, n::LogicNode) = LogisticLiteral{O}(n)
-    pc_node(::ConstantGate, n::LogicNode) = error("Cannot construct a logistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
+    pc_node(::LiteralGate, n::LogicCircuit) = LogisticLiteral{O}(n)
+    pc_node(::ConstantGate, n::LogicCircuit) = error("Cannot construct a logistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
 
-    pc_node(::⋀Gate, n::LogicNode) = begin
+    pc_node(::⋀Gate, n::LogicCircuit) = begin
         children = map(c -> cache[c], n.children)
         Logistic⋀{O}(n, children)
     end
 
-    pc_node(::⋁Gate, n::LogicNode) = begin
+    pc_node(::⋁Gate, n::LogicCircuit) = begin
         children = map(c -> cache[c], n.children)
         Logistic⋁(O, n, children, classes)
     end
diff --git a/src/Probabilistic/ProbCircuits.jl b/src/Probabilistic/ProbCircuits.jl
index f5e1dffe..07b08bda 100644
--- a/src/Probabilistic/ProbCircuits.jl
+++ b/src/Probabilistic/ProbCircuits.jl
@@ -58,7 +58,7 @@ function ProbΔ2(circuit::Δ)::ProbΔ
     linearize(ProbΔ2(circuit[end]))
 end
 
-function ProbΔ2(circuit::LogicNode)::ProbNode
+function ProbΔ2(circuit::LogicCircuit)::ProbNode
     f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
     f_lit(n) = ProbLiteral(n)
     f_a(n, cn) = Prob⋀(n, cn)
@@ -70,15 +70,15 @@ function ProbΔ(circuit::Δ, cache::ProbCache = ProbCache())
 
     sizehint!(cache, length(circuit)*4÷3)
 
-    pc_node(::LiteralGate, n::LogicNode) = ProbLiteral(n)
-    pc_node(::ConstantGate, n::LogicNode) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
+    pc_node(::LiteralGate, n::LogicCircuit) = ProbLiteral(n)
+    pc_node(::ConstantGate, n::LogicCircuit) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
 
-    pc_node(::⋀Gate, n::LogicNode) = begin
+    pc_node(::⋀Gate, n::LogicCircuit) = begin
         children = map(c -> cache[c], n.children)
         Prob⋀(n, children)
     end
 
-    pc_node(::⋁Gate, n::LogicNode) = begin
+    pc_node(::⋁Gate, n::LogicCircuit) = begin
         children = map(c -> cache[c], n.children)
         Prob⋁(n, children)
     end
diff --git a/src/Probabilistic/Queries.jl b/src/Probabilistic/Queries.jl
index 45d7b238..2d6c9bb4 100644
--- a/src/Probabilistic/Queries.jl
+++ b/src/Probabilistic/Queries.jl
@@ -3,13 +3,13 @@ using DataStructures
 # Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability
 # spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
 "Calculate the probability of the logic formula given by sdd for the psdd"
-function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogicNode})
-    cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64}()
+function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogicCircuit})
+    cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
 
     return pr_constraint(psdd_node, sdd_node, cache)
 end
-function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogicNode},
-                       cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64})::Float64
+function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogicCircuit},
+                       cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})::Float64
     if (psdd_node, sdd_node) in keys(cache) # Cache hit
         return cache[psdd_node, sdd_node]
     elseif psdd_node isa ProbLiteral # Boundary cases
@@ -92,19 +92,19 @@ end
 "KL divergence calculation for psdds that are not necessarily identical"
 function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode)::Float64
     kl_divergence_cache = Dict{Tuple{ProbNode, ProbNode}, Float64}()
-    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64}()
+    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
 
     return psdd_kl_divergence(psdd_node1, psdd_node2, kl_divergence_cache, pr_constraint_cache)
 end
 function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
         kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64})::Float64
-    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64}()
+    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
 
     return psdd_kl_divergence(psdd_node1, psdd_node2, kl_divergence_cache, pr_constraint_cache)
 end
 function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
         kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64})
+        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
     @assert !(psdd_node1 isa Prob⋀ || psdd_node2 isa Prob⋀) "Prob⋀ not a valid PSDD node for KL-Divergence"
 
     # Check if both nodes are normalized for same vtree node
@@ -175,7 +175,7 @@ function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
 end
 function psdd_kl_divergence(psdd_node1::ProbLiteral, psdd_node2::ProbLiteral,
         kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64})
+        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
     # Check if literals are over same variables in vtree
    @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
@@ -188,7 +188,7 @@ function psdd_kl_divergence(psdd_node1::ProbLiteral, psdd_node2::ProbLiteral,
 end
 function psdd_kl_divergence(psdd_node1::Prob⋁, psdd_node2::ProbLiteral,
         kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64})
+        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
     @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
@@ -209,7 +209,7 @@ function psdd_kl_divergence(psdd_node1::Prob⋁, psdd_node2::ProbLiteral,
 end
 function psdd_kl_divergence(psdd_node1::ProbLiteral, psdd_node2::Prob⋁,
         kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64})
+        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
     @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
diff --git a/src/Probabilistic/VtreeLearner.jl b/src/Probabilistic/VtreeLearner.jl
index 86d91169..676f911c 100644
--- a/src/Probabilistic/VtreeLearner.jl
+++ b/src/Probabilistic/VtreeLearner.jl
@@ -224,7 +224,7 @@ function learn_vtree_bottom_up(train_x::PlainXData; α)
     (_, mi) = mutual_information(feature_matrix(train_x), Data.weights(train_x); α = α)
     vars = Var.(collect(1:num_features(train_x)))
     context = BlossomContext(vars, mi)
-    vtree = bottom_up_vtree(PlainVTree, vars, blossom_bottom_up_curry(context))
+    vtree = bottom_up_vtree(PlainVtree, vars, blossom_bottom_up_curry(context))
 end
 
 #############
diff --git a/src/StructureLearner/CircuitBuilder.jl b/src/StructureLearner/CircuitBuilder.jl
index b21b47d2..4591a3db 100644
--- a/src/StructureLearner/CircuitBuilder.jl
+++ b/src/StructureLearner/CircuitBuilder.jl
@@ -24,7 +24,7 @@ end
 function compile_prob_circuit_from_clt(clt::CLT)::ProbΔ
     topo_order = Var.(reverse(topological_sort_by_dfs(clt::CLT))) #order to parse the node
     lin = Vector{ProbNode}()
-    node_cache = Dict{Lit, LogicNode}()
+    node_cache = Dict{Lit, LogicCircuit}()
     prob_cache = ProbCache()
     parent = parent_vector(clt)
 
@@ -106,7 +106,7 @@ function compile_prob_circuit_from_clt(clt::CLT)::ProbΔ
         prob_cache[temp] = n
         push!(lin, n)
         temp = ⋁Node([temp])
-        n = Prob⋁{LogicNode}(temp, prob_children(temp))
+        n = Prob⋁{LogicCircuit}(temp, prob_children(temp))
         prob_cache[temp] = n
         n.log_thetas = [0.0]
         push!(lin, n)
diff --git a/src/StructureLearner/PSDDInitializer.jl b/src/StructureLearner/PSDDInitializer.jl
index cb1bd27c..354722d5 100644
--- a/src/StructureLearner/PSDDInitializer.jl
+++ b/src/StructureLearner/PSDDInitializer.jl
@@ -1,7 +1,7 @@
 using ..Utils
 
-"Map from literal to LogicNode"
-const LitCache = Dict{Lit, LogicNode}
+"Map from literal to LogicCircuit"
+const LitCache = Dict{Lit, LogicCircuit}
 
 "Use literal to represent constraint (1 to X, -1 to not X), 0 to represent true"
 const ⊤ = convert(Lit, 0)
@@ -37,7 +37,7 @@ function learn_vtree_from_clt(clt::CLT; vtree_mode::String)::PlainVtree
     return linearize(rootnode)
 end
 
-function construct_node(v::Var, clt::CLT, strategy::String)::PlainVTree
+function construct_node(v::Var, clt::CLT, strategy::String)::PlainVtree
     children = Var.(outneighbors(clt, v))
     if isempty(children) # leaf node
         return PlainVtreeLeafNode(v)
@@ -47,9 +47,9 @@ function construct_node(v::Var, clt::CLT, strategy::String)::PlainVTree
     end
 end
 
-function construct_children(children::Vector{Var}, clt::CLT, strategy::String)::PlainVTree
+function construct_children(children::Vector{Var}, clt::CLT, strategy::String)::PlainVtree
     sorted_vars = sort(collect(children))
-    children_nodes = Vector{PlainVTree}()
+    children_nodes = Vector{PlainVtree}()
     foreach(x -> push!(children_nodes, construct_node(x, clt, strategy)), sorted_vars)
 
     if strategy == "linear"
@@ -61,7 +61,7 @@ function construct_children(children::Vector{Var}, clt::CLT, strategy::String)::
     end
 end
 
-function construct_children_linear(children_nodes::Vector{PlainVTree}, clt::CLT)::PlainVTree
+function construct_children_linear(children_nodes::Vector{PlainVtree}, clt::CLT)::PlainVtree
     children_nodes = Iterators.Stateful(reverse(children_nodes))
 
     right = popfirst!(children_nodes)
@@ -71,7 +71,7 @@ function construct_children_linear(children_nodes::Vector{PlainVTree}, clt::CLT)
     return right
 end
 
-function construct_children_balanced(children_nodes::Vector{PlainVTree}, clt::CLT)::PlainVTree
+function construct_children_balanced(children_nodes::Vector{PlainVtree}, clt::CLT)::PlainVtree
     if length(children_nodes) == 1
         return children_nodes[1]
     elseif length(children_nodes) == 2
@@ -84,7 +84,7 @@ function construct_children_balanced(children_nodes::Vector{PlainVTree}, clt::CL
     end
 end
 
-function add_parent(parent::Var, children::PlainVTree)
+function add_parent(parent::Var, children::PlainVtree)
     return PlainVtreeInnerNode(PlainVtreeLeafNode(parent), children)
 end
 
@@ -100,10 +100,10 @@ function compile_psdd_from_clt(clt::MetaDiGraph, vtree::PlainVtree)
     lin = Vector{ProbNode}()
     prob_cache = ProbCache()
     lit_cache = LitCache()
-    v2p = Dict{PlainVTree, ProbΔ}()
+    v2p = Dict{PlainVtree, ProbΔ}()
 
     get_params(cpt::Dict) = length(cpt) == 2 ? [cpt[1], cpt[0]] : [cpt[(1,1)], cpt[(0,1)], cpt[(1,0)], cpt[(0,0)]]
-    function add_mapping!(v::PlainVTree, circuits::ProbΔ)
+    function add_mapping!(v::PlainVtree, circuits::ProbΔ)
         if !haskey(v2p, v); v2p[v] = Vector{ProbNode}(); end
         foreach(c -> if !(c in v2p[v]) push!(v2p[v], c);end, circuits)
     end
@@ -117,7 +117,7 @@ function compile_psdd_from_clt(clt::MetaDiGraph, vtree::PlainVtree)
         if isequal(children, [])
             circuit = compile_true_nodes(var, v, get_params(cpt), lit_cache, prob_cache, lin)
         else
-            circuit = compile_literal_nodes(var, v, get_params(cpt), lit_cache, prob_cache, lin)
+            circuit = compile_canonical_literals(var, v, get_params(cpt), lit_cache, prob_cache, lin)
         end
         add_mapping!(v, circuit)
     end
@@ -149,12 +149,12 @@ end
 #####################
 
 prob_children(n, prob_cache) =  
-    collect(ProbNode{<:StructLogicNode}, map(c -> prob_cache[c], n.children))
+    collect(ProbNode{<:StructLogicCircuit}, map(c -> prob_cache[c], n.children))
 
 "Add leaf nodes to circuit `lin`"
 function add_prob_leaf_node(var::Var, vtree::PlainVtreeLeafNode, lit_cache::LitCache, prob_cache::ProbCache, lin)
-    pos = StructLiteralNode{PlainVTree}( var2lit(var), vtree)
-    neg = StructLiteralNode{PlainVTree}(-var2lit(var), vtree)
+    pos = StructLiteralNode{PlainVtree}( var2lit(var), vtree)
+    neg = StructLiteralNode{PlainVtree}(-var2lit(var), vtree)
     lit_cache[var2lit(var)] = pos
     lit_cache[-var2lit(var)] = neg
     pos2 = ProbLiteral(pos)
@@ -168,7 +168,7 @@ end
 
 "Add prob⋀ node to circuit `lin`"
 function add_prob⋀_node(children::ProbΔ, vtree::PlainVtreeInnerNode, prob_cache::ProbCache, lin)::Prob⋀
-    logic = Struct⋀Node{PlainVTree}([c.origin for c in children], vtree)
+    logic = Struct⋀Node{PlainVtree}([c.origin for c in children], vtree)
     prob = Prob⋀(logic, prob_children(logic, prob_cache))
     prob_cache[logic] = prob
     push!(lin, prob)
@@ -176,8 +176,8 @@ function add_prob⋀_node(children::ProbΔ, vtree::PlainVtreeInnerNode, prob_cac
 end
 
 "Add prob⋁ node to circuit `lin`"
-function add_prob⋁_node(children::ProbΔ, vtree::PlainVTree, thetas::Vector{Float64}, prob_cache::ProbCache, lin)::Prob⋁
-    logic = Struct⋁Node{PlainVTree}([c.origin for c in children], vtree)
+function add_prob⋁_node(children::ProbΔ, vtree::PlainVtree, thetas::Vector{Float64}, prob_cache::ProbCache, lin)::Prob⋁
+    logic = Struct⋁Node{PlainVtree}([c.origin for c in children], vtree)
     prob = Prob⋁(logic, prob_children(logic, prob_cache))
     prob.log_thetas = log.(thetas)
     prob_cache[logic] = prob
@@ -192,7 +192,7 @@ function compile_decision_node(primes::ProbΔ, subs::ProbΔ, vtree::PlainVtreeIn
 end
 
 "Construct literal nodes given variable `var`"
-function compile_literal_nodes(var::Var, vtree::PlainVtreeLeafNode, probs::Vector{Float64}, lit_cache::LitCache, prob_cache::ProbCache, lin)
+function compile_canonical_literals(var::Var, vtree::PlainVtreeLeafNode, probs::Vector{Float64}, lit_cache::LitCache, prob_cache::ProbCache, lin)
     (pos, neg) = add_prob_leaf_node(var, vtree, lit_cache, prob_cache, lin)
     return [pos, neg]
 end
@@ -265,7 +265,7 @@ function compile_fully_factorized_psdd_from_vtree(vtree::PlainVtree)::ProbΔ
     lin = Vector{ProbNode}()
     prob_cache = ProbCache()
     lit_cache = LitCache()
-    v2n = Dict{PlainVTree, ProbNode}()
+    v2n = Dict{PlainVtree, ProbNode}()
 
     for v in vtree
         ful_factor_node(v, lit_cache, prob_cache, v2n, lin)
diff --git a/test/Probabilistic/EntropyKLDTest.jl b/test/Probabilistic/EntropyKLDTest.jl
index 0c7542e9..aebd67ca 100644
--- a/test/Probabilistic/EntropyKLDTest.jl
+++ b/test/Probabilistic/EntropyKLDTest.jl
@@ -16,7 +16,7 @@ using ProbabilisticCircuits
 
     # KLD Tests #
     # KLD base tests
-    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64}()
+    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
     kl_divergence_cache = Dict{Tuple{ProbNode, ProbNode}, Float64}()
 
     @test_throws AssertionError("Both nodes not normalized for same vtree node") psdd_kl_divergence(pc1[1], pc1[3], kl_divergence_cache, pr_constraint_cache)
diff --git a/test/Probabilistic/PrConstraintTest.jl b/test/Probabilistic/PrConstraintTest.jl
index ceb6fcb5..248dc240 100644
--- a/test/Probabilistic/PrConstraintTest.jl
+++ b/test/Probabilistic/PrConstraintTest.jl
@@ -9,7 +9,7 @@ using ProbabilisticCircuits
     pc, vtree = load_struct_prob_circuit(
                     zoo_psdd_file("simple2.4.psdd"), simplevtree)
 
-    cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64}()
+    cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
 
     @test abs(pr_constraint(pc[end], pc[end], cache) - 1.0) < 1e-8
     @test abs(pr_constraint(pc[5], pc[3], cache) - 0.2) < 1e-8
@@ -28,7 +28,7 @@ using ProbabilisticCircuits
     pc1, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.5.psdd"), simplevtree)
     pc2, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.6.psdd"), simplevtree)
 
-    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicNode}}, Float64}()
+    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
     pr_constraint(pc1[end], pc2[end], pr_constraint_cache)
     @test abs(pr_constraint_cache[pc1[1], pc2[1]] - 1.0) < 1e-8
     @test abs(pr_constraint_cache[pc1[1], pc2[2]] - 0.0) < 1e-8
diff --git a/test/StructureLearner/PSDDInitializerTest.jl b/test/StructureLearner/PSDDInitializerTest.jl
index 25a8690c..2065e894 100644
--- a/test/StructureLearner/PSDDInitializerTest.jl
+++ b/test/StructureLearner/PSDDInitializerTest.jl
@@ -19,7 +19,7 @@ using ProbabilisticCircuits
     # @test pc[28].log_thetas[1] ≈ -1.1870882896239272 atol=1.0e-7
 
     # is structured decomposable 
-    for (n, vars) in variable_scopes(pc)
+    for (n, vars) in variables_by_node(pc)
         @test vars == BitSet(variables(origin(n).vtree))
     end
 

From 8293f953b2659bdfdb6079e8bb15d2f710a56b35 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Mon, 13 Jul 2020 02:19:19 -0700
Subject: [PATCH 003/131] bugfixes to LoadSave

---
 src/IO/CircuitLineCompiler.jl          | 20 ++++++++++----------
 src/StructureLearner/CircuitBuilder.jl | 16 ++++++++--------
 test/Probabilistic/PrConstraintTest.jl |  4 ++--
 3 files changed, 20 insertions(+), 20 deletions(-)

diff --git a/src/IO/CircuitLineCompiler.jl b/src/IO/CircuitLineCompiler.jl
index 9f14d375..f0899984 100644
--- a/src/IO/CircuitLineCompiler.jl
+++ b/src/IO/CircuitLineCompiler.jl
@@ -13,8 +13,8 @@ Compile lines into a probabilistic circuit.
 """
 function compile_prob(lines::CircuitFormatLines)::ProbΔ
     # first compile a logical circuit
-    logical_circuit, id2lognode = compile_smooth_logical_m(lines)
-    decorate_prob(lines, logical_circuit, id2lognode)
+    logic_circuit, id2lognode = compile_smooth_logical_m(lines)
+    decorate_prob(lines, logic_circuit, id2lognode)
 end
 
 """
@@ -22,24 +22,24 @@ Compile lines into a logistic circuit.
 """
 function compile_logistic(lines::CircuitFormatLines, classes::Int)::LogisticΔ
     # first compile a logical circuit
-    logical_circuit, id2lognode = compile_smooth_logical_m(lines)
-    decorate_logistic(lines, logical_circuit, classes, id2lognode)
+    logic_circuit, id2lognode = compile_smooth_logical_m(lines)
+    decorate_logistic(lines, logic_circuit, classes, id2lognode)
 end
 
 """
 Compile circuit and vtree lines into a structured probabilistic circuit (one whose logical circuit origin is structured).
 """
 function compile_struct_prob(circuit_lines::CircuitFormatLines, vtree_lines::VtreeFormatLines)
-    logical_circuit, vtree, id2vtree, id2lognode = compile_smooth_struct_logical_m(circuit_lines, vtree_lines)
-    prob_circuit = decorate_prob(circuit_lines, logical_circuit, id2lognode)
+    logic_circuit, vtree, id2vtree, id2lognode = compile_smooth_struct_logical_m(circuit_lines, vtree_lines)
+    prob_circuit = decorate_prob(circuit_lines, logic_circuit, id2lognode)
     return prob_circuit, vtree
 end
 
-function decorate_prob(lines::CircuitFormatLines, logical_circuit::LogicΔ, id2lognode::Dict{ID,<:LogicCircuit})::ProbΔ
+function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicΔ, id2lognode::Dict{ID,<:LogicCircuit})::ProbΔ
     # set up cache mapping logical circuit nodes to their probabilistic decorator
     lognode2probnode = ProbCache()
     # build a corresponding probabilistic circuit
-    prob_circuit = ProbΔ(logical_circuit,lognode2probnode)
+    prob_circuit = ProbΔ(logic_circuit,lognode2probnode)
     # map from line node ids to probabilistic circuit nodes
     id2probnode(id) = lognode2probnode[id2lognode[id]]
 
@@ -68,13 +68,13 @@ function decorate_prob(lines::CircuitFormatLines, logical_circuit::LogicΔ, id2l
 end
 
 
-function decorate_logistic(lines::CircuitFormatLines, logical_circuit::LogicΔ, 
+function decorate_logistic(lines::CircuitFormatLines, logic_circuit::LogicΔ, 
                             classes::Int, id2lognode::Dict{ID,<:LogicCircuit})::LogisticΔ
                         
     # set up cache mapping logical circuit nodes to their logistic decorator
     log2logistic = LogisticCache()
     # build a corresponding probabilistic circuit
-    logistic_circuit = LogisticΔ(logical_circuit, classes, log2logistic)
+    logistic_circuit = LogisticΔ(logic_circuit, classes, log2logistic)
     # map from line node ids to probabilistic circuit nodes
     id2logisticnode(id) = log2logistic[id2lognode[id]]
 
diff --git a/src/StructureLearner/CircuitBuilder.jl b/src/StructureLearner/CircuitBuilder.jl
index 4591a3db..cfdefccb 100644
--- a/src/StructureLearner/CircuitBuilder.jl
+++ b/src/StructureLearner/CircuitBuilder.jl
@@ -48,13 +48,13 @@ function compile_prob_circuit_from_clt(clt::CLT)::ProbΔ
     end
 
     "compile inner disjunction node"
-    function compile_⋁inner(ln::Lit, children::Vector{Var})::Vector{⋁Node}
-        logical_nodes = Vector{⋁Node}()
+    function compile_⋁inner(ln::Lit, children::Vector{Var})::Vector{Plain⋁Node}
+        logical_nodes = Vector{Plain⋁Node}()
         v = lit2value(ln)
 
         for c in children
             #build logical ciruits
-            temp = ⋁Node([node_cache[lit] for lit in [var2lit(c), - var2lit(c)]])
+            temp = Plain⋁Node([node_cache[lit] for lit in [var2lit(c), - var2lit(c)]])
             push!(logical_nodes, temp)
             n = Prob⋁(temp, prob_children(temp))
             prob_cache[temp] = n
@@ -69,9 +69,9 @@ function compile_prob_circuit_from_clt(clt::CLT)::ProbΔ
     end
 
     "compile inner conjunction node into circuits, left node is indicator, rest nodes are disjunction children nodes"
-    function compile_⋀inner(indicator::Lit, children::Vector{⋁Node})
+    function compile_⋀inner(indicator::Lit, children::Vector{Plain⋁Node})
         leaf = node_cache[indicator]
-        temp = ⋀Node(vcat([leaf], children))
+        temp = Plain⋀Node(vcat([leaf], children))
         node_cache[indicator] = temp
         n = Prob⋀(temp, prob_children(temp))
         prob_cache[temp] = n
@@ -89,7 +89,7 @@ function compile_prob_circuit_from_clt(clt::CLT)::ProbΔ
 
     "compile root, add another disjunction node"
     function compile_root(root::Var)
-        temp = ⋁Node([node_cache[s] for s in [var2lit(root), -var2lit(root)]])
+        temp = Plain⋁Node([node_cache[s] for s in [var2lit(root), -var2lit(root)]])
         n = Prob⋁(temp, prob_children(temp))
         prob_cache[temp] = n
         n.log_thetas = zeros(Float64, 2)
@@ -101,11 +101,11 @@ function compile_prob_circuit_from_clt(clt::CLT)::ProbΔ
     end
 
     function compile_independent_roots(roots::Vector{ProbNode})
-        temp = ⋀Node([c.origin for c in roots])
+        temp = Plain⋀Node([c.origin for c in roots])
         n = Prob⋀(temp, prob_children(temp))
         prob_cache[temp] = n
         push!(lin, n)
-        temp = ⋁Node([temp])
+        temp = Plain⋁Node([temp])
         n = Prob⋁{LogicCircuit}(temp, prob_children(temp))
         prob_cache[temp] = n
         n.log_thetas = [0.0]
diff --git a/test/Probabilistic/PrConstraintTest.jl b/test/Probabilistic/PrConstraintTest.jl
index 248dc240..e4554b8c 100644
--- a/test/Probabilistic/PrConstraintTest.jl
+++ b/test/Probabilistic/PrConstraintTest.jl
@@ -17,12 +17,12 @@ using ProbabilisticCircuits
 
     file_circuit = "little_4var.circuit"
     file_vtree = "little_4var.vtree"
-    logical_circuit, vtree = load_struct_smooth_logical_circuit(
+    logic_circuit, vtree = load_struct_smooth_logic_circuit(
                                 zoo_lc_file(file_circuit), zoo_vtree_file(file_vtree))
 
     pc = zoo_psdd("little_4var.psdd")
 
-    @test abs(pr_constraint(pc[end], logical_circuit[end - 1], cache) - 1.0) < 1e-8
+    @test abs(pr_constraint(pc[end], logic_circuit[end - 1], cache) - 1.0) < 1e-8
 
     # Test with two psdds
     pc1, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.5.psdd"), simplevtree)

From 433088b0c2f34fb7b4ce5c53135bb75c3bce8ada Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Mon, 20 Jul 2020 22:31:46 -0700
Subject: [PATCH 004/131] redesign compilation API

---
 src/Probabilistic/Queries.jl            |  2 +-
 src/StructureLearner/PSDDInitializer.jl | 14 +++++++-------
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/src/Probabilistic/Queries.jl b/src/Probabilistic/Queries.jl
index 2d6c9bb4..cf059b4a 100644
--- a/src/Probabilistic/Queries.jl
+++ b/src/Probabilistic/Queries.jl
@@ -13,7 +13,7 @@ function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogi
     if (psdd_node, sdd_node) in keys(cache) # Cache hit
         return cache[psdd_node, sdd_node]
     elseif psdd_node isa ProbLiteral # Boundary cases
-        if sdd_node isa Union{ProbLiteral, StructLiteralNode} # Both are literals, just check whether they agrees with each other
+        if sdd_node isa Union{ProbLiteral, PlainStructLiteralNode} # Both are literals, just check whether they agrees with each other
             if literal(psdd_node) == literal(sdd_node)
                 return get!(cache, (psdd_node, sdd_node), 1.0)
             else
diff --git a/src/StructureLearner/PSDDInitializer.jl b/src/StructureLearner/PSDDInitializer.jl
index 354722d5..a394dac6 100644
--- a/src/StructureLearner/PSDDInitializer.jl
+++ b/src/StructureLearner/PSDDInitializer.jl
@@ -153,8 +153,8 @@ prob_children(n, prob_cache) =
 
 "Add leaf nodes to circuit `lin`"
 function add_prob_leaf_node(var::Var, vtree::PlainVtreeLeafNode, lit_cache::LitCache, prob_cache::ProbCache, lin)
-    pos = StructLiteralNode{PlainVtree}( var2lit(var), vtree)
-    neg = StructLiteralNode{PlainVtree}(-var2lit(var), vtree)
+    pos = PlainStructLiteralNode{PlainVtree}( var2lit(var), vtree)
+    neg = PlainStructLiteralNode{PlainVtree}(-var2lit(var), vtree)
     lit_cache[var2lit(var)] = pos
     lit_cache[-var2lit(var)] = neg
     pos2 = ProbLiteral(pos)
@@ -168,7 +168,7 @@ end
 
 "Add prob⋀ node to circuit `lin`"
 function add_prob⋀_node(children::ProbΔ, vtree::PlainVtreeInnerNode, prob_cache::ProbCache, lin)::Prob⋀
-    logic = Struct⋀Node{PlainVtree}([c.origin for c in children], vtree)
+    logic = PlainStruct⋀Node{PlainVtree}([c.origin for c in children], vtree)
     prob = Prob⋀(logic, prob_children(logic, prob_cache))
     prob_cache[logic] = prob
     push!(lin, prob)
@@ -177,7 +177,7 @@ end
 
 "Add prob⋁ node to circuit `lin`"
 function add_prob⋁_node(children::ProbΔ, vtree::PlainVtree, thetas::Vector{Float64}, prob_cache::ProbCache, lin)::Prob⋁
-    logic = Struct⋁Node{PlainVtree}([c.origin for c in children], vtree)
+    logic = PlainStruct⋁Node{PlainVtree}([c.origin for c in children], vtree)
     prob = Prob⋁(logic, prob_children(logic, prob_cache))
     prob.log_thetas = log.(thetas)
     prob_cache[logic] = prob
@@ -212,7 +212,7 @@ end
 # Map and cache constraints
 #####################
 
-function set_base(index, n::StructLiteralNode, bases)
+function set_base(index, n::PlainStructLiteralNode, bases)
     if ispositive(n)
         bases[n][variable(n)] = 1
     else
@@ -220,13 +220,13 @@ function set_base(index, n::StructLiteralNode, bases)
     end
 end
 
-function set_base(index, n::Struct⋁Node, bases)
+function set_base(index, n::PlainStruct⋁Node, bases)
     len = num_children(n)
     temp = sum([bases[c] for c in n.children])
     bases[n] = map(x-> if x == len 1; elseif -x == len; -1; else 0; end, temp)
 end
 
-function set_base(index, n::Struct⋀Node, bases)
+function set_base(index, n::PlainStruct⋀Node, bases)
     bases[n] = sum([bases[c] for c in n.children])
 end
 

From 718dc179ed2ed48e88103a8266ea16aa1f505a67 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Wed, 22 Jul 2020 19:53:00 -0700
Subject: [PATCH 005/131] change node flip field into counter

---
 src/Probabilistic/ProbCircuits.jl | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/Probabilistic/ProbCircuits.jl b/src/Probabilistic/ProbCircuits.jl
index 07b08bda..85a6e9b4 100644
--- a/src/Probabilistic/ProbCircuits.jl
+++ b/src/Probabilistic/ProbCircuits.jl
@@ -8,17 +8,17 @@ abstract type ProbInnerNode{O} <: ProbNode{O} end
 mutable struct ProbLiteral{O} <: ProbLeafNode{O}
     origin::O
     data
-    bit::Bool
-    ProbLiteral(n) = new{node_type_deprecated(n)}(n, nothing, false)
+    counter::UInt32
+    ProbLiteral(n) = new{node_type_deprecated(n)}(n, nothing, 0)
 end
 
 mutable struct Prob⋀{O} <: ProbInnerNode{O}
     origin::O
     children::Vector{<:ProbNode{<:O}}
     data
-    bit::Bool
+    counter::UInt32
     Prob⋀(n, children) = begin
-        new{node_type_deprecated(n)}(n, convert(Vector{ProbNode{node_type_deprecated(n)}},children), nothing, false)
+        new{node_type_deprecated(n)}(n, convert(Vector{ProbNode{node_type_deprecated(n)}},children), nothing, 0)
     end
 end
 
@@ -27,8 +27,8 @@ mutable struct Prob⋁{O} <: ProbInnerNode{O}
     children::Vector{<:ProbNode{<:O}}
     log_thetas::Vector{Float64}
     data
-    bit::Bool
-    Prob⋁(n, children) = new{node_type_deprecated(n)}(n, convert(Vector{ProbNode{node_type_deprecated(n)}},children), init_array(Float64, length(children)), nothing, false)
+    counter::UInt32
+    Prob⋁(n, children) = new{node_type_deprecated(n)}(n, convert(Vector{ProbNode{node_type_deprecated(n)}},children), init_array(Float64, length(children)), nothing, 0)
 end
 
 const ProbΔ{O} = AbstractVector{<:ProbNode{<:O}}

From 2e322e2add630e829930731f348470c4c924ebe7 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Thu, 23 Jul 2020 14:58:20 -0700
Subject: [PATCH 006/131] refactor LoadSave; probabilistic node methods

---
 src/IO/CircuitLineCompiler.jl                 | 117 ----
 src/IO/IO.jl                                  |  33 --
 src/IO/Loaders.jl                             |  22 -
 src/LoadSave/LoadSave.jl                      |  11 +
 src/LoadSave/circuit_line_compiler.jl         | 121 ++++
 .../circuit_loaders.jl}                       |  61 ++-
 .../circuit_savers.jl}                        | 118 ++--
 src/Probabilistic/ProbCircuits.jl             | 515 ------------------
 src/Probabilistic/Probabilistic.jl            |  18 +-
 src/Probabilistic/Queries.jl                  | 277 +++-------
 src/Probabilistic/flows.jl                    |   0
 src/Probabilistic/kld.jl                      | 230 ++++++++
 src/Probabilistic/parameters.jl               | 257 +++++++++
 src/Probabilistic/prob_nodes.jl               | 104 ++++
 src/ProbabilisticCircuits.jl                  |  19 +-
 src/Utils/Utils.jl                            |  72 +--
 src/Utils/decorators.jl                       |  65 +++
 src/Utils/misc.jl                             |  67 +++
 .../circuit_loaders_tests.jl}                 |  24 +-
 .../circuit_savers_test.jl}                   |   6 +-
 test/Probabilistic/prob_nodes_tests.jl        |  37 ++
 ...CircuitQueriesTest.jl => queries_tests.jl} |   5 +-
 test/helper/plain_logic_circuits.jl           |  68 +++
 23 files changed, 1158 insertions(+), 1089 deletions(-)
 delete mode 100644 src/IO/CircuitLineCompiler.jl
 delete mode 100644 src/IO/IO.jl
 delete mode 100644 src/IO/Loaders.jl
 create mode 100644 src/LoadSave/LoadSave.jl
 create mode 100644 src/LoadSave/circuit_line_compiler.jl
 rename src/{IO/CircuitParser.jl => LoadSave/circuit_loaders.jl} (58%)
 rename src/{IO/CircuitSaver.jl => LoadSave/circuit_savers.jl} (64%)
 delete mode 100644 src/Probabilistic/ProbCircuits.jl
 create mode 100644 src/Probabilistic/flows.jl
 create mode 100644 src/Probabilistic/kld.jl
 create mode 100644 src/Probabilistic/parameters.jl
 create mode 100644 src/Probabilistic/prob_nodes.jl
 create mode 100644 src/Utils/decorators.jl
 create mode 100644 src/Utils/misc.jl
 rename test/{IO/PSDDParserTest.jl => LoadSave/circuit_loaders_tests.jl} (61%)
 rename test/{IO/CircuitSaverTest.jl => LoadSave/circuit_savers_test.jl} (78%)
 create mode 100644 test/Probabilistic/prob_nodes_tests.jl
 rename test/Probabilistic/{CircuitQueriesTest.jl => queries_tests.jl} (96%)
 create mode 100644 test/helper/plain_logic_circuits.jl

diff --git a/src/IO/CircuitLineCompiler.jl b/src/IO/CircuitLineCompiler.jl
deleted file mode 100644
index f0899984..00000000
--- a/src/IO/CircuitLineCompiler.jl
+++ /dev/null
@@ -1,117 +0,0 @@
-using LogicCircuits.IO: constant
-
-#####################
-# Compilers to ProbabilisticCircuits data structures starting from already parsed line objects
-#####################
-
-# reuse some internal infrastructure of LogicCircuits' IO module
-using LogicCircuits.IO: CircuitFormatLines, CircuitFormatLine, VtreeFormatLines, CircuitHeaderLine, UnweightedLiteralLine, WeightedLiteralLine, DecisionLine, LCElement, BiasLine, WeightedNamedConstantLine, PSDDElement, CircuitCommentLine, ID,
-compile_smooth_struct_logical_m, compile_smooth_logical_m
-
-"""
-Compile lines into a probabilistic circuit.
-"""
-function compile_prob(lines::CircuitFormatLines)::ProbΔ
-    # first compile a logical circuit
-    logic_circuit, id2lognode = compile_smooth_logical_m(lines)
-    decorate_prob(lines, logic_circuit, id2lognode)
-end
-
-"""
-Compile lines into a logistic circuit.
-"""
-function compile_logistic(lines::CircuitFormatLines, classes::Int)::LogisticΔ
-    # first compile a logical circuit
-    logic_circuit, id2lognode = compile_smooth_logical_m(lines)
-    decorate_logistic(lines, logic_circuit, classes, id2lognode)
-end
-
-"""
-Compile circuit and vtree lines into a structured probabilistic circuit (one whose logical circuit origin is structured).
-"""
-function compile_struct_prob(circuit_lines::CircuitFormatLines, vtree_lines::VtreeFormatLines)
-    logic_circuit, vtree, id2vtree, id2lognode = compile_smooth_struct_logical_m(circuit_lines, vtree_lines)
-    prob_circuit = decorate_prob(circuit_lines, logic_circuit, id2lognode)
-    return prob_circuit, vtree
-end
-
-function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicΔ, id2lognode::Dict{ID,<:LogicCircuit})::ProbΔ
-    # set up cache mapping logical circuit nodes to their probabilistic decorator
-    lognode2probnode = ProbCache()
-    # build a corresponding probabilistic circuit
-    prob_circuit = ProbΔ(logic_circuit,lognode2probnode)
-    # map from line node ids to probabilistic circuit nodes
-    id2probnode(id) = lognode2probnode[id2lognode[id]]
-
-    # go through lines again and update the probabilistic circuit node parameters
-
-    function compile(ln::CircuitFormatLine)
-        error("Compilation of line $ln into probabilistic circuit is not supported")
-    end
-    function compile(::Union{CircuitHeaderLine,CircuitCommentLine,UnweightedLiteralLine})
-        # do nothing
-    end
-    function compile(ln::WeightedNamedConstantLine)
-        @assert constant(ln) == true
-        node = id2probnode(ln.node_id)::Prob⋁
-        node.log_thetas .= [ln.weight, log1p(-exp(ln.weight)) ]
-    end
-    function compile(ln::DecisionLine{<:PSDDElement})
-        node = id2probnode(ln.node_id)::Prob⋁
-        node.log_thetas .= [x.weight for x in ln.elements]
-    end
-    for ln in lines
-        compile(ln)
-    end
-
-    prob_circuit
-end
-
-
-function decorate_logistic(lines::CircuitFormatLines, logic_circuit::LogicΔ, 
-                            classes::Int, id2lognode::Dict{ID,<:LogicCircuit})::LogisticΔ
-                        
-    # set up cache mapping logical circuit nodes to their logistic decorator
-    log2logistic = LogisticCache()
-    # build a corresponding probabilistic circuit
-    logistic_circuit = LogisticΔ(logic_circuit, classes, log2logistic)
-    # map from line node ids to probabilistic circuit nodes
-    id2logisticnode(id) = log2logistic[id2lognode[id]]
-
-    # go through lines again and update the probabilistic circuit node parameters
-
-    function compile(ln::CircuitFormatLine)
-        error("Compilation of line $ln into logistic circuit is not supported")
-    end
-    function compile(::Union{CircuitHeaderLine,CircuitCommentLine,UnweightedLiteralLine})
-        # do nothing
-    end
-
-    function compile(ln::CircuitHeaderLine)
-        # do nothing
-    end
-
-    function compile(ln::WeightedLiteralLine)
-        node = id2logisticnode(ln.node_id)::Logistic⋁
-        node.thetas[1, :] .= ln.weights
-    end
-
-    function compile(ln::DecisionLine{<:LCElement})
-        node = id2logisticnode(ln.node_id)::Logistic⋁
-        for (ind, elem) in enumerate(ln.elements)
-            node.thetas[ind, :] .= elem.weights
-        end
-    end
-
-    function compile(ln::BiasLine)
-        node = id2logisticnode(ln.node_id)::Logistic⋁
-        # @assert length(node.thetas) == 1
-        node.thetas[1,:] .= ln.weights
-    end
-
-    for ln in lines
-        compile(ln)
-    end
-
-    logistic_circuit
-end
\ No newline at end of file
diff --git a/src/IO/IO.jl b/src/IO/IO.jl
deleted file mode 100644
index 538edc8a..00000000
--- a/src/IO/IO.jl
+++ /dev/null
@@ -1,33 +0,0 @@
-module IO
-
-using LogicCircuits
-using ..Utils
-using ..Probabilistic
-using ..Logistic
-
-export
-
-# CircuitParser
-load_prob_circuit, 
-load_struct_prob_circuit, 
-load_psdd_prob_circuit, 
-load_logistic_circuit,
-parse_clt,
-
-# CircuitSaver
-save_as_dot, istrue_node, save_circuit,
-# get_node2id,get_vtree2id,vtree_node, decompile, make_element, save_lines, save_psdd_comment_line, save_sdd_comment_line, 
-# save_line, to_string
-
-
-# Loaders
-zoo_psdd, zoo_lc, zoo_clt,
-zoo_clt_file
-
-include("CircuitLineCompiler.jl")
-include("CircuitParser.jl")
-include("CircuitSaver.jl")
-
-include("Loaders.jl")
-
-end
\ No newline at end of file
diff --git a/src/IO/Loaders.jl b/src/IO/Loaders.jl
deleted file mode 100644
index 719a1a60..00000000
--- a/src/IO/Loaders.jl
+++ /dev/null
@@ -1,22 +0,0 @@
-using LogicCircuits
-using Pkg.Artifacts
-
-
-#####################
-# Circuit loaders
-#####################
-
-zoo_lc(name, num_classes) = 
-    load_logistic_circuit(zoo_lc_file(name), num_classes)
-
-zoo_clt_file(name) = 
-    artifact"circuit_model_zoo" * "/Circuit-Model-Zoo-0.1.2/clts/$name"
-
-zoo_clt(name) = 
-    parse_clt(zoo_clt_file(name))
-
-zoo_psdd_file(name) = 
-    artifact"circuit_model_zoo" * "/Circuit-Model-Zoo-0.1.2/psdds/$name"
-
-zoo_psdd(name) = 
-    load_prob_circuit(zoo_psdd_file(name))
diff --git a/src/LoadSave/LoadSave.jl b/src/LoadSave/LoadSave.jl
new file mode 100644
index 00000000..defd7f35
--- /dev/null
+++ b/src/LoadSave/LoadSave.jl
@@ -0,0 +1,11 @@
+module LoadSave
+
+using LogicCircuits
+using ..Utils
+using ..Probabilistic
+# using ..Logistic
+
+include("circuit_line_compiler.jl")
+include("circuit_loaders.jl")
+include("circuit_savers.jl")
+end
\ No newline at end of file
diff --git a/src/LoadSave/circuit_line_compiler.jl b/src/LoadSave/circuit_line_compiler.jl
new file mode 100644
index 00000000..3e148c23
--- /dev/null
+++ b/src/LoadSave/circuit_line_compiler.jl
@@ -0,0 +1,121 @@
+#####################
+# Compilers to ProbabilisticCircuits data structures starting from already parsed line objects
+#####################
+
+# reuse some internal infrastructure of LogicCircuits' LoadSave module
+using LogicCircuits.LoadSave: CircuitFormatLines, CircuitFormatLine, constant,
+VtreeFormatLines, CircuitHeaderLine, UnweightedLiteralLine, WeightedLiteralLine, 
+DecisionLine, LCElement, BiasLine, WeightedNamedConstantLine, PSDDElement, 
+CircuitCommentLine, ID, compile_smooth_struct_logical_m, compile_smooth_logical_m
+
+"""
+Compile lines into a probabilistic circuit
+"""
+function compile_prob(lines::CircuitFormatLines)::ProbCircuit
+    # first compile a logical circuit
+    logic_circuit, id2lognode = compile_smooth_logical_m(lines)
+    decorate_prob(lines, logic_circuit, id2lognode)
+end
+
+"""
+Compile lines into a logistic circuit.
+"""
+# TODO
+# function compile_logistic(lines::CircuitFormatLines, classes::Int)::LogisticΔ
+#     # first compile a logical circuit
+#     logic_circuit, id2lognode = compile_smooth_logical_m(lines)
+#     decorate_logistic(lines, logic_circuit, classes, id2lognode)
+# end
+
+"""
+Compile circuit and vtree lines into a structured probabilistic circuit (one whose logical circuit origin is structured).
+"""
+function compile_struct_prob(circuit_lines::CircuitFormatLines, vtree_lines::VtreeFormatLines)
+    logic_circuit, vtree, id2lognode, id2vtree = compile_smooth_struct_logical_m(circuit_lines, vtree_lines)
+    prob_circuit = decorate_prob(circuit_lines, logic_circuit, id2lognode)
+    return prob_circuit, vtree
+end
+
+function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicCircuit, id2lognode::Dict{ID,<:LogicCircuit})::ProbCircuit
+    
+    # set up cache mapping logical circuit nodes to their probabilistic decorator
+    prob_circuit = ProbCircuit(logic_circuit)
+    lognode2probnode = Dict{LogicCircuit, ProbCircuit}()
+    foreach(pn -> (lognode2probnode[origin(pn)] = pn), prob_circuit) 
+
+    # map from line node ids to probabilistic circuit nodes
+    id2probnode(id) = lognode2probnode[id2lognode[id]]
+
+    root = nothing
+
+    # go through lines again and update the probabilistic circuit node parameters
+
+    function compile(ln::CircuitFormatLine)
+        error("Compilation of line $ln into probabilistic circuit is not supported")
+    end
+    function compile(::Union{CircuitHeaderLine,CircuitCommentLine,UnweightedLiteralLine})
+        # do nothing
+    end
+    function compile(ln::WeightedNamedConstantLine)
+        @assert constant(ln) == true
+        root = id2probnode(ln.node_id)::Prob⋁Node
+        root.log_thetas .= [ln.weight, log1p(-exp(ln.weight))]
+    end
+    function compile(ln::DecisionLine{<:PSDDElement})
+        root = id2probnode(ln.node_id)::Prob⋁Node
+        root.log_thetas .= [x.weight for x in ln.elements]
+    end
+
+    foreach(compile, lines)
+
+    root
+end
+
+# TODO
+# function decorate_logistic(lines::CircuitFormatLines, logic_circuit::LogicΔ, 
+#                             classes::Int, id2lognode::Dict{ID,<:LogicCircuit})::LogisticΔ
+                        
+#     # set up cache mapping logical circuit nodes to their logistic decorator
+#     log2logistic = LogisticCache()
+#     # build a corresponding probabilistic circuit
+#     logistic_circuit = LogisticΔ(logic_circuit, classes, log2logistic)
+#     # map from line node ids to probabilistic circuit nodes
+#     id2logisticnode(id) = log2logistic[id2lognode[id]]
+
+#     # go through lines again and update the probabilistic circuit node parameters
+
+#     function compile(ln::CircuitFormatLine)
+#         error("Compilation of line $ln into logistic circuit is not supported")
+#     end
+#     function compile(::Union{CircuitHeaderLine,CircuitCommentLine,UnweightedLiteralLine})
+#         # do nothing
+#     end
+
+#     function compile(ln::CircuitHeaderLine)
+#         # do nothing
+#     end
+
+#     function compile(ln::WeightedLiteralLine)
+#         node = id2logisticnode(ln.node_id)::Logistic⋁
+#         node.thetas[1, :] .= ln.weights
+#     end
+
+#     function compile(ln::DecisionLine{<:LCElement})
+#         node = id2logisticnode(ln.node_id)::Logistic⋁
+#         for (ind, elem) in enumerate(ln.elements)
+#             node.thetas[ind, :] .= elem.weights
+#         end
+#     end
+
+#     function compile(ln::BiasLine)
+#         node = id2logisticnode(ln.node_id)::Logistic⋁
+#         # @assert length(node.thetas) == 1
+#         node.thetas[1,:] .= ln.weights
+#     end
+
+#     for ln in lines
+#         compile(ln)
+#     end
+
+#     logistic_circuit
+# end
\ No newline at end of file
diff --git a/src/IO/CircuitParser.jl b/src/LoadSave/circuit_loaders.jl
similarity index 58%
rename from src/IO/CircuitParser.jl
rename to src/LoadSave/circuit_loaders.jl
index 589d1bb2..b7ec85a1 100644
--- a/src/IO/CircuitParser.jl
+++ b/src/LoadSave/circuit_loaders.jl
@@ -1,5 +1,29 @@
+export zoo_clt, zoo_clt_file, zoo_psdd, zoo_lc, zoo_lc_file,
+    load_prob_circuit, load_struct_prob_circuit
 
-using MetaGraphs: MetaDiGraph, set_prop!, props
+using LogicCircuits
+using Pkg.Artifacts
+using LogicCircuits.LoadSave: parse_psdd_file, parse_circuit_file, parse_vtree_file
+
+#####################
+# circuit loaders from module zoo
+#####################
+
+# TODO
+# zoo_lc(name, num_classes) = 
+#     load_logistic_circuit(zoo_lc_file(name), num_classes)
+
+zoo_clt_file(name) = 
+    artifact"circuit_model_zoo" * "/Circuit-Model-Zoo-0.1.2/clts/$name"
+
+zoo_clt(name) = 
+    parse_clt(zoo_clt_file(name))
+
+zoo_psdd_file(name) = 
+    artifact"circuit_model_zoo" * "/Circuit-Model-Zoo-0.1.2/psdds/$name"
+
+zoo_psdd(name) = 
+    load_prob_circuit(zoo_psdd_file(name))
 
 #####################
 # general parser infrastructure for circuits
@@ -11,9 +35,9 @@ using MetaGraphs: MetaDiGraph, set_prop!, props
 """
 Load a probabilistic circuit from file.
 Support circuit file formats:
- * ".psdd" for PSDD files
+    * ".psdd" for PSDD files
 """
-function load_prob_circuit(file::String)::ProbΔ
+function load_prob_circuit(file::String)::ProbCircuit
     @assert endswith(file,".psdd")
     compile_prob(parse_psdd_file(file))
 end
@@ -21,40 +45,30 @@ end
 """
 Load a structured probabilistic circuit from file.
 Support circuit file formats:
- * ".psdd" for PSDD files
+    * ".psdd" for PSDD files
 Supported vtree file formats:
- * ".vtree" for Vtree files
+    * ".vtree" for Vtree files
 """
-function load_struct_prob_circuit(circuit_file::String, vtree_file::String)::Tuple{ProbΔ,PlainVtree}
+function load_struct_prob_circuit(circuit_file::String, vtree_file::String)::Tuple{ProbCircuit,PlainVtree}
     @assert endswith(circuit_file,".psdd")
     circuit_lines = parse_circuit_file(circuit_file)
     vtree_lines = parse_vtree_file(vtree_file)
     compile_struct_prob(circuit_lines, vtree_lines)
 end
 
-
-function load_logistic_circuit(circuit_file::String, classes::Int)::LogisticΔ
-    @assert endswith(circuit_file,".circuit")
-    circuit_lines = parse_circuit_file(circuit_file)
-    compile_logistic(circuit_lines, classes)
-end
+# TODO
+# function load_logistic_circuit(circuit_file::String, classes::Int)::LogisticΔ
+#     @assert endswith(circuit_file,".circuit")
+#     circuit_lines = parse_circuit_file(circuit_file)
+#     compile_logistic(circuit_lines, classes)
+# end
 
 
 #####################
 # parse based on file extension
 #####################
 
-function parse_circuit_file(file::String)::CircuitFormatLines
-    if endswith(file,".circuit")
-        parse_lc_file(file)
-    elseif endswith(file,".psdd")
-        parse_psdd_file(file)
-    elseif endswith(file,".sdd")
-        parse_sdd_file(file)
-    else
-        throw("Cannot parse this file type as a circuit: $file")
-    end
-end
+using MetaGraphs: MetaDiGraph, set_prop!, props, add_edge!
 
 "Parse a clt from given file"
 function parse_clt(filename::String)::MetaDiGraph
@@ -78,3 +92,4 @@ function parse_clt(filename::String)::MetaDiGraph
     end
     return clt
 end
+
diff --git a/src/IO/CircuitSaver.jl b/src/LoadSave/circuit_savers.jl
similarity index 64%
rename from src/IO/CircuitSaver.jl
rename to src/LoadSave/circuit_savers.jl
index 8d35f964..2ca61d00 100644
--- a/src/IO/CircuitSaver.jl
+++ b/src/LoadSave/circuit_savers.jl
@@ -1,34 +1,30 @@
-using Printf: @sprintf
+export save_circuit, save_as_dot, save_as_psdd
 
-import Base.copy
-import LogicCircuits.IO: SDDElement, 
+using LogicCircuits.LoadSave: SDDElement, 
     PSDDElement, 
-    save_lines, 
+    save_lines,
+    get_vtree2id,
     parse_psdd_file, 
     PsddHeaderLine, 
     LcHeaderLine, 
-    save_sdd_file, 
-    save_as_dot,
     get_nodes_level
 
-# Saving psdd
-
 #####################
 # decompile for nodes
 #####################
 
-# decompile for psdd
-decompile(n::ProbLiteral, node2id, vtree2id)::UnweightedLiteralLine = 
+"Decompile for psdd circuit, used during saving of circuits to file" 
+decompile(n::ProbLiteralNode, node2id, vtree2id)::UnweightedLiteralLine = 
     UnweightedLiteralLine(node2id[n], vtree2id[n.origin.vtree], literal(n), true)
 
-make_element(n::Prob⋀, w::AbstractFloat, node2id) = 
+make_element(n::Prob⋀Node, w::AbstractFloat, node2id) = 
     PSDDElement(node2id[n.children[1]],  node2id[n.children[2]], w)
 
 istrue_node(n)::Bool = 
     GateType(n) isa ⋁Gate && num_children(n) == 2 && GateType(children(n)[1]) isa LiteralGate && GateType(children(n)[2]) isa LiteralGate && 
     ispositive(children(n)[1]) && isnegative(children(n)[2])
 
-function decompile(n::Prob⋁, node2id, vtree2id)::Union{WeightedNamedConstantLine, DecisionLine{PSDDElement}} 
+function decompile(n::Prob⋁Node, node2id, vtree2id)::Union{WeightedNamedConstantLine, DecisionLine{PSDDElement}} 
     if istrue_node(n)
         WeightedNamedConstantLine(node2id[n], vtree2id[n.origin.vtree], lit2var(n.children[1].origin.literal), n.log_thetas[1]) # TODO
     else
@@ -40,9 +36,13 @@ end
 # build maping
 #####################
 
-function get_node2id(ln::AbstractVector{X}, T::Type)where X #<: T#::Dict{T, ID}
+# TODO same implementation, merge ?
+
+import LogicCircuits.LoadSave: get_node2id
+
+function get_node2id(circuit::ProbCircuit, T::Type) 
     node2id = Dict{T, ID}()
-    outnodes = filter(n -> !(GateType(n) isa ⋀Gate), ln)
+    outnodes = filter(n -> !is⋀gate(n), circuit)
     sizehint!(node2id, length(outnodes))
     index = ID(0) # node id start from 0
     for n in outnodes
@@ -52,23 +52,11 @@ function get_node2id(ln::AbstractVector{X}, T::Type)where X #<: T#::Dict{T, ID}
     node2id
 end
 
-function get_vtree2id(ln::PlainVtree):: Dict{PlainVtree, ID}
-    vtree2id = Dict{PlainVtree, ID}()
-    sizehint!(vtree2id, length(ln))
-    index = ID(0) # vtree id start from 0
-
-    for n in ln
-        vtree2id[n] = index
-        index += ID(1)
-    end
-    vtree2id
-end
-
 #####################
 # saver for circuits
 #####################
 
-
+"Returns header for PSDD file format"
 function psdd_header()
     """
     c ids of psdd nodes start at 0
@@ -84,16 +72,16 @@ function psdd_header()
     c"""
 end
 
-function save_psdd_file(name::String, ln::ProbΔ, vtree::PlainVtree)
+function save_as_psdd(name::String, circuit::ProbCircuit, vtree::PlainVtree)
     # TODO add method isstructured
-    @assert ln[end].origin isa StructLogicCircuit "PSDD should decorate on StructLogicΔ"
+    @assert circuit.origin isa StructLogicCircuit "PSDD should decorate on StructLogicΔ"
     @assert endswith(name, ".psdd")
-    node2id = get_node2id(ln, ProbNode)
+    node2id = get_node2id(circuit, ProbCircuit)
     vtree2id = get_vtree2id(vtree)
     formatlines = Vector{CircuitFormatLine}()
     append!(formatlines, parse_psdd_file(IOBuffer(psdd_header())))
-    push!(formatlines, PsddHeaderLine(num_nodes(ln)))
-    for n in filter(n -> !(GateType(n) isa ⋀Gate), ln)
+    push!(formatlines, PsddHeaderLine(num_nodes(circuit)))
+    for n in filter(n -> !is⋀gate(n), circuit)
         push!(formatlines, decompile(n, node2id, vtree2id))
     end
     save_lines(name, formatlines)
@@ -121,43 +109,35 @@ function lc_header()
     c"""
 end
     
-function save_lc_file(name::String, ln::LogisticΔ, vtree)
-    @assert ln[end].origin isa StructLogicCircuit "LC should decorate on StructLogicΔ"
-    @assert endswith(name, ".circuit")
-    node2id = get_node2id(ln, ProbNode)
-    vtree2id = get_vtree2id(vtree)
-    formatlines = Vector{CircuitFormatLine}()
-    append!(formatlines, parse_lc_file(IOBuffer(lc_header())))
-    push!(formatlines, LcHeaderLine())
-    for n in filter(n -> !(GateType(n) isa ⋀Gate), ln)
-        push!(formatlines, decompile(n, node2id, vtree2id))
-    end
-    save_lines(name, formatlines)
-end
-
-import LogicCircuits.save_circuit # make available for extension
-
-function save_circuit(name::String, circuit, vtree=nothing)
-    if endswith(name, ".circuit")
-        save_lc_file(name, circuit, vtree)
-    elseif endswith(name, ".psdd")
-        save_psdd_file(name, circuit, vtree)
-    elseif endswith(name, ".sdd")
-        save_sdd_file(name, circuit, vtree)
-    else
-        error("Cannot save circuit to file with this extensions: $name")
-    end
-end
-
-"Save prob circuit to .dot file"
-function save_as_dot(root::ProbNode, file::String)
-    return save_as_dot(linearize(root), file)
-end
+# function save_lc_file(name::String, ln::LogisticΔ, vtree)
+#     @assert ln[end].origin isa StructLogicCircuit "LC should decorate on StructLogicΔ"
+#     @assert endswith(name, ".circuit")
+#     node2id = get_node2id(ln, ProbNode)
+#     vtree2id = get_vtree2id(vtree)
+#     formatlines = Vector{CircuitFormatLine}()
+#     append!(formatlines, parse_lc_file(IOBuffer(lc_header())))
+#     push!(formatlines, LcHeaderLine())
+#     for n in filter(n -> !(GateType(n) isa ⋀Gate), ln)
+#         push!(formatlines, decompile(n, node2id, vtree2id))
+#     end
+#     save_lines(name, formatlines)
+# end
+
+import LogicCircuits.LoadSave: save_circuit, save_as_dot # make available for extension
+
+"Save a circuit to file"
+save_circuit(name::String, circuit::ProbCircuit, vtree::PlainVtree) =
+    save_as_psdd(name, circuit, vtree)
+
+# TODO
+# save_circuit(name::String, circuit::LogicCircuit) =
+#     save_as_psdd(name, circuit, vtree)
 
+using Printf: @sprintf
 "Save prob circuits to .dot file"
-function save_as_dot(circuit::ProbΔ, file::String)
+function save_as_dot(circuit::ProbCircuit, file::String)
     # TODO (https://github.com/Juice-jl/LogicCircuits.jl/issues/7)
-    node_cache = Dict{ProbNode, Int64}()
+    node_cache = Dict{ProbCircuit, Int64}()
     for (i, n) in enumerate(circuit)
         node_cache[n] = i
     end
@@ -179,13 +159,13 @@ function save_as_dot(circuit::ProbΔ, file::String)
     end
 
     for n in reverse(circuit)
-        if n isa Prob⋀
+        if n isa Prob⋀Node
             write(f, "$(node_cache[n]) [label=\"*$(node_cache[n])\"]\n")
         elseif n isa Prob⋁
             write(f, "$(node_cache[n]) [label=\"+$(node_cache[n])\"]\n")
-        elseif n isa ProbLiteral && ispositive(n)
+        elseif n isa ProbLiteralNode && ispositive(n)
             write(f, "$(node_cache[n]) [label=\"+$(variable(n.origin))\"]\n")
-        elseif n isa ProbLiteral && isnegative(n)
+        elseif n isa ProbLiteralNode && isnegative(n)
             write(f, "$(node_cache[n]) [label=\"-$(variable(n.origin))\"]\n")
         else
             throw("unknown ProbNode type")
diff --git a/src/Probabilistic/ProbCircuits.jl b/src/Probabilistic/ProbCircuits.jl
deleted file mode 100644
index 85a6e9b4..00000000
--- a/src/Probabilistic/ProbCircuits.jl
+++ /dev/null
@@ -1,515 +0,0 @@
-#####################
-# Probabilistic circuits
-#####################
-abstract type ProbNode{O} <: DecoratorNode{O} end
-abstract type ProbLeafNode{O} <: ProbNode{O} end
-abstract type ProbInnerNode{O} <: ProbNode{O} end
-
-mutable struct ProbLiteral{O} <: ProbLeafNode{O}
-    origin::O
-    data
-    counter::UInt32
-    ProbLiteral(n) = new{node_type_deprecated(n)}(n, nothing, 0)
-end
-
-mutable struct Prob⋀{O} <: ProbInnerNode{O}
-    origin::O
-    children::Vector{<:ProbNode{<:O}}
-    data
-    counter::UInt32
-    Prob⋀(n, children) = begin
-        new{node_type_deprecated(n)}(n, convert(Vector{ProbNode{node_type_deprecated(n)}},children), nothing, 0)
-    end
-end
-
-mutable struct Prob⋁{O} <: ProbInnerNode{O}
-    origin::O
-    children::Vector{<:ProbNode{<:O}}
-    log_thetas::Vector{Float64}
-    data
-    counter::UInt32
-    Prob⋁(n, children) = new{node_type_deprecated(n)}(n, convert(Vector{ProbNode{node_type_deprecated(n)}},children), init_array(Float64, length(children)), nothing, 0)
-end
-
-const ProbΔ{O} = AbstractVector{<:ProbNode{<:O}}
-
-Base.eltype(::Type{ProbΔ{O}}) where {O} = ProbNode{<:O}
-
-#####################
-# traits
-#####################
-
-import LogicCircuits.GateType # make available for extension
-import LogicCircuits.node_type_deprecated
-
-@inline GateType(::Type{<:ProbLiteral}) = LiteralGate()
-@inline GateType(::Type{<:Prob⋀}) = ⋀Gate()
-@inline GateType(::Type{<:Prob⋁}) = ⋁Gate()
-
-@inline node_type_deprecated(::ProbNode) = ProbNode
-
-#####################
-# constructors and conversions
-#####################
-
-const ProbCache = Dict{Node, ProbNode}
-
-function ProbΔ2(circuit::Δ)::ProbΔ
-    linearize(ProbΔ2(circuit[end]))
-end
-
-function ProbΔ2(circuit::LogicCircuit)::ProbNode
-    f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-    f_lit(n) = ProbLiteral(n)
-    f_a(n, cn) = Prob⋀(n, cn)
-    f_o(n, cn) = Prob⋁(n, cn)
-    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, ProbNode{node_type_deprecated(circuit)})
-end
-
-function ProbΔ(circuit::Δ, cache::ProbCache = ProbCache())
-
-    sizehint!(cache, length(circuit)*4÷3)
-
-    pc_node(::LiteralGate, n::LogicCircuit) = ProbLiteral(n)
-    pc_node(::ConstantGate, n::LogicCircuit) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-
-    pc_node(::⋀Gate, n::LogicCircuit) = begin
-        children = map(c -> cache[c], n.children)
-        Prob⋀(n, children)
-    end
-
-    pc_node(::⋁Gate, n::LogicCircuit) = begin
-        children = map(c -> cache[c], n.children)
-        Prob⋁(n, children)
-    end
-
-    map(circuit) do node
-        pcn = pc_node(GateType(node), node)
-        cache[node] = pcn
-        pcn
-    end
-end
-
-#####################
-# methods
-#####################
-
-import LogicCircuits: literal, children # make available for extension
-
-@inline literal(n::ProbLiteral)::Lit  = literal(n.origin)
-@inline children(n::ProbInnerNode) = n.children
-
-num_parameters(n::Prob⋁) = num_children(n)
-num_parameters(c::ProbΔ) = sum(n -> num_parameters(n), ⋁_nodes(c))
-
-"Return the first origin that is a probabilistic circuit node"
-prob_origin(n::DecoratorNode)::ProbNode = origin(n, ProbNode)
-
-"Return the first origin that is a probabilistic circuit"
-prob_origin(c::DecoratorΔ)::ProbΔ = origin(c, ProbNode)
-
-function estimate_parameters2(pc::ProbΔ, data::XData{Bool}; pseudocount::Float64)
-    Logic.pass_up_down2(pc, data)
-    w = (data isa PlainXData) ? nothing : weights(data)
-    estimate_parameters_cached2(pc, w; pseudocount=pseudocount)
-end
-
-function estimate_parameters_cached2(pc::ProbΔ, w; pseudocount::Float64)
-    flow(n) = Float64(sum(sum(n.data)))
-    children_flows(n) = sum.(map(c -> c.data[1] .& n.data[1], children(n)))
-
-    if issomething(w)
-        flow_w(n) = sum(Float64.(n.data[1]) .* w)
-        children_flows_w(n) = sum.(map(c -> Float64.(c.data[1] .& n.data[1]) .* w, children(n)))
-        flow = flow_w
-        children_flows = children_flows_w
-    end
-
-    estimate_parameters_node2(n::ProbNode) = ()
-    function estimate_parameters_node2(n::Prob⋁)
-        if num_children(n) == 1
-            n.log_thetas .= 0.0
-        else
-            smoothed_flow = flow(n) + pseudocount
-            uniform_pseudocount = pseudocount / num_children(n)
-            n.log_thetas .= log.((children_flows(n) .+ uniform_pseudocount) ./ smoothed_flow)
-            @assert isapprox(sum(exp.(n.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally"
-            # normalize away any leftover error
-            n.log_thetas .- logsumexp(n.log_thetas)
-        end
-    end
-
-    foreach(estimate_parameters_node2, pc)
-end
-
-function log_likelihood_per_instance2(pc::ProbΔ, data::XData{Bool})
-    Logic.pass_up_down2(pc, data)
-    log_likelihood_per_instance_cached(pc, data)
-end
-
-function log_likelihood_per_instance_cached(pc::ProbΔ, data::XData{Bool})
-    log_likelihoods = zeros(num_examples(data))
-    indices = init_array(Bool, num_examples(data))::BitVector
-    for n in pc
-         if n isa Prob⋁ && num_children(n) != 1 # other nodes have no effect on likelihood
-            foreach(n.children, n.log_thetas) do c, log_theta
-                indices = n.data[1] .& c.data[1]
-                view(log_likelihoods, indices::BitVector) .+=  log_theta # see MixedProductKernelBenchmark.jl
-            end
-         end
-    end
-    log_likelihoods
-end
-
-import LogicCircuits: conjoin_like, disjoin_like, literal_like, copy_node, normalize, replace_node # make available for extension
-
-"Conjoin nodes in the same way as the example"
-@inline function conjoin_like(example::ProbNode, arguments::Vector)
-    if isempty(arguments)
-        # @assert false "Probabilistic circuit does not have anonymous true node"
-        nothing
-    elseif example isa Prob⋀ && children(example) == arguments
-        example
-    else
-        n = conjoin_like(origin(example), origin.(arguments))
-        Prob⋀(n, arguments)
-    end
-end
-
-"Disjoin nodes in the same way as the example"
-@inline function disjoin_like(example::ProbNode, arguments::Vector)
-    if isempty(arguments)
-        # @assert false "Probabilistic circuit does not have false node"
-        nothing
-    elseif example isa Prob⋁ && children(example) == arguments
-        example
-    else
-        n = disjoin_like(origin(example), origin.(arguments))
-        # normalize parameters
-        thetas = zeros(Float64, length(arguments))
-        flag = falses(length(arguments))
-        for (i, c) in enumerate(arguments)
-            ind = findfirst(x -> x == c, children(example))
-            if issomething(ind)
-                thetas[i] = exp(example.log_thetas[ind])
-                flag[i] = true
-            end
-        end
-        if all(flag)
-            thetas = thetas / sum(thetas)
-        end
-        p = Prob⋁(n, arguments)
-        p.log_thetas .= log.(thetas)
-        p
-    end
-end
-
-"Construct a new literal node like the given node's type"
-@inline literal_like(::ProbNode, lit::Lit) = ProbLiteral(lit)
-
-@inline copy_node(n::Prob⋁, cns) = begin
-    orig = copy_node(origin(n), origin.(cns))
-    p = Prob⋁(orig, cns)
-    p.log_thetas .= copy(n.log_thetas)
-    p
-end
-
-@inline copy_node(n::Prob⋀, cns) = begin
-    orig = copy_node(origin(n), origin.(cns))
-    Prob⋀(orig, cns)
-end
-
-import LogicCircuits.normalize
-
-@inline normalize(n::Prob⋁, old_n::Prob⋁, kept::Union{Vector{Bool}, BitArray}) = begin
-     thetas = exp.(old_n.log_thetas[kept])
-     n.log_thetas .= log.(thetas / sum(thetas))
-end
-
-function estimate_parameters(pc::ProbΔ, data::XBatches{Bool}; pseudocount::Float64)
-    estimate_parameters(AggregateFlowΔ(pc, aggr_weight_type(data)), data; pseudocount=pseudocount)
-end
-
-function estimate_parameters(afc::AggregateFlowΔ, data::XBatches{Bool}; pseudocount::Float64)
-    @assert feature_type(data) == Bool "Can only learn probabilistic circuits on Bool data"
-    @assert (afc[end].origin isa ProbNode) "AggregateFlowΔ must originate in a ProbΔ"
-    collect_aggr_flows(afc, data)
-    estimate_parameters_cached(afc; pseudocount=pseudocount)
-    afc
-end
-
-function estimate_parameters(fc::FlowΔ, data::XBatches{Bool}; pseudocount::Float64)
-    @assert feature_type(data) == Bool "Can only learn probabilistic circuits on Bool data"
-    @assert (prob_origin(afc[end]) isa ProbNode) "FlowΔ must originate in a ProbΔ"
-    collect_aggr_flows(fc, data)
-    estimate_parameters_cached(origin(fc); pseudocount=pseudocount)
-end
-
- # turns aggregate statistics into theta parameters
-function estimate_parameters_cached(afc::AggregateFlowΔ; pseudocount::Float64)
-    foreach(n -> estimate_parameters_node(n; pseudocount=pseudocount), afc)
-end
-
-estimate_parameters_node(::AggregateFlowNode; pseudocount::Float64) = () # do nothing
-function estimate_parameters_node(n::AggregateFlow⋁; pseudocount)
-    origin = n.origin::Prob⋁
-    if num_children(n) == 1
-        origin.log_thetas .= 0.0
-    else
-        smoothed_aggr_flow = (n.aggr_flow + pseudocount)
-        uniform_pseudocount = pseudocount / num_children(n)
-        origin.log_thetas .= log.( (n.aggr_flow_children .+ uniform_pseudocount) ./ smoothed_aggr_flow )
-        @assert isapprox(sum(exp.(origin.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally: $(exp.(origin.log_thetas)), estimated from $(n.aggr_flow) and $(n.aggr_flow_children). Did you actually compute the aggregate flows?"
-        #normalize away any leftover error
-        origin.log_thetas .- logsumexp(origin.log_thetas)
-    end
-end
-
-# compute log likelihood
-function compute_log_likelihood(pc::ProbΔ, data::XBatches{Bool})
-    compute_log_likelihood(AggregateFlowΔ(pc, aggr_weight_type(data)))
-end
-
-# compute log likelihood, reusing AggregateFlowΔ but ignoring its current aggregate values
-function compute_log_likelihood(afc::AggregateFlowΔ, data::XBatches{Bool})
-    @assert feature_type(data) == Bool "Can only test probabilistic circuits on Bool data"
-    collect_aggr_flows(afc, data)
-    ll = log_likelihood(afc)
-    (afc, ll)
-end
-
-# return likelihoods given current aggregate flows.
-function log_likelihood(afc::AggregateFlowΔ)
-    sum(n -> log_likelihood(n), afc)
-end
-
-log_likelihood(::AggregateFlowNode) = 0.0
-log_likelihood(n::AggregateFlow⋁) = sum(n.origin.log_thetas .* n.aggr_flow_children)
-
-"""
-Calculates log likelihood for a batch of fully observed samples.
-(Also retures the generated FlowΔ)
-"""
-function log_likelihood_per_instance(pc::ProbΔ, batch::PlainXData{Bool})
-    fc = FlowΔ(pc, num_examples(batch), Bool)
-    (fc, log_likelihood_per_instance(fc, batch))
-end
-
-function log_proba(pc::ProbΔ, batch::PlainXData{Bool})
-    log_likelihood_per_instance(pc, batch)[2]
-end
-
-function log_proba(pc::ProbΔ, batch::PlainXData{Int8})
-    marginal_log_likelihood_per_instance(pc, batch)[2]
-end
-
-"""
-Calculate log likelihood per instance for batches of samples.
-"""
-function log_likelihood_per_instance(pc::ProbΔ, batches::XBatches{Bool})::Vector{Float64}
-    mapreduce(b -> log_likelihood_per_instance(pc, b)[2], vcat, batches)
-end
-
-"""
-Calculate log likelihood for a batch of fully observed samples.
-(This is for when you already have a FlowΔ)
-"""
-function log_likelihood_per_instance(fc::FlowΔ, batch::PlainXData{Bool})
-    @assert (prob_origin(fc[end]) isa ProbNode) "FlowΔ must originate in a ProbΔ"
-    pass_up_down(fc, batch)
-    log_likelihoods = zeros(num_examples(batch))
-    indices = init_array(Bool, flow_length(fc))::BitVector
-    for n in fc
-         if n isa DownFlow⋁ && num_children(n) != 1 # other nodes have no effect on likelihood
-            origin = prob_origin(n)::Prob⋁
-            foreach(n.children, origin.log_thetas) do c, log_theta
-                #  be careful here to allow for the Boolean multiplication to be done using & before switching to float arithmetic, or risk losing a lot of runtime!
-                # log_likelihoods .+= prod_fast(downflow(n), pr_factors(c)) .* log_theta
-                assign_prod(indices, downflow(n), pr_factors(c))
-                view(log_likelihoods, indices::BitVector) .+=  log_theta # see MixedProductKernelBenchmark.jl
-                # TODO put the lines above in Utils in order to ensure we have specialized types
-            end
-         end
-    end
-    log_likelihoods
-end
-
-"""
-Calculate log likelihood for a batch of samples with partial evidence P(e).
-(Also returns the generated FlowΔ)
-
-To indicate a variable is not observed, pass -1 for that variable.
-"""
-function marginal_log_likelihood_per_instance(pc::ProbΔ, batch::PlainXData{Int8})
-    opts = (flow_opts★..., el_type=Float64, compact⋀=false, compact⋁=false)
-    fc = UpFlowΔ(pc, num_examples(batch), Float64, opts)
-    (fc, marginal_log_likelihood_per_instance(fc, batch))
-end
-
-"""
-Calculate log likelihood for a batch of samples with partial evidence P(e).
-(If you already have a FlowΔ)
-
-To indicate a variable is not observed, pass -1 for that variable.
-"""
-function marginal_log_likelihood_per_instance(fc::UpFlowΔ, batch::PlainXData{Int8})
-    @assert (prob_origin(fc[end]) isa ProbNode) "FlowΔ must originate in a ProbΔ"
-    marginal_pass_up(fc, batch)
-    pr(fc[end])
-end
-
-function check_parameter_integrity(circuit::ProbΔ)
-    for node in filter(n -> GateType(n) isa Prob⋁, circuit)
-        @assert all(θ -> !isnan(θ), node.log_thetas) "There is a NaN in one of the log_thetas"
-    end
-    true
-end
-
-##################
-# Sampling from a psdd
-##################
-
-"""
-Sample from a PSDD without any evidence
-"""
-function sample(circuit::ProbΔ)::AbstractVector{Bool}
-    inst = Dict{Var,Int64}()
-    simulate(circuit[end], inst)
-    len = length(keys(inst))
-    ans = Vector{Bool}()
-    for i = 1:len
-        push!(ans, inst[i])
-    end
-    ans
-end
-
-# Uniformly sample based on the probability of the items
-# and return the selected index
-function sample(probs::AbstractVector{<:Number})::Int32
-    z = sum(probs)
-    q = rand() * z
-    cur = 0.0
-    for i = 1:length(probs)
-        cur += probs[i]
-        if q <= cur
-            return i
-        end
-    end
-    return length(probs)
-end
-
-function simulate(node::ProbLiteral, inst::Dict{Var,Int64})
-    if ispositive(node)
-        inst[variable(node.origin)] = 1
-    else
-        inst[variable(node.origin)] = 0
-    end
-end
-
-function simulate(node::Prob⋁, inst::Dict{Var,Int64})
-    idx = sample(exp.(node.log_thetas))
-    simulate(node.children[idx], inst)
-end
-function simulate(node::Prob⋀, inst::Dict{Var,Int64})
-    for child in node.children
-        simulate(child, inst)
-    end
-end
-
-"""
-Sampling with Evidence from a psdd.
-Internally would call marginal pass up on a newly generated flow circuit.
-"""
-function sample(circuit::ProbΔ, evidence::PlainXData{Int8})::AbstractVector{Bool}
-    opts= (compact⋀=false, compact⋁=false)
-    flow_circuit = UpFlowΔ(circuit, 1, Float64, opts)
-    marginal_pass_up(flow_circuit, evidence)
-    sample(flow_circuit)
-end
-
-"""
-Sampling with Evidence from a psdd.
-Assuming already marginal pass up has been done on the flow circuit.
-"""
-function sample(circuit::UpFlowΔ)::AbstractVector{Bool}
-    inst = Dict{Var,Int64}()
-    simulate2(circuit[end], inst)
-    len = length(keys(inst))
-    ans = Vector{Bool}()
-    for i = 1:len
-        push!(ans, inst[i])
-    end
-    ans
-end
-
-function simulate2(node::UpFlowLiteral, inst::Dict{Var,Int64})
-    if ispositive(node)
-        #TODO I don't think we need these 'grand_origin' parts below
-        inst[variable(grand_origin(node))] = 1
-    else
-        inst[variable(grand_origin(node))] = 0
-    end
-end
-
-function simulate2(node::UpFlow⋁, inst::Dict{Var,Int64})
-    prs = [ pr(ch)[1] for ch in children(node) ]
-    idx = sample(exp.(node.origin.log_thetas .+ prs))
-    simulate2(children(node)[idx], inst)
-end
-
-function simulate2(node::UpFlow⋀, inst::Dict{Var,Int64})
-    for child in children(node)
-        simulate2(child, inst)
-    end
-end
-
-
-
-##################
-# Most Probable Explanation MPE of a psdd
-#   aka MAP
-##################
-
-@inline function MAP(circuit::ProbΔ, evidence::PlainXData{Int8})::Matrix{Bool}
-    MPE(circuit, evidence)
-end
-
-function MPE(circuit::ProbΔ, evidence::PlainXData{Int8})::Matrix{Bool}
-    # Computing Marginal Likelihood for each node
-    fc, lls = marginal_log_likelihood_per_instance(circuit, evidence)
-
-    ans = Matrix{Bool}(zeros(size(evidence.x)))
-    active_samples = Array{Bool}(ones( num_examples(evidence) ))
-
-    mpe_simulate(fc[end], active_samples, ans)
-    ans
-end
-
-"""
-active_samples: bool vector indicating which samples are active for this node during mpe
-result: Matrix (num_samples, num_variables) indicating the final result of mpe
-"""
-function mpe_simulate(node::UpFlowLiteral, active_samples::Vector{Bool}, result::Matrix{Bool})
-    if ispositive(node)
-        result[active_samples, variable(node)] .= 1
-    else
-        result[active_samples, variable(node)] .= 0
-    end
-end
-function mpe_simulate(node::UpFlow⋁, active_samples::Vector{Bool}, result::Matrix{Bool})
-    prs = zeros( length(node.children), size(active_samples)[1] )
-    @simd  for i=1:length(node.children)
-        prs[i,:] .= pr(node.children[i]) .+ (node.origin.log_thetas[i])
-    end
-
-    max_child_ids = [a[1] for a in argmax(prs, dims = 1) ]
-    @simd for i=1:length(node.children)
-        ids = Vector{Bool}( active_samples .* (max_child_ids .== i)[1,:] )  # Only active for this child if it was the max for that sample
-        mpe_simulate(node.children[i], ids, result)
-    end
-end
-function mpe_simulate(node::UpFlow⋀, active_samples::Vector{Bool}, result::Matrix{Bool})
-    for child in node.children
-        mpe_simulate(child, active_samples, result)
-    end    
-end
diff --git a/src/Probabilistic/Probabilistic.jl b/src/Probabilistic/Probabilistic.jl
index 9dd95e70..d67d1493 100644
--- a/src/Probabilistic/Probabilistic.jl
+++ b/src/Probabilistic/Probabilistic.jl
@@ -45,14 +45,14 @@ clustering,
 # Queries
 pr_constraint, psdd_entropy, psdd_kl_divergence
 
-include("Clustering.jl")
-include("ProbCircuits.jl")
-include("ProbFlowCircuits.jl")
-include("MutualInformation.jl")
-include("Mixtures.jl")
-include("Bagging.jl")
-include("EMLearner.jl")
-include("VtreeLearner.jl")
-include("Queries.jl")
+# include("Clustering.jl")
+include("prob_nodes.jl")
+# include("ProbFlowCircuits.jl")
+# include("MutualInformation.jl")
+# include("Mixtures.jl")
+# include("Bagging.jl")
+# include("EMLearner.jl")
+# include("VtreeLearner.jl")
+# include("Queries.jl")
 
 end
diff --git a/src/Probabilistic/Queries.jl b/src/Probabilistic/Queries.jl
index cf059b4a..47cc1d30 100644
--- a/src/Probabilistic/Queries.jl
+++ b/src/Probabilistic/Queries.jl
@@ -1,230 +1,91 @@
-using DataStructures
+export log_prob
 
-# Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability
-# spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
-"Calculate the probability of the logic formula given by sdd for the psdd"
-function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogicCircuit})
-    cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
-
-    return pr_constraint(psdd_node, sdd_node, cache)
+function log_likelihood_per_instance(pc::ProbCircuit, data::DataFrame)
+end
+function log_likelihood_per_instance2(pc::ProbΔ, data::XData{Bool})
+    Logic.pass_up_down2(pc, data)
+    log_likelihood_per_instance_cached(pc, data)
 end
-function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogicCircuit},
-                       cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})::Float64
-    if (psdd_node, sdd_node) in keys(cache) # Cache hit
-        return cache[psdd_node, sdd_node]
-    elseif psdd_node isa ProbLiteral # Boundary cases
-        if sdd_node isa Union{ProbLiteral, PlainStructLiteralNode} # Both are literals, just check whether they agrees with each other
-            if literal(psdd_node) == literal(sdd_node)
-                return get!(cache, (psdd_node, sdd_node), 1.0)
-            else
-                return get!(cache, (psdd_node, sdd_node), 0.0)
-            end
-        else
-            pr_constraint(psdd_node, sdd_node.children[1], cache)
-            if length(sdd_node.children) > 1
-                pr_constraint(psdd_node, sdd_node.children[2], cache)
-                return get!(cache, (psdd_node, sdd_node), 1.0)
-            else
-                return get!(cache, (psdd_node, sdd_node),
-                    literal(sdd_node.children[1]) == literal(psdd_node) ? 1.0 : 0.0
-                )
-            end
-        end
-    elseif psdd_node.children[1] isa ProbLiteral # The psdd is true
-        theta = exp(psdd_node.log_thetas[1])
-        return get!(cache, (psdd_node, sdd_node),
-            theta * pr_constraint(psdd_node.children[1], sdd_node, cache) +
-            (1.0 - theta) * pr_constraint(psdd_node.children[2], sdd_node, cache)
-        )
-    else # Both psdds are not trivial
-        prob = 0.0
-        for (prob⋀_node, log_theta) in zip(psdd_node.children, psdd_node.log_thetas)
-            p = prob⋀_node.children[1]
-            s = prob⋀_node.children[2]
 
-            theta = exp(log_theta)
-            for sdd⋀_node in sdd_node.children
-                r = sdd⋀_node.children[1]
-                t = sdd⋀_node.children[2]
-                prob += theta * pr_constraint(p, r, cache) * pr_constraint(s, t, cache)
+function log_likelihood_per_instance_cached(pc::ProbΔ, data::XData{Bool})
+    log_likelihoods = zeros(num_examples(data))
+    indices = init_array(Bool, num_examples(data))::BitVector
+    for n in pc
+         if n isa Prob⋁ && num_children(n) != 1 # other nodes have no effect on likelihood
+            foreach(n.children, n.log_thetas) do c, log_theta
+                indices = n.data[1] .& c.data[1]
+                view(log_likelihoods, indices::BitVector) .+=  log_theta # see MixedProductKernelBenchmark.jl
             end
-        end
-        return get!(cache, (psdd_node, sdd_node), prob)
+         end
     end
+    log_likelihoods
 end
 
-
-"Entropy of the distribution of the input psdd."
-function psdd_entropy(psdd_node::ProbNode)::Float64
-    psdd_entropy_cache = Dict{ProbNode, Float64}()
-
-    return psdd_entropy(psdd_node, psdd_entropy_cache)
-end
-function psdd_entropy(psdd_node::Prob⋁, psdd_entropy_cache::Dict{ProbNode, Float64})::Float64
-    if psdd_node in keys(psdd_entropy_cache)
-        return psdd_entropy_cache[psdd_node]
-    elseif psdd_node.children[1] isa ProbLiteral
-        return get!(psdd_entropy_cache, psdd_node,
-            - exp(psdd_node.log_thetas[1]) * psdd_node.log_thetas[1] -
-            exp(psdd_node.log_thetas[2]) * psdd_node.log_thetas[2]
-        )
-    else
-        local_entropy = 0.0
-        for (prob⋀_node, log_prob) in zip(psdd_node.children, psdd_node.log_thetas)
-            p = prob⋀_node.children[1]
-            s = prob⋀_node.children[2]
-
-            local_entropy += exp(log_prob) * (psdd_entropy(p, psdd_entropy_cache) +
-                psdd_entropy(s, psdd_entropy_cache) - log_prob)
-        end
-        return get!(psdd_entropy_cache, psdd_node, local_entropy)
-    end
-end
-function psdd_entropy(psdd_node::Prob⋀, psdd_entropy_cache::Dict{ProbNode, Float64})::Float64
-    return get!(psdd_entropy_cache, psdd_node.children[1], psdd_entropy(psdd_node.children[1], psdd_entropy_cache)) +
-        get!(psdd_entropy_cache, psdd_node.children[2], psdd_entropy(psdd_node.children[2], psdd_entropy_cache))
-end
-function psdd_entropy(psdd_node::ProbLiteral, psdd_entropy_cache::Dict{ProbNode, Float64})::Float64
-    return get!(psdd_entropy_cache, psdd_node, 0.0)
+# compute log likelihood
+function compute_log_likelihood(pc::ProbΔ, data::XBatches{Bool})
+    compute_log_likelihood(AggregateFlowΔ(pc, aggr_weight_type(data)))
 end
 
-
-"KL divergence calculation for psdds that are not necessarily identical"
-function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode)::Float64
-    kl_divergence_cache = Dict{Tuple{ProbNode, ProbNode}, Float64}()
-    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
-
-    return psdd_kl_divergence(psdd_node1, psdd_node2, kl_divergence_cache, pr_constraint_cache)
+# compute log likelihood, reusing AggregateFlowΔ but ignoring its current aggregate values
+function compute_log_likelihood(afc::AggregateFlowΔ, data::XBatches{Bool})
+    @assert feature_type(data) == Bool "Can only test probabilistic circuits on Bool data"
+    collect_aggr_flows(afc, data)
+    ll = log_likelihood(afc)
+    (afc, ll)
 end
-function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
-        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64})::Float64
-    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
 
-    return psdd_kl_divergence(psdd_node1, psdd_node2, kl_divergence_cache, pr_constraint_cache)
+# return likelihoods given current aggregate flows.
+function log_likelihood(afc::AggregateFlowΔ)
+    sum(n -> log_likelihood(n), afc)
 end
-function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
-        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
-    @assert !(psdd_node1 isa Prob⋀ || psdd_node2 isa Prob⋀) "Prob⋀ not a valid PSDD node for KL-Divergence"
-
-    # Check if both nodes are normalized for same vtree node
-    @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
-    if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
-        return kl_divergence_cache[(psdd_node1, psdd_node2)]
-    elseif psdd_node1.children[1] isa ProbLiteral
-        if psdd_node2 isa ProbLiteral
-            psdd_kl_divergence(psdd_node1.children[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-            psdd_kl_divergence(psdd_node1.children[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-            if literal(psdd_node1.children[1]) == literal(psdd_node2)
-                return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                    psdd_node1.log_thetas[1] * exp(psdd_node1.log_thetas[1])
-                )
-            else
-                return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                    psdd_node1.log_thetas[2] * exp(psdd_node1.log_thetas[2])
-                )
-            end
-        else
-            # The below four lines actually assign zero, but still we need to
-            # call it.
-            psdd_kl_divergence(psdd_node1.children[1], psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
-            psdd_kl_divergence(psdd_node1.children[1], psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
-            psdd_kl_divergence(psdd_node1.children[2], psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
-            psdd_kl_divergence(psdd_node1.children[2], psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
-            # There are two possible matches
-            if literal(psdd_node1.children[1]) == literal(psdd_node2.children[1])
-                return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                    exp(psdd_node1.log_thetas[1]) * (psdd_node1.log_thetas[1] - psdd_node2.log_thetas[1]) +
-                    exp(psdd_node1.log_thetas[2]) * (psdd_node1.log_thetas[2] - psdd_node2.log_thetas[2])
-                )
-            else
-                return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                    exp(psdd_node1.log_thetas[1]) * (psdd_node1.log_thetas[1] - psdd_node2.log_thetas[2]) +
-                    exp(psdd_node1.log_thetas[2]) * (psdd_node1.log_thetas[2] - psdd_node2.log_thetas[1])
-                )
-            end
-        end
-    else # the normal case
-        kl_divergence = 0.0
-
-        # loop through every combination of prim and sub
-        for (prob⋀_node1, log_theta1) in zip(psdd_node1.children, psdd_node1.log_thetas)
-            for (prob⋀_node2, log_theta2) in zip(psdd_node2.children, psdd_node2.log_thetas)
-                p = prob⋀_node1.children[1]
-                s = prob⋀_node1.children[2]
-
-                r = prob⋀_node2.children[1]
-                t = prob⋀_node2.children[2]
-
-                theta1 = exp(log_theta1)
-
-                p11 = pr_constraint(s, t, pr_constraint_cache)
-                p12 = pr_constraint(p, r, pr_constraint_cache)
-
-                p13 = theta1 * (log_theta1 - log_theta2)
+log_likelihood(::AggregateFlowNode) = 0.0
+log_likelihood(n::AggregateFlow⋁) = sum(n.origin.log_thetas .* n.aggr_flow_children)
 
-                p21 = psdd_kl_divergence(p, r, kl_divergence_cache, pr_constraint_cache)
-                p31 = psdd_kl_divergence(s, t, kl_divergence_cache, pr_constraint_cache)
+"""
+Calculates log likelihood for a batch of fully observed samples.
+(Also retures the generated FlowΔ)
+"""
+function log_likelihood_per_instance(pc::ProbΔ, batch::PlainXData{Bool})
+    fc = FlowΔ(pc, num_examples(batch), Bool)
+    (fc, log_likelihood_per_instance(fc, batch))
+end
 
-                kl_divergence += p11 * p12 * p13 + theta1 * (p11 * p21 + p12 * p31)
-            end
-        end
-        return get!(kl_divergence_cache, (psdd_node1, psdd_node2), kl_divergence)
-    end
+function log_proba(pc::ProbΔ, batch::PlainXData{Bool})
+    log_likelihood_per_instance(pc, batch)[2]
 end
-function psdd_kl_divergence(psdd_node1::ProbLiteral, psdd_node2::ProbLiteral,
-        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
-    # Check if literals are over same variables in vtree
-   @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
-    if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
-        return kl_divergence_cache[psdd_node1, psdd_node2]
-    else
-        # In this case probability is 1, kl divergence is 0
-        return get!(kl_divergence_cache, (psdd_node1, psdd_node2), 0.0)
-    end
+function log_proba(pc::ProbΔ, batch::PlainXData{Int8})
+    marginal_log_likelihood_per_instance(pc, batch)[2]
 end
-function psdd_kl_divergence(psdd_node1::Prob⋁, psdd_node2::ProbLiteral,
-        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
-    @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
-    if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
-        return kl_divergence_cache[psdd_node1, psdd_node2]
-    else
-        psdd_kl_divergence(psdd_node1.children[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-        psdd_kl_divergence(psdd_node1.children[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-        if literal(psdd_node1.children[1]) == literal(psdd_node2)
-            return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                psdd_node1.log_thetas[1] * exp(psdd_node1.log_thetas[1])
-            )
-        else
-            return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                psdd_node1.log_thetas[2] * exp(psdd_node1.log_thetas[2])
-            )
-        end
-    end
+"""
+Calculate log likelihood per instance for batches of samples.
+"""
+function log_likelihood_per_instance(pc::ProbΔ, batches::XBatches{Bool})::Vector{Float64}
+    mapreduce(b -> log_likelihood_per_instance(pc, b)[2], vcat, batches)
 end
-function psdd_kl_divergence(psdd_node1::ProbLiteral, psdd_node2::Prob⋁,
-        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
-    @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
-    if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
-        return kl_divergence_cache[psdd_node1, psdd_node2]
-    else
-        psdd_kl_divergence(psdd_node1, psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
-        psdd_kl_divergence(psdd_node1, psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
-        if literal(psdd_node1) == literal(psdd_node2.children[1])
-            return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                -psdd_node2.log_thetas[1]
-            )
-        else
-            return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                -psdd_node2.log_thetas[2]
-            )
-        end
+"""
+Calculate log likelihood for a batch of fully observed samples.
+(This is for when you already have a FlowΔ)
+"""
+function log_likelihood_per_instance(fc::FlowΔ, batch::PlainXData{Bool})
+    @assert (prob_origin(fc[end]) isa ProbNode) "FlowΔ must originate in a ProbΔ"
+    pass_up_down(fc, batch)
+    log_likelihoods = zeros(num_examples(batch))
+    indices = init_array(Bool, flow_length(fc))::BitVector
+    for n in fc
+         if n isa DownFlow⋁ && num_children(n) != 1 # other nodes have no effect on likelihood
+            origin = prob_origin(n)::Prob⋁
+            foreach(n.children, origin.log_thetas) do c, log_theta
+                #  be careful here to allow for the Boolean multiplication to be done using & before switching to float arithmetic, or risk losing a lot of runtime!
+                # log_likelihoods .+= prod_fast(downflow(n), pr_factors(c)) .* log_theta
+                assign_prod(indices, downflow(n), pr_factors(c))
+                view(log_likelihoods, indices::BitVector) .+=  log_theta # see MixedProductKernelBenchmark.jl
+                # TODO put the lines above in Utils in order to ensure we have specialized types
+            end
+         end
     end
-end
+    log_likelihoods
+end
\ No newline at end of file
diff --git a/src/Probabilistic/flows.jl b/src/Probabilistic/flows.jl
new file mode 100644
index 00000000..e69de29b
diff --git a/src/Probabilistic/kld.jl b/src/Probabilistic/kld.jl
new file mode 100644
index 00000000..cf059b4a
--- /dev/null
+++ b/src/Probabilistic/kld.jl
@@ -0,0 +1,230 @@
+using DataStructures
+
+# Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability
+# spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
+"Calculate the probability of the logic formula given by sdd for the psdd"
+function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogicCircuit})
+    cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
+
+    return pr_constraint(psdd_node, sdd_node, cache)
+end
+function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogicCircuit},
+                       cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})::Float64
+    if (psdd_node, sdd_node) in keys(cache) # Cache hit
+        return cache[psdd_node, sdd_node]
+    elseif psdd_node isa ProbLiteral # Boundary cases
+        if sdd_node isa Union{ProbLiteral, PlainStructLiteralNode} # Both are literals, just check whether they agrees with each other
+            if literal(psdd_node) == literal(sdd_node)
+                return get!(cache, (psdd_node, sdd_node), 1.0)
+            else
+                return get!(cache, (psdd_node, sdd_node), 0.0)
+            end
+        else
+            pr_constraint(psdd_node, sdd_node.children[1], cache)
+            if length(sdd_node.children) > 1
+                pr_constraint(psdd_node, sdd_node.children[2], cache)
+                return get!(cache, (psdd_node, sdd_node), 1.0)
+            else
+                return get!(cache, (psdd_node, sdd_node),
+                    literal(sdd_node.children[1]) == literal(psdd_node) ? 1.0 : 0.0
+                )
+            end
+        end
+    elseif psdd_node.children[1] isa ProbLiteral # The psdd is true
+        theta = exp(psdd_node.log_thetas[1])
+        return get!(cache, (psdd_node, sdd_node),
+            theta * pr_constraint(psdd_node.children[1], sdd_node, cache) +
+            (1.0 - theta) * pr_constraint(psdd_node.children[2], sdd_node, cache)
+        )
+    else # Both psdds are not trivial
+        prob = 0.0
+        for (prob⋀_node, log_theta) in zip(psdd_node.children, psdd_node.log_thetas)
+            p = prob⋀_node.children[1]
+            s = prob⋀_node.children[2]
+
+            theta = exp(log_theta)
+            for sdd⋀_node in sdd_node.children
+                r = sdd⋀_node.children[1]
+                t = sdd⋀_node.children[2]
+                prob += theta * pr_constraint(p, r, cache) * pr_constraint(s, t, cache)
+            end
+        end
+        return get!(cache, (psdd_node, sdd_node), prob)
+    end
+end
+
+
+"Entropy of the distribution of the input psdd."
+function psdd_entropy(psdd_node::ProbNode)::Float64
+    psdd_entropy_cache = Dict{ProbNode, Float64}()
+
+    return psdd_entropy(psdd_node, psdd_entropy_cache)
+end
+function psdd_entropy(psdd_node::Prob⋁, psdd_entropy_cache::Dict{ProbNode, Float64})::Float64
+    if psdd_node in keys(psdd_entropy_cache)
+        return psdd_entropy_cache[psdd_node]
+    elseif psdd_node.children[1] isa ProbLiteral
+        return get!(psdd_entropy_cache, psdd_node,
+            - exp(psdd_node.log_thetas[1]) * psdd_node.log_thetas[1] -
+            exp(psdd_node.log_thetas[2]) * psdd_node.log_thetas[2]
+        )
+    else
+        local_entropy = 0.0
+        for (prob⋀_node, log_prob) in zip(psdd_node.children, psdd_node.log_thetas)
+            p = prob⋀_node.children[1]
+            s = prob⋀_node.children[2]
+
+            local_entropy += exp(log_prob) * (psdd_entropy(p, psdd_entropy_cache) +
+                psdd_entropy(s, psdd_entropy_cache) - log_prob)
+        end
+        return get!(psdd_entropy_cache, psdd_node, local_entropy)
+    end
+end
+function psdd_entropy(psdd_node::Prob⋀, psdd_entropy_cache::Dict{ProbNode, Float64})::Float64
+    return get!(psdd_entropy_cache, psdd_node.children[1], psdd_entropy(psdd_node.children[1], psdd_entropy_cache)) +
+        get!(psdd_entropy_cache, psdd_node.children[2], psdd_entropy(psdd_node.children[2], psdd_entropy_cache))
+end
+function psdd_entropy(psdd_node::ProbLiteral, psdd_entropy_cache::Dict{ProbNode, Float64})::Float64
+    return get!(psdd_entropy_cache, psdd_node, 0.0)
+end
+
+
+"KL divergence calculation for psdds that are not necessarily identical"
+function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode)::Float64
+    kl_divergence_cache = Dict{Tuple{ProbNode, ProbNode}, Float64}()
+    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
+
+    return psdd_kl_divergence(psdd_node1, psdd_node2, kl_divergence_cache, pr_constraint_cache)
+end
+function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
+        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64})::Float64
+    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
+
+    return psdd_kl_divergence(psdd_node1, psdd_node2, kl_divergence_cache, pr_constraint_cache)
+end
+function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
+        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
+        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
+    @assert !(psdd_node1 isa Prob⋀ || psdd_node2 isa Prob⋀) "Prob⋀ not a valid PSDD node for KL-Divergence"
+
+    # Check if both nodes are normalized for same vtree node
+    @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
+
+    if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
+        return kl_divergence_cache[(psdd_node1, psdd_node2)]
+    elseif psdd_node1.children[1] isa ProbLiteral
+        if psdd_node2 isa ProbLiteral
+            psdd_kl_divergence(psdd_node1.children[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
+            psdd_kl_divergence(psdd_node1.children[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
+            if literal(psdd_node1.children[1]) == literal(psdd_node2)
+                return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
+                    psdd_node1.log_thetas[1] * exp(psdd_node1.log_thetas[1])
+                )
+            else
+                return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
+                    psdd_node1.log_thetas[2] * exp(psdd_node1.log_thetas[2])
+                )
+            end
+        else
+            # The below four lines actually assign zero, but still we need to
+            # call it.
+            psdd_kl_divergence(psdd_node1.children[1], psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
+            psdd_kl_divergence(psdd_node1.children[1], psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
+            psdd_kl_divergence(psdd_node1.children[2], psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
+            psdd_kl_divergence(psdd_node1.children[2], psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
+            # There are two possible matches
+            if literal(psdd_node1.children[1]) == literal(psdd_node2.children[1])
+                return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
+                    exp(psdd_node1.log_thetas[1]) * (psdd_node1.log_thetas[1] - psdd_node2.log_thetas[1]) +
+                    exp(psdd_node1.log_thetas[2]) * (psdd_node1.log_thetas[2] - psdd_node2.log_thetas[2])
+                )
+            else
+                return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
+                    exp(psdd_node1.log_thetas[1]) * (psdd_node1.log_thetas[1] - psdd_node2.log_thetas[2]) +
+                    exp(psdd_node1.log_thetas[2]) * (psdd_node1.log_thetas[2] - psdd_node2.log_thetas[1])
+                )
+            end
+        end
+    else # the normal case
+        kl_divergence = 0.0
+
+        # loop through every combination of prim and sub
+        for (prob⋀_node1, log_theta1) in zip(psdd_node1.children, psdd_node1.log_thetas)
+            for (prob⋀_node2, log_theta2) in zip(psdd_node2.children, psdd_node2.log_thetas)
+                p = prob⋀_node1.children[1]
+                s = prob⋀_node1.children[2]
+
+                r = prob⋀_node2.children[1]
+                t = prob⋀_node2.children[2]
+
+                theta1 = exp(log_theta1)
+
+                p11 = pr_constraint(s, t, pr_constraint_cache)
+                p12 = pr_constraint(p, r, pr_constraint_cache)
+
+                p13 = theta1 * (log_theta1 - log_theta2)
+
+                p21 = psdd_kl_divergence(p, r, kl_divergence_cache, pr_constraint_cache)
+                p31 = psdd_kl_divergence(s, t, kl_divergence_cache, pr_constraint_cache)
+
+                kl_divergence += p11 * p12 * p13 + theta1 * (p11 * p21 + p12 * p31)
+            end
+        end
+        return get!(kl_divergence_cache, (psdd_node1, psdd_node2), kl_divergence)
+    end
+end
+function psdd_kl_divergence(psdd_node1::ProbLiteral, psdd_node2::ProbLiteral,
+        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
+        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
+    # Check if literals are over same variables in vtree
+   @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
+
+    if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
+        return kl_divergence_cache[psdd_node1, psdd_node2]
+    else
+        # In this case probability is 1, kl divergence is 0
+        return get!(kl_divergence_cache, (psdd_node1, psdd_node2), 0.0)
+    end
+end
+function psdd_kl_divergence(psdd_node1::Prob⋁, psdd_node2::ProbLiteral,
+        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
+        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
+    @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
+
+    if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
+        return kl_divergence_cache[psdd_node1, psdd_node2]
+    else
+        psdd_kl_divergence(psdd_node1.children[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
+        psdd_kl_divergence(psdd_node1.children[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
+        if literal(psdd_node1.children[1]) == literal(psdd_node2)
+            return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
+                psdd_node1.log_thetas[1] * exp(psdd_node1.log_thetas[1])
+            )
+        else
+            return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
+                psdd_node1.log_thetas[2] * exp(psdd_node1.log_thetas[2])
+            )
+        end
+    end
+end
+function psdd_kl_divergence(psdd_node1::ProbLiteral, psdd_node2::Prob⋁,
+        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
+        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
+    @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
+
+    if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
+        return kl_divergence_cache[psdd_node1, psdd_node2]
+    else
+        psdd_kl_divergence(psdd_node1, psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
+        psdd_kl_divergence(psdd_node1, psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
+        if literal(psdd_node1) == literal(psdd_node2.children[1])
+            return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
+                -psdd_node2.log_thetas[1]
+            )
+        else
+            return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
+                -psdd_node2.log_thetas[2]
+            )
+        end
+    end
+end
diff --git a/src/Probabilistic/parameters.jl b/src/Probabilistic/parameters.jl
new file mode 100644
index 00000000..e13950c6
--- /dev/null
+++ b/src/Probabilistic/parameters.jl
@@ -0,0 +1,257 @@
+function normalize_parameters(pc::ProbCircuit)
+    for or in or_nodes(pc)
+        or.log_thetas .= 1 ./ length(or.log_thetas)
+    end
+end
+
+
+function estimate_parameters2(pc::ProbΔ, data::XData{Bool}; pseudocount::Float64)
+    Logic.pass_up_down2(pc, data)
+    w = (data isa PlainXData) ? nothing : weights(data)
+    estimate_parameters_cached2(pc, w; pseudocount=pseudocount)
+end
+
+function estimate_parameters_cached2(pc::ProbΔ, w; pseudocount::Float64)
+    flow(n) = Float64(sum(sum(n.data)))
+    children_flows(n) = sum.(map(c -> c.data[1] .& n.data[1], children(n)))
+
+    if issomething(w)
+        flow_w(n) = sum(Float64.(n.data[1]) .* w)
+        children_flows_w(n) = sum.(map(c -> Float64.(c.data[1] .& n.data[1]) .* w, children(n)))
+        flow = flow_w
+        children_flows = children_flows_w
+    end
+
+    estimate_parameters_node2(n::ProbNode) = ()
+    function estimate_parameters_node2(n::Prob⋁)
+        if num_children(n) == 1
+            n.log_thetas .= 0.0
+        else
+            smoothed_flow = flow(n) + pseudocount
+            uniform_pseudocount = pseudocount / num_children(n)
+            n.log_thetas .= log.((children_flows(n) .+ uniform_pseudocount) ./ smoothed_flow)
+            @assert isapprox(sum(exp.(n.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally"
+            # normalize away any leftover error
+            n.log_thetas .- logsumexp(n.log_thetas)
+        end
+    end
+
+    foreach(estimate_parameters_node2, pc)
+end
+
+
+
+
+function estimate_parameters(pc::ProbΔ, data::XBatches{Bool}; pseudocount::Float64)
+    estimate_parameters(AggregateFlowΔ(pc, aggr_weight_type(data)), data; pseudocount=pseudocount)
+end
+
+function estimate_parameters(afc::AggregateFlowΔ, data::XBatches{Bool}; pseudocount::Float64)
+    @assert feature_type(data) == Bool "Can only learn probabilistic circuits on Bool data"
+    @assert (afc[end].origin isa ProbNode) "AggregateFlowΔ must originate in a ProbΔ"
+    collect_aggr_flows(afc, data)
+    estimate_parameters_cached(afc; pseudocount=pseudocount)
+    afc
+end
+
+function estimate_parameters(fc::FlowΔ, data::XBatches{Bool}; pseudocount::Float64)
+    @assert feature_type(data) == Bool "Can only learn probabilistic circuits on Bool data"
+    @assert (prob_origin(afc[end]) isa ProbNode) "FlowΔ must originate in a ProbΔ"
+    collect_aggr_flows(fc, data)
+    estimate_parameters_cached(origin(fc); pseudocount=pseudocount)
+end
+
+ # turns aggregate statistics into theta parameters
+function estimate_parameters_cached(afc::AggregateFlowΔ; pseudocount::Float64)
+    foreach(n -> estimate_parameters_node(n; pseudocount=pseudocount), afc)
+end
+
+estimate_parameters_node(::AggregateFlowNode; pseudocount::Float64) = () # do nothing
+function estimate_parameters_node(n::AggregateFlow⋁; pseudocount)
+    origin = n.origin::Prob⋁
+    if num_children(n) == 1
+        origin.log_thetas .= 0.0
+    else
+        smoothed_aggr_flow = (n.aggr_flow + pseudocount)
+        uniform_pseudocount = pseudocount / num_children(n)
+        origin.log_thetas .= log.( (n.aggr_flow_children .+ uniform_pseudocount) ./ smoothed_aggr_flow )
+        @assert isapprox(sum(exp.(origin.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally: $(exp.(origin.log_thetas)), estimated from $(n.aggr_flow) and $(n.aggr_flow_children). Did you actually compute the aggregate flows?"
+        #normalize away any leftover error
+        origin.log_thetas .- logsumexp(origin.log_thetas)
+    end
+end
+
+
+
+"""
+Calculate log likelihood for a batch of samples with partial evidence P(e).
+(Also returns the generated FlowΔ)
+
+To indicate a variable is not observed, pass -1 for that variable.
+"""
+function marginal_log_likelihood_per_instance(pc::ProbΔ, batch::PlainXData{Int8})
+    opts = (flow_opts★..., el_type=Float64, compact⋀=false, compact⋁=false)
+    fc = UpFlowΔ(pc, num_examples(batch), Float64, opts)
+    (fc, marginal_log_likelihood_per_instance(fc, batch))
+end
+
+"""
+Calculate log likelihood for a batch of samples with partial evidence P(e).
+(If you already have a FlowΔ)
+
+To indicate a variable is not observed, pass -1 for that variable.
+"""
+function marginal_log_likelihood_per_instance(fc::UpFlowΔ, batch::PlainXData{Int8})
+    @assert (prob_origin(fc[end]) isa ProbNode) "FlowΔ must originate in a ProbΔ"
+    marginal_pass_up(fc, batch)
+    pr(fc[end])
+end
+
+##################
+# Sampling from a psdd
+##################
+
+"""
+Sample from a PSDD without any evidence
+"""
+function sample(circuit::ProbΔ)::AbstractVector{Bool}
+    inst = Dict{Var,Int64}()
+    simulate(circuit[end], inst)
+    len = length(keys(inst))
+    ans = Vector{Bool}()
+    for i = 1:len
+        push!(ans, inst[i])
+    end
+    ans
+end
+
+# Uniformly sample based on the probability of the items
+# and return the selected index
+function sample(probs::AbstractVector{<:Number})::Int32
+    z = sum(probs)
+    q = rand() * z
+    cur = 0.0
+    for i = 1:length(probs)
+        cur += probs[i]
+        if q <= cur
+            return i
+        end
+    end
+    return length(probs)
+end
+
+function simulate(node::ProbLiteral, inst::Dict{Var,Int64})
+    if ispositive(node)
+        inst[variable(node.origin)] = 1
+    else
+        inst[variable(node.origin)] = 0
+    end
+end
+
+function simulate(node::Prob⋁, inst::Dict{Var,Int64})
+    idx = sample(exp.(node.log_thetas))
+    simulate(node.children[idx], inst)
+end
+function simulate(node::Prob⋀, inst::Dict{Var,Int64})
+    for child in node.children
+        simulate(child, inst)
+    end
+end
+
+"""
+Sampling with Evidence from a psdd.
+Internally would call marginal pass up on a newly generated flow circuit.
+"""
+function sample(circuit::ProbΔ, evidence::PlainXData{Int8})::AbstractVector{Bool}
+    opts= (compact⋀=false, compact⋁=false)
+    flow_circuit = UpFlowΔ(circuit, 1, Float64, opts)
+    marginal_pass_up(flow_circuit, evidence)
+    sample(flow_circuit)
+end
+
+"""
+Sampling with Evidence from a psdd.
+Assuming already marginal pass up has been done on the flow circuit.
+"""
+function sample(circuit::UpFlowΔ)::AbstractVector{Bool}
+    inst = Dict{Var,Int64}()
+    simulate2(circuit[end], inst)
+    len = length(keys(inst))
+    ans = Vector{Bool}()
+    for i = 1:len
+        push!(ans, inst[i])
+    end
+    ans
+end
+
+function simulate2(node::UpFlowLiteral, inst::Dict{Var,Int64})
+    if ispositive(node)
+        #TODO I don't think we need these 'grand_origin' parts below
+        inst[variable(grand_origin(node))] = 1
+    else
+        inst[variable(grand_origin(node))] = 0
+    end
+end
+
+function simulate2(node::UpFlow⋁, inst::Dict{Var,Int64})
+    prs = [ pr(ch)[1] for ch in children(node) ]
+    idx = sample(exp.(node.origin.log_thetas .+ prs))
+    simulate2(children(node)[idx], inst)
+end
+
+function simulate2(node::UpFlow⋀, inst::Dict{Var,Int64})
+    for child in children(node)
+        simulate2(child, inst)
+    end
+end
+
+
+
+##################
+# Most Probable Explanation MPE of a psdd
+#   aka MAP
+##################
+
+@inline function MAP(circuit::ProbΔ, evidence::PlainXData{Int8})::Matrix{Bool}
+    MPE(circuit, evidence)
+end
+
+function MPE(circuit::ProbΔ, evidence::PlainXData{Int8})::Matrix{Bool}
+    # Computing Marginal Likelihood for each node
+    fc, lls = marginal_log_likelihood_per_instance(circuit, evidence)
+
+    ans = Matrix{Bool}(zeros(size(evidence.x)))
+    active_samples = Array{Bool}(ones( num_examples(evidence) ))
+
+    mpe_simulate(fc[end], active_samples, ans)
+    ans
+end
+
+"""
+active_samples: bool vector indicating which samples are active for this node during mpe
+result: Matrix (num_samples, num_variables) indicating the final result of mpe
+"""
+function mpe_simulate(node::UpFlowLiteral, active_samples::Vector{Bool}, result::Matrix{Bool})
+    if ispositive(node)
+        result[active_samples, variable(node)] .= 1
+    else
+        result[active_samples, variable(node)] .= 0
+    end
+end
+function mpe_simulate(node::UpFlow⋁, active_samples::Vector{Bool}, result::Matrix{Bool})
+    prs = zeros( length(node.children), size(active_samples)[1] )
+    @simd  for i=1:length(node.children)
+        prs[i,:] .= pr(node.children[i]) .+ (node.origin.log_thetas[i])
+    end
+
+    max_child_ids = [a[1] for a in argmax(prs, dims = 1) ]
+    @simd for i=1:length(node.children)
+        ids = Vector{Bool}( active_samples .* (max_child_ids .== i)[1,:] )  # Only active for this child if it was the max for that sample
+        mpe_simulate(node.children[i], ids, result)
+    end
+end
+function mpe_simulate(node::UpFlow⋀, active_samples::Vector{Bool}, result::Matrix{Bool})
+    for child in node.children
+        mpe_simulate(child, active_samples, result)
+    end    
+end
diff --git a/src/Probabilistic/prob_nodes.jl b/src/Probabilistic/prob_nodes.jl
new file mode 100644
index 00000000..886323c2
--- /dev/null
+++ b/src/Probabilistic/prob_nodes.jl
@@ -0,0 +1,104 @@
+export ProbCircuit, ProbLeafNode, ProbInnerNode, ProbLiteralNode, Prob⋀Node, 
+Prob⋁Node, num_parameters, check_parameter_integrity
+
+#####################
+# Infrastructure for probabilistic circuit nodes
+#####################
+
+"Root of the probabilistic circuit node hierarchy"
+abstract type ProbCircuit <: DecoratorCircuit end
+
+"""
+A probabilistic leaf node
+"""
+abstract type ProbLeafNode <: ProbCircuit end
+
+"""
+A probabilistic inner node
+"""
+abstract type ProbInnerNode <: ProbCircuit end
+
+"""
+A probabilistic literal node
+"""
+mutable struct ProbLiteralNode <: ProbLeafNode
+    origin::LogicCircuit
+    data
+    counter::UInt32
+    ProbLiteralNode(n) = begin 
+        @assert GateType(n) isa LiteralGate
+        new(n, nothing, 0)
+    end
+end
+
+"""
+A probabilistic conjunction node (And node)
+"""
+mutable struct Prob⋀Node <: ProbInnerNode
+    origin::LogicCircuit
+    children::Vector{<:ProbCircuit}
+    data
+    counter::UInt32
+    Prob⋀Node(n, children) = begin
+        @assert GateType(n) isa ⋀Gate
+        new(n, convert(Vector{ProbCircuit}, children), nothing, 0)
+    end
+end
+
+"""
+A probabilistic disjunction node (Or node)
+"""
+mutable struct Prob⋁Node <: ProbInnerNode
+    origin::LogicCircuit
+    children::Vector{<:ProbCircuit}
+    log_thetas::Vector{Float64}
+    data
+    counter::UInt32
+    Prob⋁Node(n, children) = begin
+        @assert GateType(n) isa ⋁Gate
+        new(n, convert(Vector{ProbCircuit}, children), init_array(Float64, length(children)), nothing, 0)
+    end
+end
+
+#####################
+# traits
+#####################
+
+import LogicCircuits.GateType # make available for extension
+
+@inline GateType(::Type{<:ProbLiteralNode}) = LiteralGate()
+@inline GateType(::Type{<:Prob⋀Node}) = ⋀Gate()
+@inline GateType(::Type{<:Prob⋁Node}) = ⋁Gate()
+
+#####################
+# methods
+#####################
+
+import ..Utils.origin
+@inline origin(c::ProbCircuit) = c.origin
+
+import LogicCircuits: children # make available for extension
+@inline children(n::ProbInnerNode) = n.children
+@inline num_parameters(c::ProbCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
+
+#####################
+# constructors and conversions
+#####################
+
+function ProbCircuit(circuit::LogicCircuit)::ProbCircuit
+    f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
+    f_lit(n) = ProbLiteralNode(n)
+    f_a(n, cn) = Prob⋀Node(n, cn)
+    f_o(n, cn) = Prob⋁Node(n, cn)
+    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, ProbCircuit)
+end
+
+# TODO: import LogicCircuits: conjoin, disjoin, compile # make available for extension 
+
+
+function check_parameter_integrity(circuit::ProbCircuit)
+    for node in or_nodes(circuit)
+        @assert all(θ -> !isnan(θ), node.log_thetas) "There is a NaN in one of the log_thetas"
+    end
+    true
+end
\ No newline at end of file
diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 6ed05250..af0f8802 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -5,24 +5,25 @@ module ProbabilisticCircuits
 # USE EXTERNAL MODULES
 
 using Reexport
+using LogicCircuits
 
 include("Utils/Utils.jl")
-
 @reexport using .Utils
 
+
 # INCLUDE CHILD MODULES
 include("Probabilistic/Probabilistic.jl")
-include("Logistic/Logistic.jl")
-include("IO/IO.jl")
-include("StructureLearner/StructureLearner.jl")
-include("Reasoning/Reasoning.jl")
+# include("Logistic/Logistic.jl")
+include("LoadSave/LoadSave.jl")
+# include("StructureLearner/StructureLearner.jl")
+# include("Reasoning/Reasoning.jl")
 
 
 # USE CHILD MODULES (in order to re-export some functions)
 @reexport using .Probabilistic
-@reexport using .Logistic
-@reexport using .IO
-@reexport using .StructureLearner
-@reexport using .Reasoning
+# @reexport using .Logistic
+@reexport using .LoadSave
+# @reexport using .StructureLearner
+# @reexport using .Reasoning
 
 end
diff --git a/src/Utils/Utils.jl b/src/Utils/Utils.jl
index d863c9bc..24729879 100644
--- a/src/Utils/Utils.jl
+++ b/src/Utils/Utils.jl
@@ -1,74 +1,10 @@
 """
-Module with general utilities and missing standard library features that could be useful in any Julia project
+Module with general utilities and missing standard library features 
+that could be useful in any Julia project
 """
 module Utils
 
-export to_long_mi,
-    generate_all, generate_data_all
-
-
-###################
-# Misc.
-####################
-
-
-function to_long_mi(m::Matrix{Float64}, min_int, max_int)::Matrix{Int64}
-    δmi = maximum(m) - minimum(m)
-    δint = max_int - min_int
-    return @. round(Int64, m * δint / δmi + min_int)
-end
-
-###################
-# One-Hot Encoding
-####################
-"""
-One-hot encode data (2-D Array) based on categories (1-D Array)
-Each row of the return value is a concatenation of one-hot encoding of elements of the same row in data
-Assumption: both input arrays have elements of same type
-"""
-function one_hot_encode(X::Array{T, 2}, categories::Array{T,1}) where {T<:Any}
-    X_dash = zeros(Bool, size(X)[1], length(categories)*size(X)[2])
-    for i = 1:size(X)[1], j = 1:size(X)[2]
-            X_dash[i, (j-1)*length(categories) + findfirst(==(X[i,j]), categories)] = 1
-    end  
-    X_dash
-end
-
-###################
-# Testing Utils
-####################
-
-"""
-Given some missing values generates all possible fillings
-"""
-function generate_all(row::Array{Int8})
-    miss_count = count(row .== -1)
-    lits = length(row)
-    result = Bool.(zeros(1 << miss_count, lits))
-
-    if miss_count == 0
-        result[1, :] = copy(row)
-    else
-        for mask = 0: (1<<miss_count) - 1
-            cur = copy(row)
-            cur[row .== -1] = transpose(parse.(Bool, split(bitstring(mask)[end-miss_count+1:end], "")))
-            result[mask+1,:] = cur
-        end
-    end
-    result
-end
-
-"""
-Generates all possible binary configurations of size N
-"""
-function generate_data_all(N::Int)
-    data_all = transpose(parse.(Bool, split(bitstring(0)[end-N+1:end], "")));
-    for mask = 1: (1<<N) - 1
-        data_all = vcat(data_all,
-            transpose(parse.(Bool, split(bitstring(mask)[end-N+1:end], "")))
-        );
-    end
-    data_all
-end
+include("misc.jl")
+include("decorators.jl")
 
 end #module
diff --git a/src/Utils/decorators.jl b/src/Utils/decorators.jl
new file mode 100644
index 00000000..27c0ec68
--- /dev/null
+++ b/src/Utils/decorators.jl
@@ -0,0 +1,65 @@
+export DecoratorCircuit, literal, origin, and_nodes, or_nodes, ⋀_nodes, ⋁_nodes,
+GateType, NodeType, variable, ispositive, isnegative, origin
+
+using LogicCircuits
+
+"Root of the decorator circuit node hierarchy"
+abstract type DecoratorCircuit <: Dag end
+
+#####################
+# functions that need to be implemented for each type of decorator circuit
+#####################
+"""
+Get the origin node/circuit in a given decorator node/circuit
+"""
+function origin end
+
+#####################
+# Abstract infrastructure for decorator circuit nodes
+#####################
+
+import LogicCircuits: GateType, NodeType
+
+"Get the gate type trait of the given `DecoratorCircuit`"
+@inline GateType(instance::DecoratorCircuit) = GateType(typeof(instance))
+
+"Map gate type traits to graph node traits"
+@inline NodeType(::Type{N}) where {N<:DecoratorCircuit} = NodeType(GateType(N))
+
+#####################
+# node functions
+#####################
+
+import LogicCircuits: literal, and_nodes, or_nodes, ⋀_nodes, ⋁_nodes
+
+"Get the logical literal in a given node"
+literal(n::DecoratorCircuit)::Lit = literal(origin(n))
+
+"Get the list of conjunction nodes in a given circuit"
+⋀_nodes(c::DecoratorCircuit) = filter(is⋀gate, c)
+
+"Get the list of And nodes in a given circuit"
+@inline and_nodes(c::DecoratorCircuit) = ⋀_nodes(c)
+
+"Get the list of disjunction nodes in a given circuit"
+⋁_nodes(c::DecoratorCircuit) = filter(is⋁gate, c)
+
+"Get the list of or nodes in a given circuit"
+@inline or_nodes(c::DecoratorCircuit) = ⋁_nodes(c)
+
+#####################
+# derived node functions
+#####################
+
+import LogicCircuits: variable, ispositive, isnegative
+
+"Get the logical variable in a given literal leaf node"
+@inline variable(n::DecoratorCircuit)::Var = variable(GateType(n), origin(n))
+
+"Get the sign of the literal leaf node"
+@inline ispositive(n::DecoratorCircuit)::Bool = ispositive(GateType(n), origin(n))
+@inline isnegative(n::DecoratorCircuit)::Bool = !ispositive(n)
+
+# TODO
+# istrue
+# isfalse
\ No newline at end of file
diff --git a/src/Utils/misc.jl b/src/Utils/misc.jl
new file mode 100644
index 00000000..7b1c39f7
--- /dev/null
+++ b/src/Utils/misc.jl
@@ -0,0 +1,67 @@
+export to_long_mi,
+    generate_all, generate_data_all
+
+
+###################
+# Misc.
+####################
+
+
+function to_long_mi(m::Matrix{Float64}, min_int, max_int)::Matrix{Int64}
+    δmi = maximum(m) - minimum(m)
+    δint = max_int - min_int
+    return @. round(Int64, m * δint / δmi + min_int)
+end
+
+###################
+# One-Hot Encoding
+####################
+"""
+One-hot encode data (2-D Array) based on categories (1-D Array)
+Each row of the return value is a concatenation of one-hot encoding of elements of the same row in data
+Assumption: both input arrays have elements of same type
+"""
+function one_hot_encode(X::Array{T, 2}, categories::Array{T,1}) where {T<:Any}
+    X_dash = zeros(Bool, size(X)[1], length(categories)*size(X)[2])
+    for i = 1:size(X)[1], j = 1:size(X)[2]
+            X_dash[i, (j-1)*length(categories) + findfirst(==(X[i,j]), categories)] = 1
+    end  
+    X_dash
+end
+
+###################
+# Testing Utils
+####################
+
+"""
+Given some missing values generates all possible fillings
+"""
+function generate_all(row::Array{Int8})
+    miss_count = count(row .== -1)
+    lits = length(row)
+    result = Bool.(zeros(1 << miss_count, lits))
+
+    if miss_count == 0
+        result[1, :] = copy(row)
+    else
+        for mask = 0: (1<<miss_count) - 1
+            cur = copy(row)
+            cur[row .== -1] = transpose(parse.(Bool, split(bitstring(mask)[end-miss_count+1:end], "")))
+            result[mask+1,:] = cur
+        end
+    end
+    result
+end
+
+"""
+Generates all possible binary configurations of size N
+"""
+function generate_data_all(N::Int)
+    data_all = transpose(parse.(Bool, split(bitstring(0)[end-N+1:end], "")));
+    for mask = 1: (1<<N) - 1
+        data_all = vcat(data_all,
+            transpose(parse.(Bool, split(bitstring(mask)[end-N+1:end], "")))
+        );
+    end
+    data_all
+end
diff --git a/test/IO/PSDDParserTest.jl b/test/LoadSave/circuit_loaders_tests.jl
similarity index 61%
rename from test/IO/PSDDParserTest.jl
rename to test/LoadSave/circuit_loaders_tests.jl
index d880024a..0ad98a0f 100644
--- a/test/IO/PSDDParserTest.jl
+++ b/test/LoadSave/circuit_loaders_tests.jl
@@ -5,25 +5,27 @@ using ProbabilisticCircuits
 @testset "Load a small PSDD and test methods" begin
    file = zoo_psdd_file("little_4var.psdd")
    prob_circuit = load_prob_circuit(file);
-   @test prob_circuit isa ProbΔ
+   @test prob_circuit isa ProbCircuit
 
    # Testing number of nodes and parameters
    @test  9 == num_parameters(prob_circuit)
-   @test 20 == size(prob_circuit)[1]
+   @test 20 == num_nodes(prob_circuit)
    
    # Testing Read Parameters
    EPS = 1e-7
-   @test abs(prob_circuit[13].log_thetas[1] - (-1.6094379124341003)) < EPS
-   @test abs(prob_circuit[13].log_thetas[2] - (-1.2039728043259361)) < EPS
-   @test abs(prob_circuit[13].log_thetas[3] - (-0.916290731874155)) < EPS
-   @test abs(prob_circuit[13].log_thetas[4] - (-2.3025850929940455)) < EPS
+   or1 = prob_circuit.children[1].children[2]
+   @test abs(or1.log_thetas[1] - (-1.6094379124341003)) < EPS
+   @test abs(or1.log_thetas[2] - (-1.2039728043259361)) < EPS
+   @test abs(or1.log_thetas[3] - (-0.916290731874155)) < EPS
+   @test abs(or1.log_thetas[4] - (-2.3025850929940455)) < EPS
 
-   @test abs(prob_circuit[18].log_thetas[1] - (-2.3025850929940455)) < EPS
-   @test abs(prob_circuit[18].log_thetas[2] - (-2.3025850929940455)) < EPS
-   @test abs(prob_circuit[18].log_thetas[3] - (-2.3025850929940455)) < EPS
-   @test abs(prob_circuit[18].log_thetas[4] - (-0.35667494393873245)) < EPS
+   or2 = prob_circuit.children[1].children[1]
+   @test abs(or2.log_thetas[1] - (-2.3025850929940455)) < EPS
+   @test abs(or2.log_thetas[2] - (-2.3025850929940455)) < EPS
+   @test abs(or2.log_thetas[3] - (-2.3025850929940455)) < EPS
+   @test abs(or2.log_thetas[4] - (-0.35667494393873245)) < EPS
 
-   @test abs(prob_circuit[20].log_thetas[1] - (0.0)) < EPS
+   @test abs(prob_circuit.log_thetas[1] - (0.0)) < EPS
 end
 
 psdd_files = ["little_4var.psdd", "msnbc-yitao-a.psdd", "msnbc-yitao-b.psdd", "msnbc-yitao-c.psdd", "msnbc-yitao-d.psdd", "msnbc-yitao-e.psdd", "mnist-antonio.psdd"]
diff --git a/test/IO/CircuitSaverTest.jl b/test/LoadSave/circuit_savers_test.jl
similarity index 78%
rename from test/IO/CircuitSaverTest.jl
rename to test/LoadSave/circuit_savers_test.jl
index 7ce513e5..286cfba0 100644
--- a/test/IO/CircuitSaverTest.jl
+++ b/test/LoadSave/circuit_savers_test.jl
@@ -10,12 +10,12 @@ using ProbabilisticCircuits
 
         # load, save, and load as .psdd
         save_circuit("$tmp/temp.psdd", circuit, vtree)
-        save(vtree, "$tmp/temp.vtree");
+        save_vtree(vtree, "$tmp/temp.vtree");
         load_struct_prob_circuit("$tmp/temp.psdd", "$tmp/temp.vtree")
         
         # save and load as .sdd
-        save_circuit("$tmp/temp.sdd", circuit, vtree)
-        save(vtree, "$tmp/temp.vtree")
+        save_circuit("$tmp/temp.sdd", origin(circuit), vtree)
+        save_vtree(vtree, "$tmp/temp.vtree")
 
     end
     
diff --git a/test/Probabilistic/prob_nodes_tests.jl b/test/Probabilistic/prob_nodes_tests.jl
new file mode 100644
index 00000000..1d9c83fa
--- /dev/null
+++ b/test/Probabilistic/prob_nodes_tests.jl
@@ -0,0 +1,37 @@
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+
+include("../helper/plain_logic_circuits.jl")
+
+@testset "probabilistic circuit nodes" begin
+    c1 = little_3var()
+    p1 = ProbCircuit(c1)
+    lit3 = children(p1)[1].children[1]
+    @test isempty(intersect(linearize(ProbCircuit(c1)), linearize(ProbCircuit(c1))))
+    
+    # traits
+    @test p1 isa ProbCircuit
+    @test p1 isa Prob⋁Node
+    @test children(p1)[1] isa Prob⋀Node
+    @test lit3 isa ProbLiteralNode
+    @test GateType(p1) isa ⋁Gate
+    @test GateType(children(p1)[1]) isa ⋀Gate
+    @test GateType(lit3) isa LiteralGate
+
+    # methods
+    @test origin(p1) === c1
+    @test all(origin.(children(p1)) .=== c1.children)
+    @test num_parameters(p1) == 10
+
+    # extension methods
+    @test literal(lit3) === literal(children(c1)[1].children[1])
+    @test all(origin.(and_nodes(p1)) .=== and_nodes(c1))
+    @test all(origin.(or_nodes(p1)) .=== or_nodes(c1))
+    @test variable(left_most_descendent(p1)) == Var(3)
+    @test ispositive(left_most_descendent(p1))
+    @test !isnegative(left_most_descendent(p1))
+    @test num_nodes(p1) == 15
+    @test num_edges(p1) == 18
+
+end
\ No newline at end of file
diff --git a/test/Probabilistic/CircuitQueriesTest.jl b/test/Probabilistic/queries_tests.jl
similarity index 96%
rename from test/Probabilistic/CircuitQueriesTest.jl
rename to test/Probabilistic/queries_tests.jl
index 4b1bd1f4..40d16d06 100644
--- a/test/Probabilistic/CircuitQueriesTest.jl
+++ b/test/Probabilistic/queries_tests.jl
@@ -8,7 +8,8 @@ using ProbabilisticCircuits
     # match with python. Also tests all probabilities sum up to 1.
 
     EPS = 1e-7;
-    prob_circuit = zoo_psdd("little_4var.psdd");
+    # prob_circuit = zoo_psdd("little_4var.psdd");
+    prob_circuit = load_logic_circuit(zoo_lc_file("little_4var.circuit"))
     @test prob_circuit isa Vector{<:ProbNode};
 
     flow_circuit = FlowΔ(prob_circuit, 16, Bool)
@@ -16,7 +17,7 @@ using ProbabilisticCircuits
 
 
     # Step 1. Check Probabilities for 3 samples
-    data = XData(Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]));
+    data = Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]);
     true_prob = [0.07; 0.03; 0.13999999999999999]
 
     calc_prob = log_likelihood_per_instance(flow_circuit, data)
diff --git a/test/helper/plain_logic_circuits.jl b/test/helper/plain_logic_circuits.jl
new file mode 100644
index 00000000..f2a66f95
--- /dev/null
+++ b/test/helper/plain_logic_circuits.jl
@@ -0,0 +1,68 @@
+function little_2var()
+    v = Var(2)
+    pos = compile(PlainLogicCircuit, var2lit(v))
+    neg = compile(PlainLogicCircuit, -var2lit(v))
+    or1 = pos | neg
+    or2 = pos | neg
+
+    v = Var(1)
+    pos = compile(PlainLogicCircuit, var2lit(v))
+    neg = compile(PlainLogicCircuit, -var2lit(v))
+    
+    and1 = pos & or1
+    and2 = neg & or2
+    and1 | and2
+end
+
+function little_3var()
+    or1 = little_2var()
+    v = Var(3)
+
+    pos = compile(PlainLogicCircuit,  var2lit(v))
+    neg = compile(PlainLogicCircuit, -var2lit(v))
+    
+    or2 = disjoin(children(or1))
+    
+    and1 = pos & or1
+    and2 = neg & or2
+    and1 | and2
+end
+
+function little_3var_constants()
+    or1 = little_2var()
+    v = Var(3)
+
+    t = compile(PlainLogicCircuit, true)
+    f = compile(PlainLogicCircuit, false)
+
+    pos = compile(PlainLogicCircuit,  var2lit(v)) & t
+    neg = compile(PlainLogicCircuit, -var2lit(v)) & f
+    
+    or2 = disjoin(children(or1))
+    
+    and1 = pos & or1
+    and2 = neg & or2
+    and1 | and2
+end
+
+function little_4var()
+    ors = map(1:4) do v
+        v = Var(v)
+        pos = compile(PlainLogicCircuit, var2lit(v))
+        neg = compile(PlainLogicCircuit, - var2lit(v))
+        or = pos | neg
+    end
+    and1 = ors[1] & ors[2]
+    and2 = ors[3] & ors[4]
+    or = and1 | and2
+end
+
+function little_5var()
+    c_4var = little_4var()
+    v = Var(5)
+    pos = compile(PlainLogicCircuit, var2lit(v))
+    neg = compile(PlainLogicCircuit, - var2lit(v))
+    or = pos | neg
+    and = c_4var & or
+    Plain⋁Node([and])
+end

From 722cf214c387dfe1e1872af7180e98085aa6d394 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Thu, 23 Jul 2020 15:58:06 -0700
Subject: [PATCH 007/131] logistic node methods

---
 src/LoadSave/LoadSave.jl              |   2 +-
 src/LoadSave/circuit_line_compiler.jl | 100 ++++++++----------
 src/LoadSave/circuit_loaders.jl       |  29 +++--
 src/LoadSave/circuit_savers.jl        |  37 +++----
 src/Logistic/Logistic.jl              |  19 +---
 src/Logistic/LogisticCircuits.jl      | 139 ------------------------
 src/Logistic/logistic_nodes.jl        | 146 ++++++++++++++++++++++++++
 src/Probabilistic/prob_nodes.jl       |   4 +-
 src/ProbabilisticCircuits.jl          |   4 +-
 src/Reasoning/ExpFlowCircuits.jl      |  14 +--
 src/Reasoning/Expectation.jl          |  28 ++---
 src/Utils/decorators.jl               |   7 +-
 test/Logistic/LogisticCircuitTest.jl  |  46 --------
 test/Logistic/logistic_tests.jl       |  46 ++++++++
 14 files changed, 308 insertions(+), 313 deletions(-)
 delete mode 100644 src/Logistic/LogisticCircuits.jl
 create mode 100644 src/Logistic/logistic_nodes.jl
 delete mode 100644 test/Logistic/LogisticCircuitTest.jl
 create mode 100644 test/Logistic/logistic_tests.jl

diff --git a/src/LoadSave/LoadSave.jl b/src/LoadSave/LoadSave.jl
index defd7f35..e5b72dee 100644
--- a/src/LoadSave/LoadSave.jl
+++ b/src/LoadSave/LoadSave.jl
@@ -3,7 +3,7 @@ module LoadSave
 using LogicCircuits
 using ..Utils
 using ..Probabilistic
-# using ..Logistic
+using ..Logistic
 
 include("circuit_line_compiler.jl")
 include("circuit_loaders.jl")
diff --git a/src/LoadSave/circuit_line_compiler.jl b/src/LoadSave/circuit_line_compiler.jl
index 3e148c23..b20b6fde 100644
--- a/src/LoadSave/circuit_line_compiler.jl
+++ b/src/LoadSave/circuit_line_compiler.jl
@@ -20,12 +20,11 @@ end
 """
 Compile lines into a logistic circuit.
 """
-# TODO
-# function compile_logistic(lines::CircuitFormatLines, classes::Int)::LogisticΔ
-#     # first compile a logical circuit
-#     logic_circuit, id2lognode = compile_smooth_logical_m(lines)
-#     decorate_logistic(lines, logic_circuit, classes, id2lognode)
-# end
+function compile_logistic(lines::CircuitFormatLines, classes::Int)::LogisticCircuit
+    # first compile a logical circuit
+    logic_circuit, id2lognode = compile_smooth_logical_m(lines)
+    decorate_logistic(lines, logic_circuit, classes, id2lognode)
+end
 
 """
 Compile circuit and vtree lines into a structured probabilistic circuit (one whose logical circuit origin is structured).
@@ -37,7 +36,6 @@ function compile_struct_prob(circuit_lines::CircuitFormatLines, vtree_lines::Vtr
 end
 
 function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicCircuit, id2lognode::Dict{ID,<:LogicCircuit})::ProbCircuit
-    
     # set up cache mapping logical circuit nodes to their probabilistic decorator
     prob_circuit = ProbCircuit(logic_circuit)
     lognode2probnode = Dict{LogicCircuit, ProbCircuit}()
@@ -71,51 +69,45 @@ function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicCircuit, i
     root
 end
 
-# TODO
-# function decorate_logistic(lines::CircuitFormatLines, logic_circuit::LogicΔ, 
-#                             classes::Int, id2lognode::Dict{ID,<:LogicCircuit})::LogisticΔ
+function decorate_logistic(lines::CircuitFormatLines, logic_circuit::LogicCircuit,
+                            classes::Int, id2lognode::Dict{ID,<:LogicCircuit})::LogisticCircuit
                         
-#     # set up cache mapping logical circuit nodes to their logistic decorator
-#     log2logistic = LogisticCache()
-#     # build a corresponding probabilistic circuit
-#     logistic_circuit = LogisticΔ(logic_circuit, classes, log2logistic)
-#     # map from line node ids to probabilistic circuit nodes
-#     id2logisticnode(id) = log2logistic[id2lognode[id]]
-
-#     # go through lines again and update the probabilistic circuit node parameters
-
-#     function compile(ln::CircuitFormatLine)
-#         error("Compilation of line $ln into logistic circuit is not supported")
-#     end
-#     function compile(::Union{CircuitHeaderLine,CircuitCommentLine,UnweightedLiteralLine})
-#         # do nothing
-#     end
-
-#     function compile(ln::CircuitHeaderLine)
-#         # do nothing
-#     end
-
-#     function compile(ln::WeightedLiteralLine)
-#         node = id2logisticnode(ln.node_id)::Logistic⋁
-#         node.thetas[1, :] .= ln.weights
-#     end
-
-#     function compile(ln::DecisionLine{<:LCElement})
-#         node = id2logisticnode(ln.node_id)::Logistic⋁
-#         for (ind, elem) in enumerate(ln.elements)
-#             node.thetas[ind, :] .= elem.weights
-#         end
-#     end
-
-#     function compile(ln::BiasLine)
-#         node = id2logisticnode(ln.node_id)::Logistic⋁
-#         # @assert length(node.thetas) == 1
-#         node.thetas[1,:] .= ln.weights
-#     end
-
-#     for ln in lines
-#         compile(ln)
-#     end
-
-#     logistic_circuit
-# end
\ No newline at end of file
+    # set up cache mapping logical circuit nodes to their logistic decorator
+    logistic_circuit = LogisticCircuit(logic_circuit, classes)
+    log2logistic = Dict{LogicCircuit, LogisticCircuit}()
+    foreach(ln -> (log2logistic[origin(ln)] = ln), logistic_circuit) 
+    id2logisticnode(id) = log2logistic[id2lognode[id]]
+
+    root = nothing
+    # go through lines again and update the probabilistic circuit node parameters
+
+    function compile(ln::CircuitFormatLine)
+        error("Compilation of line $ln into logistic circuit is not supported")
+    end
+
+    function compile(::Union{CircuitHeaderLine,CircuitCommentLine,UnweightedLiteralLine})
+        # do nothing
+    end
+
+    function compile(ln::WeightedLiteralLine)
+        root = id2logisticnode(ln.node_id)::Logistic⋁Node
+        root.thetas[1, :] .= ln.weights
+    end
+
+    function compile(ln::DecisionLine{<:LCElement})
+        root = id2logisticnode(ln.node_id)::Logistic⋁Node
+        for (ind, elem) in enumerate(ln.elements)
+            root.thetas[ind, :] .= elem.weights
+        end
+    end
+
+    function compile(ln::BiasLine)
+        root = id2logisticnode(ln.node_id)::Logistic⋁Node
+        # @assert length(node.thetas) == 1
+        root.thetas[1,:] .= ln.weights
+    end
+
+    foreach(compile, lines)
+
+    root
+end
\ No newline at end of file
diff --git a/src/LoadSave/circuit_loaders.jl b/src/LoadSave/circuit_loaders.jl
index b7ec85a1..90f1237b 100644
--- a/src/LoadSave/circuit_loaders.jl
+++ b/src/LoadSave/circuit_loaders.jl
@@ -1,5 +1,5 @@
 export zoo_clt, zoo_clt_file, zoo_psdd, zoo_lc, zoo_lc_file,
-    load_prob_circuit, load_struct_prob_circuit
+    load_prob_circuit, load_struct_prob_circuit, load_logistic_circuit
 
 using LogicCircuits
 using Pkg.Artifacts
@@ -9,9 +9,11 @@ using LogicCircuits.LoadSave: parse_psdd_file, parse_circuit_file, parse_vtree_f
 # circuit loaders from module zoo
 #####################
 
-# TODO
-# zoo_lc(name, num_classes) = 
-#     load_logistic_circuit(zoo_lc_file(name), num_classes)
+zoo_lc_file(name) = 
+    artifact"circuit_model_zoo" * "/Circuit-Model-Zoo-0.1.2/lcs/$name"
+
+zoo_lc(name, num_classes) = 
+    load_logistic_circuit(zoo_lc_file(name), num_classes)
 
 zoo_clt_file(name) = 
     artifact"circuit_model_zoo" * "/Circuit-Model-Zoo-0.1.2/clts/$name"
@@ -56,13 +58,18 @@ function load_struct_prob_circuit(circuit_file::String, vtree_file::String)::Tup
     compile_struct_prob(circuit_lines, vtree_lines)
 end
 
-# TODO
-# function load_logistic_circuit(circuit_file::String, classes::Int)::LogisticΔ
-#     @assert endswith(circuit_file,".circuit")
-#     circuit_lines = parse_circuit_file(circuit_file)
-#     compile_logistic(circuit_lines, classes)
-# end
-
+"""
+Load a logistic circuit from file.
+Support circuit file formats:
+    * ".circuit" for logistic files
+Supported vtree file formats:
+    * ".vtree" for Vtree files
+"""
+function load_logistic_circuit(circuit_file::String, classes::Int)::LogisticCircuit
+    @assert endswith(circuit_file,".circuit")
+    circuit_lines = parse_circuit_file(circuit_file)
+    compile_logistic(circuit_lines, classes)
+end
 
 #####################
 # parse based on file extension
diff --git a/src/LoadSave/circuit_savers.jl b/src/LoadSave/circuit_savers.jl
index 2ca61d00..3177920b 100644
--- a/src/LoadSave/circuit_savers.jl
+++ b/src/LoadSave/circuit_savers.jl
@@ -1,4 +1,4 @@
-export save_circuit, save_as_dot, save_as_psdd
+export save_circuit, save_as_dot, save_as_psdd, save_as_logistic
 
 using LogicCircuits.LoadSave: SDDElement, 
     PSDDElement, 
@@ -40,7 +40,7 @@ end
 
 import LogicCircuits.LoadSave: get_node2id
 
-function get_node2id(circuit::ProbCircuit, T::Type) 
+function get_node2id(circuit::DecoratorCircuit, T::Type) 
     node2id = Dict{T, ID}()
     outnodes = filter(n -> !is⋀gate(n), circuit)
     sizehint!(node2id, length(outnodes))
@@ -109,19 +109,21 @@ function lc_header()
     c"""
 end
     
-# function save_lc_file(name::String, ln::LogisticΔ, vtree)
-#     @assert ln[end].origin isa StructLogicCircuit "LC should decorate on StructLogicΔ"
-#     @assert endswith(name, ".circuit")
-#     node2id = get_node2id(ln, ProbNode)
-#     vtree2id = get_vtree2id(vtree)
-#     formatlines = Vector{CircuitFormatLine}()
-#     append!(formatlines, parse_lc_file(IOBuffer(lc_header())))
-#     push!(formatlines, LcHeaderLine())
-#     for n in filter(n -> !(GateType(n) isa ⋀Gate), ln)
-#         push!(formatlines, decompile(n, node2id, vtree2id))
-#     end
-#     save_lines(name, formatlines)
-# end
+function save_as_logistic(name::String, circuit::LogisticCircuit, vtree)
+    @assert circuit.origin isa StructLogicCircuit "LC should decorate on StructLogicΔ"
+    @assert endswith(name, ".circuit")
+    node2id = get_node2id(circuit, LogisticCircuit)
+    vtree2id = get_vtree2id(vtree)
+    formatlines = Vector{CircuitFormatLine}()
+    append!(formatlines, parse_lc_file(IOBuffer(lc_header())))
+    push!(formatlines, LcHeaderLine())
+    for n in filter(n -> !is⋀gate(n), circuit)
+        push!(formatlines, decompile(n, node2id, vtree2id))
+    end
+    save_lines(name, formatlines)
+end
+
+# TODO add Decompile for logistic circuit
 
 import LogicCircuits.LoadSave: save_circuit, save_as_dot # make available for extension
 
@@ -129,9 +131,8 @@ import LogicCircuits.LoadSave: save_circuit, save_as_dot # make available for ex
 save_circuit(name::String, circuit::ProbCircuit, vtree::PlainVtree) =
     save_as_psdd(name, circuit, vtree)
 
-# TODO
-# save_circuit(name::String, circuit::LogicCircuit) =
-#     save_as_psdd(name, circuit, vtree)
+save_circuit(name::String, circuit::LogicCircuit, vtree::PlainVtree) =
+    save_as_logistic(name, circuit, vtree)
 
 using Printf: @sprintf
 "Save prob circuits to .dot file"
diff --git a/src/Logistic/Logistic.jl b/src/Logistic/Logistic.jl
index e5871408..1923d8ea 100644
--- a/src/Logistic/Logistic.jl
+++ b/src/Logistic/Logistic.jl
@@ -3,23 +3,6 @@ module Logistic
 using LogicCircuits
 using ..Utils
 
-export 
-    LogisticNode, 
-    LogisticLeafNode, 
-    LogisticInnerNode, 
-    LogisticLiteral,
-    Logistic⋀,
-    Logistic⋁,
-    LogisticΔ,
-    LogisticΔ,
-    LogisticCache,
-    num_parameters_perclass,
-    logistic_origin,
-    class_conditional_likelihood_per_instance,
-    classes
-
-
-
-include("LogisticCircuits.jl")
+include("logistic_nodes.jl")
 
 end
\ No newline at end of file
diff --git a/src/Logistic/LogisticCircuits.jl b/src/Logistic/LogisticCircuits.jl
deleted file mode 100644
index 98239895..00000000
--- a/src/Logistic/LogisticCircuits.jl
+++ /dev/null
@@ -1,139 +0,0 @@
-#######################
-## Logistic Circuits
-#######################
-
-
-abstract type LogisticNode{O} <: DecoratorNode{O} end
-abstract type LogisticLeafNode{O} <: LogisticNode{O} end
-abstract type LogisticInnerNode{O} <: LogisticNode{O} end
-
-struct LogisticLiteral{O} <: LogisticLeafNode{O}
-    origin::O
-end
-
-struct Logistic⋀{O} <: LogisticInnerNode{O}
-    origin::O
-    children::Vector{<:LogisticNode{<:O}}
-end
-
-mutable struct Logistic⋁{O} <: LogisticInnerNode{O}
-    origin::O
-    children::Vector{<:LogisticNode{<:O}}
-    thetas::Array{Float64, 2}
-end
-
-
-
-const LogisticΔ{O} = AbstractVector{<:LogisticNode{O}}
-
-#####################
-# traits
-#####################
-
-import LogicCircuits.GateType # make available for extension
-
-@inline GateType(::Type{<:LogisticLiteral}) = LiteralGate()
-@inline GateType(::Type{<:Logistic⋀}) = ⋀Gate()
-@inline GateType(::Type{<:Logistic⋁}) = ⋁Gate()
-
-
-
-#####################
-# constructors and conversions
-#####################
-
-function Logistic⋁(::Type{O}, origin, children, classes::Int) where {O}
-    Logistic⋁{O}(origin, children, Array{Float64, 2}(undef, (length(children), classes)))
-end
-
-
-const LogisticCache = Dict{Node, LogisticNode}
-
-function LogisticΔ(circuit::Δ, classes::Int, cache::LogisticCache = LogisticCache())
-
-    sizehint!(cache, length(circuit)*4÷3)
-    
-    O = grapheltype(circuit) # type of node in the origin
-
-    pc_node(::LiteralGate, n::LogicCircuit) = LogisticLiteral{O}(n)
-    pc_node(::ConstantGate, n::LogicCircuit) = error("Cannot construct a logistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-
-    pc_node(::⋀Gate, n::LogicCircuit) = begin
-        children = map(c -> cache[c], n.children)
-        Logistic⋀{O}(n, children)
-    end
-
-    pc_node(::⋁Gate, n::LogicCircuit) = begin
-        children = map(c -> cache[c], n.children)
-        Logistic⋁(O, n, children, classes)
-    end
-        
-    map(circuit) do node
-        pcn = pc_node(GateType(node), node)
-        cache[node] = pcn
-        pcn
-    end
-end
-
-
-#####################
-# methods
-#####################
-
-import LogicCircuits: literal, children # make available for extension
-
-@inline literal(n::LogisticLiteral)::Lit  = literal(n.origin)
-@inline children(n::LogisticInnerNode) = n.children
-@inline classes(n::Logistic⋁) = size(n.thetas)[2]
-
-num_parameters(n::Logistic⋁) = num_children(n) * classes(n)
-num_parameters(c::LogisticΔ) = sum(n -> num_parameters(n), ⋁_nodes(c))
-
-num_parameters_perclass(n::Logistic⋁) = num_children(n)
-num_parameters_perclass(c::LogisticΔ) = sum(n -> num_parameters_perclass(n), ⋁_nodes(c))
-
-"Return the first origin that is a Logistic circuit node"
-logistic_origin(n::DecoratorNode)::LogisticNode = origin(n,LogisticNode)
-
-"Return the first origin that is a Logistic circuit"
-logistic_origin(c::DecoratorΔ)::LogisticΔ = origin(c, LogisticNode)
-
-
-# TODO Learning
-
-
-
-# Class Conditional Probability
-function class_conditional_likelihood_per_instance(fc::FlowΔ, 
-                                                    classes::Int, 
-                                                    batch::PlainXData{Bool})
-    lc = origin(origin(fc))
-    @assert(lc isa LogisticΔ)
-    pass_up_down(fc, batch)
-    likelihoods = zeros(num_examples(batch), classes)
-    for n in fc
-        orig = logistic_origin(n)
-        if orig isa Logistic⋁
-            # For each class. orig.thetas is 2D so used eachcol
-            for (idx, thetaC) in enumerate(eachcol(orig.thetas))
-                foreach(n.children, thetaC) do c, theta
-                    likelihoods[:, idx] .+= prod_fast(downflow(n), pr_factors(origin(c))) .* theta
-                end
-            end
-        end
-    end
-    likelihoods
-end
-
-"""
-Calculate conditional log likelihood for a batch of samples with evidence P(c | x).
-(Also returns the generated FlowΔ)
-"""
-function class_conditional_likelihood_per_instance(lc::LogisticΔ, 
-                                                    classes::Int, 
-                                                    batch::PlainXData{Bool})
-    opts = (max_factors = 2, compact⋀=false, compact⋁=false)
-    fc = FlowΔ(lc, num_examples(batch), Float64, opts)
-    (fc, class_conditional_likelihood_per_instance(fc, classes, batch))
-end
-
diff --git a/src/Logistic/logistic_nodes.jl b/src/Logistic/logistic_nodes.jl
new file mode 100644
index 00000000..b0cd6ba7
--- /dev/null
+++ b/src/Logistic/logistic_nodes.jl
@@ -0,0 +1,146 @@
+export 
+    LogisticCircuit, 
+    LogisticLeafNode, 
+    LogisticInnerNode, 
+    LogisticLiteral,
+    Logistic⋀Node,
+    Logistic⋁Node,
+    classes,
+    num_parameters_perclass
+    # class_conditional_likelihood_per_instance,
+    
+#####################
+# Infrastructure for logistic circuit nodes
+#####################
+
+"Root of the logistic circuit node hierarchy"
+abstract type LogisticCircuit <: DecoratorCircuit end
+
+"""
+A logistic leaf node
+"""
+abstract type LogisticLeafNode <: LogisticCircuit end
+
+"""
+A logistic inner node
+"""
+abstract type LogisticInnerNode <: LogisticCircuit end
+
+"""
+A logistic literal node
+"""
+mutable struct LogisticLiteral <: LogisticLeafNode
+    origin::LogicCircuit
+    data
+    counter::UInt32
+    LogisticLiteral(n) = begin 
+        @assert GateType(n) isa LiteralGate
+        new(n, nothing, 0)
+    end
+end
+
+"""
+A logistic conjunction node (And node)
+"""
+mutable struct Logistic⋀Node <: LogisticInnerNode
+    origin::LogicCircuit
+    children::Vector{<:LogisticCircuit}
+    data
+    counter::UInt32
+    Logistic⋀Node(n, children) = begin
+        @assert GateType(n) isa ⋀Gate
+        new(n, convert(Vector{LogisticCircuit}, children), nothing, 0)
+    end
+end
+
+"""
+A logistic disjunction node (Or node)
+"""
+mutable struct Logistic⋁Node <: LogisticInnerNode
+    origin::LogicCircuit
+    children::Vector{<:LogisticCircuit}
+    thetas::Array{Float64, 2}
+    data
+    counter::UInt32
+    Logistic⋁Node(n, children, class::Int) = begin
+        @assert GateType(n) isa ⋁Gate
+        new(n, convert(Vector{LogisticCircuit}, children), init_array(Float64, length(children), class), nothing, 0)
+    end
+end
+
+#####################
+# traits
+#####################
+
+import LogicCircuits.GateType # make available for extension
+
+@inline GateType(::Type{<:LogisticLiteral}) = LiteralGate()
+@inline GateType(::Type{<:Logistic⋀Node}) = ⋀Gate()
+@inline GateType(::Type{<:Logistic⋁Node}) = ⋁Gate()
+
+#####################
+# methods
+#####################
+
+import ..Utils: origin, num_parameters
+@inline origin(c::LogisticCircuit) = c.origin
+@inline num_parameters(c::LogisticCircuit) = sum(n -> num_children(n) * classes(n), ⋁_nodes(c))
+
+import LogicCircuits: children # make available for extension
+@inline children(n::LogisticInnerNode) = n.children
+@inline classes(n::Logistic⋁Node) = size(n.thetas)[2]
+
+@inline num_parameters_perclass(c::LogisticCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
+
+#####################
+# constructors and conversions
+#####################
+
+function LogisticCircuit(circuit::LogicCircuit, classes::Int)
+    f_con(n) = error("Cannot construct a logistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
+    f_lit(n) = LogisticLiteral(n)
+    f_a(n, cn) = Logistic⋀Node(n, cn)
+    f_o(n, cn) = Logistic⋁Node(n, cn, classes)
+    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, LogisticCircuit)
+
+end
+
+#####################
+# methods
+#####################
+# TODO Learning
+# TODO queries
+# Class Conditional Probability
+# function class_conditional_likelihood_per_instance(fc::FlowΔ, 
+#                                                     classes::Int, 
+#                                                     batch::PlainXData{Bool})
+#     lc = origin(origin(fc))
+#     @assert(lc isa LogisticΔ)
+#     pass_up_down(fc, batch)
+#     likelihoods = zeros(num_examples(batch), classes)
+#     for n in fc
+#         orig = logistic_origin(n)
+#         if orig isa Logistic⋀Node
+#             # For each class. orig.thetas is 2D so used eachcol
+#             for (idx, thetaC) in enumerate(eachcol(orig.thetas))
+#                 foreach(n.children, thetaC) do c, theta
+#                     likelihoods[:, idx] .+= prod_fast(downflow(n), pr_factors(origin(c))) .* theta
+#                 end
+#             end
+#         end
+#     end
+#     likelihoods
+# end
+
+# """
+# Calculate conditional log likelihood for a batch of samples with evidence P(c | x).
+# (Also returns the generated FlowΔ)
+# """
+# function class_conditional_likelihood_per_instance(lc::LogisticΔ, 
+#                                                     classes::Int, 
+#                                                     batch::PlainXData{Bool})
+#     opts = (max_factors = 2, compact⋀=false, compact⋁=false)
+#     fc = FlowΔ(lc, num_examples(batch), Float64, opts)
+#     (fc, class_conditional_likelihood_per_instance(fc, classes, batch))
+# end
+
diff --git a/src/Probabilistic/prob_nodes.jl b/src/Probabilistic/prob_nodes.jl
index 886323c2..2bf43383 100644
--- a/src/Probabilistic/prob_nodes.jl
+++ b/src/Probabilistic/prob_nodes.jl
@@ -1,5 +1,5 @@
 export ProbCircuit, ProbLeafNode, ProbInnerNode, ProbLiteralNode, Prob⋀Node, 
-Prob⋁Node, num_parameters, check_parameter_integrity
+Prob⋁Node, check_parameter_integrity
 
 #####################
 # Infrastructure for probabilistic circuit nodes
@@ -74,7 +74,7 @@ import LogicCircuits.GateType # make available for extension
 # methods
 #####################
 
-import ..Utils.origin
+import ..Utils: origin, num_parameters
 @inline origin(c::ProbCircuit) = c.origin
 
 import LogicCircuits: children # make available for extension
diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index af0f8802..dea10633 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -13,7 +13,7 @@ include("Utils/Utils.jl")
 
 # INCLUDE CHILD MODULES
 include("Probabilistic/Probabilistic.jl")
-# include("Logistic/Logistic.jl")
+include("Logistic/Logistic.jl")
 include("LoadSave/LoadSave.jl")
 # include("StructureLearner/StructureLearner.jl")
 # include("Reasoning/Reasoning.jl")
@@ -21,7 +21,7 @@ include("LoadSave/LoadSave.jl")
 
 # USE CHILD MODULES (in order to re-export some functions)
 @reexport using .Probabilistic
-# @reexport using .Logistic
+@reexport using .Logistic
 @reexport using .LoadSave
 # @reexport using .StructureLearner
 # @reexport using .Reasoning
diff --git a/src/Reasoning/ExpFlowCircuits.jl b/src/Reasoning/ExpFlowCircuits.jl
index 8c3011ea..314423b7 100644
--- a/src/Reasoning/ExpFlowCircuits.jl
+++ b/src/Reasoning/ExpFlowCircuits.jl
@@ -41,7 +41,7 @@ function ExpFlowΔ(pc::ProbΔ, lc::LogisticΔ, batch_size::Int, ::Type{El}) wher
     sizehint!(cache, (length(pc) + length(lc))*4÷3)
     expFlowCircuit = Vector{ExpFlowNode}()
 
-    function ExpflowTraverse(n::Prob⋁, m::Logistic⋁) 
+    function ExpflowTraverse(n::Prob⋁, m::Logistic⋀Node) 
         get!(cache, Pair(n, m)) do
             children = [ ExpflowTraverse(i, j) for i in n.children for j in m.children]
             node = UpExpFlow{pc_type,lc_type, F}(n, m, children, fmem(), fgmem())
@@ -49,7 +49,7 @@ function ExpFlowΔ(pc::ProbΔ, lc::LogisticΔ, batch_size::Int, ::Type{El}) wher
             return node
         end
     end
-    function ExpflowTraverse(n::Prob⋀, m::Logistic⋀) 
+    function ExpflowTraverse(n::Prob⋀, m::Logistic⋀Node) 
         get!(cache, Pair(n, m)) do
             children = [ ExpflowTraverse(z[1], z[2]) for z in zip(n.children, m.children) ]
             node = UpExpFlow{pc_type,lc_type, F}(n, m, children, fmem(), fgmem())
@@ -57,7 +57,7 @@ function ExpFlowΔ(pc::ProbΔ, lc::LogisticΔ, batch_size::Int, ::Type{El}) wher
             return node
         end
     end
-    function ExpflowTraverse(n::ProbLiteral, m::Logistic⋁) 
+    function ExpflowTraverse(n::ProbLiteral, m::Logistic⋀Node) 
         get!(cache, Pair(n, m)) do
             children = Vector{ExpFlowNode{pc_type,lc_type, F}}() # TODO
             node = UpExpFlow{pc_type,lc_type, F}(n, m, children, fmem(), fgmem())
@@ -99,7 +99,7 @@ function exp_pass_up_node(node::ExpFlowNode{PC,LC,F}, data::XData{E}) where{E <:
     pType = typeof(node.p_origin)
     fType = typeof(node.f_origin)
 
-    if node.p_origin isa Prob⋁ && node.f_origin isa Logistic⋁
+    if node.p_origin isa Prob⋁ && node.f_origin isa Logistic⋀Node
         #todo this ordering might be different than the ExpFlowNode children
         pthetas = [exp(node.p_origin.log_thetas[i])
                     for i in 1:length(node.p_origin.children) for j in 1:length(node.f_origin.children)]
@@ -113,13 +113,13 @@ function exp_pass_up_node(node::ExpFlowNode{PC,LC,F}, data::XData{E}) where{E <:
             node.fg .+= (pthetas[z] .* fthetas[z]) .* node.children[z].f
             node.fg .+= pthetas[z] .* node.children[z].fg
         end
-    elseif node.p_origin isa Prob⋀ && node.f_origin isa Logistic⋀
+    elseif node.p_origin isa Prob⋀ && node.f_origin isa Logistic⋀Node
         node.f .= node.children[1].f .* node.children[2].f # assume 2 children
         node.fg .= (node.children[1].f .* node.children[2].fg) .+
                    (node.children[2].f .* node.children[1].fg)
 
     elseif node.p_origin isa ProbLiteral 
-        if node.f_origin isa Logistic⋁
+        if node.f_origin isa Logistic⋀Node
             m = node.f_origin.children[1]
         elseif node.f_origin isa LogisticLiteral
             m = node.f_origin
@@ -139,7 +139,7 @@ function exp_pass_up_node(node::ExpFlowNode{PC,LC,F}, data::XData{E}) where{E <:
             node.f .= 0.0
         end
 
-        if node.f_origin isa Logistic⋁
+        if node.f_origin isa Logistic⋀Node
             node.fg .= node.f .* transpose(node.f_origin.thetas)
         else
             node.fg .= 0.0
diff --git a/src/Reasoning/Expectation.jl b/src/Reasoning/Expectation.jl
index 43a410b6..f1246a58 100644
--- a/src/Reasoning/Expectation.jl
+++ b/src/Reasoning/Expectation.jl
@@ -92,7 +92,7 @@ end
 # exp_f (pr-constraint) is originally from:
 #   Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
 
-function exp_f(n::Prob⋁, m::Logistic⋁, data::XData{Int8}, cache::Union{ExpectationCache, MomentCache})
+function exp_f(n::Prob⋁, m::Logistic⋀Node, data::XData{Int8}, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = zeros(1 , num_examples(data) )
         pthetas = [exp(n.log_thetas[i]) for i in 1:length(n.children)]
@@ -105,7 +105,7 @@ function exp_f(n::Prob⋁, m::Logistic⋁, data::XData{Int8}, cache::Union{Expec
     end
 end
 
-function exp_f(n::Prob⋀, m::Logistic⋀, data::XData{Int8}, cache::Union{ExpectationCache, MomentCache})
+function exp_f(n::Prob⋀, m::Logistic⋀Node, data::XData{Int8}, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = ones(1 , num_examples(data) )
         @fastmath for (i,j) in zip(n.children, m.children)
@@ -136,9 +136,9 @@ end
 end
 
 """
-Has to be a Logistic⋁ with only one child, which is a leaf node 
+Has to be a Logistic⋀Node with only one child, which is a leaf node 
 """
-@inline function exp_f(n::ProbLiteral, m::Logistic⋁, data::XData{Int8}, cache::Union{ExpectationCache, MomentCache})
+@inline function exp_f(n::ProbLiteral, m::Logistic⋀Node, data::XData{Int8}, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         exp_f(n, m.children[1], data, cache)
     end
@@ -148,11 +148,11 @@ end
 ######## exp_g, exp_fg
 ########################################################################
 
-@inline function exp_g(n::Prob⋁, m::Logistic⋁, data::XData{Int8}, cache::ExpectationCache)
+@inline function exp_g(n::Prob⋁, m::Logistic⋀Node, data::XData{Int8}, cache::ExpectationCache)
     exp_fg(n, m, data, cache) # exp_fg and exp_g are the same for OR nodes
 end
 
-# function exp_g(n::Prob⋀, m::Logistic⋀, data::XData{Int8}, cache::ExpectationCache)
+# function exp_g(n::Prob⋀, m::Logistic⋀Node, data::XData{Int8}, cache::ExpectationCache)
 #     value = zeros(classes(m) , num_examples(data))
 #     @fastmath for (i,j) in zip(n.children, m.children)
 #         value .+= exp_fg(i, j, data, cache)
@@ -162,7 +162,7 @@ end
 # end
 
 
-function exp_fg(n::Prob⋁, m::Logistic⋁, data::XData{Int8}, cache::ExpectationCache)
+function exp_fg(n::Prob⋁, m::Logistic⋀Node, data::XData{Int8}, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         value = zeros(classes(m) , num_examples(data) )
         pthetas = [exp(n.log_thetas[i]) for i in 1:length(n.children)]
@@ -176,7 +176,7 @@ function exp_fg(n::Prob⋁, m::Logistic⋁, data::XData{Int8}, cache::Expectatio
     end
 end
 
-function exp_fg(n::Prob⋀, m::Logistic⋀, data::XData{Int8}, cache::ExpectationCache)
+function exp_fg(n::Prob⋀, m::Logistic⋀Node, data::XData{Int8}, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         # Assuming 2 children
         value = exp_f(n.children[1], m.children[1], data, cache) .* exp_fg(n.children[2], m.children[2], data, cache)
@@ -187,9 +187,9 @@ end
 
 
 """
-Has to be a Logistic⋁ with only one child, which is a leaf node 
+Has to be a Logistic⋀Node with only one child, which is a leaf node 
 """
-@inline function exp_fg(n::ProbLiteral, m::Logistic⋁, data::XData{Int8}, cache::ExpectationCache)
+@inline function exp_fg(n::ProbLiteral, m::Logistic⋀Node, data::XData{Int8}, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         m.thetas[1,:] .* exp_f(n, m, data, cache)
     end
@@ -204,7 +204,7 @@ end
 ######## moment_g, moment_fg
 ########################################################################
 
-@inline function moment_g(n::Prob⋁, m::Logistic⋁, data::XData{Int8}, moment::Int, cache::MomentCache)
+@inline function moment_g(n::Prob⋁, m::Logistic⋀Node, data::XData{Int8}, moment::Int, cache::MomentCache)
     get!(cache.fg, (n, m, moment)) do
         moment_fg(n, m, data, moment, cache)
     end
@@ -213,7 +213,7 @@ end
 """
 Calculating  E[g^k * f]
 """
-function moment_fg(n::Prob⋁, m::Logistic⋁, data::XData{Int8}, moment::Int, cache::MomentCache)
+function moment_fg(n::Prob⋁, m::Logistic⋀Node, data::XData{Int8}, moment::Int, cache::MomentCache)
     if moment == 0
         return exp_f(n, m, data, cache)
     end
@@ -232,7 +232,7 @@ function moment_fg(n::Prob⋁, m::Logistic⋁, data::XData{Int8}, moment::Int, c
     end
 end
 
-@inline function moment_fg(n::ProbLiteral, m::Logistic⋁, data::XData{Int8}, moment::Int, cache::MomentCache)
+@inline function moment_fg(n::ProbLiteral, m::Logistic⋀Node, data::XData{Int8}, moment::Int, cache::MomentCache)
     get!(cache.fg, (n, m, moment)) do
         m.thetas[1,:].^(moment) .* exp_f(n, m, data, cache)
     end
@@ -247,7 +247,7 @@ end
     end
 end
 
-function moment_fg(n::Prob⋀, m::Logistic⋀, data::XData{Int8}, moment::Int, cache::MomentCache)
+function moment_fg(n::Prob⋀, m::Logistic⋀Node, data::XData{Int8}, moment::Int, cache::MomentCache)
     if moment == 0
         return exp_f(n, m, data, cache)
     end
diff --git a/src/Utils/decorators.jl b/src/Utils/decorators.jl
index 27c0ec68..38097da4 100644
--- a/src/Utils/decorators.jl
+++ b/src/Utils/decorators.jl
@@ -1,5 +1,5 @@
 export DecoratorCircuit, literal, origin, and_nodes, or_nodes, ⋀_nodes, ⋁_nodes,
-GateType, NodeType, variable, ispositive, isnegative, origin
+GateType, NodeType, variable, ispositive, isnegative, origin, num_parameters
 
 using LogicCircuits
 
@@ -14,6 +14,11 @@ Get the origin node/circuit in a given decorator node/circuit
 """
 function origin end
 
+"""
+Get the number of parameters of a given decorator node/circuit
+"""
+function num_parameters end
+
 #####################
 # Abstract infrastructure for decorator circuit nodes
 #####################
diff --git a/test/Logistic/LogisticCircuitTest.jl b/test/Logistic/LogisticCircuitTest.jl
deleted file mode 100644
index 7802c012..00000000
--- a/test/Logistic/LogisticCircuitTest.jl
+++ /dev/null
@@ -1,46 +0,0 @@
-using Test
-using LogicCircuits
-using ProbabilisticCircuits
-
-# This tests are supposed to test queries on the circuits
-@testset "Logistic Circuit Class Conditional" begin
-    # Uses a Logistic Circuit with 4 variables, and tests 3 of the configurations to 
-    # match with python version.
-
-    EPS = 1e-7;
-    my_opts = (max_factors= 2,
-            compact⋀=false,
-            compact⋁=false)
-        
-    logistic_circuit = zoo_lc("little_4var.circuit", 2);
-    @test logistic_circuit isa Vector{<:LogisticNode};
-
-    flow_circuit = FlowΔ(logistic_circuit, 16, Float64, my_opts)
-    @test flow_circuit isa Vector{<:FlowNode};
-
-    # Step 1. Check Probabilities for 3 samples
-    data = XData(Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]));
-    
-    true_prob = [3.43147972 4.66740416; 
-                4.27595352 2.83503504;
-                3.67415087 4.93793472]
-            
-    CLASSES = 2
-    calc_prob = class_conditional_likelihood_per_instance(flow_circuit, CLASSES, data)
-    
-    for i = 1:3
-        for j = 1:2
-            @test true_prob[i,j] ≈ calc_prob[i,j] atol= EPS;
-        end
-    end
-
-    # 2. Testing different API
-    fc2, calc_prob2 = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
-    for i = 1:3
-        for j = 1:2
-            @test true_prob[i,j] ≈ calc_prob2[i,j] atol= EPS;
-        end
-    end
-
-
-end
\ No newline at end of file
diff --git a/test/Logistic/logistic_tests.jl b/test/Logistic/logistic_tests.jl
new file mode 100644
index 00000000..4337e0c5
--- /dev/null
+++ b/test/Logistic/logistic_tests.jl
@@ -0,0 +1,46 @@
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+
+# This tests are supposed to test queries on the circuits
+@testset "Logistic Circuit Class Conditional" begin
+    # Uses a Logistic Circuit with 4 variables, and tests 3 of the configurations to 
+    # match with python version.
+
+    EPS = 1e-7;
+    my_opts = (max_factors= 2,
+            compact⋀=false,
+            compact⋁=false)
+        
+    logistic_circuit = zoo_lc("little_4var.circuit", 2);
+    @test logistic_circuit isa LogisticCircuit;
+
+    # flow_circuit = FlowΔ(logistic_circuit, 16, Float64, my_opts)
+    # @test flow_circuit isa Vector{<:FlowNode};
+
+    # Step 1. Check Probabilities for 3 samples
+    data = Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]);
+    
+    true_prob = [3.43147972 4.66740416; 
+                4.27595352 2.83503504;
+                3.67415087 4.93793472]
+            
+    CLASSES = 2
+    # calc_prob = class_conditional_likelihood_per_instance(flow_circuit, CLASSES, data)
+    
+    # for i = 1:3
+    #     for j = 1:2
+    #         @test true_prob[i,j] ≈ calc_prob[i,j] atol= EPS;
+    #     end
+    # end
+
+    # # 2. Testing different API
+    # fc2, calc_prob2 = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
+    # for i = 1:3
+    #     for j = 1:2
+    #         @test true_prob[i,j] ≈ calc_prob2[i,j] atol= EPS;
+    #     end
+    # end
+
+
+end
\ No newline at end of file

From 55ff3254d20617c5babc318868ca97f3c7bf5547 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Thu, 23 Jul 2020 16:03:30 -0700
Subject: [PATCH 008/131] mv files

---
 src/LoadSave/circuit_savers.jl                |  2 +-
 src/Logistic/Logistic.jl                      |  1 +
 src/Logistic/logistic_nodes.jl                | 40 -------------------
 src/Logistic/queries.jl                       | 35 ++++++++++++++++
 src/Probabilistic/{ => deprecated}/Bagging.jl |  0
 .../{ => deprecated}/Clustering.jl            |  0
 .../MutualInformation.jl                      |  0
 7 files changed, 37 insertions(+), 41 deletions(-)
 create mode 100644 src/Logistic/queries.jl
 rename src/Probabilistic/{ => deprecated}/Bagging.jl (100%)
 rename src/Probabilistic/{ => deprecated}/Clustering.jl (100%)
 rename src/{Probabilistic => Utils}/MutualInformation.jl (100%)

diff --git a/src/LoadSave/circuit_savers.jl b/src/LoadSave/circuit_savers.jl
index 3177920b..22acd3a6 100644
--- a/src/LoadSave/circuit_savers.jl
+++ b/src/LoadSave/circuit_savers.jl
@@ -10,7 +10,7 @@ using LogicCircuits.LoadSave: SDDElement,
     get_nodes_level
 
 #####################
-# decompile for nodes
+# decompile for probabilistic nodes
 #####################
 
 "Decompile for psdd circuit, used during saving of circuits to file" 
diff --git a/src/Logistic/Logistic.jl b/src/Logistic/Logistic.jl
index 1923d8ea..c6a73c93 100644
--- a/src/Logistic/Logistic.jl
+++ b/src/Logistic/Logistic.jl
@@ -4,5 +4,6 @@ using LogicCircuits
 using ..Utils
 
 include("logistic_nodes.jl")
+include("queries.jl")
 
 end
\ No newline at end of file
diff --git a/src/Logistic/logistic_nodes.jl b/src/Logistic/logistic_nodes.jl
index b0cd6ba7..9b7a364a 100644
--- a/src/Logistic/logistic_nodes.jl
+++ b/src/Logistic/logistic_nodes.jl
@@ -104,43 +104,3 @@ function LogisticCircuit(circuit::LogicCircuit, classes::Int)
     foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, LogisticCircuit)
 
 end
-
-#####################
-# methods
-#####################
-# TODO Learning
-# TODO queries
-# Class Conditional Probability
-# function class_conditional_likelihood_per_instance(fc::FlowΔ, 
-#                                                     classes::Int, 
-#                                                     batch::PlainXData{Bool})
-#     lc = origin(origin(fc))
-#     @assert(lc isa LogisticΔ)
-#     pass_up_down(fc, batch)
-#     likelihoods = zeros(num_examples(batch), classes)
-#     for n in fc
-#         orig = logistic_origin(n)
-#         if orig isa Logistic⋀Node
-#             # For each class. orig.thetas is 2D so used eachcol
-#             for (idx, thetaC) in enumerate(eachcol(orig.thetas))
-#                 foreach(n.children, thetaC) do c, theta
-#                     likelihoods[:, idx] .+= prod_fast(downflow(n), pr_factors(origin(c))) .* theta
-#                 end
-#             end
-#         end
-#     end
-#     likelihoods
-# end
-
-# """
-# Calculate conditional log likelihood for a batch of samples with evidence P(c | x).
-# (Also returns the generated FlowΔ)
-# """
-# function class_conditional_likelihood_per_instance(lc::LogisticΔ, 
-#                                                     classes::Int, 
-#                                                     batch::PlainXData{Bool})
-#     opts = (max_factors = 2, compact⋀=false, compact⋁=false)
-#     fc = FlowΔ(lc, num_examples(batch), Float64, opts)
-#     (fc, class_conditional_likelihood_per_instance(fc, classes, batch))
-# end
-
diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
new file mode 100644
index 00000000..9865be43
--- /dev/null
+++ b/src/Logistic/queries.jl
@@ -0,0 +1,35 @@
+# export class_conditional_likelihood_per_instance
+# # Class Conditional Probability
+# function class_conditional_likelihood_per_instance(fc::FlowΔ, 
+#                                                     classes::Int, 
+#                                                     batch::PlainXData{Bool})
+#     lc = origin(origin(fc))
+#     @assert(lc isa LogisticΔ)
+#     pass_up_down(fc, batch)
+#     likelihoods = zeros(num_examples(batch), classes)
+#     for n in fc
+#         orig = logistic_origin(n)
+#         if orig isa Logistic⋀Node
+#             # For each class. orig.thetas is 2D so used eachcol
+#             for (idx, thetaC) in enumerate(eachcol(orig.thetas))
+#                 foreach(n.children, thetaC) do c, theta
+#                     likelihoods[:, idx] .+= prod_fast(downflow(n), pr_factors(origin(c))) .* theta
+#                 end
+#             end
+#         end
+#     end
+#     likelihoods
+# end
+
+# """
+# Calculate conditional log likelihood for a batch of samples with evidence P(c | x).
+# (Also returns the generated FlowΔ)
+# """
+# function class_conditional_likelihood_per_instance(lc::LogisticΔ, 
+#                                                     classes::Int, 
+#                                                     batch::PlainXData{Bool})
+#     opts = (max_factors = 2, compact⋀=false, compact⋁=false)
+#     fc = FlowΔ(lc, num_examples(batch), Float64, opts)
+#     (fc, class_conditional_likelihood_per_instance(fc, classes, batch))
+# end
+
diff --git a/src/Probabilistic/Bagging.jl b/src/Probabilistic/deprecated/Bagging.jl
similarity index 100%
rename from src/Probabilistic/Bagging.jl
rename to src/Probabilistic/deprecated/Bagging.jl
diff --git a/src/Probabilistic/Clustering.jl b/src/Probabilistic/deprecated/Clustering.jl
similarity index 100%
rename from src/Probabilistic/Clustering.jl
rename to src/Probabilistic/deprecated/Clustering.jl
diff --git a/src/Probabilistic/MutualInformation.jl b/src/Utils/MutualInformation.jl
similarity index 100%
rename from src/Probabilistic/MutualInformation.jl
rename to src/Utils/MutualInformation.jl

From ca922c7e7a5ec4792f9a84781e2a2cac0894fd41 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Thu, 23 Jul 2020 16:17:07 -0700
Subject: [PATCH 009/131] todo

---
 src/Probabilistic/{ => todo}/EMLearner.jl        | 0
 src/Probabilistic/{ => todo}/Mixtures.jl         | 0
 src/Probabilistic/{ => todo}/ProbFlowCircuits.jl | 0
 src/Probabilistic/{ => todo}/VtreeLearner.jl     | 0
 src/Probabilistic/{ => todo}/flows.jl            | 0
 src/Probabilistic/{ => todo}/kld.jl              | 0
 src/Probabilistic/{ => todo}/parameters.jl       | 0
 7 files changed, 0 insertions(+), 0 deletions(-)
 rename src/Probabilistic/{ => todo}/EMLearner.jl (100%)
 rename src/Probabilistic/{ => todo}/Mixtures.jl (100%)
 rename src/Probabilistic/{ => todo}/ProbFlowCircuits.jl (100%)
 rename src/Probabilistic/{ => todo}/VtreeLearner.jl (100%)
 rename src/Probabilistic/{ => todo}/flows.jl (100%)
 rename src/Probabilistic/{ => todo}/kld.jl (100%)
 rename src/Probabilistic/{ => todo}/parameters.jl (100%)

diff --git a/src/Probabilistic/EMLearner.jl b/src/Probabilistic/todo/EMLearner.jl
similarity index 100%
rename from src/Probabilistic/EMLearner.jl
rename to src/Probabilistic/todo/EMLearner.jl
diff --git a/src/Probabilistic/Mixtures.jl b/src/Probabilistic/todo/Mixtures.jl
similarity index 100%
rename from src/Probabilistic/Mixtures.jl
rename to src/Probabilistic/todo/Mixtures.jl
diff --git a/src/Probabilistic/ProbFlowCircuits.jl b/src/Probabilistic/todo/ProbFlowCircuits.jl
similarity index 100%
rename from src/Probabilistic/ProbFlowCircuits.jl
rename to src/Probabilistic/todo/ProbFlowCircuits.jl
diff --git a/src/Probabilistic/VtreeLearner.jl b/src/Probabilistic/todo/VtreeLearner.jl
similarity index 100%
rename from src/Probabilistic/VtreeLearner.jl
rename to src/Probabilistic/todo/VtreeLearner.jl
diff --git a/src/Probabilistic/flows.jl b/src/Probabilistic/todo/flows.jl
similarity index 100%
rename from src/Probabilistic/flows.jl
rename to src/Probabilistic/todo/flows.jl
diff --git a/src/Probabilistic/kld.jl b/src/Probabilistic/todo/kld.jl
similarity index 100%
rename from src/Probabilistic/kld.jl
rename to src/Probabilistic/todo/kld.jl
diff --git a/src/Probabilistic/parameters.jl b/src/Probabilistic/todo/parameters.jl
similarity index 100%
rename from src/Probabilistic/parameters.jl
rename to src/Probabilistic/todo/parameters.jl

From 9e77d6cfc6ebcb53af5ed5045ab189ad92e9d180 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Thu, 23 Jul 2020 17:28:32 -0700
Subject: [PATCH 010/131] EVI

---
 src/Probabilistic/Probabilistic.jl  |   3 +-
 src/Probabilistic/Queries.jl        | 110 +++++++++-------------------
 test/Probabilistic/queries_tests.jl |  20 ++---
 3 files changed, 47 insertions(+), 86 deletions(-)

diff --git a/src/Probabilistic/Probabilistic.jl b/src/Probabilistic/Probabilistic.jl
index d67d1493..1082b4d8 100644
--- a/src/Probabilistic/Probabilistic.jl
+++ b/src/Probabilistic/Probabilistic.jl
@@ -47,12 +47,13 @@ pr_constraint, psdd_entropy, psdd_kl_divergence
 
 # include("Clustering.jl")
 include("prob_nodes.jl")
+include("queries.jl")
 # include("ProbFlowCircuits.jl")
 # include("MutualInformation.jl")
 # include("Mixtures.jl")
 # include("Bagging.jl")
 # include("EMLearner.jl")
 # include("VtreeLearner.jl")
-# include("Queries.jl")
+
 
 end
diff --git a/src/Probabilistic/Queries.jl b/src/Probabilistic/Queries.jl
index 47cc1d30..e5691b8a 100644
--- a/src/Probabilistic/Queries.jl
+++ b/src/Probabilistic/Queries.jl
@@ -1,91 +1,51 @@
-export log_prob
+export EVI, log_proba, log_likelihood_per_instance
 
-function log_likelihood_per_instance(pc::ProbCircuit, data::DataFrame)
-end
-function log_likelihood_per_instance2(pc::ProbΔ, data::XData{Bool})
-    Logic.pass_up_down2(pc, data)
-    log_likelihood_per_instance_cached(pc, data)
+using DataFrames
+using LogicCircuits: UpDownFlow, UpDownFlow2
+
+"""
+Get the edge flow from logic circuit
+"""
+# TODO move to LogicCircuits
+@inline isfactorized(n) = n.data::UpDownFlow isa UpDownFlow2
+function get_edge_flow(n, c)::BitVector
+    @assert !is⋁gate(c) && is⋁gate(n)
+    df = copy(n.data.downflow)
+    if isfactorized(c)
+        return df .&= c.data.prime_flow .& c.data.sub_flow
+    else
+        return df .&= c.data.downflow
+    end
 end
 
-function log_likelihood_per_instance_cached(pc::ProbΔ, data::XData{Bool})
-    log_likelihoods = zeros(num_examples(data))
+"""
+Complete evidence queries
+"""
+function log_likelihood_per_instance(pc::ProbCircuit, data::Union{DataFrame, AbstractMatrix})
+    @assert isbinarydata(data) "Can only calculate EVI on Bool data"
+    
+    compute_flows(origin(pc), data)
+    log_likelihoods = zeros(Float64, num_examples(data))
     indices = init_array(Bool, num_examples(data))::BitVector
-    for n in pc
-         if n isa Prob⋁ && num_children(n) != 1 # other nodes have no effect on likelihood
-            foreach(n.children, n.log_thetas) do c, log_theta
-                indices = n.data[1] .& c.data[1]
+    
+    ll(n::ProbCircuit) = ()
+    ll(n::Prob⋁Node) = begin
+        if num_children(n) != 1 # other nodes have no effect on likelihood
+            foreach(children(origin(n)), n.log_thetas) do c, log_theta
+                indices = get_edge_flow(origin(n), c)
                 view(log_likelihoods, indices::BitVector) .+=  log_theta # see MixedProductKernelBenchmark.jl
             end
          end
     end
-    log_likelihoods
-end
-
-# compute log likelihood
-function compute_log_likelihood(pc::ProbΔ, data::XBatches{Bool})
-    compute_log_likelihood(AggregateFlowΔ(pc, aggr_weight_type(data)))
-end
 
-# compute log likelihood, reusing AggregateFlowΔ but ignoring its current aggregate values
-function compute_log_likelihood(afc::AggregateFlowΔ, data::XBatches{Bool})
-    @assert feature_type(data) == Bool "Can only test probabilistic circuits on Bool data"
-    collect_aggr_flows(afc, data)
-    ll = log_likelihood(afc)
-    (afc, ll)
-end
-
-# return likelihoods given current aggregate flows.
-function log_likelihood(afc::AggregateFlowΔ)
-    sum(n -> log_likelihood(n), afc)
+    foreach(ll, pc)
+    log_likelihoods
 end
 
-log_likelihood(::AggregateFlowNode) = 0.0
-log_likelihood(n::AggregateFlow⋁) = sum(n.origin.log_thetas .* n.aggr_flow_children)
+EVI = log_proba = log_likelihood_per_instance
 
 """
-Calculates log likelihood for a batch of fully observed samples.
-(Also retures the generated FlowΔ)
+Complete evidence queries
 """
-function log_likelihood_per_instance(pc::ProbΔ, batch::PlainXData{Bool})
-    fc = FlowΔ(pc, num_examples(batch), Bool)
-    (fc, log_likelihood_per_instance(fc, batch))
-end
 
-function log_proba(pc::ProbΔ, batch::PlainXData{Bool})
-    log_likelihood_per_instance(pc, batch)[2]
-end
-
-function log_proba(pc::ProbΔ, batch::PlainXData{Int8})
-    marginal_log_likelihood_per_instance(pc, batch)[2]
-end
-
-"""
-Calculate log likelihood per instance for batches of samples.
-"""
-function log_likelihood_per_instance(pc::ProbΔ, batches::XBatches{Bool})::Vector{Float64}
-    mapreduce(b -> log_likelihood_per_instance(pc, b)[2], vcat, batches)
-end
 
-"""
-Calculate log likelihood for a batch of fully observed samples.
-(This is for when you already have a FlowΔ)
-"""
-function log_likelihood_per_instance(fc::FlowΔ, batch::PlainXData{Bool})
-    @assert (prob_origin(fc[end]) isa ProbNode) "FlowΔ must originate in a ProbΔ"
-    pass_up_down(fc, batch)
-    log_likelihoods = zeros(num_examples(batch))
-    indices = init_array(Bool, flow_length(fc))::BitVector
-    for n in fc
-         if n isa DownFlow⋁ && num_children(n) != 1 # other nodes have no effect on likelihood
-            origin = prob_origin(n)::Prob⋁
-            foreach(n.children, origin.log_thetas) do c, log_theta
-                #  be careful here to allow for the Boolean multiplication to be done using & before switching to float arithmetic, or risk losing a lot of runtime!
-                # log_likelihoods .+= prod_fast(downflow(n), pr_factors(c)) .* log_theta
-                assign_prod(indices, downflow(n), pr_factors(c))
-                view(log_likelihoods, indices::BitVector) .+=  log_theta # see MixedProductKernelBenchmark.jl
-                # TODO put the lines above in Utils in order to ensure we have specialized types
-            end
-         end
-    end
-    log_likelihoods
-end
\ No newline at end of file
diff --git a/test/Probabilistic/queries_tests.jl b/test/Probabilistic/queries_tests.jl
index 40d16d06..3b45f6a4 100644
--- a/test/Probabilistic/queries_tests.jl
+++ b/test/Probabilistic/queries_tests.jl
@@ -8,19 +8,14 @@ using ProbabilisticCircuits
     # match with python. Also tests all probabilities sum up to 1.
 
     EPS = 1e-7;
-    # prob_circuit = zoo_psdd("little_4var.psdd");
-    prob_circuit = load_logic_circuit(zoo_lc_file("little_4var.circuit"))
-    @test prob_circuit isa Vector{<:ProbNode};
-
-    flow_circuit = FlowΔ(prob_circuit, 16, Bool)
-    @test flow_circuit isa Vector{<:FlowNode};
-
+    prob_circuit = zoo_psdd("little_4var.psdd");
+    @test prob_circuit isa ProbCircuit;
 
     # Step 1. Check Probabilities for 3 samples
     data = Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]);
     true_prob = [0.07; 0.03; 0.13999999999999999]
 
-    calc_prob = log_likelihood_per_instance(flow_circuit, data)
+    calc_prob = log_likelihood_per_instance(prob_circuit, data)
     calc_prob = exp.(calc_prob)
 
     for i = 1:3
@@ -29,9 +24,9 @@ using ProbabilisticCircuits
 
     # Step 2. Add up all probabilities and see if they add up to one
     N = 4;
-    data_all = XData(generate_data_all(N))
+    data_all = generate_data_all(N)
 
-    calc_prob_all = log_likelihood_per_instance(flow_circuit, data_all)
+    calc_prob_all = log_likelihood_per_instance(prob_circuit, data_all)
     calc_prob_all = exp.(calc_prob_all)
     sum_prob_all = sum(calc_prob_all)
 
@@ -161,3 +156,8 @@ end
 
     test_mpe_brute_force(prob_circuit, evidence)
 end
+
+
+@testset "EVI" begin
+    pc = zoo_psdd("nltcs.psdd")
+end

From e759aa763344a16dcb0e49832de976ec2749f139 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Thu, 23 Jul 2020 21:46:26 -0700
Subject: [PATCH 011/131] MAR

---
 src/Probabilistic/Probabilistic.jl         |  1 +
 src/Probabilistic/Queries.jl               | 17 +++-
 src/Probabilistic/flows.jl                 | 99 ++++++++++++++++++++++
 src/Probabilistic/todo/ProbFlowCircuits.jl | 49 -----------
 src/Probabilistic/todo/flows.jl            |  0
 test/Probabilistic/queries_tests.jl        | 16 +---
 6 files changed, 116 insertions(+), 66 deletions(-)
 create mode 100644 src/Probabilistic/flows.jl
 delete mode 100644 src/Probabilistic/todo/flows.jl

diff --git a/src/Probabilistic/Probabilistic.jl b/src/Probabilistic/Probabilistic.jl
index 1082b4d8..81773590 100644
--- a/src/Probabilistic/Probabilistic.jl
+++ b/src/Probabilistic/Probabilistic.jl
@@ -47,6 +47,7 @@ pr_constraint, psdd_entropy, psdd_kl_divergence
 
 # include("Clustering.jl")
 include("prob_nodes.jl")
+include("flows.jl")
 include("queries.jl")
 # include("ProbFlowCircuits.jl")
 # include("MutualInformation.jl")
diff --git a/src/Probabilistic/Queries.jl b/src/Probabilistic/Queries.jl
index e5691b8a..0a102ec5 100644
--- a/src/Probabilistic/Queries.jl
+++ b/src/Probabilistic/Queries.jl
@@ -1,4 +1,5 @@
-export EVI, log_proba, log_likelihood_per_instance
+export EVI, log_proba, log_likelihood_per_instance,
+MAR, marginal_log_likelihood_per_instance
 
 using DataFrames
 using LogicCircuits: UpDownFlow, UpDownFlow2
@@ -18,10 +19,15 @@ function get_edge_flow(n, c)::BitVector
     end
 end
 
+"""
+Data 
+"""
+const Data = Union{DataFrame, AbstractMatrix}
+
 """
 Complete evidence queries
 """
-function log_likelihood_per_instance(pc::ProbCircuit, data::Union{DataFrame, AbstractMatrix})
+function log_likelihood_per_instance(pc::ProbCircuit, data::Data)
     @assert isbinarydata(data) "Can only calculate EVI on Bool data"
     
     compute_flows(origin(pc), data)
@@ -45,7 +51,12 @@ end
 EVI = log_proba = log_likelihood_per_instance
 
 """
-Complete evidence queries
+marginal queries
 """
+function marginal_log_likelihood_per_instance(pc::ProbCircuit, data)
+    evaluate(pc, data)
+end
+MAR = marginal_log_likelihood_per_instance
+
 
 
diff --git a/src/Probabilistic/flows.jl b/src/Probabilistic/flows.jl
new file mode 100644
index 00000000..a880fcc9
--- /dev/null
+++ b/src/Probabilistic/flows.jl
@@ -0,0 +1,99 @@
+import LogicCircuits: evaluate
+using StatsFuns: logsumexp
+
+# evaluate a circuit as a function
+function (root::ProbCircuit)(data)
+    evaluate(root, data)
+end
+
+"Container for circuit flows represented as a float vector"
+const UpFlow1 = Vector{Float64}
+
+
+"Container for circuit flows represented as an implicit conjunction of a prime and sub float vector (saves memory allocations in circuits with many binary conjunctions)"
+struct UpFlow2
+    prime_flow::Vector{Float64}
+    sub_flow::Vector{Float64}
+end
+
+const UpFlow = Union{UpFlow1,UpFlow2}
+
+@inline UpFlow(elems::UpFlow1) = elems
+
+@inline UpFlow(elems::UpFlow2) =
+    elems.prime_flow .+ elems.sub_flow
+
+import Base.length
+length(elems::UpFlow2) = length(UpFlow(elems))
+
+function evaluate(root::ProbCircuit, data;
+                   nload = nload, nsave = nsave, reset=true)::Vector{Float64}
+    n_ex::Int = num_examples(data)
+    ϵ = 1e-300
+
+    @inline f_lit(n) = begin
+        uf = convert(Vector{Int8}, feature_values(data, variable(n)))
+        if ispositive(origin(n))
+            uf[uf.==-1] .= 1
+        else
+            uf .= 1 .- uf
+            uf[uf.==2] .= 1
+        end
+        uf = convert(Vector{Float64}, uf)
+        uf .= log.(uf .+ ϵ)
+    end
+    
+    @inline f_con(n) = begin
+        uf = istrue(origin(n)) ? ones(Float64, n_ex) : zeros(Float64, n_ex)
+        uf .= log.(uf .+ ϵ)
+    end
+    
+    @inline fa(n, call) = begin
+        if num_children(n) == 1
+            return UpFlow1(call(@inbounds children(n)[1]))
+        else
+            c1 = call(@inbounds children(n)[1])::UpFlow
+            c2 = call(@inbounds children(n)[2])::UpFlow
+            if num_children(n) == 2 && c1 isa UpFlow1 && c2 isa UpFlow1 
+                UpFlow2(c1, c2) # no need to allocate a new BitVector
+            end
+            x = flowop(c1, c2, +)
+            for c in children(n)[3:end]
+                accumulate(x, call(c), +)
+            end
+            return x
+        end
+    end
+    
+    @inline fo(n, call) = begin
+        if num_children(n) == 1
+            return UpFlow1(call(@inbounds children(n)[1]))
+        else
+            log_thetas = n.log_thetas
+            c1 = call(@inbounds children(n)[1])::UpFlow
+            c2 = call(@inbounds children(n)[2])::UpFlow
+            x = flowop(c1, log_thetas[1], c2, log_thetas[2], logsumexp)
+            for (i, c) in enumerate(children(n)[3:end])
+                accumulate(x, call(c), log_thetas[i+2], logsumexp)
+            end
+            return x
+        end
+    end
+    
+    # ensure flow us Flow1 at the root, even when it's a conjunction
+    root_flow = UpFlow1(foldup(root, f_con, f_lit, fa, fo, UpFlow; nload, nsave, reset))
+    return nsave(root, root_flow)
+end
+
+@inline flowop(x::UpFlow, y::UpFlow, op)::UpFlow1 =
+    op.(UpFlow(x), UpFlow(y))
+
+@inline flowop(x::UpFlow, w1::Float64, y::UpFlow, w2::Float64, op)::UpFlow1 =
+    op.(UpFlow(x) .+ w1, UpFlow(y) .+ w2)
+
+import Base.accumulate
+@inline accumulate(x::UpFlow, v::UpFlow, op) = 
+    @inbounds @. x = op($UpFlow(x), $UpFlow(v)); nothing
+
+@inline accumulate(x::UpFlow, v::UpFlow, w::Float64, op) = 
+    @inbounds @. x = op($UpFlow(x), $UpFlow(v) + w); nothing
diff --git a/src/Probabilistic/todo/ProbFlowCircuits.jl b/src/Probabilistic/todo/ProbFlowCircuits.jl
index 00916954..e2c6bbf1 100644
--- a/src/Probabilistic/todo/ProbFlowCircuits.jl
+++ b/src/Probabilistic/todo/ProbFlowCircuits.jl
@@ -1,52 +1,3 @@
-#####################
-
-#TODO This code seems to assume logspace flows as floating point numbers. if so, enforca that on type F
-function marginal_pass_up(circuit::UpFlowΔ{O,F}, data::XData{E}) where {E <: eltype(F)} where {O,F}
-    resize_flows(circuit, num_examples(data))
-    cache = zeros(Float64, num_examples(data)) #TODO: fix type later
-    marginal_pass_up_node(n::UpFlowNode, ::PlainXData) = ()
-
-    function marginal_pass_up_node(n::UpFlowLiteral{O,F}, cache::Array{Float64}, data::PlainXData{E}) where {E <: eltype(F)} where {O,F}
-        pass_up_node(n, data)
-        # now override missing values by 1
-        npr = pr(n)
-        npr[feature_matrix(data)[:,variable(n)] .< zero(eltype(F))] .= 1
-        npr .= log.( npr .+ 1e-300 )
-        return nothing
-    end
-
-    function marginal_pass_up_node(n::UpFlow⋀Cached, cache::Array{Float64}, ::PlainXData)
-        pr(n) .= 0
-        for i=1:length(n.children)
-            # pr(n) .+= pr(n.children[i])
-            broadcast!(+, pr(n), pr(n), pr(n.children[i]))
-        end
-        return nothing
-    end
-
-    function marginal_pass_up_node(n::UpFlow⋁Cached, cache::Array{Float64}, ::PlainXData)
-        pr(n) .= 1e-300
-        for i=1:length(n.children)    
-            cache .= 0
-            # broadcast reduced memory allocation, though accessing prob_origin(n).log_thetas[i] still allocates lots of extra memory, 
-            # it is proabably due to derefrencing the pointer
-            broadcast!(+, cache, pr(n.children[i]), prob_origin(n).log_thetas[i])
-            broadcast!(exp, cache, cache)
-            broadcast!(+, pr(n), pr(n), cache)
-        end
-        broadcast!(log, pr(n), pr(n));
-        return nothing
-    end
-
-    ## Pass Up on every node in order
-    for n in circuit
-        marginal_pass_up_node(n, cache, data)
-    end
-    return nothing
-end
-
-
-
 ##### marginal_pass_down
 
 function marginal_pass_down(circuit::DownFlowΔ{O,F}) where {O,F}
diff --git a/src/Probabilistic/todo/flows.jl b/src/Probabilistic/todo/flows.jl
deleted file mode 100644
index e69de29b..00000000
diff --git a/test/Probabilistic/queries_tests.jl b/test/Probabilistic/queries_tests.jl
index 3b45f6a4..e2d02eb1 100644
--- a/test/Probabilistic/queries_tests.jl
+++ b/test/Probabilistic/queries_tests.jl
@@ -37,29 +37,17 @@ end
     EPS = 1e-7;
     prob_circuit = zoo_psdd("little_4var.psdd");
 
-    data = XData(
-        Int8.([0 0 0 0; 0 1 1 0; 0 0 1 1;
+    data = Int8.([0 0 0 0; 0 1 1 0; 0 0 1 1;
                 0 0 0 -1; -1 1 0 -1; -1 -1 -1 -1; 0 -1 -1 -1])
-    );
     true_prob = [0.07; 0.03; 0.13999999999999999;
                     0.3499999999999; 0.1; 1.0; 0.8]
 
-    opts = (compact⋀=false, compact⋁=false)
-    flow_circuit = UpFlowΔ(prob_circuit, 16, Float64, opts)
-    calc_prob = marginal_log_likelihood_per_instance(flow_circuit, data)
+    calc_prob = marginal_log_likelihood_per_instance(prob_circuit, data)
     calc_prob = exp.(calc_prob)
 
     for i = 1:length(true_prob)
         @test true_prob[i] ≈ calc_prob[i] atol= EPS;
     end
-
-    # Now trying the other api without instantiating a flow circuit
-    fc2, calc_prob2 = marginal_log_likelihood_per_instance(prob_circuit, data)
-    calc_prob2 = exp.(calc_prob2)
-    for i = 1:length(true_prob)
-        @test true_prob[i] ≈ calc_prob2[i] atol= EPS;
-    end
-
 end
 
 @testset "Marginal Pass Down" begin

From c08297855637b423b6ec678ce2863863c29668c7 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 01:10:58 -0700
Subject: [PATCH 012/131] marginal pass down

---
 src/Probabilistic/Queries.jl               |  29 +--
 src/Probabilistic/flows.jl                 | 195 ++++++++++++++++++---
 src/Probabilistic/todo/ProbFlowCircuits.jl |  56 ------
 test/Probabilistic/queries_tests.jl        |  58 +++---
 4 files changed, 195 insertions(+), 143 deletions(-)
 delete mode 100644 src/Probabilistic/todo/ProbFlowCircuits.jl

diff --git a/src/Probabilistic/Queries.jl b/src/Probabilistic/Queries.jl
index 0a102ec5..ed4934d7 100644
--- a/src/Probabilistic/Queries.jl
+++ b/src/Probabilistic/Queries.jl
@@ -1,33 +1,10 @@
-export EVI, log_proba, log_likelihood_per_instance,
+export EVI, log_likelihood_per_instance,
 MAR, marginal_log_likelihood_per_instance
 
-using DataFrames
-using LogicCircuits: UpDownFlow, UpDownFlow2
-
-"""
-Get the edge flow from logic circuit
-"""
-# TODO move to LogicCircuits
-@inline isfactorized(n) = n.data::UpDownFlow isa UpDownFlow2
-function get_edge_flow(n, c)::BitVector
-    @assert !is⋁gate(c) && is⋁gate(n)
-    df = copy(n.data.downflow)
-    if isfactorized(c)
-        return df .&= c.data.prime_flow .& c.data.sub_flow
-    else
-        return df .&= c.data.downflow
-    end
-end
-
-"""
-Data 
-"""
-const Data = Union{DataFrame, AbstractMatrix}
-
 """
 Complete evidence queries
 """
-function log_likelihood_per_instance(pc::ProbCircuit, data::Data)
+function log_likelihood_per_instance(pc::ProbCircuit, data)
     @assert isbinarydata(data) "Can only calculate EVI on Bool data"
     
     compute_flows(origin(pc), data)
@@ -38,7 +15,7 @@ function log_likelihood_per_instance(pc::ProbCircuit, data::Data)
     ll(n::Prob⋁Node) = begin
         if num_children(n) != 1 # other nodes have no effect on likelihood
             foreach(children(origin(n)), n.log_thetas) do c, log_theta
-                indices = get_edge_flow(origin(n), c)
+                indices = get_downflow(origin(n), c)
                 view(log_likelihoods, indices::BitVector) .+=  log_theta # see MixedProductKernelBenchmark.jl
             end
          end
diff --git a/src/Probabilistic/flows.jl b/src/Probabilistic/flows.jl
index a880fcc9..e9516572 100644
--- a/src/Probabilistic/flows.jl
+++ b/src/Probabilistic/flows.jl
@@ -1,30 +1,78 @@
-import LogicCircuits: evaluate
+export get_downflow, get_upflow
+
+import LogicCircuits: evaluate, compute_flows
 using StatsFuns: logsumexp
 
+# TODO move to LogicCircuits
+# TODO clean up and better API
+using LogicCircuits: UpFlow, UpFlow1, UpDownFlow, UpDownFlow1, UpDownFlow2
+
+"""
+Get upflow from logic circuit
+"""
+@inline get_upflow(elems::UpDownFlow1) = elems.upflow
+@inline get_upflow(elems::UpDownFlow2) = UpFlow1(elems)
+@inline get_upflow(elems::UpFlow) = UpFlow1(elems)
+@inline get_upflow(n::LogicCircuit) = get_upflow(n.data)
+
+"""
+Get the node/edge flow from logic circuit
+"""
+function get_downflow(n::LogicCircuit; root=nothing)::BitVector
+    downflow(x::UpDownFlow1) = x.downflow
+    downflow(x::UpDownFlow2) = begin
+        ors = or_nodes(root)
+        p = findall(p -> n in children(p), ors)
+        @assert length(p) == 1
+        get_downflow(ors[p[1]], n)
+    end
+    downflow(n.data)
+end
+
+function get_downflow(n::ProbCircuit; root=nothing)::Vector{Float64}
+    downflow(x::ExpUpDownFlow1) = x.downflow
+    downflow(x::ExpUpDownFlow2) = begin
+        ors = or_nodes(root)
+        p = findall(p -> n in children(p), ors)
+        @assert length(p) == 1
+        get_downflow(ors[p[1]], n)
+    end
+    downflow(n.data)
+end
+
+@inline isfactorized(n::LogicCircuit) = n.data::UpDownFlow isa UpDownFlow2
+function get_downflow(n::LogicCircuit, c::LogicCircuit)::BitVector
+    @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
+    df = copy(n.data.downflow)
+    if isfactorized(c)
+        return df .&= c.data.prime_flow .& c.data.sub_flow
+    else
+        return df .&= c.data.downflow
+    end
+end
+
+#####################
+# performance-critical queries related to circuit flows
+#####################
+
 # evaluate a circuit as a function
 function (root::ProbCircuit)(data)
     evaluate(root, data)
 end
 
 "Container for circuit flows represented as a float vector"
-const UpFlow1 = Vector{Float64}
-
+const ExpUpFlow1 = Vector{Float64}
 
 "Container for circuit flows represented as an implicit conjunction of a prime and sub float vector (saves memory allocations in circuits with many binary conjunctions)"
-struct UpFlow2
+struct ExpUpFlow2
     prime_flow::Vector{Float64}
     sub_flow::Vector{Float64}
 end
 
-const UpFlow = Union{UpFlow1,UpFlow2}
-
-@inline UpFlow(elems::UpFlow1) = elems
-
-@inline UpFlow(elems::UpFlow2) =
-    elems.prime_flow .+ elems.sub_flow
+const ExpUpFlow = Union{ExpUpFlow1,ExpUpFlow2}
 
-import Base.length
-length(elems::UpFlow2) = length(UpFlow(elems))
+@inline ExpUpFlow1(elems::ExpUpFlow1) = elems
+@inline ExpUpFlow1(elems::ExpUpFlow2) = elems.prime_flow .+ elems.sub_flow
 
 function evaluate(root::ProbCircuit, data;
                    nload = nload, nsave = nsave, reset=true)::Vector{Float64}
@@ -50,12 +98,12 @@ function evaluate(root::ProbCircuit, data;
     
     @inline fa(n, call) = begin
         if num_children(n) == 1
-            return UpFlow1(call(@inbounds children(n)[1]))
+            return ExpUpFlow1(call(@inbounds children(n)[1]))
         else
-            c1 = call(@inbounds children(n)[1])::UpFlow
-            c2 = call(@inbounds children(n)[2])::UpFlow
-            if num_children(n) == 2 && c1 isa UpFlow1 && c2 isa UpFlow1 
-                UpFlow2(c1, c2) # no need to allocate a new BitVector
+            c1 = call(@inbounds children(n)[1])::ExpUpFlow
+            c2 = call(@inbounds children(n)[2])::ExpUpFlow
+            if num_children(n) == 2 && c1 isa ExpUpFlow1 && c2 isa ExpUpFlow1 
+                return ExpUpFlow2(c1, c2) # no need to allocate a new BitVector
             end
             x = flowop(c1, c2, +)
             for c in children(n)[3:end]
@@ -67,11 +115,11 @@ function evaluate(root::ProbCircuit, data;
     
     @inline fo(n, call) = begin
         if num_children(n) == 1
-            return UpFlow1(call(@inbounds children(n)[1]))
+            return ExpUpFlow1(call(@inbounds children(n)[1]))
         else
             log_thetas = n.log_thetas
-            c1 = call(@inbounds children(n)[1])::UpFlow
-            c2 = call(@inbounds children(n)[2])::UpFlow
+            c1 = call(@inbounds children(n)[1])::ExpUpFlow
+            c2 = call(@inbounds children(n)[2])::ExpUpFlow
             x = flowop(c1, log_thetas[1], c2, log_thetas[2], logsumexp)
             for (i, c) in enumerate(children(n)[3:end])
                 accumulate(x, call(c), log_thetas[i+2], logsumexp)
@@ -81,19 +129,108 @@ function evaluate(root::ProbCircuit, data;
     end
     
     # ensure flow us Flow1 at the root, even when it's a conjunction
-    root_flow = UpFlow1(foldup(root, f_con, f_lit, fa, fo, UpFlow; nload, nsave, reset))
+    root_flow = ExpUpFlow1(foldup(root, f_con, f_lit, fa, fo, ExpUpFlow; nload, nsave, reset))
     return nsave(root, root_flow)
 end
 
-@inline flowop(x::UpFlow, y::UpFlow, op)::UpFlow1 =
-    op.(UpFlow(x), UpFlow(y))
+@inline flowop(x::ExpUpFlow, y::ExpUpFlow, op)::ExpUpFlow1 =
+    op.(ExpUpFlow1(x), ExpUpFlow1(y))
 
-@inline flowop(x::UpFlow, w1::Float64, y::UpFlow, w2::Float64, op)::UpFlow1 =
-    op.(UpFlow(x) .+ w1, UpFlow(y) .+ w2)
+@inline flowop(x::ExpUpFlow, w1::Float64, y::ExpUpFlow, w2::Float64, op)::ExpUpFlow1 =
+    op.(ExpUpFlow1(x) .+ w1, ExpUpFlow1(y) .+ w2)
 
 import Base.accumulate
-@inline accumulate(x::UpFlow, v::UpFlow, op) = 
-    @inbounds @. x = op($UpFlow(x), $UpFlow(v)); nothing
+@inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, op) = 
+    @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v)); nothing
+
+@inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, w::Float64, op) = 
+    @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v) + w); nothing
+
+
+#####################
+# downward pass
+#####################
+
+struct ExpUpDownFlow1
+    upflow::ExpUpFlow1
+    downflow::Vector{Float64}
+    ExpUpDownFlow1(upf::ExpUpFlow1) = new(upf, log.(zeros(Float64, length(upf)) .+ 1e-300))
+end
+
+const ExpUpDownFlow2 = ExpUpFlow2
+
+const ExpUpDownFlow = Union{ExpUpDownFlow1, ExpUpDownFlow2}
+
+@inline get_upflow(elems::ExpUpDownFlow1) = elems.upflow
+@inline get_upflow(elems::ExpUpDownFlow2) = ExpUpFlow1(elems)
+
+function compute_flows(circuit::ProbCircuit, data)
+
+    # upward pass
+    @inline upflow!(n, v) = begin
+        n.data = (v isa ExpUpFlow1) ? ExpUpDownFlow1(v) : v
+        v
+    end
+
+    @inline upflow(n) = begin
+        d = n.data::ExpUpDownFlow
+        (d isa ExpUpDownFlow1) ? d.upflow : d
+    end
+
+    evaluate(circuit, data; nload=upflow, nsave=upflow!, reset=false)
+    
+    # downward pass
+
+    @inline downflow(n) = (n.data::ExpUpDownFlow1).downflow
+    @inline isfactorized(n) = n.data::ExpUpDownFlow isa ExpUpDownFlow2
+
+    downflow(circuit) .= 0.0
+
+    foreach_down(circuit; setcounter=false) do n
+        if isinner(n) && !isfactorized(n)
+            downflow_n = downflow(n)
+            upflow_n = upflow(n)
+            for ite in 1 : num_children(n)
+                c = children(n)[ite]
+                log_theta = is⋀gate(n) ? 0.0 : n.log_thetas[ite]
+                if isfactorized(c)
+                    upflow2_c = c.data::ExpUpDownFlow2
+                    # propagate one level further down
+                    for i = 1:2
+                        downflow_c = downflow(@inbounds children(c)[i])
+                        downflow_c .= logsumexp.(downflow_c, downflow_n .+ log_theta .+ upflow2_c.prime_flow .+ upflow2_c.sub_flow .- upflow_n)
+                    end
+                else
+                    upflow1_c = (c.data::ExpUpDownFlow1).upflow
+                    downflow_c = downflow(c)
+                    downflow_c .= logsumexp.(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n)
+                end
+            end 
+        end
+        nothing
+    end
+    nothing
+end
+
+"""
+Get the node/edge downflow from probabilistic circuit
+"""
+function get_downflow(n::ProbCircuit; root=nothing)::Vector{Float64}
+    downflow(x::ExpUpDownFlow1) = x.downflow
+    downflow(x::ExpUpDownFlow2) = begin
+        ors = or_nodes(root)
+        p = findall(p -> n in children(p), ors)
+        @assert length(p) == 1
+        get_downflow(ors[p[1]], n)
+    end
+    downflow(n.data)
+end
+
+function get_downflow(n::ProbCircuit, c::ProbCircuit)::Vector{Float64}
+    @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
+    df = copy(get_downflow(n))
+    log_theta = n.log_thetas[findfirst(x -> x == c, children(n))]
+    return df .+ log_theta .+ get_upflow(c.data) .- get_upflow(n.data)
+end
 
-@inline accumulate(x::UpFlow, v::UpFlow, w::Float64, op) = 
-    @inbounds @. x = op($UpFlow(x), $UpFlow(v) + w); nothing
+@inline isfactorized(n::ProbCircuit) = n.data::ExpUpDownFlow isa ExpUpDownFlow2
\ No newline at end of file
diff --git a/src/Probabilistic/todo/ProbFlowCircuits.jl b/src/Probabilistic/todo/ProbFlowCircuits.jl
deleted file mode 100644
index e2c6bbf1..00000000
--- a/src/Probabilistic/todo/ProbFlowCircuits.jl
+++ /dev/null
@@ -1,56 +0,0 @@
-##### marginal_pass_down
-
-function marginal_pass_down(circuit::DownFlowΔ{O,F}) where {O,F}
-    resize_flows(circuit, flow_length(origin(circuit)))
-    for n in circuit
-        reset_downflow_in_progress(n)
-    end
-    for downflow in downflow_sinks(circuit[end])
-        # initialize root flows to 1
-        downflow.downflow .= one(eltype(F))
-    end
-    for n in Iterators.reverse(circuit)
-        marginal_pass_down_node(n)
-    end
-end
-
-marginal_pass_down_node(n::DownFlowNode) = () # do nothing
-marginal_pass_down_node(n::DownFlowLeaf) = ()
-
-function marginal_pass_down_node(n::DownFlow⋀Cached)
-    # todo(pashak) might need some changes, not tested, also to convert to logexpsum later
-     # downflow(n) = EF_n(e), the EF for edges or leaves are note stored
-    for c in n.children
-        for sink in downflow_sinks(c)
-            if !sink.in_progress
-                sink.downflow .= downflow(n)
-                sink.in_progress = true
-            else
-                sink.downflow .+= downflow(n)
-            end
-        end
-    end
-end
-
-function marginal_pass_down_node(n::DownFlow⋁Cached)
-    # todo(pashak) might need some changes, not tested, also to convert to logexpsum later
-    # downflow(n) = EF_n(e), the EF for edges or leaves are note stored
-    for (ind, c) in enumerate(n.children)
-        for sink in downflow_sinks(c)
-            if !sink.in_progress
-                sink.downflow .= downflow(n) .* exp.(prob_origin(n).log_thetas[ind] .+ pr(origin(c)) .- pr(origin(n)) )
-                sink.in_progress = true
-            else
-                sink.downflow .+= downflow(n) .* exp.(prob_origin(n).log_thetas[ind] .+ pr(origin(c)) .- pr(origin(n)))
-            end
-        end
-    end
-end
-
-#### marginal_pass_up_down
-
-function marginal_pass_up_down(circuit::DownFlowΔ{O,F}, data::XData{E}) where {E <: eltype(F)} where {O,F}
-    @assert !(E isa Bool)
-    marginal_pass_up(origin(circuit), data)
-    marginal_pass_down(circuit)
-end
diff --git a/test/Probabilistic/queries_tests.jl b/test/Probabilistic/queries_tests.jl
index e2d02eb1..19ff068e 100644
--- a/test/Probabilistic/queries_tests.jl
+++ b/test/Probabilistic/queries_tests.jl
@@ -53,57 +53,51 @@ end
 @testset "Marginal Pass Down" begin
     EPS = 1e-7;
     prob_circuit = zoo_psdd("little_4var.psdd");
+    logic_circuit = origin(prob_circuit)
 
     N = 4
-    data_full = XData(Int8.(generate_data_all(N)))
-    opts= (compact⋀=false, compact⋁=false)
-
-    flow_circuit   = FlowΔ(prob_circuit, 16, Float64, opts)
-    flow_circuit_marg = FlowΔ(prob_circuit, 16, Float64, opts)
-
+    data_full = Bool.(generate_data_all(N))
 
     # Comparing with down pass with fully obeserved data
-    pass_up_down(flow_circuit, data_full)
-    marginal_pass_up_down(flow_circuit_marg, data_full)
+    compute_flows(logic_circuit, data_full)
+    compute_flows(prob_circuit, data_full)
 
-    for (ind, node) in enumerate(flow_circuit)
-        if node isa HasDownFlow
-            @test all(  isapprox.(downflow(flow_circuit[ind]), downflow(flow_circuit_marg[ind]), atol = EPS) )
-        end
+    for pn in linearize(prob_circuit)
+        @test all(isapprox.(exp.(get_downflow(pn; root=prob_circuit)), 
+            get_downflow(pn.origin; root=logic_circuit), atol=EPS))
     end
 
-
     # Validating one example with missing features done by hand
-    data_partial = XData(Int8.([-1 1 -1 1]))
-    flow_circuit_part  = FlowΔ(prob_circuit, 16, Float64, opts)
-    ProbabilisticCircuits.marginal_pass_up_down(flow_circuit_part, data_partial)
+    data_partial = Int8.([-1 1 -1 1])
+    prob_circuit = zoo_psdd("little_4var.psdd");
+    compute_flows(prob_circuit, data_partial)
 
     # (node index, correct down_flow_value)
     true_vals = [(1, 0.5),
                 (2, 1.0),
-                (3, 1/3),
-                (4, 1.0),
-                (5, 0.5),
-                (6, 0.0),
-                (7, 2/3),
+                (3, 0.5),
+                (4, 0.0),
+                (5, 0.0),
+                (6, 0.5),
+                (7, 0.5),
                 (8, 0.0),
-                (9, 0.3333333333333),
-                (10, 0.0),
-                (11, 0.6666666666666),
-                (12, 0.0),
-                (13, 1.0),
-                (14, 0.5),
-                (15, 0.0),
-                (16, 0.5),
+                (9, 1.0),
+                (10, 1/3),
+                (11, 1),
+                (12, 1/3),
+                (13, 0.0),
+                (14, 0.0),
+                (15, 2/3),
+                (16, 2/3),
                 (17, 0.0),
                 (18, 1.0),
                 (19, 1.0),
                 (20, 1.0)]
-
+    lin = linearize(prob_circuit)
+    
     for ind_val in true_vals
-        @test downflow(flow_circuit_part[ind_val[1]])[1] ≈ ind_val[2] atol= EPS
+        @test exp(get_downflow(lin[ind_val[1]]; root=prob_circuit)[1]) ≈ ind_val[2] atol= EPS
     end
-
 end
 
 function test_mpe_brute_force(prob_circuit, evidence)

From 4f5c09bf29520433ebf63ade141fd2785780f56e Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 11:16:08 -0700
Subject: [PATCH 013/131] MPE

---
 src/LoadSave/circuit_line_compiler.jl |  4 +-
 src/LoadSave/circuit_savers.jl        |  8 +--
 src/Probabilistic/Queries.jl          | 53 +++++++++++++++++-
 src/Probabilistic/flows.jl            | 46 ++++++----------
 src/Probabilistic/todo/parameters.jl  | 79 +--------------------------
 test/Probabilistic/queries_tests.jl   | 23 +++-----
 6 files changed, 82 insertions(+), 131 deletions(-)

diff --git a/src/LoadSave/circuit_line_compiler.jl b/src/LoadSave/circuit_line_compiler.jl
index b20b6fde..24058656 100644
--- a/src/LoadSave/circuit_line_compiler.jl
+++ b/src/LoadSave/circuit_line_compiler.jl
@@ -3,7 +3,7 @@
 #####################
 
 # reuse some internal infrastructure of LogicCircuits' LoadSave module
-using LogicCircuits.LoadSave: CircuitFormatLines, CircuitFormatLine, constant,
+using LogicCircuits.LoadSave: CircuitFormatLines, CircuitFormatLine, lnconstant,
 VtreeFormatLines, CircuitHeaderLine, UnweightedLiteralLine, WeightedLiteralLine, 
 DecisionLine, LCElement, BiasLine, WeightedNamedConstantLine, PSDDElement, 
 CircuitCommentLine, ID, compile_smooth_struct_logical_m, compile_smooth_logical_m
@@ -55,7 +55,7 @@ function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicCircuit, i
         # do nothing
     end
     function compile(ln::WeightedNamedConstantLine)
-        @assert constant(ln) == true
+        @assert lnconstant(ln) == true
         root = id2probnode(ln.node_id)::Prob⋁Node
         root.log_thetas .= [ln.weight, log1p(-exp(ln.weight))]
     end
diff --git a/src/LoadSave/circuit_savers.jl b/src/LoadSave/circuit_savers.jl
index 22acd3a6..ab23580c 100644
--- a/src/LoadSave/circuit_savers.jl
+++ b/src/LoadSave/circuit_savers.jl
@@ -40,8 +40,8 @@ end
 
 import LogicCircuits.LoadSave: get_node2id
 
-function get_node2id(circuit::DecoratorCircuit, T::Type) 
-    node2id = Dict{T, ID}()
+function get_node2id(circuit::DecoratorCircuit) 
+    node2id = Dict{DecoratorCircuit, ID}()
     outnodes = filter(n -> !is⋀gate(n), circuit)
     sizehint!(node2id, length(outnodes))
     index = ID(0) # node id start from 0
@@ -76,7 +76,7 @@ function save_as_psdd(name::String, circuit::ProbCircuit, vtree::PlainVtree)
     # TODO add method isstructured
     @assert circuit.origin isa StructLogicCircuit "PSDD should decorate on StructLogicΔ"
     @assert endswith(name, ".psdd")
-    node2id = get_node2id(circuit, ProbCircuit)
+    node2id = get_node2id(circuit)
     vtree2id = get_vtree2id(vtree)
     formatlines = Vector{CircuitFormatLine}()
     append!(formatlines, parse_psdd_file(IOBuffer(psdd_header())))
@@ -112,7 +112,7 @@ end
 function save_as_logistic(name::String, circuit::LogisticCircuit, vtree)
     @assert circuit.origin isa StructLogicCircuit "LC should decorate on StructLogicΔ"
     @assert endswith(name, ".circuit")
-    node2id = get_node2id(circuit, LogisticCircuit)
+    node2id = get_node2id(circuit)
     vtree2id = get_vtree2id(vtree)
     formatlines = Vector{CircuitFormatLine}()
     append!(formatlines, parse_lc_file(IOBuffer(lc_header())))
diff --git a/src/Probabilistic/Queries.jl b/src/Probabilistic/Queries.jl
index ed4934d7..351459fb 100644
--- a/src/Probabilistic/Queries.jl
+++ b/src/Probabilistic/Queries.jl
@@ -1,5 +1,6 @@
 export EVI, log_likelihood_per_instance,
-MAR, marginal_log_likelihood_per_instance
+MAR, marginal_log_likelihood_per_instance,
+MPE, MAP
 
 """
 Complete evidence queries
@@ -25,10 +26,10 @@ function log_likelihood_per_instance(pc::ProbCircuit, data)
     log_likelihoods
 end
 
-EVI = log_proba = log_likelihood_per_instance
+EVI = log_likelihood_per_instance
 
 """
-marginal queries
+Marginal queries
 """
 function marginal_log_likelihood_per_instance(pc::ProbCircuit, data)
     evaluate(pc, data)
@@ -36,4 +37,50 @@ end
 MAR = marginal_log_likelihood_per_instance
 
 
+"""
+Most Probable Explanation (MPE), aka MAP
+"""
+@inline function MAP(pc::ProbCircuit, evidence)::BitMatrix
+    MPE(pc, evidence)
+end
+
+function MPE(pc::ProbCircuit, evidence)::BitMatrix
+    mlls = marginal_log_likelihood_per_instance(pc, evidence)
+    
+    ans = falses(num_examples(evidence), num_features(evidence))
+    active_samples = trues(num_examples(evidence))
+
+    function mpe_simulate(node::ProbLiteralNode, active_samples::BitVector, result::BitMatrix)
+        if ispositive(node)
+            result[active_samples, variable(node)] .= 1
+        else
+            result[active_samples, variable(node)] .= 0
+        end
+    end
+    
+    function mpe_simulate(node::Prob⋁Node, active_samples::BitVector, result::BitMatrix)
+        prs = zeros(length(node.children), size(active_samples)[1] )
+        @simd  for i=1:length(node.children)
+            prs[i,:] .= get_upflow(node.children[i]) .+ (node.log_thetas[i])
+        end
+    
+        max_child_ids = [a[1] for a in argmax(prs, dims = 1) ]
+        @simd for i=1:length(node.children)
+            # Only active for this child if it was the max for that sample
+            ids = convert(BitVector, active_samples .* (max_child_ids .== i)[1,:])
+            mpe_simulate(node.children[i], ids, result)
+        end
+    end
+    
+    function mpe_simulate(node::Prob⋀Node, active_samples::BitVector, result::BitMatrix)
+        for child in children(node)
+            mpe_simulate(child, active_samples, result)
+        end
+    end
+
+    mpe_simulate(pc, active_samples, ans)
+    ans
+end
+
+
 
diff --git a/src/Probabilistic/flows.jl b/src/Probabilistic/flows.jl
index e9516572..337ab65f 100644
--- a/src/Probabilistic/flows.jl
+++ b/src/Probabilistic/flows.jl
@@ -4,16 +4,15 @@ import LogicCircuits: evaluate, compute_flows
 using StatsFuns: logsumexp
 
 # TODO move to LogicCircuits
-# TODO clean up and better API
+# TODO downflow struct
 using LogicCircuits: UpFlow, UpFlow1, UpDownFlow, UpDownFlow1, UpDownFlow2
 
 """
 Get upflow from logic circuit
 """
+@inline get_upflow(n::LogicCircuit) = get_upflow(n.data)
 @inline get_upflow(elems::UpDownFlow1) = elems.upflow
-@inline get_upflow(elems::UpDownFlow2) = UpFlow1(elems)
 @inline get_upflow(elems::UpFlow) = UpFlow1(elems)
-@inline get_upflow(n::LogicCircuit) = get_upflow(n.data)
 
 """
 Get the node/edge flow from logic circuit
@@ -29,26 +28,9 @@ function get_downflow(n::LogicCircuit; root=nothing)::BitVector
     downflow(n.data)
 end
 
-function get_downflow(n::ProbCircuit; root=nothing)::Vector{Float64}
-    downflow(x::ExpUpDownFlow1) = x.downflow
-    downflow(x::ExpUpDownFlow2) = begin
-        ors = or_nodes(root)
-        p = findall(p -> n in children(p), ors)
-        @assert length(p) == 1
-        get_downflow(ors[p[1]], n)
-    end
-    downflow(n.data)
-end
-
-@inline isfactorized(n::LogicCircuit) = n.data::UpDownFlow isa UpDownFlow2
 function get_downflow(n::LogicCircuit, c::LogicCircuit)::BitVector
     @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
-    df = copy(n.data.downflow)
-    if isfactorized(c)
-        return df .&= c.data.prime_flow .& c.data.sub_flow
-    else
-        return df .&= c.data.downflow
-    end
+    get_downflow(n) .& get_upflow(c)
 end
 
 #####################
@@ -161,8 +143,6 @@ const ExpUpDownFlow2 = ExpUpFlow2
 
 const ExpUpDownFlow = Union{ExpUpDownFlow1, ExpUpDownFlow2}
 
-@inline get_upflow(elems::ExpUpDownFlow1) = elems.upflow
-@inline get_upflow(elems::ExpUpDownFlow2) = ExpUpFlow1(elems)
 
 function compute_flows(circuit::ProbCircuit, data)
 
@@ -198,12 +178,13 @@ function compute_flows(circuit::ProbCircuit, data)
                     # propagate one level further down
                     for i = 1:2
                         downflow_c = downflow(@inbounds children(c)[i])
-                        downflow_c .= logsumexp.(downflow_c, downflow_n .+ log_theta .+ upflow2_c.prime_flow .+ upflow2_c.sub_flow .- upflow_n)
+                        accumulate(downflow_c, downflow_n .+ log_theta .+ upflow2_c.prime_flow 
+                        .+ upflow2_c.sub_flow .- upflow_n, logsumexp)
                     end
                 else
                     upflow1_c = (c.data::ExpUpDownFlow1).upflow
                     downflow_c = downflow(c)
-                    downflow_c .= logsumexp.(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n)
+                    accumulate(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n, logsumexp)
                 end
             end 
         end
@@ -212,6 +193,14 @@ function compute_flows(circuit::ProbCircuit, data)
     nothing
 end
 
+
+"""
+Get upflow of a probabilistic circuit
+"""
+@inline get_upflow(pc::ProbCircuit) = get_upflow(pc.data)
+@inline get_upflow(elems::ExpUpDownFlow1) = elems.upflow
+@inline get_upflow(elems::ExpUpFlow) = ExpUpFlow1(elems)
+
 """
 Get the node/edge downflow from probabilistic circuit
 """
@@ -228,9 +217,6 @@ end
 
 function get_downflow(n::ProbCircuit, c::ProbCircuit)::Vector{Float64}
     @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
-    df = copy(get_downflow(n))
     log_theta = n.log_thetas[findfirst(x -> x == c, children(n))]
-    return df .+ log_theta .+ get_upflow(c.data) .- get_upflow(n.data)
-end
-
-@inline isfactorized(n::ProbCircuit) = n.data::ExpUpDownFlow isa ExpUpDownFlow2
\ No newline at end of file
+    return get_downflow(n) .+ log_theta .+ get_upflow(c) .- get_upflow(n)
+end
\ No newline at end of file
diff --git a/src/Probabilistic/todo/parameters.jl b/src/Probabilistic/todo/parameters.jl
index e13950c6..3e21b75d 100644
--- a/src/Probabilistic/todo/parameters.jl
+++ b/src/Probabilistic/todo/parameters.jl
@@ -81,32 +81,6 @@ function estimate_parameters_node(n::AggregateFlow⋁; pseudocount)
     end
 end
 
-
-
-"""
-Calculate log likelihood for a batch of samples with partial evidence P(e).
-(Also returns the generated FlowΔ)
-
-To indicate a variable is not observed, pass -1 for that variable.
-"""
-function marginal_log_likelihood_per_instance(pc::ProbΔ, batch::PlainXData{Int8})
-    opts = (flow_opts★..., el_type=Float64, compact⋀=false, compact⋁=false)
-    fc = UpFlowΔ(pc, num_examples(batch), Float64, opts)
-    (fc, marginal_log_likelihood_per_instance(fc, batch))
-end
-
-"""
-Calculate log likelihood for a batch of samples with partial evidence P(e).
-(If you already have a FlowΔ)
-
-To indicate a variable is not observed, pass -1 for that variable.
-"""
-function marginal_log_likelihood_per_instance(fc::UpFlowΔ, batch::PlainXData{Int8})
-    @assert (prob_origin(fc[end]) isa ProbNode) "FlowΔ must originate in a ProbΔ"
-    marginal_pass_up(fc, batch)
-    pr(fc[end])
-end
-
 ##################
 # Sampling from a psdd
 ##################
@@ -203,55 +177,4 @@ function simulate2(node::UpFlow⋀, inst::Dict{Var,Int64})
     for child in children(node)
         simulate2(child, inst)
     end
-end
-
-
-
-##################
-# Most Probable Explanation MPE of a psdd
-#   aka MAP
-##################
-
-@inline function MAP(circuit::ProbΔ, evidence::PlainXData{Int8})::Matrix{Bool}
-    MPE(circuit, evidence)
-end
-
-function MPE(circuit::ProbΔ, evidence::PlainXData{Int8})::Matrix{Bool}
-    # Computing Marginal Likelihood for each node
-    fc, lls = marginal_log_likelihood_per_instance(circuit, evidence)
-
-    ans = Matrix{Bool}(zeros(size(evidence.x)))
-    active_samples = Array{Bool}(ones( num_examples(evidence) ))
-
-    mpe_simulate(fc[end], active_samples, ans)
-    ans
-end
-
-"""
-active_samples: bool vector indicating which samples are active for this node during mpe
-result: Matrix (num_samples, num_variables) indicating the final result of mpe
-"""
-function mpe_simulate(node::UpFlowLiteral, active_samples::Vector{Bool}, result::Matrix{Bool})
-    if ispositive(node)
-        result[active_samples, variable(node)] .= 1
-    else
-        result[active_samples, variable(node)] .= 0
-    end
-end
-function mpe_simulate(node::UpFlow⋁, active_samples::Vector{Bool}, result::Matrix{Bool})
-    prs = zeros( length(node.children), size(active_samples)[1] )
-    @simd  for i=1:length(node.children)
-        prs[i,:] .= pr(node.children[i]) .+ (node.origin.log_thetas[i])
-    end
-
-    max_child_ids = [a[1] for a in argmax(prs, dims = 1) ]
-    @simd for i=1:length(node.children)
-        ids = Vector{Bool}( active_samples .* (max_child_ids .== i)[1,:] )  # Only active for this child if it was the max for that sample
-        mpe_simulate(node.children[i], ids, result)
-    end
-end
-function mpe_simulate(node::UpFlow⋀, active_samples::Vector{Bool}, result::Matrix{Bool})
-    for child in node.children
-        mpe_simulate(child, active_samples, result)
-    end    
-end
+end
\ No newline at end of file
diff --git a/test/Probabilistic/queries_tests.jl b/test/Probabilistic/queries_tests.jl
index 19ff068e..88263b58 100644
--- a/test/Probabilistic/queries_tests.jl
+++ b/test/Probabilistic/queries_tests.jl
@@ -104,13 +104,13 @@ function test_mpe_brute_force(prob_circuit, evidence)
     EPS = 1e-9;
     result = MPE(prob_circuit, evidence);
     for idx = 1 : num_examples(evidence)
-        marg = XData(generate_all(evidence.x[idx,:]));
-        fc, lls = log_likelihood_per_instance(prob_circuit, marg);
-        brute_mpe = marg.x[argmax(lls), :]
+        marg = generate_all(evidence[idx,:])
+        lls = log_likelihood_per_instance(prob_circuit, marg);
+        brute_mpe = marg[argmax(lls), :]
 
         # Compare and validate p(result[idx]) == p(brute_mpe)
-        comp_data = XData(vcat(result[idx,:]',  brute_mpe'))
-        fc2, lls2 = log_likelihood_per_instance(prob_circuit, comp_data);
+        comp_data = vcat(result[idx,:]',  brute_mpe')
+        lls2 = log_likelihood_per_instance(prob_circuit, comp_data);
 
         @test lls2[1] ≈ lls2[2] atol= EPS
     end
@@ -118,12 +118,12 @@ end
 
 @testset "MPE Brute Force Test Small (4 var)" begin
     prob_circuit = zoo_psdd("little_4var.psdd");
-    evidence = XData( Int8.( [-1 0 0 0;
+    evidence = Int8.( [-1 0 0 0;
                                 0 -1 -1 0;
                                 1 1 1 -1;
                                 1 0 1 0;
                                 -1 -1 -1 1;
-                                -1 -1 -1 -1] ))
+                                -1 -1 -1 -1] )
 
     test_mpe_brute_force(prob_circuit, evidence)
 
@@ -134,12 +134,7 @@ end
     COUNT = 10
 
     prob_circuit = zoo_psdd("exp-D15-N1000-C4.psdd");
-    evidence = XData(Int8.(rand( (-1,0,1), (COUNT, N) )))
+    evidence = Int8.(rand( (-1,0,1), (COUNT, N)))
 
     test_mpe_brute_force(prob_circuit, evidence)
-end
-
-
-@testset "EVI" begin
-    pc = zoo_psdd("nltcs.psdd")
-end
+end
\ No newline at end of file

From 41acbda1d8a62875e198caa32b7d882c44a57d26 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 11:18:50 -0700
Subject: [PATCH 014/131] mv file and clean up

---
 src/Probabilistic/Probabilistic.jl            | 41 +------------------
 .../{todo/kld.jl => information.jl}           |  0
 2 files changed, 1 insertion(+), 40 deletions(-)
 rename src/Probabilistic/{todo/kld.jl => information.jl} (100%)

diff --git a/src/Probabilistic/Probabilistic.jl b/src/Probabilistic/Probabilistic.jl
index 81773590..9ea2bb33 100644
--- a/src/Probabilistic/Probabilistic.jl
+++ b/src/Probabilistic/Probabilistic.jl
@@ -5,50 +5,11 @@ using ..Utils
 
 export
 
-# ProbCircuits
-ProbNode, ProbΔ, ProbΔ, ProbLeafNode, ProbInnerNode,
-ProbLiteral, Prob⋀, Prob⋁, ProbCache, variable, num_parameters, compute_log_likelihood,
-log_proba,
-log_likelihood, estimate_parameters, log_likelihood_per_instance, marginal_log_likelihood_per_instance,
-initial_mixture_model, estimate_parameters_from_aggregates, compute_ensemble_log_likelihood,
-expectation_step, maximization_step, expectation_step_batch, train_mixture_with_structure, check_parameter_integrity,
-ll_per_instance_per_component, ll_per_instance_for_ensemble,estimate_parameters_cached,
-sample,
-MPE, MAP,prob_origin, copy_node, conjoin_like, disjoin_like, literal_like, normalize, replace_node,
-
-# ProbFlowCircuits
-marginal_pass_up, marginal_pass_down, marginal_pass_up_down,
-
-# Mixtures
-Mixture, AbstractFlatMixture, FlatMixture, FlatMixtureWithFlow,component_weights,FlatMixtureWithFlows,
-log_likelihood, log_likelihood_per_instance, log_likelihood_per_instance_component,
-init_mixture_with_flows, reset_mixture_aggregate_flows, aggregate_flows, estimate_parameters,
-AbstractMetaMixture, MetaMixture,AbstractFlatMixture,AbstractMixture, components, num_components,
-
-# EM Learner
-train_mixture,
-
-# Bagging
-bootstrap_samples_ids, learn_mixture_bagging, learn_mixture_bagging2,
-init_bagging_samples, train_bagging,
-
-# VtreeLearner
-MetisContext, metis_top_down, BlossomContext, blossom_bottom_up!,
-test_top_down, test_bottom_up!,learn_vtree_bottom_up,
-
-# MutualInformation
-mutual_information, DisCache, conditional_entropy, sum_entropy_given_x,
-
-# Clustering
-clustering,
-
-# Queries
-pr_constraint, psdd_entropy, psdd_kl_divergence
-
 # include("Clustering.jl")
 include("prob_nodes.jl")
 include("flows.jl")
 include("queries.jl")
+include("information.jl")
 # include("ProbFlowCircuits.jl")
 # include("MutualInformation.jl")
 # include("Mixtures.jl")
diff --git a/src/Probabilistic/todo/kld.jl b/src/Probabilistic/information.jl
similarity index 100%
rename from src/Probabilistic/todo/kld.jl
rename to src/Probabilistic/information.jl

From 0e3ba4f1af07d3bbe0a7a42417cf85813fb14539 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 11:20:19 -0700
Subject: [PATCH 015/131] mv file and clean up

---
 src/Probabilistic/{information.jl => informations.jl}           | 1 +
 test/Probabilistic/{EntropyKLDTest.jl => informations_tests.jl} | 0
 2 files changed, 1 insertion(+)
 rename src/Probabilistic/{information.jl => informations.jl} (99%)
 rename test/Probabilistic/{EntropyKLDTest.jl => informations_tests.jl} (100%)

diff --git a/src/Probabilistic/information.jl b/src/Probabilistic/informations.jl
similarity index 99%
rename from src/Probabilistic/information.jl
rename to src/Probabilistic/informations.jl
index cf059b4a..7a8fdcf2 100644
--- a/src/Probabilistic/information.jl
+++ b/src/Probabilistic/informations.jl
@@ -1,3 +1,4 @@
+export psdd_kl_divergence
 using DataStructures
 
 # Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability
diff --git a/test/Probabilistic/EntropyKLDTest.jl b/test/Probabilistic/informations_tests.jl
similarity index 100%
rename from test/Probabilistic/EntropyKLDTest.jl
rename to test/Probabilistic/informations_tests.jl

From 36546861a47e1500b7cf38659cfe7a5f4009ded5 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 12:26:06 -0700
Subject: [PATCH 016/131] kld

---
 src/Probabilistic/Probabilistic.jl       |   4 +-
 src/Probabilistic/informations.jl        | 148 +++++++++++------------
 test/Probabilistic/informations_tests.jl |  54 +++++----
 3 files changed, 99 insertions(+), 107 deletions(-)

diff --git a/src/Probabilistic/Probabilistic.jl b/src/Probabilistic/Probabilistic.jl
index 9ea2bb33..de1de6c8 100644
--- a/src/Probabilistic/Probabilistic.jl
+++ b/src/Probabilistic/Probabilistic.jl
@@ -3,13 +3,11 @@ module Probabilistic
 using LogicCircuits
 using ..Utils
 
-export
-
 # include("Clustering.jl")
 include("prob_nodes.jl")
 include("flows.jl")
 include("queries.jl")
-include("information.jl")
+include("informations.jl")
 # include("ProbFlowCircuits.jl")
 # include("MutualInformation.jl")
 # include("Mixtures.jl")
diff --git a/src/Probabilistic/informations.jl b/src/Probabilistic/informations.jl
index 7a8fdcf2..04ad7531 100644
--- a/src/Probabilistic/informations.jl
+++ b/src/Probabilistic/informations.jl
@@ -1,20 +1,26 @@
-export psdd_kl_divergence
-using DataStructures
+export pr_constraint, kl_divergence, entropy
+
+const StrutCircuit = Union{ProbCircuit, StructLogicCircuit}
+const KLDCache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}
+const PRCache = Dict{Tuple{ProbCircuit, StrutCircuit}, Float64}
 
 # Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability
 # spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
-"Calculate the probability of the logic formula given by sdd for the psdd"
-function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogicCircuit})
-    cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
 
-    return pr_constraint(psdd_node, sdd_node, cache)
-end
-function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogicCircuit},
-                       cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})::Float64
-    if (psdd_node, sdd_node) in keys(cache) # Cache hit
+"""
+Calculate the probability of the logic formula given by sdd for the psdd
+"""
+function pr_constraint(psdd_node::ProbCircuit, sdd_node::StrutCircuit,
+    cache::PRCache=PRCache())::Float64
+    
+    # Cache hit
+    if (psdd_node, sdd_node) in keys(cache) 
         return cache[psdd_node, sdd_node]
-    elseif psdd_node isa ProbLiteral # Boundary cases
-        if sdd_node isa Union{ProbLiteral, PlainStructLiteralNode} # Both are literals, just check whether they agrees with each other
+    
+    # Boundary cases
+    elseif psdd_node isa ProbLiteralNode
+        # Both are literals, just check whether they agrees with each other 
+        if isliteralgate(sdd_node)
             if literal(psdd_node) == literal(sdd_node)
                 return get!(cache, (psdd_node, sdd_node), 1.0)
             else
@@ -27,17 +33,19 @@ function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogi
                 return get!(cache, (psdd_node, sdd_node), 1.0)
             else
                 return get!(cache, (psdd_node, sdd_node),
-                    literal(sdd_node.children[1]) == literal(psdd_node) ? 1.0 : 0.0
-                )
+                    literal(sdd_node.children[1]) == literal(psdd_node) ? 1.0 : 0.0)
             end
         end
-    elseif psdd_node.children[1] isa ProbLiteral # The psdd is true
+    
+    # The psdd is true
+    elseif psdd_node.children[1] isa ProbLiteralNode 
         theta = exp(psdd_node.log_thetas[1])
         return get!(cache, (psdd_node, sdd_node),
             theta * pr_constraint(psdd_node.children[1], sdd_node, cache) +
-            (1.0 - theta) * pr_constraint(psdd_node.children[2], sdd_node, cache)
-        )
-    else # Both psdds are not trivial
+            (1.0 - theta) * pr_constraint(psdd_node.children[2], sdd_node, cache))
+    
+    # Both psdds are not trivial
+    else 
         prob = 0.0
         for (prob⋀_node, log_theta) in zip(psdd_node.children, psdd_node.log_thetas)
             p = prob⋀_node.children[1]
@@ -55,68 +63,52 @@ function pr_constraint(psdd_node::ProbNode, sdd_node::Union{ProbNode, StructLogi
 end
 
 
-"Entropy of the distribution of the input psdd."
-function psdd_entropy(psdd_node::ProbNode)::Float64
-    psdd_entropy_cache = Dict{ProbNode, Float64}()
-
-    return psdd_entropy(psdd_node, psdd_entropy_cache)
-end
-function psdd_entropy(psdd_node::Prob⋁, psdd_entropy_cache::Dict{ProbNode, Float64})::Float64
+""""
+Calculate entropy of the distribution of the input psdd."
+"""
+function entropy(psdd_node::Prob⋁Node, psdd_entropy_cache::Dict{ProbCircuit, Float64}=Dict{ProbCircuit, Float64}())::Float64
     if psdd_node in keys(psdd_entropy_cache)
         return psdd_entropy_cache[psdd_node]
-    elseif psdd_node.children[1] isa ProbLiteral
+    elseif psdd_node.children[1] isa ProbLiteralNode
         return get!(psdd_entropy_cache, psdd_node,
             - exp(psdd_node.log_thetas[1]) * psdd_node.log_thetas[1] -
-            exp(psdd_node.log_thetas[2]) * psdd_node.log_thetas[2]
-        )
+            exp(psdd_node.log_thetas[2]) * psdd_node.log_thetas[2])
     else
         local_entropy = 0.0
         for (prob⋀_node, log_prob) in zip(psdd_node.children, psdd_node.log_thetas)
             p = prob⋀_node.children[1]
             s = prob⋀_node.children[2]
 
-            local_entropy += exp(log_prob) * (psdd_entropy(p, psdd_entropy_cache) +
-                psdd_entropy(s, psdd_entropy_cache) - log_prob)
+            local_entropy += exp(log_prob) * (entropy(p, psdd_entropy_cache) +
+                entropy(s, psdd_entropy_cache) - log_prob)
         end
         return get!(psdd_entropy_cache, psdd_node, local_entropy)
     end
 end
-function psdd_entropy(psdd_node::Prob⋀, psdd_entropy_cache::Dict{ProbNode, Float64})::Float64
-    return get!(psdd_entropy_cache, psdd_node.children[1], psdd_entropy(psdd_node.children[1], psdd_entropy_cache)) +
-        get!(psdd_entropy_cache, psdd_node.children[2], psdd_entropy(psdd_node.children[2], psdd_entropy_cache))
-end
-function psdd_entropy(psdd_node::ProbLiteral, psdd_entropy_cache::Dict{ProbNode, Float64})::Float64
-    return get!(psdd_entropy_cache, psdd_node, 0.0)
-end
 
-
-"KL divergence calculation for psdds that are not necessarily identical"
-function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode)::Float64
-    kl_divergence_cache = Dict{Tuple{ProbNode, ProbNode}, Float64}()
-    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
-
-    return psdd_kl_divergence(psdd_node1, psdd_node2, kl_divergence_cache, pr_constraint_cache)
+function entropy(psdd_node::Prob⋀Node, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
+    return get!(psdd_entropy_cache, psdd_node.children[1], entropy(psdd_node.children[1], psdd_entropy_cache)) +
+        get!(psdd_entropy_cache, psdd_node.children[2], entropy(psdd_node.children[2], psdd_entropy_cache))
 end
-function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
-        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64})::Float64
-    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
 
-    return psdd_kl_divergence(psdd_node1, psdd_node2, kl_divergence_cache, pr_constraint_cache)
+function entropy(psdd_node::ProbLiteralNode, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
+    return get!(psdd_entropy_cache, psdd_node, 0.0)
 end
-function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
-        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
-    @assert !(psdd_node1 isa Prob⋀ || psdd_node2 isa Prob⋀) "Prob⋀ not a valid PSDD node for KL-Divergence"
+
+"Calculate KL divergence calculation for psdds that are not necessarily identical"
+function kl_divergence(psdd_node1::Prob⋁Node, psdd_node2::Prob⋁Node,
+        kl_divergence_cache::KLDCache=KLDCache(), pr_constraint_cache::PRCache=PRCache())
+    @assert !(psdd_node1 isa Prob⋀Node || psdd_node2 isa Prob⋀Node) "Prob⋀ not a valid PSDD node for KL-Divergence"
 
     # Check if both nodes are normalized for same vtree node
     @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
         return kl_divergence_cache[(psdd_node1, psdd_node2)]
-    elseif psdd_node1.children[1] isa ProbLiteral
-        if psdd_node2 isa ProbLiteral
-            psdd_kl_divergence(psdd_node1.children[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-            psdd_kl_divergence(psdd_node1.children[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
+    elseif psdd_node1.children[1] isa ProbLiteralNode
+        if psdd_node2 isa ProbLiteralNode
+            kl_divergence(psdd_node1.children[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(psdd_node1.children[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
             if literal(psdd_node1.children[1]) == literal(psdd_node2)
                 return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
                     psdd_node1.log_thetas[1] * exp(psdd_node1.log_thetas[1])
@@ -129,10 +121,10 @@ function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
         else
             # The below four lines actually assign zero, but still we need to
             # call it.
-            psdd_kl_divergence(psdd_node1.children[1], psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
-            psdd_kl_divergence(psdd_node1.children[1], psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
-            psdd_kl_divergence(psdd_node1.children[2], psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
-            psdd_kl_divergence(psdd_node1.children[2], psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(psdd_node1.children[1], psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(psdd_node1.children[1], psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(psdd_node1.children[2], psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(psdd_node1.children[2], psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
             # There are two possible matches
             if literal(psdd_node1.children[1]) == literal(psdd_node2.children[1])
                 return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
@@ -147,7 +139,7 @@ function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
             end
         end
     else # the normal case
-        kl_divergence = 0.0
+        kld = 0.0
 
         # loop through every combination of prim and sub
         for (prob⋀_node1, log_theta1) in zip(psdd_node1.children, psdd_node1.log_thetas)
@@ -165,18 +157,18 @@ function psdd_kl_divergence(psdd_node1::ProbNode, psdd_node2::ProbNode,
 
                 p13 = theta1 * (log_theta1 - log_theta2)
 
-                p21 = psdd_kl_divergence(p, r, kl_divergence_cache, pr_constraint_cache)
-                p31 = psdd_kl_divergence(s, t, kl_divergence_cache, pr_constraint_cache)
+                p21 = kl_divergence(p, r, kl_divergence_cache, pr_constraint_cache)
+                p31 = kl_divergence(s, t, kl_divergence_cache, pr_constraint_cache)
 
-                kl_divergence += p11 * p12 * p13 + theta1 * (p11 * p21 + p12 * p31)
+                kld += p11 * p12 * p13 + theta1 * (p11 * p21 + p12 * p31)
             end
         end
-        return get!(kl_divergence_cache, (psdd_node1, psdd_node2), kl_divergence)
+        return get!(kl_divergence_cache, (psdd_node1, psdd_node2), kld)
     end
 end
-function psdd_kl_divergence(psdd_node1::ProbLiteral, psdd_node2::ProbLiteral,
-        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
+
+function kl_divergence(psdd_node1::ProbLiteralNode, psdd_node2::ProbLiteralNode,
+        kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
     # Check if literals are over same variables in vtree
    @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
@@ -187,16 +179,16 @@ function psdd_kl_divergence(psdd_node1::ProbLiteral, psdd_node2::ProbLiteral,
         return get!(kl_divergence_cache, (psdd_node1, psdd_node2), 0.0)
     end
 end
-function psdd_kl_divergence(psdd_node1::Prob⋁, psdd_node2::ProbLiteral,
-        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
+
+function kl_divergence(psdd_node1::Prob⋁Node, psdd_node2::ProbLiteralNode,
+        kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
     @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
         return kl_divergence_cache[psdd_node1, psdd_node2]
     else
-        psdd_kl_divergence(psdd_node1.children[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-        psdd_kl_divergence(psdd_node1.children[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
+        kl_divergence(psdd_node1.children[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
+        kl_divergence(psdd_node1.children[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
         if literal(psdd_node1.children[1]) == literal(psdd_node2)
             return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
                 psdd_node1.log_thetas[1] * exp(psdd_node1.log_thetas[1])
@@ -208,16 +200,16 @@ function psdd_kl_divergence(psdd_node1::Prob⋁, psdd_node2::ProbLiteral,
         end
     end
 end
-function psdd_kl_divergence(psdd_node1::ProbLiteral, psdd_node2::Prob⋁,
-        kl_divergence_cache::Dict{Tuple{ProbNode, ProbNode}, Float64},
-        pr_constraint_cache::Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64})
+
+function kl_divergence(psdd_node1::ProbLiteralNode, psdd_node2::Prob⋁Node,
+        kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
     @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
         return kl_divergence_cache[psdd_node1, psdd_node2]
     else
-        psdd_kl_divergence(psdd_node1, psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
-        psdd_kl_divergence(psdd_node1, psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
+        kl_divergence(psdd_node1, psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
+        kl_divergence(psdd_node1, psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
         if literal(psdd_node1) == literal(psdd_node2.children[1])
             return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
                 -psdd_node2.log_thetas[1]
diff --git a/test/Probabilistic/informations_tests.jl b/test/Probabilistic/informations_tests.jl
index aebd67ca..64e30164 100644
--- a/test/Probabilistic/informations_tests.jl
+++ b/test/Probabilistic/informations_tests.jl
@@ -2,6 +2,8 @@ using Test
 using LogicCircuits
 using ProbabilisticCircuits
 
+# TODO reinstate after fix tests by replacing indexing circuit node
+
 @testset "Entropy and KLD" begin
     pc1, vtree = load_struct_prob_circuit(
                     zoo_psdd_file("simple2.1.psdd"), zoo_vtree_file("simple2.vtree"))
@@ -11,38 +13,38 @@ using ProbabilisticCircuits
                     zoo_psdd_file("simple2.3.psdd"), zoo_vtree_file("simple2.vtree"))
    
     # Entropy calculation test
-    @test abs(psdd_entropy(pc1[end]) - 1.2899219826090118) < 1e-8
-    @test abs(psdd_entropy(pc2[end]) - 0.9359472745536583) < 1e-8
+    @test abs(entropy(pc1) - 1.2899219826090118) < 1e-8
+    @test abs(entropy(pc2) - 0.9359472745536583) < 1e-8
 
     # KLD Tests #
     # KLD base tests
-    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
-    kl_divergence_cache = Dict{Tuple{ProbNode, ProbNode}, Float64}()
+    pr_constraint_cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
+    kl_divergence_cache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}()
 
-    @test_throws AssertionError("Both nodes not normalized for same vtree node") psdd_kl_divergence(pc1[1], pc1[3], kl_divergence_cache, pr_constraint_cache)
-    @test_throws AssertionError("Both nodes not normalized for same vtree node") psdd_kl_divergence(pc1[2], pc1[3], kl_divergence_cache, pr_constraint_cache)
-    @test_throws AssertionError("Both nodes not normalized for same vtree node") psdd_kl_divergence(pc1[1], pc1[4], kl_divergence_cache, pr_constraint_cache)
-    @test_throws AssertionError("Both nodes not normalized for same vtree node") psdd_kl_divergence(pc1[1], pc1[5], kl_divergence_cache, pr_constraint_cache)
-    @test_throws AssertionError("Both nodes not normalized for same vtree node") psdd_kl_divergence(pc1[2], pc1[5], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[3], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[2], pc1[3], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[4], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[5], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[2], pc1[5], kl_divergence_cache, pr_constraint_cache)
 
-    @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") psdd_kl_divergence(pc1[1], pc1[6], kl_divergence_cache, pr_constraint_cache)
-    @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") psdd_kl_divergence(pc1[7], pc1[2], kl_divergence_cache, pr_constraint_cache)
-    @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") psdd_kl_divergence(pc1[6], pc2[7], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[1], pc1[6], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[7], pc1[2], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[6], pc2[7], kl_divergence_cache, pr_constraint_cache)
 
     # KLD calculation test
-    @test abs(psdd_kl_divergence(pc1[1], pc2[1], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-    @test abs(psdd_kl_divergence(pc1[1], pc1[2], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-    @test abs(psdd_kl_divergence(pc1[1], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.9)) < 1e-8
-    @test abs(psdd_kl_divergence(pc1[2], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.1)) < 1e-8
-    @test abs(psdd_kl_divergence(pc1[5], pc2[4], kl_divergence_cache, pr_constraint_cache) - 0.2 * log(0.2)) < 1e-8
-    @test abs(psdd_kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
-    @test abs(psdd_kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
-    @test abs(psdd_kl_divergence(pc1[end], pc2[end]) - 0.5672800167911778) < 1e-8
-
-    kl_divergence_cache = Dict{Tuple{ProbNode, ProbNode}, Float64}()
-    @test abs(psdd_kl_divergence(pc2[4], pc3[5], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-    @test abs(psdd_kl_divergence(pc2[4], pc3[4], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-    @test abs(psdd_kl_divergence(pc2[3], pc3[3], kl_divergence_cache, pr_constraint_cache) - 0.9 * log(0.9 / 0.5) - 0.1 * log(0.1 / 0.5)) < 1e-8
-    @test abs(psdd_kl_divergence(pc2[end], pc3[end]) - 0.38966506) < 1e-8
+    # @test abs(kl_divergence(pc1[1], pc2[1], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
+    # @test abs(kl_divergence(pc1[1], pc1[2], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
+    # @test abs(kl_divergence(pc1[1], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.9)) < 1e-8
+    # @test abs(kl_divergence(pc1[2], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.1)) < 1e-8
+    # @test abs(kl_divergence(pc1[5], pc2[4], kl_divergence_cache, pr_constraint_cache) - 0.2 * log(0.2)) < 1e-8
+    # @test abs(kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
+    # @test abs(kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
+    @test abs(kl_divergence(pc1, pc2) - 0.5672800167911778) < 1e-8
+
+    kl_divergence_cache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}()
+    # @test abs(kl_divergence(pc2[4], pc3[5], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
+    # @test abs(kl_divergence(pc2[4], pc3[4], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
+    # @test abs(kl_divergence(pc2[3], pc3[3], kl_divergence_cache, pr_constraint_cache) - 0.9 * log(0.9 / 0.5) - 0.1 * log(0.1 / 0.5)) < 1e-8
+    @test abs(kl_divergence(pc2, pc3) - 0.38966506) < 1e-8
 
 end

From 8d152620506d953a9abdd2bbefd5d8873e073552 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 12:55:28 -0700
Subject: [PATCH 017/131] logistic circuits

---
 src/Logistic/Logistic.jl        |  2 ++
 src/Logistic/queries.jl         | 53 +++++++++++++--------------------
 test/Logistic/logistic_tests.jl | 29 ++++--------------
 3 files changed, 28 insertions(+), 56 deletions(-)

diff --git a/src/Logistic/Logistic.jl b/src/Logistic/Logistic.jl
index c6a73c93..c657449f 100644
--- a/src/Logistic/Logistic.jl
+++ b/src/Logistic/Logistic.jl
@@ -6,4 +6,6 @@ using ..Utils
 include("logistic_nodes.jl")
 include("queries.jl")
 
+# TODO learning
+
 end
\ No newline at end of file
diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index 9865be43..b96f631c 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -1,35 +1,22 @@
-# export class_conditional_likelihood_per_instance
-# # Class Conditional Probability
-# function class_conditional_likelihood_per_instance(fc::FlowΔ, 
-#                                                     classes::Int, 
-#                                                     batch::PlainXData{Bool})
-#     lc = origin(origin(fc))
-#     @assert(lc isa LogisticΔ)
-#     pass_up_down(fc, batch)
-#     likelihoods = zeros(num_examples(batch), classes)
-#     for n in fc
-#         orig = logistic_origin(n)
-#         if orig isa Logistic⋀Node
-#             # For each class. orig.thetas is 2D so used eachcol
-#             for (idx, thetaC) in enumerate(eachcol(orig.thetas))
-#                 foreach(n.children, thetaC) do c, theta
-#                     likelihoods[:, idx] .+= prod_fast(downflow(n), pr_factors(origin(c))) .* theta
-#                 end
-#             end
-#         end
-#     end
-#     likelihoods
-# end
+export class_conditional_likelihood_per_instance
 
-# """
-# Calculate conditional log likelihood for a batch of samples with evidence P(c | x).
-# (Also returns the generated FlowΔ)
-# """
-# function class_conditional_likelihood_per_instance(lc::LogisticΔ, 
-#                                                     classes::Int, 
-#                                                     batch::PlainXData{Bool})
-#     opts = (max_factors = 2, compact⋀=false, compact⋁=false)
-#     fc = FlowΔ(lc, num_examples(batch), Float64, opts)
-#     (fc, class_conditional_likelihood_per_instance(fc, classes, batch))
-# end
+using ..Probabilistic: get_downflow, get_upflow
+"""
+Class Conditional Probability
+"""
+function class_conditional_likelihood_per_instance(lc::LogisticCircuit,  classes::Int, data)
+    compute_flows(lc.origin, data)
+    likelihoods = zeros(num_examples(data), classes)
+    foreach(lc) do ln
+        if ln isa Logistic⋁Node
+            # For each class. orig.thetas is 2D so used eachcol
+            for (idx, thetaC) in enumerate(eachcol(ln.thetas))
+                foreach(ln.children, thetaC) do c, theta
+                    likelihoods[:, idx] .+= Float64.(get_downflow(ln.origin) .& get_upflow(c.origin)) .* theta
+                end
+            end
+        end
+    end
+    likelihoods
+end
 
diff --git a/test/Logistic/logistic_tests.jl b/test/Logistic/logistic_tests.jl
index 4337e0c5..3461a064 100644
--- a/test/Logistic/logistic_tests.jl
+++ b/test/Logistic/logistic_tests.jl
@@ -8,16 +8,9 @@ using ProbabilisticCircuits
     # match with python version.
 
     EPS = 1e-7;
-    my_opts = (max_factors= 2,
-            compact⋀=false,
-            compact⋁=false)
-        
     logistic_circuit = zoo_lc("little_4var.circuit", 2);
     @test logistic_circuit isa LogisticCircuit;
 
-    # flow_circuit = FlowΔ(logistic_circuit, 16, Float64, my_opts)
-    # @test flow_circuit isa Vector{<:FlowNode};
-
     # Step 1. Check Probabilities for 3 samples
     data = Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]);
     
@@ -26,21 +19,11 @@ using ProbabilisticCircuits
                 3.67415087 4.93793472]
             
     CLASSES = 2
-    # calc_prob = class_conditional_likelihood_per_instance(flow_circuit, CLASSES, data)
+    calc_prob = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
     
-    # for i = 1:3
-    #     for j = 1:2
-    #         @test true_prob[i,j] ≈ calc_prob[i,j] atol= EPS;
-    #     end
-    # end
-
-    # # 2. Testing different API
-    # fc2, calc_prob2 = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
-    # for i = 1:3
-    #     for j = 1:2
-    #         @test true_prob[i,j] ≈ calc_prob2[i,j] atol= EPS;
-    #     end
-    # end
-
-
+    for i = 1:3
+        for j = 1:2
+            @test true_prob[i,j] ≈ calc_prob[i,j] atol= EPS;
+        end
+    end
 end
\ No newline at end of file

From 8606d02f2b9205f00a935733ceb35736d307a68f Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 14:03:17 -0700
Subject: [PATCH 018/131] minor fix

---
 src/Utils/Utils.jl                                  | 1 +
 src/Utils/{MutualInformation.jl => informations.jl} | 1 +
 test/Utils/informations_tests.jl                    | 0
 3 files changed, 2 insertions(+)
 rename src/Utils/{MutualInformation.jl => informations.jl} (98%)
 create mode 100644 test/Utils/informations_tests.jl

diff --git a/src/Utils/Utils.jl b/src/Utils/Utils.jl
index 24729879..24c120b6 100644
--- a/src/Utils/Utils.jl
+++ b/src/Utils/Utils.jl
@@ -6,5 +6,6 @@ module Utils
 
 include("misc.jl")
 include("decorators.jl")
+# include("informations.jl")
 
 end #module
diff --git a/src/Utils/MutualInformation.jl b/src/Utils/informations.jl
similarity index 98%
rename from src/Utils/MutualInformation.jl
rename to src/Utils/informations.jl
index 2e13330c..9787b237 100644
--- a/src/Utils/MutualInformation.jl
+++ b/src/Utils/informations.jl
@@ -1,3 +1,4 @@
+export entropy, conditional_entropy, mutual_information
 using Statistics
 using StatsFuns: xlogx, xlogy
 
diff --git a/test/Utils/informations_tests.jl b/test/Utils/informations_tests.jl
new file mode 100644
index 00000000..e69de29b

From d3964d0a2e6fb3bfbe7aaa4afdbe610281df6389 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 15:16:51 -0700
Subject: [PATCH 019/131] sample from psdd

---
 src/Probabilistic/Probabilistic.jl     |   1 +
 src/Probabilistic/Queries.jl           |  83 +++++++++++-
 src/Probabilistic/parameters.jl        |  25 ++++
 src/Probabilistic/todo/parameters.jl   | 180 -------------------------
 test/Probabilistic/SamplingTest.jl     |  79 -----------
 test/Probabilistic/parameters_tests.jl |   8 ++
 test/Probabilistic/queries_tests.jl    |  69 +++++++++-
 7 files changed, 182 insertions(+), 263 deletions(-)
 create mode 100644 src/Probabilistic/parameters.jl
 delete mode 100644 src/Probabilistic/todo/parameters.jl
 delete mode 100644 test/Probabilistic/SamplingTest.jl
 create mode 100644 test/Probabilistic/parameters_tests.jl

diff --git a/src/Probabilistic/Probabilistic.jl b/src/Probabilistic/Probabilistic.jl
index de1de6c8..abfbebd0 100644
--- a/src/Probabilistic/Probabilistic.jl
+++ b/src/Probabilistic/Probabilistic.jl
@@ -8,6 +8,7 @@ include("prob_nodes.jl")
 include("flows.jl")
 include("queries.jl")
 include("informations.jl")
+include("parameters.jl")
 # include("ProbFlowCircuits.jl")
 # include("MutualInformation.jl")
 # include("Mixtures.jl")
diff --git a/src/Probabilistic/Queries.jl b/src/Probabilistic/Queries.jl
index 351459fb..441cc292 100644
--- a/src/Probabilistic/Queries.jl
+++ b/src/Probabilistic/Queries.jl
@@ -1,6 +1,5 @@
-export EVI, log_likelihood_per_instance,
-MAR, marginal_log_likelihood_per_instance,
-MPE, MAP
+export EVI, log_likelihood_per_instance, MAR, marginal_log_likelihood_per_instance, 
+MPE, MAP, sample
 
 """
 Complete evidence queries
@@ -28,6 +27,7 @@ end
 
 EVI = log_likelihood_per_instance
 
+
 """
 Marginal queries
 """
@@ -83,4 +83,81 @@ function MPE(pc::ProbCircuit, evidence)::BitMatrix
 end
 
 
+##################
+# Sampling from a psdd
+##################
+
+"""
+Sample from a PSDD without any evidence
+"""
+function sample(circuit::ProbCircuit)::AbstractVector{Bool}
+
+    simulate(node::ProbLiteralNode) = begin
+        inst[variable(node.origin)] = ispositive(node) ? 1 : 0
+    end
+    
+    simulate(node::Prob⋁Node) = begin
+        idx = sample(exp.(node.log_thetas))
+        simulate(node.children[idx])
+    end
+
+    simulate(node::Prob⋀Node) = foreach(simulate, children(node))
+
+    inst = Dict{Var,Int64}()
+    simulate(circuit)
+    len = length(keys(inst))
+    ans = Vector{Bool}()
+    for i = 1:len
+        push!(ans, inst[i])
+    end
+    ans
+end
+
+
+"""
+Sampling with Evidence from a psdd.
+"""
+function sample(circuit::ProbCircuit, evidence)::AbstractVector{Bool}
 
+    @assert num_examples(evidence) == 1 "evidence have to be one example"
+    
+    simulate(node::ProbLiteralNode) = begin
+        inst[variable(node.origin)] = ispositive(node) ? 1 : 0
+    end
+    
+    function simulate(node::Prob⋁Node)
+        prs = [get_upflow(ch)[1] for ch in children(node)] # #evidence == 1
+        idx = sample(exp.(node.log_thetas .+ prs))
+        simulate(children(node)[idx])
+    end
+    
+    simulate(node::Prob⋀Node) = foreach(simulate, children(node))
+
+    evaluate(circuit, evidence)
+
+    inst = Dict{Var,Int64}()
+    simulate(circuit)
+    len = length(keys(inst))
+    ans = Vector{Bool}()
+    for i = 1:len
+        push!(ans, inst[i])
+    end
+    ans
+end
+
+
+"""
+Uniformly sample based on the probability of the items and return the selected index
+"""
+function sample(probs::AbstractVector{<:Number})::Int32
+    z = sum(probs)
+    q = rand() * z
+    cur = 0.0
+    for i = 1:length(probs)
+        cur += probs[i]
+        if q <= cur
+            return i
+        end
+    end
+    return length(probs)
+end
\ No newline at end of file
diff --git a/src/Probabilistic/parameters.jl b/src/Probabilistic/parameters.jl
new file mode 100644
index 00000000..60047fae
--- /dev/null
+++ b/src/Probabilistic/parameters.jl
@@ -0,0 +1,25 @@
+export estimate_parameters
+
+"""
+Maximum likilihood estimation of parameters given data
+"""
+function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
+    @assert isbinarydata(data)
+    compute_flows(pc.origin, data)
+    foreach(pc) do pn
+        if pn isa Prob⋁Node
+            if num_children(pn) == 1
+                pn.log_thetas .= 0.0
+            else
+                smoothed_flow = Float64(sum(get_downflow(pn.origin))) + pseudocount
+                uniform_pseudocount = pseudocount / num_children(pn)
+                children_flows = map(c -> sum(get_downflow(pn.origin, c)), children(pn.origin))
+                @. pn.log_thetas = log((children_flows + uniform_pseudocount) / smoothed_flow)
+                @assert isapprox(sum(exp.(pn.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally"
+                # normalize away any leftover error
+                pn.log_thetas .-= logsumexp(pn.log_thetas)
+            end
+        end
+    end
+end
+
diff --git a/src/Probabilistic/todo/parameters.jl b/src/Probabilistic/todo/parameters.jl
deleted file mode 100644
index 3e21b75d..00000000
--- a/src/Probabilistic/todo/parameters.jl
+++ /dev/null
@@ -1,180 +0,0 @@
-function normalize_parameters(pc::ProbCircuit)
-    for or in or_nodes(pc)
-        or.log_thetas .= 1 ./ length(or.log_thetas)
-    end
-end
-
-
-function estimate_parameters2(pc::ProbΔ, data::XData{Bool}; pseudocount::Float64)
-    Logic.pass_up_down2(pc, data)
-    w = (data isa PlainXData) ? nothing : weights(data)
-    estimate_parameters_cached2(pc, w; pseudocount=pseudocount)
-end
-
-function estimate_parameters_cached2(pc::ProbΔ, w; pseudocount::Float64)
-    flow(n) = Float64(sum(sum(n.data)))
-    children_flows(n) = sum.(map(c -> c.data[1] .& n.data[1], children(n)))
-
-    if issomething(w)
-        flow_w(n) = sum(Float64.(n.data[1]) .* w)
-        children_flows_w(n) = sum.(map(c -> Float64.(c.data[1] .& n.data[1]) .* w, children(n)))
-        flow = flow_w
-        children_flows = children_flows_w
-    end
-
-    estimate_parameters_node2(n::ProbNode) = ()
-    function estimate_parameters_node2(n::Prob⋁)
-        if num_children(n) == 1
-            n.log_thetas .= 0.0
-        else
-            smoothed_flow = flow(n) + pseudocount
-            uniform_pseudocount = pseudocount / num_children(n)
-            n.log_thetas .= log.((children_flows(n) .+ uniform_pseudocount) ./ smoothed_flow)
-            @assert isapprox(sum(exp.(n.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally"
-            # normalize away any leftover error
-            n.log_thetas .- logsumexp(n.log_thetas)
-        end
-    end
-
-    foreach(estimate_parameters_node2, pc)
-end
-
-
-
-
-function estimate_parameters(pc::ProbΔ, data::XBatches{Bool}; pseudocount::Float64)
-    estimate_parameters(AggregateFlowΔ(pc, aggr_weight_type(data)), data; pseudocount=pseudocount)
-end
-
-function estimate_parameters(afc::AggregateFlowΔ, data::XBatches{Bool}; pseudocount::Float64)
-    @assert feature_type(data) == Bool "Can only learn probabilistic circuits on Bool data"
-    @assert (afc[end].origin isa ProbNode) "AggregateFlowΔ must originate in a ProbΔ"
-    collect_aggr_flows(afc, data)
-    estimate_parameters_cached(afc; pseudocount=pseudocount)
-    afc
-end
-
-function estimate_parameters(fc::FlowΔ, data::XBatches{Bool}; pseudocount::Float64)
-    @assert feature_type(data) == Bool "Can only learn probabilistic circuits on Bool data"
-    @assert (prob_origin(afc[end]) isa ProbNode) "FlowΔ must originate in a ProbΔ"
-    collect_aggr_flows(fc, data)
-    estimate_parameters_cached(origin(fc); pseudocount=pseudocount)
-end
-
- # turns aggregate statistics into theta parameters
-function estimate_parameters_cached(afc::AggregateFlowΔ; pseudocount::Float64)
-    foreach(n -> estimate_parameters_node(n; pseudocount=pseudocount), afc)
-end
-
-estimate_parameters_node(::AggregateFlowNode; pseudocount::Float64) = () # do nothing
-function estimate_parameters_node(n::AggregateFlow⋁; pseudocount)
-    origin = n.origin::Prob⋁
-    if num_children(n) == 1
-        origin.log_thetas .= 0.0
-    else
-        smoothed_aggr_flow = (n.aggr_flow + pseudocount)
-        uniform_pseudocount = pseudocount / num_children(n)
-        origin.log_thetas .= log.( (n.aggr_flow_children .+ uniform_pseudocount) ./ smoothed_aggr_flow )
-        @assert isapprox(sum(exp.(origin.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally: $(exp.(origin.log_thetas)), estimated from $(n.aggr_flow) and $(n.aggr_flow_children). Did you actually compute the aggregate flows?"
-        #normalize away any leftover error
-        origin.log_thetas .- logsumexp(origin.log_thetas)
-    end
-end
-
-##################
-# Sampling from a psdd
-##################
-
-"""
-Sample from a PSDD without any evidence
-"""
-function sample(circuit::ProbΔ)::AbstractVector{Bool}
-    inst = Dict{Var,Int64}()
-    simulate(circuit[end], inst)
-    len = length(keys(inst))
-    ans = Vector{Bool}()
-    for i = 1:len
-        push!(ans, inst[i])
-    end
-    ans
-end
-
-# Uniformly sample based on the probability of the items
-# and return the selected index
-function sample(probs::AbstractVector{<:Number})::Int32
-    z = sum(probs)
-    q = rand() * z
-    cur = 0.0
-    for i = 1:length(probs)
-        cur += probs[i]
-        if q <= cur
-            return i
-        end
-    end
-    return length(probs)
-end
-
-function simulate(node::ProbLiteral, inst::Dict{Var,Int64})
-    if ispositive(node)
-        inst[variable(node.origin)] = 1
-    else
-        inst[variable(node.origin)] = 0
-    end
-end
-
-function simulate(node::Prob⋁, inst::Dict{Var,Int64})
-    idx = sample(exp.(node.log_thetas))
-    simulate(node.children[idx], inst)
-end
-function simulate(node::Prob⋀, inst::Dict{Var,Int64})
-    for child in node.children
-        simulate(child, inst)
-    end
-end
-
-"""
-Sampling with Evidence from a psdd.
-Internally would call marginal pass up on a newly generated flow circuit.
-"""
-function sample(circuit::ProbΔ, evidence::PlainXData{Int8})::AbstractVector{Bool}
-    opts= (compact⋀=false, compact⋁=false)
-    flow_circuit = UpFlowΔ(circuit, 1, Float64, opts)
-    marginal_pass_up(flow_circuit, evidence)
-    sample(flow_circuit)
-end
-
-"""
-Sampling with Evidence from a psdd.
-Assuming already marginal pass up has been done on the flow circuit.
-"""
-function sample(circuit::UpFlowΔ)::AbstractVector{Bool}
-    inst = Dict{Var,Int64}()
-    simulate2(circuit[end], inst)
-    len = length(keys(inst))
-    ans = Vector{Bool}()
-    for i = 1:len
-        push!(ans, inst[i])
-    end
-    ans
-end
-
-function simulate2(node::UpFlowLiteral, inst::Dict{Var,Int64})
-    if ispositive(node)
-        #TODO I don't think we need these 'grand_origin' parts below
-        inst[variable(grand_origin(node))] = 1
-    else
-        inst[variable(grand_origin(node))] = 0
-    end
-end
-
-function simulate2(node::UpFlow⋁, inst::Dict{Var,Int64})
-    prs = [ pr(ch)[1] for ch in children(node) ]
-    idx = sample(exp.(node.origin.log_thetas .+ prs))
-    simulate2(children(node)[idx], inst)
-end
-
-function simulate2(node::UpFlow⋀, inst::Dict{Var,Int64})
-    for child in children(node)
-        simulate2(child, inst)
-    end
-end
\ No newline at end of file
diff --git a/test/Probabilistic/SamplingTest.jl b/test/Probabilistic/SamplingTest.jl
deleted file mode 100644
index 0e1afd5c..00000000
--- a/test/Probabilistic/SamplingTest.jl
+++ /dev/null
@@ -1,79 +0,0 @@
-using Test
-using LogicCircuits
-using ProbabilisticCircuits
-using DataStructures
-
-@testset "Sampling Test" begin
-    EPS = 1e-2;
-    prob_circuit = zoo_psdd("little_4var.psdd");
-    flow_circuit = FlowΔ(prob_circuit, 16, Bool);
-
-    N = 4;
-    data_all = XData(generate_data_all(N));
-
-    calc_prob_all = log_likelihood_per_instance(flow_circuit, data_all);
-    calc_prob_all = exp.(calc_prob_all);
-
-    using DataStructures
-    hist = DefaultDict{AbstractString,Float64}(0.0)
-
-    Nsamples = 1000 * 1000
-    for i = 1:Nsamples
-        cur = join(Int.(sample(prob_circuit)))
-        hist[cur] += 1
-    end
-
-    for k in keys(hist)
-        hist[k] /= Nsamples
-    end
-
-    for k in keys(hist)
-        cur = parse(Int32, k, base=2) + 1 # cause Julia arrays start at 1 :(
-        @test calc_prob_all[cur] ≈ hist[k] atol= EPS;
-    end
-
-
-end
-
-@testset "Sampling With Evidence" begin
-    # TODO (pashak) this test should be improved by adding few more cases
-    EPS = 1e-3;
-    prob_circuit = zoo_psdd("little_4var.psdd");
-
-    opts= (compact⋀=false, compact⋁=false)
-    flow_circuit = UpFlowΔ(prob_circuit, 1, Float64, opts);
-
-    N = 4;
-    data = XData(Int8.([0 -1 0 -1]));
-    calc_prob = marginal_log_likelihood_per_instance(flow_circuit, data);
-    calc_prob = exp.(calc_prob);
-
-    flow_circuit_all = UpFlowΔ(prob_circuit, 4, Float64, opts);
-    data_all = XData(Int8.([
-                            0 0 0 0;
-                            0 0 0 1;
-                            0 1 0 0;
-                            0 1 0 1;
-                        ]));
-    calc_prob_all = marginal_log_likelihood_per_instance(flow_circuit_all, data_all);
-    calc_prob_all = exp.(calc_prob_all);
-
-    calc_prob_all ./= calc_prob[1]
-
-    hist = DefaultDict{AbstractString,Float64}(0.0)
-
-    Nsamples = 1000 * 1000
-    for i = 1:Nsamples
-        cur = join(Int.(sample(flow_circuit)))
-        hist[cur] += 1
-    end
-
-    for k in keys(hist)
-        hist[k] /= Nsamples
-    end
-
-    for ind = 1:4
-        cur = join(data_all.x[ind, :])
-        @test calc_prob_all[ind] ≈ hist[cur] atol= EPS;
-    end
-end
\ No newline at end of file
diff --git a/test/Probabilistic/parameters_tests.jl b/test/Probabilistic/parameters_tests.jl
new file mode 100644
index 00000000..0f953904
--- /dev/null
+++ b/test/Probabilistic/parameters_tests.jl
@@ -0,0 +1,8 @@
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+
+# TODO add tests
+@testset "MLE tests" begin
+    @test true
+end
\ No newline at end of file
diff --git a/test/Probabilistic/queries_tests.jl b/test/Probabilistic/queries_tests.jl
index 88263b58..24e57c08 100644
--- a/test/Probabilistic/queries_tests.jl
+++ b/test/Probabilistic/queries_tests.jl
@@ -2,7 +2,6 @@ using Test
 using LogicCircuits
 using ProbabilisticCircuits
 
-# This tests are supposed to test queries on the circuits
 @testset "Probability of Full Evidence" begin
     # Uses a PSDD with 4 variables, and tests 3 of the configurations to
     # match with python. Also tests all probabilities sum up to 1.
@@ -137,4 +136,72 @@ end
     evidence = Int8.(rand( (-1,0,1), (COUNT, N)))
 
     test_mpe_brute_force(prob_circuit, evidence)
+end
+
+@testset "Sampling Test" begin
+    EPS = 1e-2;
+    prob_circuit = zoo_psdd("little_4var.psdd");
+
+    N = 4;
+    data_all = generate_data_all(N);
+
+    calc_prob_all = log_likelihood_per_instance(prob_circuit, data_all);
+    calc_prob_all = exp.(calc_prob_all);
+
+    using DataStructures
+    hist = DefaultDict{AbstractString,Float64}(0.0)
+
+    Nsamples = 1000 * 1000
+    for i = 1:Nsamples
+        cur = join(Int.(sample(prob_circuit)))
+        hist[cur] += 1
+    end
+
+    for k in keys(hist)
+        hist[k] /= Nsamples
+    end
+
+    for k in keys(hist)
+        cur = parse(Int32, k, base=2) + 1 # cause Julia arrays start at 1 :(
+        @test calc_prob_all[cur] ≈ hist[k] atol= EPS;
+    end
+
+
+end
+
+@testset "Sampling With Evidence" begin
+    # TODO (pashak) this test should be improved by adding few more cases
+    EPS = 1e-3;
+    prob_circuit = zoo_psdd("little_4var.psdd");
+
+    N = 4;
+    data = Int8.([0 -1 0 -1])
+    calc_prob = marginal_log_likelihood_per_instance(prob_circuit, data);
+    calc_prob = exp.(calc_prob);
+
+    data_all = Int8.([0 0 0 0;
+                    0 0 0 1;
+                    0 1 0 0;
+                    0 1 0 1;]);
+    calc_prob_all = marginal_log_likelihood_per_instance(prob_circuit, data_all);
+    calc_prob_all = exp.(calc_prob_all);
+
+    calc_prob_all ./= calc_prob[1]
+
+    hist = DefaultDict{AbstractString,Float64}(0.0)
+
+    Nsamples = 1000 * 1000
+    for i = 1:Nsamples
+        cur = join(Int.(sample(prob_circuit, data)))
+        hist[cur] += 1
+    end
+
+    for k in keys(hist)
+        hist[k] /= Nsamples
+    end
+
+    for ind = 1:4
+        cur = join(data_all[ind, :])
+        @test calc_prob_all[ind] ≈ hist[cur] atol= EPS;
+    end
 end
\ No newline at end of file

From 1e46155b867a3a4c537bd4bc42f3d35e1eae31cd Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 16:04:37 -0700
Subject: [PATCH 020/131] fix tests

---
 src/LoadSave/circuit_loaders.jl               | 10 +--
 src/LoadSave/circuit_savers.jl                |  2 +-
 .../deprecated/Bagging.jl                     |  0
 .../deprecated/Clustering.jl                  |  0
 .../todo/EMLearner.jl                         |  0
 .../todo/Mixtures.jl                          |  0
 src/Probabilistic/informations.jl             | 80 +++++++++----------
 .../todo => StructureLearner}/VtreeLearner.jl |  0
 .../EMLearnerTest.jl                          |  0
 test/Probabilistic/MutualInformationTest.jl   | 30 -------
 test/Probabilistic/PrConstraintTest.jl        | 41 ----------
 test/Probabilistic/informations_tests.jl      | 37 +++++++++
 .../VtreeLearnerTest.jl                       |  0
 test/Utils/informations_tests.jl              | 30 +++++++
 test/runtests.jl                              |  3 +-
 15 files changed, 112 insertions(+), 121 deletions(-)
 rename src/{Probabilistic => Mixtures}/deprecated/Bagging.jl (100%)
 rename src/{Probabilistic => Mixtures}/deprecated/Clustering.jl (100%)
 rename src/{Probabilistic => Mixtures}/todo/EMLearner.jl (100%)
 rename src/{Probabilistic => Mixtures}/todo/Mixtures.jl (100%)
 rename src/{Probabilistic/todo => StructureLearner}/VtreeLearner.jl (100%)
 rename test/{Probabilistic => Mixtures}/EMLearnerTest.jl (100%)
 delete mode 100644 test/Probabilistic/MutualInformationTest.jl
 delete mode 100644 test/Probabilistic/PrConstraintTest.jl
 rename test/{Probabilistic => StructureLearner}/VtreeLearnerTest.jl (100%)

diff --git a/src/LoadSave/circuit_loaders.jl b/src/LoadSave/circuit_loaders.jl
index 90f1237b..d3ffec67 100644
--- a/src/LoadSave/circuit_loaders.jl
+++ b/src/LoadSave/circuit_loaders.jl
@@ -1,5 +1,5 @@
-export zoo_clt, zoo_clt_file, zoo_psdd, zoo_lc, zoo_lc_file,
-    load_prob_circuit, load_struct_prob_circuit, load_logistic_circuit
+export zoo_clt, zoo_clt_file, zoo_psdd, zoo_lc, load_prob_circuit, 
+load_struct_prob_circuit, load_logistic_circuit
 
 using LogicCircuits
 using Pkg.Artifacts
@@ -9,9 +9,6 @@ using LogicCircuits.LoadSave: parse_psdd_file, parse_circuit_file, parse_vtree_f
 # circuit loaders from module zoo
 #####################
 
-zoo_lc_file(name) = 
-    artifact"circuit_model_zoo" * "/Circuit-Model-Zoo-0.1.2/lcs/$name"
-
 zoo_lc(name, num_classes) = 
     load_logistic_circuit(zoo_lc_file(name), num_classes)
 
@@ -21,9 +18,6 @@ zoo_clt_file(name) =
 zoo_clt(name) = 
     parse_clt(zoo_clt_file(name))
 
-zoo_psdd_file(name) = 
-    artifact"circuit_model_zoo" * "/Circuit-Model-Zoo-0.1.2/psdds/$name"
-
 zoo_psdd(name) = 
     load_prob_circuit(zoo_psdd_file(name))
 
diff --git a/src/LoadSave/circuit_savers.jl b/src/LoadSave/circuit_savers.jl
index ab23580c..aa138a9e 100644
--- a/src/LoadSave/circuit_savers.jl
+++ b/src/LoadSave/circuit_savers.jl
@@ -131,7 +131,7 @@ import LogicCircuits.LoadSave: save_circuit, save_as_dot # make available for ex
 save_circuit(name::String, circuit::ProbCircuit, vtree::PlainVtree) =
     save_as_psdd(name, circuit, vtree)
 
-save_circuit(name::String, circuit::LogicCircuit, vtree::PlainVtree) =
+save_circuit(name::String, circuit::LogisticCircuit, vtree::PlainVtree) =
     save_as_logistic(name, circuit, vtree)
 
 using Printf: @sprintf
diff --git a/src/Probabilistic/deprecated/Bagging.jl b/src/Mixtures/deprecated/Bagging.jl
similarity index 100%
rename from src/Probabilistic/deprecated/Bagging.jl
rename to src/Mixtures/deprecated/Bagging.jl
diff --git a/src/Probabilistic/deprecated/Clustering.jl b/src/Mixtures/deprecated/Clustering.jl
similarity index 100%
rename from src/Probabilistic/deprecated/Clustering.jl
rename to src/Mixtures/deprecated/Clustering.jl
diff --git a/src/Probabilistic/todo/EMLearner.jl b/src/Mixtures/todo/EMLearner.jl
similarity index 100%
rename from src/Probabilistic/todo/EMLearner.jl
rename to src/Mixtures/todo/EMLearner.jl
diff --git a/src/Probabilistic/todo/Mixtures.jl b/src/Mixtures/todo/Mixtures.jl
similarity index 100%
rename from src/Probabilistic/todo/Mixtures.jl
rename to src/Mixtures/todo/Mixtures.jl
diff --git a/src/Probabilistic/informations.jl b/src/Probabilistic/informations.jl
index 04ad7531..57aeda1b 100644
--- a/src/Probabilistic/informations.jl
+++ b/src/Probabilistic/informations.jl
@@ -27,34 +27,34 @@ function pr_constraint(psdd_node::ProbCircuit, sdd_node::StrutCircuit,
                 return get!(cache, (psdd_node, sdd_node), 0.0)
             end
         else
-            pr_constraint(psdd_node, sdd_node.children[1], cache)
-            if length(sdd_node.children) > 1
-                pr_constraint(psdd_node, sdd_node.children[2], cache)
+            pr_constraint(psdd_node, children(sdd_node)[1], cache)
+            if length(children(sdd_node)) > 1
+                pr_constraint(psdd_node, children(sdd_node)[2], cache)
                 return get!(cache, (psdd_node, sdd_node), 1.0)
             else
                 return get!(cache, (psdd_node, sdd_node),
-                    literal(sdd_node.children[1]) == literal(psdd_node) ? 1.0 : 0.0)
+                    literal(children(sdd_node)[1]) == literal(psdd_node) ? 1.0 : 0.0)
             end
         end
     
     # The psdd is true
-    elseif psdd_node.children[1] isa ProbLiteralNode 
+    elseif children(psdd_node)[1] isa ProbLiteralNode 
         theta = exp(psdd_node.log_thetas[1])
         return get!(cache, (psdd_node, sdd_node),
-            theta * pr_constraint(psdd_node.children[1], sdd_node, cache) +
-            (1.0 - theta) * pr_constraint(psdd_node.children[2], sdd_node, cache))
+            theta * pr_constraint(children(psdd_node)[1], sdd_node, cache) +
+            (1.0 - theta) * pr_constraint(children(psdd_node)[2], sdd_node, cache))
     
     # Both psdds are not trivial
     else 
         prob = 0.0
-        for (prob⋀_node, log_theta) in zip(psdd_node.children, psdd_node.log_thetas)
-            p = prob⋀_node.children[1]
-            s = prob⋀_node.children[2]
+        for (prob⋀_node, log_theta) in zip(children(psdd_node), psdd_node.log_thetas)
+            p = children(prob⋀_node)[1]
+            s = children(prob⋀_node)[2]
 
             theta = exp(log_theta)
-            for sdd⋀_node in sdd_node.children
-                r = sdd⋀_node.children[1]
-                t = sdd⋀_node.children[2]
+            for sdd⋀_node in children(sdd_node)
+                r = children(sdd⋀_node)[1]
+                t = children(sdd⋀_node)[2]
                 prob += theta * pr_constraint(p, r, cache) * pr_constraint(s, t, cache)
             end
         end
@@ -69,15 +69,15 @@ Calculate entropy of the distribution of the input psdd."
 function entropy(psdd_node::Prob⋁Node, psdd_entropy_cache::Dict{ProbCircuit, Float64}=Dict{ProbCircuit, Float64}())::Float64
     if psdd_node in keys(psdd_entropy_cache)
         return psdd_entropy_cache[psdd_node]
-    elseif psdd_node.children[1] isa ProbLiteralNode
+    elseif children(psdd_node)[1] isa ProbLiteralNode
         return get!(psdd_entropy_cache, psdd_node,
             - exp(psdd_node.log_thetas[1]) * psdd_node.log_thetas[1] -
             exp(psdd_node.log_thetas[2]) * psdd_node.log_thetas[2])
     else
         local_entropy = 0.0
-        for (prob⋀_node, log_prob) in zip(psdd_node.children, psdd_node.log_thetas)
-            p = prob⋀_node.children[1]
-            s = prob⋀_node.children[2]
+        for (prob⋀_node, log_prob) in zip(children(psdd_node), psdd_node.log_thetas)
+            p = children(prob⋀_node)[1]
+            s = children(prob⋀_node)[2]
 
             local_entropy += exp(log_prob) * (entropy(p, psdd_entropy_cache) +
                 entropy(s, psdd_entropy_cache) - log_prob)
@@ -87,8 +87,8 @@ function entropy(psdd_node::Prob⋁Node, psdd_entropy_cache::Dict{ProbCircuit, F
 end
 
 function entropy(psdd_node::Prob⋀Node, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
-    return get!(psdd_entropy_cache, psdd_node.children[1], entropy(psdd_node.children[1], psdd_entropy_cache)) +
-        get!(psdd_entropy_cache, psdd_node.children[2], entropy(psdd_node.children[2], psdd_entropy_cache))
+    return get!(psdd_entropy_cache, children(psdd_node)[1], entropy(children(psdd_node)[1], psdd_entropy_cache)) +
+        get!(psdd_entropy_cache, children(psdd_node)[2], entropy(children(psdd_node)[2], psdd_entropy_cache))
 end
 
 function entropy(psdd_node::ProbLiteralNode, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
@@ -105,11 +105,11 @@ function kl_divergence(psdd_node1::Prob⋁Node, psdd_node2::Prob⋁Node,
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
         return kl_divergence_cache[(psdd_node1, psdd_node2)]
-    elseif psdd_node1.children[1] isa ProbLiteralNode
+    elseif children(psdd_node1)[1] isa ProbLiteralNode
         if psdd_node2 isa ProbLiteralNode
-            kl_divergence(psdd_node1.children[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-            kl_divergence(psdd_node1.children[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-            if literal(psdd_node1.children[1]) == literal(psdd_node2)
+            kl_divergence(children(psdd_node1)[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(children(psdd_node1)[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
+            if literal(children(psdd_node1)[1]) == literal(psdd_node2)
                 return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
                     psdd_node1.log_thetas[1] * exp(psdd_node1.log_thetas[1])
                 )
@@ -121,12 +121,12 @@ function kl_divergence(psdd_node1::Prob⋁Node, psdd_node2::Prob⋁Node,
         else
             # The below four lines actually assign zero, but still we need to
             # call it.
-            kl_divergence(psdd_node1.children[1], psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
-            kl_divergence(psdd_node1.children[1], psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
-            kl_divergence(psdd_node1.children[2], psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
-            kl_divergence(psdd_node1.children[2], psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(children(psdd_node1)[1], children(psdd_node2)[1], kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(children(psdd_node1)[1], children(psdd_node2)[2], kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(children(psdd_node1)[2], children(psdd_node2)[1], kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(children(psdd_node1)[2], children(psdd_node2)[2], kl_divergence_cache, pr_constraint_cache)
             # There are two possible matches
-            if literal(psdd_node1.children[1]) == literal(psdd_node2.children[1])
+            if literal(children(psdd_node1)[1]) == literal(children(psdd_node2)[1])
                 return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
                     exp(psdd_node1.log_thetas[1]) * (psdd_node1.log_thetas[1] - psdd_node2.log_thetas[1]) +
                     exp(psdd_node1.log_thetas[2]) * (psdd_node1.log_thetas[2] - psdd_node2.log_thetas[2])
@@ -142,13 +142,13 @@ function kl_divergence(psdd_node1::Prob⋁Node, psdd_node2::Prob⋁Node,
         kld = 0.0
 
         # loop through every combination of prim and sub
-        for (prob⋀_node1, log_theta1) in zip(psdd_node1.children, psdd_node1.log_thetas)
-            for (prob⋀_node2, log_theta2) in zip(psdd_node2.children, psdd_node2.log_thetas)
-                p = prob⋀_node1.children[1]
-                s = prob⋀_node1.children[2]
+        for (prob⋀_node1, log_theta1) in zip(children(psdd_node1), psdd_node1.log_thetas)
+            for (prob⋀_node2, log_theta2) in zip(children(psdd_node2), psdd_node2.log_thetas)
+                p = children(prob⋀_node1)[1]
+                s = children(prob⋀_node1)[2]
 
-                r = prob⋀_node2.children[1]
-                t = prob⋀_node2.children[2]
+                r = children(prob⋀_node2)[1]
+                t = children(prob⋀_node2)[2]
 
                 theta1 = exp(log_theta1)
 
@@ -187,9 +187,9 @@ function kl_divergence(psdd_node1::Prob⋁Node, psdd_node2::ProbLiteralNode,
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
         return kl_divergence_cache[psdd_node1, psdd_node2]
     else
-        kl_divergence(psdd_node1.children[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-        kl_divergence(psdd_node1.children[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-        if literal(psdd_node1.children[1]) == literal(psdd_node2)
+        kl_divergence(children(psdd_node1)[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
+        kl_divergence(children(psdd_node1)[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
+        if literal(children(psdd_node1)[1]) == literal(psdd_node2)
             return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
                 psdd_node1.log_thetas[1] * exp(psdd_node1.log_thetas[1])
             )
@@ -208,9 +208,9 @@ function kl_divergence(psdd_node1::ProbLiteralNode, psdd_node2::Prob⋁Node,
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
         return kl_divergence_cache[psdd_node1, psdd_node2]
     else
-        kl_divergence(psdd_node1, psdd_node2.children[1], kl_divergence_cache, pr_constraint_cache)
-        kl_divergence(psdd_node1, psdd_node2.children[2], kl_divergence_cache, pr_constraint_cache)
-        if literal(psdd_node1) == literal(psdd_node2.children[1])
+        kl_divergence(psdd_node1, children(psdd_node2)[1], kl_divergence_cache, pr_constraint_cache)
+        kl_divergence(psdd_node1, children(psdd_node2)[2], kl_divergence_cache, pr_constraint_cache)
+        if literal(psdd_node1) == literal(children(psdd_node2)[1])
             return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
                 -psdd_node2.log_thetas[1]
             )
diff --git a/src/Probabilistic/todo/VtreeLearner.jl b/src/StructureLearner/VtreeLearner.jl
similarity index 100%
rename from src/Probabilistic/todo/VtreeLearner.jl
rename to src/StructureLearner/VtreeLearner.jl
diff --git a/test/Probabilistic/EMLearnerTest.jl b/test/Mixtures/EMLearnerTest.jl
similarity index 100%
rename from test/Probabilistic/EMLearnerTest.jl
rename to test/Mixtures/EMLearnerTest.jl
diff --git a/test/Probabilistic/MutualInformationTest.jl b/test/Probabilistic/MutualInformationTest.jl
deleted file mode 100644
index 12fd4ab7..00000000
--- a/test/Probabilistic/MutualInformationTest.jl
+++ /dev/null
@@ -1,30 +0,0 @@
-using Test
-using LogicCircuits
-using ProbabilisticCircuits
-
-function conditional_entropy_test()
-    N = 10
-    D = 5
-
-    b = rand(Bool, N, D)
-    dis_cache, hy_given_x = conditional_entropy(b, nothing; α=0)
-    p = dis_cache.pairwise
-    m = dis_cache.marginal
-
-    for x in 1 : D, y in 1 : D
-        h_y_x = p[x, y, 1] * log(p[x, y, 1] / m[x, 1]) +
-                    p[x, y, 2] * log(p[x, y, 2] / m[x, 1]) +
-                    p[x, y, 3] * log(p[x, y, 3] / m[x, 2]) +
-                    p[x, y, 4] * log(p[x, y, 4] / m[x, 2])
-        if x == y
-            @test hy_given_x[x, y] == 0.0
-        elseif !isnan(h_y_x)
-            @test hy_given_x[x, y] ≈ - h_y_x atol=1e-12
-        end
-    end
-end
-
-@testset "Information Theory Test" begin
-    conditional_entropy_test()
-end
-
diff --git a/test/Probabilistic/PrConstraintTest.jl b/test/Probabilistic/PrConstraintTest.jl
deleted file mode 100644
index e4554b8c..00000000
--- a/test/Probabilistic/PrConstraintTest.jl
+++ /dev/null
@@ -1,41 +0,0 @@
-using Test
-using LogicCircuits
-using ProbabilisticCircuits
-
-
-@testset "pr_constraint Query" begin
-    # two nodes
-    simplevtree = zoo_vtree_file("simple2.vtree")
-    pc, vtree = load_struct_prob_circuit(
-                    zoo_psdd_file("simple2.4.psdd"), simplevtree)
-
-    cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
-
-    @test abs(pr_constraint(pc[end], pc[end], cache) - 1.0) < 1e-8
-    @test abs(pr_constraint(pc[5], pc[3], cache) - 0.2) < 1e-8
-    @test abs(pr_constraint(pc[5], pc[4], cache) - 0.8) < 1e-8
-
-    file_circuit = "little_4var.circuit"
-    file_vtree = "little_4var.vtree"
-    logic_circuit, vtree = load_struct_smooth_logic_circuit(
-                                zoo_lc_file(file_circuit), zoo_vtree_file(file_vtree))
-
-    pc = zoo_psdd("little_4var.psdd")
-
-    @test abs(pr_constraint(pc[end], logic_circuit[end - 1], cache) - 1.0) < 1e-8
-
-    # Test with two psdds
-    pc1, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.5.psdd"), simplevtree)
-    pc2, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.6.psdd"), simplevtree)
-
-    pr_constraint_cache = Dict{Tuple{ProbNode, Union{ProbNode, StructLogicCircuit}}, Float64}()
-    pr_constraint(pc1[end], pc2[end], pr_constraint_cache)
-    @test abs(pr_constraint_cache[pc1[1], pc2[1]] - 1.0) < 1e-8
-    @test abs(pr_constraint_cache[pc1[1], pc2[2]] - 0.0) < 1e-8
-    @test abs(pr_constraint_cache[pc1[3], pc2[4]] - 1.0) < 1e-8
-    @test abs(pr_constraint_cache[pc1[3], pc2[5]] - 0.0) < 1e-8
-    @test abs(pr_constraint_cache[pc1[9], pc2[8]] - 1.0) < 1e-8
-    @test abs(pr_constraint_cache[pc1[5], pc2[4]] - 0.2) < 1e-8
-    @test abs(pr_constraint_cache[pc1[5], pc2[5]] - 0.8) < 1e-8
-    @test abs(pr_constraint_cache[pc1[2], pc2[3]] - 1.0) < 1e-8
-end
\ No newline at end of file
diff --git a/test/Probabilistic/informations_tests.jl b/test/Probabilistic/informations_tests.jl
index 64e30164..91a23973 100644
--- a/test/Probabilistic/informations_tests.jl
+++ b/test/Probabilistic/informations_tests.jl
@@ -48,3 +48,40 @@ using ProbabilisticCircuits
     @test abs(kl_divergence(pc2, pc3) - 0.38966506) < 1e-8
 
 end
+
+@testset "Pr constraint Query" begin
+    # two nodes
+    simplevtree = zoo_vtree_file("simple2.vtree")
+    pc, vtree = load_struct_prob_circuit(
+                    zoo_psdd_file("simple2.4.psdd"), simplevtree)
+
+    cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
+
+    @test abs(pr_constraint(pc, pc, cache) - 1.0) < 1e-8
+    # @test abs(pr_constraint(pc[5], pc[3], cache) - 0.2) < 1e-8
+    # @test abs(pr_constraint(pc[5], pc[4], cache) - 0.8) < 1e-8
+
+    file_circuit = "little_4var.circuit"
+    file_vtree = "little_4var.vtree"
+    logic_circuit, vtree = load_struct_smooth_logic_circuit(
+                                zoo_lc_file(file_circuit), zoo_vtree_file(file_vtree))
+
+    pc = zoo_psdd("little_4var.psdd")
+
+    @test abs(pr_constraint(pc, children(logic_circuit)[1], cache) - 1.0) < 1e-8
+
+    # Test with two psdds
+    pc1, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.5.psdd"), simplevtree)
+    pc2, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.6.psdd"), simplevtree)
+
+    pr_constraint_cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
+    pr_constraint(pc1, pc2, pr_constraint_cache)
+    # @test abs(pr_constraint_cache[pc1[1], pc2[1]] - 1.0) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[1], pc2[2]] - 0.0) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[3], pc2[4]] - 1.0) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[3], pc2[5]] - 0.0) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[9], pc2[8]] - 1.0) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[5], pc2[4]] - 0.2) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[5], pc2[5]] - 0.8) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[2], pc2[3]] - 1.0) < 1e-8
+end
diff --git a/test/Probabilistic/VtreeLearnerTest.jl b/test/StructureLearner/VtreeLearnerTest.jl
similarity index 100%
rename from test/Probabilistic/VtreeLearnerTest.jl
rename to test/StructureLearner/VtreeLearnerTest.jl
diff --git a/test/Utils/informations_tests.jl b/test/Utils/informations_tests.jl
index e69de29b..12fd4ab7 100644
--- a/test/Utils/informations_tests.jl
+++ b/test/Utils/informations_tests.jl
@@ -0,0 +1,30 @@
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+
+function conditional_entropy_test()
+    N = 10
+    D = 5
+
+    b = rand(Bool, N, D)
+    dis_cache, hy_given_x = conditional_entropy(b, nothing; α=0)
+    p = dis_cache.pairwise
+    m = dis_cache.marginal
+
+    for x in 1 : D, y in 1 : D
+        h_y_x = p[x, y, 1] * log(p[x, y, 1] / m[x, 1]) +
+                    p[x, y, 2] * log(p[x, y, 2] / m[x, 1]) +
+                    p[x, y, 3] * log(p[x, y, 3] / m[x, 2]) +
+                    p[x, y, 4] * log(p[x, y, 4] / m[x, 2])
+        if x == y
+            @test hy_given_x[x, y] == 0.0
+        elseif !isnan(h_y_x)
+            @test hy_given_x[x, y] ≈ - h_y_x atol=1e-12
+        end
+    end
+end
+
+@testset "Information Theory Test" begin
+    conditional_entropy_test()
+end
+
diff --git a/test/runtests.jl b/test/runtests.jl
index b9e58d89..769e66dd 100644
--- a/test/runtests.jl
+++ b/test/runtests.jl
@@ -11,4 +11,5 @@ end
 
 using Jive
 
-runtests(@__DIR__, skip=["runtests.jl", "helper"])
+# TODO reinstate after refactoring all modules
+runtests(@__DIR__, skip=["runtests.jl", "helper", "Reasoning", "StructureLearner", "Mixtures", "Utils"])

From ff710bdc934df296550497ae0bf7905be7f515e8 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 16:13:07 -0700
Subject: [PATCH 021/131] fix

---
 .travis.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.travis.yml b/.travis.yml
index 1c3624fc..5aa78bc7 100644
--- a/.travis.yml
+++ b/.travis.yml
@@ -12,7 +12,7 @@ jobs:
   include:
     - stage: "Unit Tests"      
       os: linux
-      julia: 1.3
+      julia: 1.5
       install:
         - julia -e 'using Pkg; Pkg.activate("."); Pkg.add(PackageSpec(url="https://github.com/Juice-jl/LogicCircuits.jl")); Pkg.instantiate(); Pkg.precompile()'
         - julia -e 'using Pkg; Pkg.activate("./test"); Pkg.add(PackageSpec(url="https://github.com/Juice-jl/LogicCircuits.jl")); Pkg.develop(PackageSpec(path = pwd())); Pkg.instantiate(); Pkg.precompile();'
@@ -25,7 +25,7 @@ jobs:
 
     - stage: "Deploy Documentation"      
       os: linux
-      julia: 1.3
+      julia: 1.5
       script:
         - julia --project=docs/ -e 'using Pkg; Pkg.develop(PackageSpec(path=pwd())); Pkg.instantiate()'
         - julia --project=docs/ docs/make.jl

From a816a5ac8efcc2aa1e1d3ac1b09573a04e628b50 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 16:23:52 -0700
Subject: [PATCH 022/131] fix

---
 Project.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Project.toml b/Project.toml
index 3dd5e37d..cc639b0c 100644
--- a/Project.toml
+++ b/Project.toml
@@ -32,4 +32,4 @@ Reexport = "0.2"
 SimpleWeightedGraphs = "1.1"
 StatsBase = "0.33"
 StatsFuns = "0.9"
-julia = "1.3"
+julia = "1.5"

From a953244dbfd18fef6f05ad15278779657780eef9 Mon Sep 17 00:00:00 2001
From: meihua <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 17:27:09 -0700
Subject: [PATCH 023/131] Rename Queries.jl to queries.jl

---
 src/Probabilistic/{Queries.jl => queries.jl} | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)
 rename src/Probabilistic/{Queries.jl => queries.jl} (99%)

diff --git a/src/Probabilistic/Queries.jl b/src/Probabilistic/queries.jl
similarity index 99%
rename from src/Probabilistic/Queries.jl
rename to src/Probabilistic/queries.jl
index 441cc292..15f23419 100644
--- a/src/Probabilistic/Queries.jl
+++ b/src/Probabilistic/queries.jl
@@ -160,4 +160,4 @@ function sample(probs::AbstractVector{<:Number})::Int32
         end
     end
     return length(probs)
-end
\ No newline at end of file
+end

From 60198a6e5d277f79ad00159621a0e11090708724 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 19:21:42 -0700
Subject: [PATCH 024/131] reasoning

---
 src/LoadSave/circuit_savers.jl                |  2 +-
 src/Mixtures/deprecated/Bagging.jl            |  2 +-
 src/Mixtures/todo/EMLearner.jl                |  2 +-
 src/Mixtures/todo/Mixtures.jl                 |  8 +-
 src/ProbabilisticCircuits.jl                  |  5 +-
 src/Reasoning/Expectation.jl                  | 91 ++++++++++---------
 src/Reasoning/Reasoning.jl                    | 15 +--
 ...xpFlowCircuits.jl => exp_flow_circuits.jl} | 77 +++++++---------
 src/StructureLearner/CircuitBuilder.jl        | 14 +--
 src/StructureLearner/PSDDInitializer.jl       | 26 +++---
 src/Utils/decorators.jl                       |  3 +-
 test/Probabilistic/queries_tests.jl           |  3 +-
 ...ExpectationTest.jl => expectation_test.jl} | 34 +++----
 test/StructureLearner/CircuitBuilderTest.jl   |  2 +-
 test/StructureLearner/PSDDInitializerTest.jl  |  2 +-
 test/StructureLearner/VtreeLearnerTest.jl     |  2 +-
 test/runtests.jl                              |  2 +-
 17 files changed, 140 insertions(+), 150 deletions(-)
 rename src/Reasoning/{ExpFlowCircuits.jl => exp_flow_circuits.jl} (61%)
 rename test/Reasoning/{ExpectationTest.jl => expectation_test.jl} (78%)

diff --git a/src/LoadSave/circuit_savers.jl b/src/LoadSave/circuit_savers.jl
index aa138a9e..0027ef1b 100644
--- a/src/LoadSave/circuit_savers.jl
+++ b/src/LoadSave/circuit_savers.jl
@@ -169,7 +169,7 @@ function save_as_dot(circuit::ProbCircuit, file::String)
         elseif n isa ProbLiteralNode && isnegative(n)
             write(f, "$(node_cache[n]) [label=\"-$(variable(n.origin))\"]\n")
         else
-            throw("unknown ProbNode type")
+            throw("unknown ProbCircuit type")
         end
     end
 
diff --git a/src/Mixtures/deprecated/Bagging.jl b/src/Mixtures/deprecated/Bagging.jl
index 42e60515..980fa4e2 100644
--- a/src/Mixtures/deprecated/Bagging.jl
+++ b/src/Mixtures/deprecated/Bagging.jl
@@ -10,7 +10,7 @@ function bootstrap_samples_ids(train_x::PlainXData, n_samples::Int
         ids, n_instances, replace=true) for i in 1:n_samples]
 end
     
-function train_bagging(# pcs::Vector{<:ProbΔ},
+function train_bagging(# pcs::Vector{<:ProbCircuit},
                         train_x::XBatches{Bool},
                         n_components::Int64;
                         init_models=nothing,
diff --git a/src/Mixtures/todo/EMLearner.jl b/src/Mixtures/todo/EMLearner.jl
index e16b6f7f..8ad45ce7 100644
--- a/src/Mixtures/todo/EMLearner.jl
+++ b/src/Mixtures/todo/EMLearner.jl
@@ -1,7 +1,7 @@
 """
 Train a mixture of probabilistic circuits from data, starting with random example weights.
 """
-function train_mixture( pcs::Vector{<:ProbΔ},
+function train_mixture( pcs::Vector{<:ProbCircuit},
                         train_x::XBatches{Bool},
                         pseudocount, num_iters;
                         structure_learner=nothing, learnstruct_step = num_iters + 1, # structure learning
diff --git a/src/Mixtures/todo/Mixtures.jl b/src/Mixtures/todo/Mixtures.jl
index 68041988..88d3498d 100644
--- a/src/Mixtures/todo/Mixtures.jl
+++ b/src/Mixtures/todo/Mixtures.jl
@@ -14,7 +14,7 @@ abstract type AbstractMetaMixture <: AbstractMixture end
 "A probabilistic mixture model of probabilistic circuits"
 struct FlatMixture <: AbstractFlatMixture
     weights::Vector{Float64}
-    components::Vector{<:ProbΔ}
+    components::Vector{<:ProbCircuit}
     FlatMixture(w,c) = begin
         @assert length(w) == length(c)
         @assert sum(w) ≈ 1.0
@@ -24,7 +24,7 @@ end
 
 FlatMixture(c) = FlatMixture(uniform(length(c)),c)
 
-"A mixture with cached flow circuits for each component (which are assumed to be ProbΔs)"
+"A mixture with cached flow circuits for each component (which are assumed to be ProbCircuits)"
 struct FlatMixtureWithFlow <: AbstractFlatMixture
     origin::FlatMixture
     flowcircuits::Vector{<:FlowΔ}
@@ -53,7 +53,7 @@ end
 MetaMixture(c) = MetaMixture(uniform(length(c)),c)
 
 Mixture(w, c::Vector{<:AbstractMixture}) = MetaMixture(w, c)
-Mixture(w, c::Vector{<:ProbΔ}) = FlatMixture(w, c)
+Mixture(w, c::Vector{<:ProbCircuit}) = FlatMixture(w, c)
 
 #####################
 # Functions
@@ -79,7 +79,7 @@ ensure_with_flows(m::FlatMixture, size_hint::Int)::FlatMixtureWithFlow = begin
 end
 ensure_with_flows(m::FlatMixtureWithFlow, ::Int)::FlatMixtureWithFlow = m
 
-replace_prob_circuits(m::FlatMixture, pcs::Vector{ProbΔ}) =
+replace_prob_circuits(m::FlatMixture, pcs::Vector{ProbCircuit}) =
     FlatMixture(component_weights(m), pcs)
 
 # log_likelihood
diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index dea10633..6f62186d 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -15,15 +15,16 @@ include("Utils/Utils.jl")
 include("Probabilistic/Probabilistic.jl")
 include("Logistic/Logistic.jl")
 include("LoadSave/LoadSave.jl")
+include("Reasoning/Reasoning.jl")
+
 # include("StructureLearner/StructureLearner.jl")
-# include("Reasoning/Reasoning.jl")
 
 
 # USE CHILD MODULES (in order to re-export some functions)
 @reexport using .Probabilistic
 @reexport using .Logistic
 @reexport using .LoadSave
+@reexport using .Reasoning
 # @reexport using .StructureLearner
-# @reexport using .Reasoning
 
 end
diff --git a/src/Reasoning/Expectation.jl b/src/Reasoning/Expectation.jl
index f1246a58..0d397648 100644
--- a/src/Reasoning/Expectation.jl
+++ b/src/Reasoning/Expectation.jl
@@ -1,10 +1,13 @@
-ExpCacheDict = Dict{Pair{ProbNode, LogisticNode}, Array{Float64, 2}}
-MomentCacheDict = Dict{Tuple{ProbNode, LogisticNode, Int64}, Array{Float64, 2}}
+export Expectation, ExpectationUpward, Moment
+
+ExpCacheDict = Dict{Pair{ProbCircuit, LogisticCircuit}, Array{Float64, 2}}
+MomentCacheDict = Dict{Tuple{ProbCircuit, LogisticCircuit, Int64}, Array{Float64, 2}}
 
 struct ExpectationCache 
     f::ExpCacheDict
     fg::ExpCacheDict
 end
+
 ExpectationCache() = ExpectationCache(ExpCacheDict(), ExpCacheDict())
 
 struct MomentCache 
@@ -26,37 +29,37 @@ end
 """
 Missing values should be denoted by -1
 """
-function Expectation(pc::ProbΔ, lc::LogisticΔ, data::XData{Int8})
+function Expectation(pc::ProbCircuit, lc::LogisticCircuit, data)
     # 1. Get probability of each observation
-    fc, log_likelihoods = marginal_log_likelihood_per_instance(pc, data)
+    log_likelihoods = marginal_log_likelihood_per_instance(pc, data)
     p_observed = exp.( log_likelihoods )
     
     # 2. Expectation w.r.t. P(x_m, x_o)
     cache = ExpectationCache()
-    results_unnormalized = exp_g(pc[end], lc[end-1], data, cache) # skipping the bias node of lc
+    results_unnormalized = exp_g(pc, lc.children[1], data, cache) # skipping the bias node of lc
 
     # 3. Expectation w.r.t P(x_m | x_o)
     results = transpose(results_unnormalized) ./ p_observed
 
     # 4. Add Bias terms
-    biases = lc[end].thetas
+    biases = lc.thetas
     results .+= biases
     
     results, cache
 end
 
-function Moment(pc::ProbΔ, lc::LogisticΔ, data::XData{Int8}, moment::Int)
+function Moment(pc::ProbCircuit, lc::LogisticCircuit, data, moment::Int)
     # 1. Get probability of each observation
-    fc, log_likelihoods = marginal_log_likelihood_per_instance(pc, data)
+    log_likelihoods = marginal_log_likelihood_per_instance(pc, data)
     p_observed = exp.( log_likelihoods )
     
     # 2. Moment w.r.t. P(x_m, x_o)
     cache = MomentCache()
-    biases = lc[end].thetas
-    results_unnormalized = zeros(num_examples(data), classes(lc[end]))
+    biases = lc.thetas
+    results_unnormalized = zeros(num_examples(data), classes(lc))
     
     for z = 0:moment-1  
-        results_unnormalized .+= choose(moment, z) .* (biases .^ (z)) .* transpose(moment_g(pc[end], lc[end-1], data, moment - z, cache))
+        results_unnormalized .+= choose(moment, z) .* (biases .^ (z)) .* transpose(moment_g(pc, lc.children[1], data, moment - z, cache))
     end
     
     # 3. Moment w.r.t P(x_m | x_o)
@@ -69,30 +72,30 @@ function Moment(pc::ProbΔ, lc::LogisticΔ, data::XData{Int8}, moment::Int)
 end
 
 
-function ExpectationUpward(pc::ProbΔ, lc::LogisticΔ, data::XData{Int8})
-        # 1. Get probability of each observation
-        fc, log_likelihoods = marginal_log_likelihood_per_instance(pc, data)
-        p_observed = exp.( log_likelihoods )
-        
-        # 2. Expectation w.r.t. P(x_m, x_o)
-        exps_flow = exp_pass_up(pc, lc, data)
-        results_unnormalized = exps_flow[end].fg
+function ExpectationUpward(pc::ProbCircuit, lc::LogisticCircuit, data)
+    # 1. Get probability of each observation
+    log_likelihoods = marginal_log_likelihood_per_instance(pc, data)
+    p_observed = exp.( log_likelihoods )
     
-        # 3. Expectation w.r.t P(x_m | x_o)
-        results = transpose(results_unnormalized) ./ p_observed
+    # 2. Expectation w.r.t. P(x_m, x_o)
+    exps_flow = exp_pass_up(pc, lc, data)
+    results_unnormalized = exps_flow[end].fg
+
+    # 3. Expectation w.r.t P(x_m | x_o)
+    results = transpose(results_unnormalized) ./ p_observed
+
+    # 4. Add Bias terms
+    biases = lc.thetas
+    results .+= biases
     
-        # 4. Add Bias terms
-        biases = lc[end].thetas
-        results .+= biases
-        
-        results, exps_flow
+    results, exps_flow
 end
 
 
 # exp_f (pr-constraint) is originally from:
 #   Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
 
-function exp_f(n::Prob⋁, m::Logistic⋀Node, data::XData{Int8}, cache::Union{ExpectationCache, MomentCache})
+function exp_f(n::Prob⋁Node, m::Logistic⋁Node, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = zeros(1 , num_examples(data) )
         pthetas = [exp(n.log_thetas[i]) for i in 1:length(n.children)]
@@ -105,7 +108,7 @@ function exp_f(n::Prob⋁, m::Logistic⋀Node, data::XData{Int8}, cache::Union{E
     end
 end
 
-function exp_f(n::Prob⋀, m::Logistic⋀Node, data::XData{Int8}, cache::Union{ExpectationCache, MomentCache})
+function exp_f(n::Prob⋀Node, m::Logistic⋀Node, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = ones(1 , num_examples(data) )
         @fastmath for (i,j) in zip(n.children, m.children)
@@ -117,11 +120,11 @@ function exp_f(n::Prob⋀, m::Logistic⋀Node, data::XData{Int8}, cache::Union{E
 end
 
 
-@inline function exp_f(n::ProbLiteral, m::LogisticLiteral, data::XData{Int8}, cache::Union{ExpectationCache, MomentCache})
+@inline function exp_f(n::ProbLiteralNode, m::LogisticLiteral, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = zeros(1 , num_examples(data) )
         var = lit2var(literal(m))
-        X = feature_matrix(data)
+        X = data
         if ispositive(n) && ispositive(m) 
             # value[1, X[:, var] .== -1 ] .= 1.0  # missing observation always agrees
             # value[1, X[:, var] .== 1 ] .= 1.0 # positive observations
@@ -136,9 +139,9 @@ end
 end
 
 """
-Has to be a Logistic⋀Node with only one child, which is a leaf node 
+Has to be a Logistic⋁Node with only one child, which is a leaf node 
 """
-@inline function exp_f(n::ProbLiteral, m::Logistic⋀Node, data::XData{Int8}, cache::Union{ExpectationCache, MomentCache})
+@inline function exp_f(n::ProbLiteralNode, m::Logistic⋁Node, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         exp_f(n, m.children[1], data, cache)
     end
@@ -148,11 +151,11 @@ end
 ######## exp_g, exp_fg
 ########################################################################
 
-@inline function exp_g(n::Prob⋁, m::Logistic⋀Node, data::XData{Int8}, cache::ExpectationCache)
+@inline function exp_g(n::Prob⋁Node, m::Logistic⋁Node, data, cache::ExpectationCache)
     exp_fg(n, m, data, cache) # exp_fg and exp_g are the same for OR nodes
 end
 
-# function exp_g(n::Prob⋀, m::Logistic⋀Node, data::XData{Int8}, cache::ExpectationCache)
+# function exp_g(n::Prob⋀, m::Logistic⋀Node, data, cache::ExpectationCache)
 #     value = zeros(classes(m) , num_examples(data))
 #     @fastmath for (i,j) in zip(n.children, m.children)
 #         value .+= exp_fg(i, j, data, cache)
@@ -162,7 +165,7 @@ end
 # end
 
 
-function exp_fg(n::Prob⋁, m::Logistic⋀Node, data::XData{Int8}, cache::ExpectationCache)
+function exp_fg(n::Prob⋁Node, m::Logistic⋁Node, data, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         value = zeros(classes(m) , num_examples(data) )
         pthetas = [exp(n.log_thetas[i]) for i in 1:length(n.children)]
@@ -176,7 +179,7 @@ function exp_fg(n::Prob⋁, m::Logistic⋀Node, data::XData{Int8}, cache::Expect
     end
 end
 
-function exp_fg(n::Prob⋀, m::Logistic⋀Node, data::XData{Int8}, cache::ExpectationCache)
+function exp_fg(n::Prob⋀Node, m::Logistic⋀Node, data, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         # Assuming 2 children
         value = exp_f(n.children[1], m.children[1], data, cache) .* exp_fg(n.children[2], m.children[2], data, cache)
@@ -187,15 +190,15 @@ end
 
 
 """
-Has to be a Logistic⋀Node with only one child, which is a leaf node 
+Has to be a Logistic⋁Node with only one child, which is a leaf node 
 """
-@inline function exp_fg(n::ProbLiteral, m::Logistic⋀Node, data::XData{Int8}, cache::ExpectationCache)
+@inline function exp_fg(n::ProbLiteralNode, m::Logistic⋁Node, data, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         m.thetas[1,:] .* exp_f(n, m, data, cache)
     end
 end
 
-@inline function exp_fg(n::ProbLiteral, m::LogisticLiteral, data::XData{Int8}, cache::ExpectationCache)
+@inline function exp_fg(n::ProbLiteralNode, m::LogisticLiteral, data, cache::ExpectationCache)
     #dont know how many classes, boradcasting does the job
     zeros(1 , num_examples(data)) 
 end
@@ -204,7 +207,7 @@ end
 ######## moment_g, moment_fg
 ########################################################################
 
-@inline function moment_g(n::Prob⋁, m::Logistic⋀Node, data::XData{Int8}, moment::Int, cache::MomentCache)
+@inline function moment_g(n::Prob⋁Node, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
     get!(cache.fg, (n, m, moment)) do
         moment_fg(n, m, data, moment, cache)
     end
@@ -213,7 +216,7 @@ end
 """
 Calculating  E[g^k * f]
 """
-function moment_fg(n::Prob⋁, m::Logistic⋀Node, data::XData{Int8}, moment::Int, cache::MomentCache)
+function moment_fg(n::Prob⋁Node, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
     if moment == 0
         return exp_f(n, m, data, cache)
     end
@@ -232,13 +235,13 @@ function moment_fg(n::Prob⋁, m::Logistic⋀Node, data::XData{Int8}, moment::In
     end
 end
 
-@inline function moment_fg(n::ProbLiteral, m::Logistic⋀Node, data::XData{Int8}, moment::Int, cache::MomentCache)
+@inline function moment_fg(n::ProbLiteralNode, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
     get!(cache.fg, (n, m, moment)) do
         m.thetas[1,:].^(moment) .* exp_f(n, m, data, cache)
     end
 end
 
-@inline function moment_fg(n::ProbLiteral, m::LogisticLiteral, data::XData{Int8}, moment::Int, cache::MomentCache)
+@inline function moment_fg(n::ProbLiteralNode, m::LogisticLiteral, data, moment::Int, cache::MomentCache)
     #dont know how many classes, boradcasting does the job
     if moment == 0
         exp_f(n, m, data, cache)
@@ -247,7 +250,7 @@ end
     end
 end
 
-function moment_fg(n::Prob⋀, m::Logistic⋀Node, data::XData{Int8}, moment::Int, cache::MomentCache)
+function moment_fg(n::Prob⋀Node, m::Logistic⋀Node, data, moment::Int, cache::MomentCache)
     if moment == 0
         return exp_f(n, m, data, cache)
     end
diff --git a/src/Reasoning/Reasoning.jl b/src/Reasoning/Reasoning.jl
index ce486ff4..a87f0145 100644
--- a/src/Reasoning/Reasoning.jl
+++ b/src/Reasoning/Reasoning.jl
@@ -1,20 +1,11 @@
 module Reasoning
 
 using LogicCircuits
+using ..Utils
 using ..Probabilistic
 using ..Logistic
-using ..Utils
-
-export 
-    UpExpFlow,
-    ExpFlowΔ,
-    exp_pass_up,
-    Expectation,
-    ExpectationUpward,
-    Moment
-
-include("Expectation.jl")
-include("ExpFlowCircuits.jl")
 
+include("expectation.jl")
+include("exp_flow_circuits.jl")
 
 end
\ No newline at end of file
diff --git a/src/Reasoning/ExpFlowCircuits.jl b/src/Reasoning/exp_flow_circuits.jl
similarity index 61%
rename from src/Reasoning/ExpFlowCircuits.jl
rename to src/Reasoning/exp_flow_circuits.jl
index 314423b7..7722fe5d 100644
--- a/src/Reasoning/ExpFlowCircuits.jl
+++ b/src/Reasoning/exp_flow_circuits.jl
@@ -1,74 +1,67 @@
-########################
-# Do not use for now
-######################
+export UpExpFlow, ExpFlowCircuit, exp_pass_up
+
 #####################
 # Expectation Flow circuits
 # For use of algorithms depending on pairs of nodes of two circuits
 #####################
 
 "A expectation circuit node that has pair of origins of type PC and type LC"
-abstract type DecoratorNodePair{PC<:Node, LC<:Node} <: Node end
-
-abstract type ExpFlowNode{PC, LC, F} <: DecoratorNodePair{PC, LC} end
+abstract type ExpFlowNode{F} end
 
-const ExpFlowΔ{O} = AbstractVector{<:ExpFlowNode{<:O}}
+const ExpFlowCircuit{O} = Vector{<:ExpFlowNode{<:O}}
 
-struct UpExpFlow{PC, LC, F} <: ExpFlowNode{PC, LC, F}
-    p_origin::PC
-    f_origin::LC
-    children::Vector{<:ExpFlowNode{<:PC, <:LC, <:F}}
+struct UpExpFlow{F} <: ExpFlowNode{F}
+    p_origin::ProbCircuit
+    f_origin::LogisticCircuit
+    children::Vector{<:ExpFlowNode{<:F}}
     f::F
     fg::F
 end
 
-
 """
 Construct a upward expectation flow circuit from a given pair of PC and LC circuits
 Note that its assuming the two circuits share the same vtree
 """
-function ExpFlowΔ(pc::ProbΔ, lc::LogisticΔ, batch_size::Int, ::Type{El}) where El
-    pc_type = grapheltype(pc)
-    lc_type = grapheltype(lc)
-
+function ExpFlowCircuit(pc::ProbCircuit, lc::LogisticCircuit, batch_size::Int, ::Type{El}) where El
     F = Array{El, 2}
     fmem = () -> zeros(1, batch_size) #Vector{El}(undef, batch_size)  #init_array(El, batch_size) # note: fmem's return type will determine type of all UpFlows in the circuit (should be El)
-    fgmem = () -> zeros(classes(lc[end]), batch_size)
+    fgmem = () -> zeros(classes(lc), batch_size)
 
-    root_pc = pc[end]
-    root_lc = lc[end- 1]
+    root_pc = pc
+    root_lc = lc.children[1]
     
     cache = Dict{Pair{Node, Node}, ExpFlowNode}()
-    sizehint!(cache, (length(pc) + length(lc))*4÷3)
+    sizehint!(cache, (num_nodes(pc) + num_nodes(lc))*4÷3)
     expFlowCircuit = Vector{ExpFlowNode}()
 
-    function ExpflowTraverse(n::Prob⋁, m::Logistic⋀Node) 
+    function ExpflowTraverse(n::Prob⋁Node, m::Logistic⋁Node) 
         get!(cache, Pair(n, m)) do
             children = [ ExpflowTraverse(i, j) for i in n.children for j in m.children]
-            node = UpExpFlow{pc_type,lc_type, F}(n, m, children, fmem(), fgmem())
+            node = UpExpFlow{F}(n, m, children, fmem(), fgmem())
             push!(expFlowCircuit, node)
             return node
         end
     end
-    function ExpflowTraverse(n::Prob⋀, m::Logistic⋀Node) 
+    function ExpflowTraverse(n::Prob⋀Node, m::Logistic⋀Node) 
         get!(cache, Pair(n, m)) do
             children = [ ExpflowTraverse(z[1], z[2]) for z in zip(n.children, m.children) ]
-            node = UpExpFlow{pc_type,lc_type, F}(n, m, children, fmem(), fgmem())
+            node = UpExpFlow{F}(n, m, children, fmem(), fgmem())
             push!(expFlowCircuit, node)
             return node
         end
     end
-    function ExpflowTraverse(n::ProbLiteral, m::Logistic⋀Node) 
+    function ExpflowTraverse(n::ProbLiteralNode, m::Logistic⋁Node) 
         get!(cache, Pair(n, m)) do
-            children = Vector{ExpFlowNode{pc_type,lc_type, F}}() # TODO
-            node = UpExpFlow{pc_type,lc_type, F}(n, m, children, fmem(), fgmem())
+            children = Vector{ExpFlowNode{F}}() # TODO
+            node = UpExpFlow{F}(n, m, children, fmem(), fgmem())
             push!(expFlowCircuit, node)
             return node
         end
     end
-    function ExpflowTraverse(n::ProbLiteral, m::LogisticLiteral) 
+    function ExpflowTraverse(n::ProbLiteralNode, m::LogisticLiteral) 
         get!(cache, Pair(n, m)) do
-            children = Vector{ExpFlowNode{pc_type,lc_type, F}}() # TODO
-            node = UpExpFlow{pc_type,lc_type, F}(n, m, children, fmem(), fgmem())
+            children = Vector{ExpFlowNode{F}}() # TODO
+            node = UpExpFlow{F}(n, m, children, fmem(), fgmem())
             push!(expFlowCircuit, node)
             return node
         end
@@ -78,28 +71,28 @@ function ExpFlowΔ(pc::ProbΔ, lc::LogisticΔ, batch_size::Int, ::Type{El}) wher
     expFlowCircuit
 end
 
-function exp_pass_up(pc::ProbΔ, lc::LogisticΔ, data::XData{E}) where{E <: eltype(F)} where{PC, LC, F}
-    expFlowCircuit = ExpFlowΔ(pc, lc, num_examples(data), Float64);
+function exp_pass_up(pc::ProbCircuit, lc::LogisticCircuit, data)
+    expFlowCircuit = ExpFlowCircuit(pc, lc, num_examples(data), Float64);
     for n in expFlowCircuit
         exp_pass_up_node(n, data)
     end 
     expFlowCircuit
 end
 
-function exp_pass_up(fc::ExpFlowΔ, data::XData{E}) where{E <: eltype(F)} where{PC, LC, F}
+function exp_pass_up(fc::ExpFlowCircuit, data)
     #TODO write resize_flows similar to flow_circuits
     #     and give as input the expFlowCircuit instead
-    #expFlowCircuit = ExpFlowΔ(pc, lc, num_examples(data), Float64);
+    #expFlowCircuit = ExpFlowCircuit(pc, lc, num_examples(data), Float64);
     for n in fc
         exp_pass_up_node(n, data)
     end
 end
 
-function exp_pass_up_node(node::ExpFlowNode{PC,LC,F}, data::XData{E}) where{E <: eltype(F)} where{PC, LC, F}
+function exp_pass_up_node(node::ExpFlowNode{E}, data) where E
     pType = typeof(node.p_origin)
     fType = typeof(node.f_origin)
 
-    if node.p_origin isa Prob⋁ && node.f_origin isa Logistic⋀Node
+    if node.p_origin isa Prob⋁Node && node.f_origin isa Logistic⋁Node
         #todo this ordering might be different than the ExpFlowNode children
         pthetas = [exp(node.p_origin.log_thetas[i])
                     for i in 1:length(node.p_origin.children) for j in 1:length(node.f_origin.children)]
@@ -113,13 +106,13 @@ function exp_pass_up_node(node::ExpFlowNode{PC,LC,F}, data::XData{E}) where{E <:
             node.fg .+= (pthetas[z] .* fthetas[z]) .* node.children[z].f
             node.fg .+= pthetas[z] .* node.children[z].fg
         end
-    elseif node.p_origin isa Prob⋀ && node.f_origin isa Logistic⋀Node
+    elseif node.p_origin isa Prob⋀Node && node.f_origin isa Logistic⋀Node
         node.f .= node.children[1].f .* node.children[2].f # assume 2 children
         node.fg .= (node.children[1].f .* node.children[2].fg) .+
                    (node.children[2].f .* node.children[1].fg)
 
-    elseif node.p_origin isa ProbLiteral 
-        if node.f_origin isa Logistic⋀Node
+    elseif node.p_origin isa ProbLiteralNode 
+        if node.f_origin isa Logistic⋁Node
             m = node.f_origin.children[1]
         elseif node.f_origin isa LogisticLiteral
             m = node.f_origin
@@ -127,8 +120,8 @@ function exp_pass_up_node(node::ExpFlowNode{PC,LC,F}, data::XData{E}) where{E <:
             error("Invalid Types of pairs {$pType} - {$fType}")
         end
 
-        var = lit2var(literal(m))
-        X = feature_matrix(data)
+        var = variable(m)
+        X = data
         if ispositive(node.p_origin) && ispositive(m)
             node.f[:, X[:, var] .!= 0 ] .= 1.0 # positive and missing observations
             node.f[:, X[:, var] .== 0 ] .= 0.0
@@ -139,7 +132,7 @@ function exp_pass_up_node(node::ExpFlowNode{PC,LC,F}, data::XData{E}) where{E <:
             node.f .= 0.0
         end
 
-        if node.f_origin isa Logistic⋀Node
+        if node.f_origin isa Logistic⋁Node
             node.fg .= node.f .* transpose(node.f_origin.thetas)
         else
             node.fg .= 0.0
diff --git a/src/StructureLearner/CircuitBuilder.jl b/src/StructureLearner/CircuitBuilder.jl
index cfdefccb..758b3b1f 100644
--- a/src/StructureLearner/CircuitBuilder.jl
+++ b/src/StructureLearner/CircuitBuilder.jl
@@ -9,7 +9,7 @@ using MetaGraphs: get_prop
 Learning from data a circuit with several structure learning algorithms
 """
 function learn_probabilistic_circuit(data::Union{XData, WXData}; 
-        pseudocount = 1.0, algo = "chow-liu", algo_kwargs=(α=1.0, clt_root="graph_center"))::ProbΔ
+        pseudocount = 1.0, algo = "chow-liu", algo_kwargs=(α=1.0, clt_root="graph_center"))::ProbCircuit
     if algo == "chow-liu"
         clt = learn_chow_liu_tree(data; algo_kwargs...)
         pc = compile_prob_circuit_from_clt(clt)
@@ -21,15 +21,15 @@ function learn_probabilistic_circuit(data::Union{XData, WXData};
 end
 
 "Build decomposable probability circuits from Chow-Liu tree"
-function compile_prob_circuit_from_clt(clt::CLT)::ProbΔ
+function compile_prob_circuit_from_clt(clt::CLT)::ProbCircuit
     topo_order = Var.(reverse(topological_sort_by_dfs(clt::CLT))) #order to parse the node
-    lin = Vector{ProbNode}()
+    lin = Vector{ProbCircuit}()
     node_cache = Dict{Lit, LogicCircuit}()
     prob_cache = ProbCache()
     parent = parent_vector(clt)
 
-    prob_children(n)::Vector{<:ProbNode{<:node_type_deprecated(n)}} =  
-        collect(ProbNode{<:node_type_deprecated(n)}, map(c -> prob_cache[c], n.children))
+    prob_children(n)::Vector{<:ProbCircuit{<:node_type_deprecated(n)}} =  
+        collect(ProbCircuit{<:node_type_deprecated(n)}, map(c -> prob_cache[c], n.children))
 
     "default order of circuit node, from left to right: +/1 -/0"
 
@@ -100,7 +100,7 @@ function compile_prob_circuit_from_clt(clt::CLT)::ProbΔ
         return n
     end
 
-    function compile_independent_roots(roots::Vector{ProbNode})
+    function compile_independent_roots(roots::Vector{ProbCircuit})
         temp = Plain⋀Node([c.origin for c in roots])
         n = Prob⋀(temp, prob_children(temp))
         prob_cache[temp] = n
@@ -112,7 +112,7 @@ function compile_prob_circuit_from_clt(clt::CLT)::ProbΔ
         push!(lin, n)
     end
 
-    roots = Vector{ProbNode}()
+    roots = Vector{ProbCircuit}()
     for id in topo_order
         children = Var.(outneighbors(clt, id))
         if isequal(children, [])
diff --git a/src/StructureLearner/PSDDInitializer.jl b/src/StructureLearner/PSDDInitializer.jl
index a394dac6..7a086875 100644
--- a/src/StructureLearner/PSDDInitializer.jl
+++ b/src/StructureLearner/PSDDInitializer.jl
@@ -97,14 +97,14 @@ function compile_psdd_from_clt(clt::MetaDiGraph, vtree::PlainVtree)
     order = linearize(vtree[end])
     parent_clt = Var.(parent_vector(clt))
 
-    lin = Vector{ProbNode}()
+    lin = Vector{ProbCircuit}()
     prob_cache = ProbCache()
     lit_cache = LitCache()
-    v2p = Dict{PlainVtree, ProbΔ}()
+    v2p = Dict{PlainVtree, ProbCircuit}()
 
     get_params(cpt::Dict) = length(cpt) == 2 ? [cpt[1], cpt[0]] : [cpt[(1,1)], cpt[(0,1)], cpt[(1,0)], cpt[(0,0)]]
-    function add_mapping!(v::PlainVtree, circuits::ProbΔ)
-        if !haskey(v2p, v); v2p[v] = Vector{ProbNode}(); end
+    function add_mapping!(v::PlainVtree, circuits::ProbCircuit)
+        if !haskey(v2p, v); v2p[v] = Vector{ProbCircuit}(); end
         foreach(c -> if !(c in v2p[v]) push!(v2p[v], c);end, circuits)
     end
 
@@ -149,7 +149,7 @@ end
 #####################
 
 prob_children(n, prob_cache) =  
-    collect(ProbNode{<:StructLogicCircuit}, map(c -> prob_cache[c], n.children))
+    collect(ProbCircuit{<:StructLogicCircuit}, map(c -> prob_cache[c], n.children))
 
 "Add leaf nodes to circuit `lin`"
 function add_prob_leaf_node(var::Var, vtree::PlainVtreeLeafNode, lit_cache::LitCache, prob_cache::ProbCache, lin)
@@ -167,7 +167,7 @@ function add_prob_leaf_node(var::Var, vtree::PlainVtreeLeafNode, lit_cache::LitC
 end
 
 "Add prob⋀ node to circuit `lin`"
-function add_prob⋀_node(children::ProbΔ, vtree::PlainVtreeInnerNode, prob_cache::ProbCache, lin)::Prob⋀
+function add_prob⋀_node(children::ProbCircuit, vtree::PlainVtreeInnerNode, prob_cache::ProbCache, lin)::Prob⋀
     logic = PlainStruct⋀Node{PlainVtree}([c.origin for c in children], vtree)
     prob = Prob⋀(logic, prob_children(logic, prob_cache))
     prob_cache[logic] = prob
@@ -176,7 +176,7 @@ function add_prob⋀_node(children::ProbΔ, vtree::PlainVtreeInnerNode, prob_cac
 end
 
 "Add prob⋁ node to circuit `lin`"
-function add_prob⋁_node(children::ProbΔ, vtree::PlainVtree, thetas::Vector{Float64}, prob_cache::ProbCache, lin)::Prob⋁
+function add_prob⋁_node(children::ProbCircuit, vtree::PlainVtree, thetas::Vector{Float64}, prob_cache::ProbCache, lin)::Prob⋁
     logic = PlainStruct⋁Node{PlainVtree}([c.origin for c in children], vtree)
     prob = Prob⋁(logic, prob_children(logic, prob_cache))
     prob.log_thetas = log.(thetas)
@@ -186,7 +186,7 @@ function add_prob⋁_node(children::ProbΔ, vtree::PlainVtree, thetas::Vector{Fl
 end
 
 "Construct decision nodes given `primes` and `subs`"
-function compile_decision_node(primes::ProbΔ, subs::ProbΔ, vtree::PlainVtreeInnerNode, params::Vector{Float64}, prob_cache::ProbCache, lin)
+function compile_decision_node(primes::ProbCircuit, subs::ProbCircuit, vtree::PlainVtreeInnerNode, params::Vector{Float64}, prob_cache::ProbCache, lin)
     elements = [add_prob⋀_node([prime, sub], vtree, prob_cache, lin) for (prime, sub) in zip(primes, subs)]
     return add_prob⋁_node(elements, vtree, params, prob_cache, lin)
 end
@@ -204,7 +204,7 @@ function compile_true_nodes(var::Var, vtree::PlainVtreeLeafNode, probs::Vector{F
 end
 
 "Construct decision nodes conditiond on different distribution"
-function compile_decision_nodes(primes::ProbΔ, subs::ProbΔ, vtree::PlainVtreeInnerNode, params::Vector{Float64}, prob_cache::ProbCache, lin)
+function compile_decision_nodes(primes::ProbCircuit, subs::ProbCircuit, vtree::PlainVtreeInnerNode, params::Vector{Float64}, prob_cache::ProbCache, lin)
     return [compile_decision_node(primes, subs, vtree, params[i:i+1], prob_cache, lin) for i in 1:2:length(params)]
 end
 
@@ -230,7 +230,7 @@ function set_base(index, n::PlainStruct⋀Node, bases)
     bases[n] = sum([bases[c] for c in n.children])
 end
 
-function calculate_all_bases(circuit::ProbΔ)::BaseCache
+function calculate_all_bases(circuit::ProbCircuit)::BaseCache
     num_var = num_variables(circuit[end].origin.vtree)
     bases = BaseCache()
     foreach(n -> bases[n.origin] = fill(⊤, num_var), circuit)
@@ -243,7 +243,7 @@ end
 # Compile fully factorized PSDD from vtree, all variables are independent initially
 #####################
 
-function compile_fully_factorized_psdd_from_vtree(vtree::PlainVtree)::ProbΔ
+function compile_fully_factorized_psdd_from_vtree(vtree::PlainVtree)::ProbCircuit
 
     function ful_factor_node(v::PlainVtreeLeafNode, lit_cache::LitCache, prob_cache::ProbCache, v2n, lin)
         var = variables(v)[1]
@@ -262,10 +262,10 @@ function compile_fully_factorized_psdd_from_vtree(vtree::PlainVtree)::ProbΔ
         nothing
     end
 
-    lin = Vector{ProbNode}()
+    lin = Vector{ProbCircuit}()
     prob_cache = ProbCache()
     lit_cache = LitCache()
-    v2n = Dict{PlainVtree, ProbNode}()
+    v2n = Dict{PlainVtree, ProbCircuit}()
 
     for v in vtree
         ful_factor_node(v, lit_cache, prob_cache, v2n, lin)
diff --git a/src/Utils/decorators.jl b/src/Utils/decorators.jl
index 38097da4..b5611870 100644
--- a/src/Utils/decorators.jl
+++ b/src/Utils/decorators.jl
@@ -4,7 +4,8 @@ GateType, NodeType, variable, ispositive, isnegative, origin, num_parameters
 using LogicCircuits
 
 "Root of the decorator circuit node hierarchy"
-abstract type DecoratorCircuit <: Dag end
+# TODO rm DecoratorCircuit Type 
+abstract type DecoratorCircuit <: LogicCircuit end
 
 #####################
 # functions that need to be implemented for each type of decorator circuit
diff --git a/test/Probabilistic/queries_tests.jl b/test/Probabilistic/queries_tests.jl
index 24e57c08..b87cd359 100644
--- a/test/Probabilistic/queries_tests.jl
+++ b/test/Probabilistic/queries_tests.jl
@@ -169,9 +169,10 @@ end
 
 end
 
+using DataStructures
 @testset "Sampling With Evidence" begin
     # TODO (pashak) this test should be improved by adding few more cases
-    EPS = 1e-3;
+    EPS = 1e-2;
     prob_circuit = zoo_psdd("little_4var.psdd");
 
     N = 4;
diff --git a/test/Reasoning/ExpectationTest.jl b/test/Reasoning/expectation_test.jl
similarity index 78%
rename from test/Reasoning/ExpectationTest.jl
rename to test/Reasoning/expectation_test.jl
index b0b59a71..c8aafc50 100644
--- a/test/Reasoning/ExpectationTest.jl
+++ b/test/Reasoning/expectation_test.jl
@@ -2,19 +2,19 @@ using Test
 using LogicCircuits
 using ProbabilisticCircuits
 
-function test_expectation_brute_force(pc::ProbΔ, lc::LogisticΔ, data::XData, CLASSES::Int)
+function test_expectation_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLASSES::Int)
     EPS = 1e-7;
-    COUNT = size(data.x)[1]
+    COUNT = size(data)[1]
     # Compute True expectation brute force
     true_exp = zeros(COUNT, CLASSES)
     for i in 1:COUNT
-        row = data.x[i, :]
-        cur_data_all = XData(generate_all(row))
+        row = data[i, :]
+        cur_data_all = generate_all(row)
 
-        fc1, calc_p = log_likelihood_per_instance(pc, cur_data_all)
+        calc_p = log_likelihood_per_instance(pc, cur_data_all)
         calc_p = exp.(calc_p)
 
-        fc2, calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
+        calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
         true_exp[i, :] = sum(calc_p .* calc_f, dims=1)
         true_exp[i, :] ./= sum(calc_p) #p_observed
     end
@@ -35,19 +35,19 @@ function test_expectation_brute_force(pc::ProbΔ, lc::LogisticΔ, data::XData, C
     end
 end
 
-function test_moment_brute_force(pc::ProbΔ, lc::LogisticΔ, data::XData, CLASSES::Int, moment::Int)
+function test_moment_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLASSES::Int, moment::Int)
     EPS = 1e-7;
-    COUNT = size(data.x)[1]
+    COUNT = size(data)[1]
     # Compute True moment brute force
     true_mom = zeros(COUNT, CLASSES)
     for i in 1:COUNT
-        row = data.x[i, :]
-        cur_data_all = XData(generate_all(row))
+        row = data[i, :]
+        cur_data_all = generate_all(row)
 
-        fc1, calc_p = log_likelihood_per_instance(pc, cur_data_all)
+        calc_p = log_likelihood_per_instance(pc, cur_data_all)
         calc_p = exp.(calc_p)
 
-        fc2, calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
+        calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
         true_mom[i, :] = sum(calc_p .* (calc_f .^ moment), dims=1)
         true_mom[i, :] ./= sum(calc_p) #p_observed
     end
@@ -70,7 +70,7 @@ end
 
     pc = zoo_psdd(psdd_file);
     lc = zoo_lc(logistic_file, CLASSES);
-    data = XData(Int8.([
+    data = Int8.([
                         0 0 0 0; 
                         0 1 1 0; 
                         0 0 1 1;
@@ -82,7 +82,7 @@ end
                         -1 -1 0 1;
                         -1 -1 -1 1;
                         -1 -1 -1 0;
-                        ]));
+                        ]);
 
     test_expectation_brute_force(pc, lc, data, CLASSES)
 end
@@ -97,7 +97,7 @@ end
 
     pc = zoo_psdd(psdd_file);
     lc = zoo_lc(logistic_file, CLASSES);
-    data = XData(Int8.(rand( (-1,0,1), (COUNT, N) )))
+    data = Int8.(rand( (-1,0,1), (COUNT, N) ))
     
     test_expectation_brute_force(pc, lc, data, CLASSES)
 end
@@ -112,7 +112,7 @@ end
 
     pc = zoo_psdd(psdd_file);
     lc = zoo_lc(logistic_file, CLASSES);
-    data = XData(Int8.(rand( (-1,0,1), (COUNT, N) )))
+    data = Int8.(rand( (-1,0,1), (COUNT, N) ))
 
     test_moment_brute_force(pc, lc, data, CLASSES, 1)
     test_moment_brute_force(pc, lc, data, CLASSES, 2)
@@ -131,7 +131,7 @@ end
 
     pc = zoo_psdd(psdd_file);
     lc = zoo_lc(logistic_file, CLASSES);
-    data = XData(Int8.(rand( (-1,0,1), (COUNT, N) )))
+    data = Int8.(rand( (-1,0,1), (COUNT, N) ))
 
     test_moment_brute_force(pc, lc, data, CLASSES, 1)
     test_moment_brute_force(pc, lc, data, CLASSES, 2)
diff --git a/test/StructureLearner/CircuitBuilderTest.jl b/test/StructureLearner/CircuitBuilderTest.jl
index 48415a53..40c38db5 100644
--- a/test/StructureLearner/CircuitBuilderTest.jl
+++ b/test/StructureLearner/CircuitBuilderTest.jl
@@ -8,7 +8,7 @@ using ProbabilisticCircuits
     pc = learn_probabilistic_circuit(train_x; pseudocount = 1.0, algo = "chow-liu", algo_kwargs=(α=1.0, clt_root="graph_center"))
     
     # simple test
-    @test pc isa ProbΔ
+    @test pc isa ProbCircuit
     @test check_parameter_integrity(pc)
     @test num_parameters(pc) == 62 
     @test pc[26].log_thetas[1] ≈ -0.023528423773273476 atol=1.0e-7
diff --git a/test/StructureLearner/PSDDInitializerTest.jl b/test/StructureLearner/PSDDInitializerTest.jl
index 2065e894..cd8b51a3 100644
--- a/test/StructureLearner/PSDDInitializerTest.jl
+++ b/test/StructureLearner/PSDDInitializerTest.jl
@@ -9,7 +9,7 @@ using ProbabilisticCircuits
             vtree = "chow-liu", vtree_kwargs=(vtree_mode="balanced",))
     
     # simple test
-    @test pc isa ProbΔ
+    @test pc isa ProbCircuit
     @test vtree isa PlainVtree
     @test num_variables(vtree) == num_features(data)
     @test check_parameter_integrity(pc)
diff --git a/test/StructureLearner/VtreeLearnerTest.jl b/test/StructureLearner/VtreeLearnerTest.jl
index 146929fb..a9dac98a 100644
--- a/test/StructureLearner/VtreeLearnerTest.jl
+++ b/test/StructureLearner/VtreeLearnerTest.jl
@@ -13,7 +13,7 @@ using ProbabilisticCircuits
     mktempdir() do tmp
         save(vtree, "$tmp/test.vtree.dot")        
         psdd = compile_psdd_from_clt(clt, vtree);
-        @test psdd isa ProbΔ
+        @test psdd isa ProbCircuit
         save_as_dot(psdd, "$tmp/test.psdd.dot")
     end
     
diff --git a/test/runtests.jl b/test/runtests.jl
index 769e66dd..bddbc3e2 100644
--- a/test/runtests.jl
+++ b/test/runtests.jl
@@ -12,4 +12,4 @@ end
 using Jive
 
 # TODO reinstate after refactoring all modules
-runtests(@__DIR__, skip=["runtests.jl", "helper", "Reasoning", "StructureLearner", "Mixtures", "Utils"])
+runtests(@__DIR__, skip=["runtests.jl", "helper", "StructureLearner", "Mixtures", "Utils"])

From c3bb754f753a825dcd5a0cead3b514616c6dc3e2 Mon Sep 17 00:00:00 2001
From: meihua <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 19:31:41 -0700
Subject: [PATCH 025/131] Rename Expectation.jl to expectation.jl

---
 src/Reasoning/{Expectation.jl => expectation.jl} | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)
 rename src/Reasoning/{Expectation.jl => expectation.jl} (99%)

diff --git a/src/Reasoning/Expectation.jl b/src/Reasoning/expectation.jl
similarity index 99%
rename from src/Reasoning/Expectation.jl
rename to src/Reasoning/expectation.jl
index 0d397648..92f25309 100644
--- a/src/Reasoning/Expectation.jl
+++ b/src/Reasoning/expectation.jl
@@ -262,4 +262,4 @@ function moment_fg(n::Prob⋀Node, m::Logistic⋀Node, data, moment::Int, cache:
         end
         return value
     end
-end
\ No newline at end of file
+end

From a445f96de2b240f2551f9bf4ec14d2427573b238 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 24 Jul 2020 19:37:12 -0700
Subject: [PATCH 026/131] add todo

---
 src/Probabilistic/parameters.jl | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/Probabilistic/parameters.jl b/src/Probabilistic/parameters.jl
index 60047fae..cd53ae5b 100644
--- a/src/Probabilistic/parameters.jl
+++ b/src/Probabilistic/parameters.jl
@@ -23,3 +23,5 @@ function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
     end
 end
 
+
+# TODO add em paramaters learning 

From afb1460560bbace9da9c5b4abc547780b5243a79 Mon Sep 17 00:00:00 2001
From: Pasha Khosravi <khosravipasha@users.noreply.github.com>
Date: Sat, 25 Jul 2020 02:06:21 -0700
Subject: [PATCH 027/131] fix doc build issue

Doc build uses the latest release of LogicCircuits instead of lastest commit, changing it to use the latest commit.
---
 .travis.yml | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/.travis.yml b/.travis.yml
index 5aa78bc7..753ff389 100644
--- a/.travis.yml
+++ b/.travis.yml
@@ -14,20 +14,21 @@ jobs:
       os: linux
       julia: 1.5
       install:
-        - julia -e 'using Pkg; Pkg.activate("."); Pkg.add(PackageSpec(url="https://github.com/Juice-jl/LogicCircuits.jl")); Pkg.instantiate(); Pkg.precompile()'
+        - julia -e 'using Pkg; Pkg.activate("."); Pkg.add(PackageSpec(url="https://github.com/Juice-jl/LogicCircuits.jl")); Pkg.instantiate(); Pkg.precompile();'
         - julia -e 'using Pkg; Pkg.activate("./test"); Pkg.add(PackageSpec(url="https://github.com/Juice-jl/LogicCircuits.jl")); Pkg.develop(PackageSpec(path = pwd())); Pkg.instantiate(); Pkg.precompile();'
 
       script:
         - julia --code-coverage --color=yes -p2 test/runtests.jl
 
       after_success:
-        - julia -e 'using Pkg; Pkg.add("Coverage"); using Coverage; Codecov.submit(process_folder())'
+        - julia -e 'using Pkg; Pkg.add("Coverage"); using Coverage; Codecov.submit(process_folder());'
 
     - stage: "Deploy Documentation"      
       os: linux
       julia: 1.5
       script:
-        - julia --project=docs/ -e 'using Pkg; Pkg.develop(PackageSpec(path=pwd())); Pkg.instantiate()'
+        - julia --project=docs/ -e 'using Pkg; Pkg.develop(PackageSpec(url="https://github.com/Juice-jl/LogicCircuits.jl")); Pkg.instantiate(); Pkg.precompile();'
+        - julia --project=docs/ -e 'using Pkg; Pkg.develop(PackageSpec(path=pwd())); Pkg.instantiate();'
         - julia --project=docs/ docs/make.jl
       after_success: skip
 
@@ -38,4 +39,4 @@ notifications:
     on_start: always
     on_error: always
     rooms:
-      - secure: VMXOgM9g758gZiU06/Gaahns6CFpoSuDYMnl9g0LMv165HEe7tZPlF1IFbTEXk6svr+tAuSEd3oxs/kAyK7onI3hIpP0PSc+Y7/+rnOMk8zU+z7R6JEzQKHHb1M6pQ6MjzOia9BM7SfcfVqedPREVXZx+XJPmVuR4BgTOxUnnyfltZzW0ldSbyeJ37FdDSd9SDRRf7Q4UzbEMN33GfVsTKMZoRqASrZXhvqAVp7deXMdGp1kNlvIbbwVkeICLYTIYrm5zd0HkH2yEhk0AtgeTpyx/kkR1T0Fs2+PCDsLRPhP1EEJs7FdsdQJuP0SueJ92GpPd7yLYZVVWWQkGWudNb6H3iYp2xtbZCoeCBLEUgusrawwdxp0OlNOgP/aeJDc+zNy59ikraluI0sNCV1Pl8dIXu8Ihu6e7W6hoiTQ8K9PjwcXSmBgUsR+kXD8NcCx73RTxynokv+24Xk0M1pkJhu6mjNjZBDIegXVM/CnNew1LSMoMjdi43asuDiDbkZg2uCxfHwaMxlgWuM/M38r662FbOjEfgr13fhCyuUQZRFOKvvqU17HbA+ewC/J40C2g0sBDGPu/uOJsDJaQGPXDpXsh4G+8R7uZRNunhwNPK4OnVdY+uVnYlD+9TG9T1IothaDSRJvYU8HwAcUOJhMNYDDQosWOy+01NQtX0IYRgk=
\ No newline at end of file
+      - secure: VMXOgM9g758gZiU06/Gaahns6CFpoSuDYMnl9g0LMv165HEe7tZPlF1IFbTEXk6svr+tAuSEd3oxs/kAyK7onI3hIpP0PSc+Y7/+rnOMk8zU+z7R6JEzQKHHb1M6pQ6MjzOia9BM7SfcfVqedPREVXZx+XJPmVuR4BgTOxUnnyfltZzW0ldSbyeJ37FdDSd9SDRRf7Q4UzbEMN33GfVsTKMZoRqASrZXhvqAVp7deXMdGp1kNlvIbbwVkeICLYTIYrm5zd0HkH2yEhk0AtgeTpyx/kkR1T0Fs2+PCDsLRPhP1EEJs7FdsdQJuP0SueJ92GpPd7yLYZVVWWQkGWudNb6H3iYp2xtbZCoeCBLEUgusrawwdxp0OlNOgP/aeJDc+zNy59ikraluI0sNCV1Pl8dIXu8Ihu6e7W6hoiTQ8K9PjwcXSmBgUsR+kXD8NcCx73RTxynokv+24Xk0M1pkJhu6mjNjZBDIegXVM/CnNew1LSMoMjdi43asuDiDbkZg2uCxfHwaMxlgWuM/M38r662FbOjEfgr13fhCyuUQZRFOKvvqU17HbA+ewC/J40C2g0sBDGPu/uOJsDJaQGPXDpXsh4G+8R7uZRNunhwNPK4OnVdY+uVnYlD+9TG9T1IothaDSRJvYU8HwAcUOJhMNYDDQosWOy+01NQtX0IYRgk=

From 6e8e0032e6de22b8204ee9782918d58a1394b1ad Mon Sep 17 00:00:00 2001
From: Pasha Khosravi <khosravipasha@gmail.com>
Date: Sat, 25 Jul 2020 02:41:22 -0700
Subject: [PATCH 028/131] fix docs - renamed IO module to LoadSave

---
 docs/src/api/internals/io.md               | 6 ------
 docs/src/api/internals/loadsave.md         | 6 ++++++
 docs/src/api/internals/probabilistic.md    | 2 +-
 docs/src/api/internals/reasoning.md        | 2 +-
 docs/src/api/internals/structureLearner.md | 2 +-
 docs/src/api/internals/utils.md            | 2 +-
 6 files changed, 10 insertions(+), 10 deletions(-)
 delete mode 100644 docs/src/api/internals/io.md
 create mode 100644 docs/src/api/internals/loadsave.md

diff --git a/docs/src/api/internals/io.md b/docs/src/api/internals/io.md
deleted file mode 100644
index 972aa218..00000000
--- a/docs/src/api/internals/io.md
+++ /dev/null
@@ -1,6 +0,0 @@
-
-# IO
-
-```@autodocs
-Modules = [ProbabilisticCircuits.IO]
-```
\ No newline at end of file
diff --git a/docs/src/api/internals/loadsave.md b/docs/src/api/internals/loadsave.md
new file mode 100644
index 00000000..3f74274e
--- /dev/null
+++ b/docs/src/api/internals/loadsave.md
@@ -0,0 +1,6 @@
+
+# LoadSave
+
+```@autodocs
+Modules = [ProbabilisticCircuits.LoadSave]
+```
\ No newline at end of file
diff --git a/docs/src/api/internals/probabilistic.md b/docs/src/api/internals/probabilistic.md
index 2d862da9..8d045097 100644
--- a/docs/src/api/internals/probabilistic.md
+++ b/docs/src/api/internals/probabilistic.md
@@ -1,5 +1,5 @@
 # Probabilistic
 
 ```@autodocs
-Modules = [Probabilistic]
+Modules = [ProbabilisticCircuits.Probabilistic]
 ```
\ No newline at end of file
diff --git a/docs/src/api/internals/reasoning.md b/docs/src/api/internals/reasoning.md
index 65d5400a..e8428ba2 100644
--- a/docs/src/api/internals/reasoning.md
+++ b/docs/src/api/internals/reasoning.md
@@ -1,5 +1,5 @@
 # Reasoning
 
 ```@autodocs
-Modules = [Reasoning]
+Modules = [ProbabilisticCircuits.Reasoning]
 ```
diff --git a/docs/src/api/internals/structureLearner.md b/docs/src/api/internals/structureLearner.md
index 72719021..78ab902f 100644
--- a/docs/src/api/internals/structureLearner.md
+++ b/docs/src/api/internals/structureLearner.md
@@ -1,5 +1,5 @@
 # StructureLearner
 
 ```@autodocs
-Modules = [StructureLearner]
+Modules = [ProbabilisticCircuits.StructureLearner]
 ```
diff --git a/docs/src/api/internals/utils.md b/docs/src/api/internals/utils.md
index c8dae019..57998984 100644
--- a/docs/src/api/internals/utils.md
+++ b/docs/src/api/internals/utils.md
@@ -1,5 +1,5 @@
 # Utils
 
 ```@autodocs
-Modules = [Utils]
+Modules = [ProbabilisticCircuits.Utils]
 ```

From 83b8d96ce437416a6b7b6ba1ef52b5d477e1ee97 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 25 Jul 2020 21:37:12 -0700
Subject: [PATCH 029/131] logical -> logic

---
 src/IO/CircuitLineCompiler.jl         | 115 ++++++++++++++++++++++++++
 src/LoadSave/circuit_line_compiler.jl |  10 +--
 2 files changed, 120 insertions(+), 5 deletions(-)
 create mode 100644 src/IO/CircuitLineCompiler.jl

diff --git a/src/IO/CircuitLineCompiler.jl b/src/IO/CircuitLineCompiler.jl
new file mode 100644
index 00000000..604a2e5e
--- /dev/null
+++ b/src/IO/CircuitLineCompiler.jl
@@ -0,0 +1,115 @@
+#####################
+# Compilers to ProbabilisticCircuits data structures starting from already parsed line objects
+#####################
+
+# reuse some internal infrastructure of LogicCircuits' IO module
+using LogicCircuits.IO: CircuitFormatLines, CircuitFormatLine, VtreeFormatLines, CircuitHeaderLine, UnweightedLiteralLine, WeightedLiteralLine, DecisionLine, LCElement, BiasLine, WeightedNamedConstantLine, PSDDElement, CircuitCommentLine, ID,
+compile_smooth_struct_logical_m, compile_smooth_logical_m
+
+"""
+Compile lines into a probabilistic circuit.
+"""
+function compile_prob(lines::CircuitFormatLines)::ProbΔ
+    # first compile a logic circuit
+    logic_circuit, id2lognode = compile_smooth_logical_m(lines)
+    decorate_prob(lines, logic_circuit, id2lognode)
+end
+
+"""
+Compile lines into a logistic circuit.
+"""
+function compile_logistic(lines::CircuitFormatLines, classes::Int)::LogisticΔ
+    # first compile a logic circuit
+    logic_circuit, id2lognode = compile_smooth_logical_m(lines)
+    decorate_logistic(lines, logic_circuit, classes, id2lognode)
+end
+
+"""
+Compile circuit and vtree lines into a structured probabilistic circuit (one whose logic circuit origin is structured).
+"""
+function compile_struct_prob(circuit_lines::CircuitFormatLines, vtree_lines::VtreeFormatLines)
+    logic_circuit, vtree, id2vtree, id2lognode = compile_smooth_struct_logical_m(circuit_lines, vtree_lines)
+    prob_circuit = decorate_prob(circuit_lines, logic_circuit, id2lognode)
+    return prob_circuit, vtree
+end
+
+function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicΔ, id2lognode::Dict{ID,<:LogicCircuit})::ProbΔ
+    # set up cache mapping logic circuit nodes to their probabilistic decorator
+    lognode2probnode = ProbCache()
+    # build a corresponding probabilistic circuit
+    prob_circuit = ProbΔ(logic_circuit,lognode2probnode)
+    # map from line node ids to probabilistic circuit nodes
+    id2probnode(id) = lognode2probnode[id2lognode[id]]
+
+    # go through lines again and update the probabilistic circuit node parameters
+
+    function compile(ln::CircuitFormatLine)
+        error("Compilation of line $ln into probabilistic circuit is not supported")
+    end
+    function compile(::Union{CircuitHeaderLine,CircuitCommentLine,UnweightedLiteralLine})
+        # do nothing
+    end
+    function compile(ln::WeightedNamedConstantLine)
+        @assert lnconstant(ln) == true
+        node = id2probnode(ln.node_id)::Prob⋁
+        node.log_thetas .= [ln.weight, log1p(-exp(ln.weight)) ]
+    end
+    function compile(ln::DecisionLine{<:PSDDElement})
+        node = id2probnode(ln.node_id)::Prob⋁
+        node.log_thetas .= [x.weight for x in ln.elements]
+    end
+    for ln in lines
+        compile(ln)
+    end
+
+    prob_circuit
+end
+
+
+function decorate_logistic(lines::CircuitFormatLines, logic_circuit::LogicΔ, 
+                            classes::Int, id2lognode::Dict{ID,<:LogicCircuit})::LogisticΔ
+                        
+    # set up cache mapping logic circuit nodes to their logistic decorator
+    log2logistic = LogisticCache()
+    # build a corresponding probabilistic circuit
+    logistic_circuit = LogisticΔ(logic_circuit, classes, log2logistic)
+    # map from line node ids to probabilistic circuit nodes
+    id2logisticnode(id) = log2logistic[id2lognode[id]]
+
+    # go through lines again and update the probabilistic circuit node parameters
+
+    function compile(ln::CircuitFormatLine)
+        error("Compilation of line $ln into logistic circuit is not supported")
+    end
+    function compile(::Union{CircuitHeaderLine,CircuitCommentLine,UnweightedLiteralLine})
+        # do nothing
+    end
+
+    function compile(ln::CircuitHeaderLine)
+        # do nothing
+    end
+
+    function compile(ln::WeightedLiteralLine)
+        node = id2logisticnode(ln.node_id)::Logistic⋁
+        node.thetas[1, :] .= ln.weights
+    end
+
+    function compile(ln::DecisionLine{<:LCElement})
+        node = id2logisticnode(ln.node_id)::Logistic⋁
+        for (ind, elem) in enumerate(ln.elements)
+            node.thetas[ind, :] .= elem.weights
+        end
+    end
+
+    function compile(ln::BiasLine)
+        node = id2logisticnode(ln.node_id)::Logistic⋁
+        # @assert length(node.thetas) == 1
+        node.thetas[1,:] .= ln.weights
+    end
+
+    for ln in lines
+        compile(ln)
+    end
+
+    logistic_circuit
+end
\ No newline at end of file
diff --git a/src/LoadSave/circuit_line_compiler.jl b/src/LoadSave/circuit_line_compiler.jl
index 24058656..eb72a8a2 100644
--- a/src/LoadSave/circuit_line_compiler.jl
+++ b/src/LoadSave/circuit_line_compiler.jl
@@ -12,7 +12,7 @@ CircuitCommentLine, ID, compile_smooth_struct_logical_m, compile_smooth_logical_
 Compile lines into a probabilistic circuit
 """
 function compile_prob(lines::CircuitFormatLines)::ProbCircuit
-    # first compile a logical circuit
+    # first compile a logic circuit
     logic_circuit, id2lognode = compile_smooth_logical_m(lines)
     decorate_prob(lines, logic_circuit, id2lognode)
 end
@@ -21,13 +21,13 @@ end
 Compile lines into a logistic circuit.
 """
 function compile_logistic(lines::CircuitFormatLines, classes::Int)::LogisticCircuit
-    # first compile a logical circuit
+    # first compile a logic circuit
     logic_circuit, id2lognode = compile_smooth_logical_m(lines)
     decorate_logistic(lines, logic_circuit, classes, id2lognode)
 end
 
 """
-Compile circuit and vtree lines into a structured probabilistic circuit (one whose logical circuit origin is structured).
+Compile circuit and vtree lines into a structured probabilistic circuit (one whose logic circuit origin is structured).
 """
 function compile_struct_prob(circuit_lines::CircuitFormatLines, vtree_lines::VtreeFormatLines)
     logic_circuit, vtree, id2lognode, id2vtree = compile_smooth_struct_logical_m(circuit_lines, vtree_lines)
@@ -36,7 +36,7 @@ function compile_struct_prob(circuit_lines::CircuitFormatLines, vtree_lines::Vtr
 end
 
 function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicCircuit, id2lognode::Dict{ID,<:LogicCircuit})::ProbCircuit
-    # set up cache mapping logical circuit nodes to their probabilistic decorator
+    # set up cache mapping logic circuit nodes to their probabilistic decorator
     prob_circuit = ProbCircuit(logic_circuit)
     lognode2probnode = Dict{LogicCircuit, ProbCircuit}()
     foreach(pn -> (lognode2probnode[origin(pn)] = pn), prob_circuit) 
@@ -72,7 +72,7 @@ end
 function decorate_logistic(lines::CircuitFormatLines, logic_circuit::LogicCircuit,
                             classes::Int, id2lognode::Dict{ID,<:LogicCircuit})::LogisticCircuit
                         
-    # set up cache mapping logical circuit nodes to their logistic decorator
+    # set up cache mapping logic circuit nodes to their logistic decorator
     logistic_circuit = LogisticCircuit(logic_circuit, classes)
     log2logistic = Dict{LogicCircuit, LogisticCircuit}()
     foreach(ln -> (log2logistic[origin(ln)] = ln), logistic_circuit) 

From 29fd22889d2ec744195220e1ca4782480c6dfd57 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Sat, 25 Jul 2020 22:58:12 -0700
Subject: [PATCH 030/131] rm decorator circuit

---
 src/LoadSave/circuit_line_compiler.jl        |  11 +-
 src/LoadSave/circuit_savers.jl               |  33 +---
 src/Logistic/logistic_nodes.jl               |  36 ++--
 src/Logistic/queries.jl                      |   6 +-
 src/Probabilistic/Probabilistic.jl           |  12 +-
 src/Probabilistic/{flows.jl => exp_flows.jl} |  33 ++--
 src/Probabilistic/parameters.jl              |   8 +-
 src/Probabilistic/prob_nodes.jl              |  41 +++--
 src/Probabilistic/queries.jl                 |  28 ++--
 src/Reasoning/exp_flow_circuits.jl           |  39 +++--
 src/Reasoning/expectation.jl                 |  48 +++---
 src/StructureLearner/CircuitBuilder.jl       |   2 +-
 src/Utils/decorators.jl                      |  67 +-------
 temp.vtree                                   |  17 ++
 test/LoadSave/circuit_loaders_tests.jl       |   4 +-
 test/LoadSave/circuit_savers_test.jl         |  24 +--
 test/Probabilistic/informations_tests.jl     | 163 ++++++++++---------
 test/Probabilistic/prob_nodes_tests.jl       |   8 +-
 test/Probabilistic/queries_tests.jl          |  20 ++-
 19 files changed, 262 insertions(+), 338 deletions(-)
 rename src/Probabilistic/{flows.jl => exp_flows.jl} (87%)
 create mode 100644 temp.vtree

diff --git a/src/LoadSave/circuit_line_compiler.jl b/src/LoadSave/circuit_line_compiler.jl
index 24058656..efbc9c5c 100644
--- a/src/LoadSave/circuit_line_compiler.jl
+++ b/src/LoadSave/circuit_line_compiler.jl
@@ -39,7 +39,11 @@ function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicCircuit, i
     # set up cache mapping logical circuit nodes to their probabilistic decorator
     prob_circuit = ProbCircuit(logic_circuit)
     lognode2probnode = Dict{LogicCircuit, ProbCircuit}()
-    foreach(pn -> (lognode2probnode[origin(pn)] = pn), prob_circuit) 
+
+    prob_lin = linearize(prob_circuit) # TODO better implementation
+    logic_lin = linearize(logic_circuit)
+
+    foreach(i -> lognode2probnode[logic_lin[i]] = prob_lin[i], 1 : num_nodes(logic_circuit)) 
 
     # map from line node ids to probabilistic circuit nodes
     id2probnode(id) = lognode2probnode[id2lognode[id]]
@@ -75,7 +79,10 @@ function decorate_logistic(lines::CircuitFormatLines, logic_circuit::LogicCircui
     # set up cache mapping logical circuit nodes to their logistic decorator
     logistic_circuit = LogisticCircuit(logic_circuit, classes)
     log2logistic = Dict{LogicCircuit, LogisticCircuit}()
-    foreach(ln -> (log2logistic[origin(ln)] = ln), logistic_circuit) 
+    logistic_lin = linearize(logistic_circuit)
+    logic_lin = linearize(logic_circuit)
+
+    foreach(i -> log2logistic[logic_lin[i]] = logistic_lin[i], 1 : length(logic_lin)) 
     id2logisticnode(id) = log2logistic[id2lognode[id]]
 
     root = nothing
diff --git a/src/LoadSave/circuit_savers.jl b/src/LoadSave/circuit_savers.jl
index 0027ef1b..28789f7f 100644
--- a/src/LoadSave/circuit_savers.jl
+++ b/src/LoadSave/circuit_savers.jl
@@ -4,6 +4,7 @@ using LogicCircuits.LoadSave: SDDElement,
     PSDDElement, 
     save_lines,
     get_vtree2id,
+    get_node2id,
     parse_psdd_file, 
     PsddHeaderLine, 
     LcHeaderLine, 
@@ -18,40 +19,20 @@ decompile(n::ProbLiteralNode, node2id, vtree2id)::UnweightedLiteralLine =
     UnweightedLiteralLine(node2id[n], vtree2id[n.origin.vtree], literal(n), true)
 
 make_element(n::Prob⋀Node, w::AbstractFloat, node2id) = 
-    PSDDElement(node2id[n.children[1]],  node2id[n.children[2]], w)
+    PSDDElement(node2id[children(n)[1]],  node2id[children(n)[2]], w)
 
 istrue_node(n)::Bool = 
-    GateType(n) isa ⋁Gate && num_children(n) == 2 && GateType(children(n)[1]) isa LiteralGate && GateType(children(n)[2]) isa LiteralGate && 
+    is⋁gate(n) && num_children(n) == 2 && GateType(children(n)[1]) isa LiteralGate && GateType(children(n)[2]) isa LiteralGate && 
     ispositive(children(n)[1]) && isnegative(children(n)[2])
 
 function decompile(n::Prob⋁Node, node2id, vtree2id)::Union{WeightedNamedConstantLine, DecisionLine{PSDDElement}} 
     if istrue_node(n)
-        WeightedNamedConstantLine(node2id[n], vtree2id[n.origin.vtree], lit2var(n.children[1].origin.literal), n.log_thetas[1]) # TODO
+        WeightedNamedConstantLine(node2id[n], vtree2id[n.origin.vtree], lit2var(children(n)[1].origin.literal), n.log_thetas[1]) # TODO
     else
         DecisionLine(node2id[n], vtree2id[n.origin.vtree], UInt32(num_children(n)), map(x -> make_element(x[1], x[2], node2id), zip(children(n), n.log_thetas)))
     end
 end
 
-#####################
-# build maping
-#####################
-
-# TODO same implementation, merge ?
-
-import LogicCircuits.LoadSave: get_node2id
-
-function get_node2id(circuit::DecoratorCircuit) 
-    node2id = Dict{DecoratorCircuit, ID}()
-    outnodes = filter(n -> !is⋀gate(n), circuit)
-    sizehint!(node2id, length(outnodes))
-    index = ID(0) # node id start from 0
-    for n in outnodes
-        node2id[n] = index
-        index += ID(1)
-    end
-    node2id
-end
-
 #####################
 # saver for circuits
 #####################
@@ -74,7 +55,6 @@ end
 
 function save_as_psdd(name::String, circuit::ProbCircuit, vtree::PlainVtree)
     # TODO add method isstructured
-    @assert circuit.origin isa StructLogicCircuit "PSDD should decorate on StructLogicΔ"
     @assert endswith(name, ".psdd")
     node2id = get_node2id(circuit)
     vtree2id = get_vtree2id(vtree)
@@ -110,7 +90,6 @@ function lc_header()
 end
     
 function save_as_logistic(name::String, circuit::LogisticCircuit, vtree)
-    @assert circuit.origin isa StructLogicCircuit "LC should decorate on StructLogicΔ"
     @assert endswith(name, ".circuit")
     node2id = get_node2id(circuit)
     vtree2id = get_vtree2id(vtree)
@@ -175,11 +154,11 @@ function save_as_dot(circuit::ProbCircuit, file::String)
 
     for n in reverse(circuit)
         if n isa Prob⋀
-            for c in n.children
+            for c in children(n)
                 write(f, "$(node_cache[n]) -> $(node_cache[c])\n")
             end
         elseif n isa Prob⋁
-            for (c, p) in zip(n.children, exp.(n.log_thetas))
+            for (c, p) in zip(children(n), exp.(n.log_thetas))
                 prob = @sprintf "%0.1f" p
                 write(f, "$(node_cache[n]) -> $(node_cache[c]) [label=\"$prob\"]\n")
             end
diff --git a/src/Logistic/logistic_nodes.jl b/src/Logistic/logistic_nodes.jl
index 9b7a364a..950dd8c8 100644
--- a/src/Logistic/logistic_nodes.jl
+++ b/src/Logistic/logistic_nodes.jl
@@ -7,14 +7,13 @@ export
     Logistic⋁Node,
     classes,
     num_parameters_perclass
-    # class_conditional_likelihood_per_instance,
     
 #####################
 # Infrastructure for logistic circuit nodes
 #####################
 
 "Root of the logistic circuit node hierarchy"
-abstract type LogisticCircuit <: DecoratorCircuit end
+abstract type LogisticCircuit <: LogicCircuit end
 
 """
 A logistic leaf node
@@ -30,12 +29,11 @@ abstract type LogisticInnerNode <: LogisticCircuit end
 A logistic literal node
 """
 mutable struct LogisticLiteral <: LogisticLeafNode
-    origin::LogicCircuit
+    literal::Lit
     data
     counter::UInt32
-    LogisticLiteral(n) = begin 
-        @assert GateType(n) isa LiteralGate
-        new(n, nothing, 0)
+    LogisticLiteral(l) = begin 
+        new(l, nothing, 0)
     end
 end
 
@@ -43,13 +41,11 @@ end
 A logistic conjunction node (And node)
 """
 mutable struct Logistic⋀Node <: LogisticInnerNode
-    origin::LogicCircuit
     children::Vector{<:LogisticCircuit}
     data
     counter::UInt32
-    Logistic⋀Node(n, children) = begin
-        @assert GateType(n) isa ⋀Gate
-        new(n, convert(Vector{LogisticCircuit}, children), nothing, 0)
+    Logistic⋀Node(children) = begin
+        new(convert(Vector{LogisticCircuit}, children), nothing, 0)
     end
 end
 
@@ -57,14 +53,12 @@ end
 A logistic disjunction node (Or node)
 """
 mutable struct Logistic⋁Node <: LogisticInnerNode
-    origin::LogicCircuit
     children::Vector{<:LogisticCircuit}
     thetas::Array{Float64, 2}
     data
     counter::UInt32
-    Logistic⋁Node(n, children, class::Int) = begin
-        @assert GateType(n) isa ⋁Gate
-        new(n, convert(Vector{LogisticCircuit}, children), init_array(Float64, length(children), class), nothing, 0)
+    Logistic⋁Node(children, class::Int) = begin
+        new(convert(Vector{LogisticCircuit}, children), init_array(Float64, length(children), class), nothing, 0)
     end
 end
 
@@ -73,7 +67,6 @@ end
 #####################
 
 import LogicCircuits.GateType # make available for extension
-
 @inline GateType(::Type{<:LogisticLiteral}) = LiteralGate()
 @inline GateType(::Type{<:Logistic⋀Node}) = ⋀Gate()
 @inline GateType(::Type{<:Logistic⋁Node}) = ⋁Gate()
@@ -82,14 +75,12 @@ import LogicCircuits.GateType # make available for extension
 # methods
 #####################
 
-import ..Utils: origin, num_parameters
-@inline origin(c::LogisticCircuit) = c.origin
-@inline num_parameters(c::LogisticCircuit) = sum(n -> num_children(n) * classes(n), ⋁_nodes(c))
-
 import LogicCircuits: children # make available for extension
 @inline children(n::LogisticInnerNode) = n.children
 @inline classes(n::Logistic⋁Node) = size(n.thetas)[2]
 
+import ..Utils: num_parameters
+@inline num_parameters(c::LogisticCircuit) = sum(n -> num_children(n) * classes(n), ⋁_nodes(c))
 @inline num_parameters_perclass(c::LogisticCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
 
 #####################
@@ -98,9 +89,8 @@ import LogicCircuits: children # make available for extension
 
 function LogisticCircuit(circuit::LogicCircuit, classes::Int)
     f_con(n) = error("Cannot construct a logistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-    f_lit(n) = LogisticLiteral(n)
-    f_a(n, cn) = Logistic⋀Node(n, cn)
-    f_o(n, cn) = Logistic⋁Node(n, cn, classes)
+    f_lit(n) = LogisticLiteral(literal(n))
+    f_a(n, cn) = Logistic⋀Node(cn)
+    f_o(n, cn) = Logistic⋁Node(cn, classes)
     foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, LogisticCircuit)
-
 end
diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index b96f631c..7c80e625 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -5,14 +5,14 @@ using ..Probabilistic: get_downflow, get_upflow
 Class Conditional Probability
 """
 function class_conditional_likelihood_per_instance(lc::LogisticCircuit,  classes::Int, data)
-    compute_flows(lc.origin, data)
+    compute_flows(lc, data)
     likelihoods = zeros(num_examples(data), classes)
     foreach(lc) do ln
         if ln isa Logistic⋁Node
             # For each class. orig.thetas is 2D so used eachcol
             for (idx, thetaC) in enumerate(eachcol(ln.thetas))
-                foreach(ln.children, thetaC) do c, theta
-                    likelihoods[:, idx] .+= Float64.(get_downflow(ln.origin) .& get_upflow(c.origin)) .* theta
+                foreach(children(ln), thetaC) do c, theta
+                    likelihoods[:, idx] .+= Float64.(get_downflow(ln) .& get_upflow(c)) .* theta
                 end
             end
         end
diff --git a/src/Probabilistic/Probabilistic.jl b/src/Probabilistic/Probabilistic.jl
index abfbebd0..a56d3e1c 100644
--- a/src/Probabilistic/Probabilistic.jl
+++ b/src/Probabilistic/Probabilistic.jl
@@ -3,18 +3,10 @@ module Probabilistic
 using LogicCircuits
 using ..Utils
 
-# include("Clustering.jl")
 include("prob_nodes.jl")
-include("flows.jl")
+include("exp_flows.jl")
 include("queries.jl")
-include("informations.jl")
+# include("informations.jl")
 include("parameters.jl")
-# include("ProbFlowCircuits.jl")
-# include("MutualInformation.jl")
-# include("Mixtures.jl")
-# include("Bagging.jl")
-# include("EMLearner.jl")
-# include("VtreeLearner.jl")
-
 
 end
diff --git a/src/Probabilistic/flows.jl b/src/Probabilistic/exp_flows.jl
similarity index 87%
rename from src/Probabilistic/flows.jl
rename to src/Probabilistic/exp_flows.jl
index 337ab65f..204a63c3 100644
--- a/src/Probabilistic/flows.jl
+++ b/src/Probabilistic/exp_flows.jl
@@ -1,6 +1,6 @@
-export get_downflow, get_upflow
+export evaluate_exp, compute_exp_flows, get_downflow, get_upflow, get_exp_downflow, get_exp_upflow
+
 
-import LogicCircuits: evaluate, compute_flows
 using StatsFuns: logsumexp
 
 # TODO move to LogicCircuits
@@ -37,11 +37,6 @@ end
 # performance-critical queries related to circuit flows
 #####################
 
-# evaluate a circuit as a function
-function (root::ProbCircuit)(data)
-    evaluate(root, data)
-end
-
 "Container for circuit flows represented as a float vector"
 const ExpUpFlow1 = Vector{Float64}
 
@@ -56,14 +51,14 @@ const ExpUpFlow = Union{ExpUpFlow1,ExpUpFlow2}
 @inline ExpUpFlow1(elems::ExpUpFlow1) = elems
 @inline ExpUpFlow1(elems::ExpUpFlow2) = elems.prime_flow .+ elems.sub_flow
 
-function evaluate(root::ProbCircuit, data;
+function evaluate_exp(root::ProbCircuit, data;
                    nload = nload, nsave = nsave, reset=true)::Vector{Float64}
     n_ex::Int = num_examples(data)
     ϵ = 1e-300
 
     @inline f_lit(n) = begin
         uf = convert(Vector{Int8}, feature_values(data, variable(n)))
-        if ispositive(origin(n))
+        if ispositive(n)
             uf[uf.==-1] .= 1
         else
             uf .= 1 .- uf
@@ -74,7 +69,7 @@ function evaluate(root::ProbCircuit, data;
     end
     
     @inline f_con(n) = begin
-        uf = istrue(origin(n)) ? ones(Float64, n_ex) : zeros(Float64, n_ex)
+        uf = istrue(n) ? ones(Float64, n_ex) : zeros(Float64, n_ex)
         uf .= log.(uf .+ ϵ)
     end
     
@@ -144,7 +139,7 @@ const ExpUpDownFlow2 = ExpUpFlow2
 const ExpUpDownFlow = Union{ExpUpDownFlow1, ExpUpDownFlow2}
 
 
-function compute_flows(circuit::ProbCircuit, data)
+function compute_exp_flows(circuit::ProbCircuit, data)
 
     # upward pass
     @inline upflow!(n, v) = begin
@@ -157,7 +152,7 @@ function compute_flows(circuit::ProbCircuit, data)
         (d isa ExpUpDownFlow1) ? d.upflow : d
     end
 
-    evaluate(circuit, data; nload=upflow, nsave=upflow!, reset=false)
+    evaluate_exp(circuit, data; nload=upflow, nsave=upflow!, reset=false)
     
     # downward pass
 
@@ -197,26 +192,26 @@ end
 """
 Get upflow of a probabilistic circuit
 """
-@inline get_upflow(pc::ProbCircuit) = get_upflow(pc.data)
-@inline get_upflow(elems::ExpUpDownFlow1) = elems.upflow
-@inline get_upflow(elems::ExpUpFlow) = ExpUpFlow1(elems)
+@inline get_exp_upflow(pc::ProbCircuit) = get_exp_upflow(pc.data)
+@inline get_exp_upflow(elems::ExpUpDownFlow1) = elems.upflow
+@inline get_exp_upflow(elems::ExpUpFlow) = ExpUpFlow1(elems)
 
 """
 Get the node/edge downflow from probabilistic circuit
 """
-function get_downflow(n::ProbCircuit; root=nothing)::Vector{Float64}
+function get_exp_downflow(n::ProbCircuit; root=nothing)::Vector{Float64}
     downflow(x::ExpUpDownFlow1) = x.downflow
     downflow(x::ExpUpDownFlow2) = begin
         ors = or_nodes(root)
         p = findall(p -> n in children(p), ors)
         @assert length(p) == 1
-        get_downflow(ors[p[1]], n)
+        get_exp_downflow(ors[p[1]], n)
     end
     downflow(n.data)
 end
 
-function get_downflow(n::ProbCircuit, c::ProbCircuit)::Vector{Float64}
+function get_exp_downflow(n::ProbCircuit, c::ProbCircuit)::Vector{Float64}
     @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
     log_theta = n.log_thetas[findfirst(x -> x == c, children(n))]
-    return get_downflow(n) .+ log_theta .+ get_upflow(c) .- get_upflow(n)
+    return get_exp_downflow(n) .+ log_theta .+ get_exp_upflow(c) .- get_exp_upflow(n)
 end
\ No newline at end of file
diff --git a/src/Probabilistic/parameters.jl b/src/Probabilistic/parameters.jl
index cd53ae5b..fe3887e6 100644
--- a/src/Probabilistic/parameters.jl
+++ b/src/Probabilistic/parameters.jl
@@ -5,15 +5,15 @@ Maximum likilihood estimation of parameters given data
 """
 function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
     @assert isbinarydata(data)
-    compute_flows(pc.origin, data)
+    compute_flows(pc, data)
     foreach(pc) do pn
         if pn isa Prob⋁Node
             if num_children(pn) == 1
                 pn.log_thetas .= 0.0
             else
-                smoothed_flow = Float64(sum(get_downflow(pn.origin))) + pseudocount
+                smoothed_flow = Float64(sum(get_downflow(pn))) + pseudocount
                 uniform_pseudocount = pseudocount / num_children(pn)
-                children_flows = map(c -> sum(get_downflow(pn.origin, c)), children(pn.origin))
+                children_flows = map(c -> sum(get_downflow(pn, c)), children(pn))
                 @. pn.log_thetas = log((children_flows + uniform_pseudocount) / smoothed_flow)
                 @assert isapprox(sum(exp.(pn.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally"
                 # normalize away any leftover error
@@ -24,4 +24,4 @@ function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
 end
 
 
-# TODO add em paramaters learning 
+# TODO add em paramaters learning 
\ No newline at end of file
diff --git a/src/Probabilistic/prob_nodes.jl b/src/Probabilistic/prob_nodes.jl
index 2bf43383..92dfd3fd 100644
--- a/src/Probabilistic/prob_nodes.jl
+++ b/src/Probabilistic/prob_nodes.jl
@@ -6,7 +6,7 @@ Prob⋁Node, check_parameter_integrity
 #####################
 
 "Root of the probabilistic circuit node hierarchy"
-abstract type ProbCircuit <: DecoratorCircuit end
+abstract type ProbCircuit <: LogicCircuit end
 
 """
 A probabilistic leaf node
@@ -22,26 +22,21 @@ abstract type ProbInnerNode <: ProbCircuit end
 A probabilistic literal node
 """
 mutable struct ProbLiteralNode <: ProbLeafNode
-    origin::LogicCircuit
+    literal::Lit
     data
     counter::UInt32
-    ProbLiteralNode(n) = begin 
-        @assert GateType(n) isa LiteralGate
-        new(n, nothing, 0)
-    end
+    ProbLiteralNode(l) = new(l, nothing, 0)
 end
 
 """
 A probabilistic conjunction node (And node)
 """
 mutable struct Prob⋀Node <: ProbInnerNode
-    origin::LogicCircuit
     children::Vector{<:ProbCircuit}
     data
     counter::UInt32
-    Prob⋀Node(n, children) = begin
-        @assert GateType(n) isa ⋀Gate
-        new(n, convert(Vector{ProbCircuit}, children), nothing, 0)
+    Prob⋀Node(children) = begin
+        new(convert(Vector{ProbCircuit}, children), nothing, 0)
     end
 end
 
@@ -49,14 +44,12 @@ end
 A probabilistic disjunction node (Or node)
 """
 mutable struct Prob⋁Node <: ProbInnerNode
-    origin::LogicCircuit
     children::Vector{<:ProbCircuit}
     log_thetas::Vector{Float64}
     data
     counter::UInt32
-    Prob⋁Node(n, children) = begin
-        @assert GateType(n) isa ⋁Gate
-        new(n, convert(Vector{ProbCircuit}, children), init_array(Float64, length(children)), nothing, 0)
+    Prob⋁Node(children) = begin
+        new(convert(Vector{ProbCircuit}, children), init_array(Float64, length(children)), nothing, 0)
     end
 end
 
@@ -74,11 +67,10 @@ import LogicCircuits.GateType # make available for extension
 # methods
 #####################
 
-import ..Utils: origin, num_parameters
-@inline origin(c::ProbCircuit) = c.origin
-
 import LogicCircuits: children # make available for extension
 @inline children(n::ProbInnerNode) = n.children
+
+import ..Utils: num_parameters
 @inline num_parameters(c::ProbCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
 
 #####################
@@ -87,14 +79,21 @@ import LogicCircuits: children # make available for extension
 
 function ProbCircuit(circuit::LogicCircuit)::ProbCircuit
     f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-    f_lit(n) = ProbLiteralNode(n)
-    f_a(n, cn) = Prob⋀Node(n, cn)
-    f_o(n, cn) = Prob⋁Node(n, cn)
+    f_lit(n) = ProbLiteralNode(literal(n))
+    f_a(n, cn) = Prob⋀Node(cn)
+    f_o(n, cn) = Prob⋁Node(cn)
     foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, ProbCircuit)
 end
 
-# TODO: import LogicCircuits: conjoin, disjoin, compile # make available for extension 
+function PlainLogicCircuit(circuit::ProbCircuit)::PlainLogicCircuit
+    f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
+    f_lit(n) = PlainLiteralNode(literal(n))
+    f_a(n, cn) = Plain⋀Node(cn)
+    f_o(n, cn) = Plain⋁Node(cn)
+    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, PlainLogicCircuit)
+end
 
+# TODO: import LogicCircuits: conjoin, disjoin, compile # make available for extension 
 
 function check_parameter_integrity(circuit::ProbCircuit)
     for node in or_nodes(circuit)
diff --git a/src/Probabilistic/queries.jl b/src/Probabilistic/queries.jl
index 15f23419..77650b3a 100644
--- a/src/Probabilistic/queries.jl
+++ b/src/Probabilistic/queries.jl
@@ -7,15 +7,15 @@ Complete evidence queries
 function log_likelihood_per_instance(pc::ProbCircuit, data)
     @assert isbinarydata(data) "Can only calculate EVI on Bool data"
     
-    compute_flows(origin(pc), data)
+    compute_flows(pc, data)
     log_likelihoods = zeros(Float64, num_examples(data))
     indices = init_array(Bool, num_examples(data))::BitVector
     
     ll(n::ProbCircuit) = ()
     ll(n::Prob⋁Node) = begin
         if num_children(n) != 1 # other nodes have no effect on likelihood
-            foreach(children(origin(n)), n.log_thetas) do c, log_theta
-                indices = get_downflow(origin(n), c)
+            foreach(children(n), n.log_thetas) do c, log_theta
+                indices = get_downflow(n, c)
                 view(log_likelihoods, indices::BitVector) .+=  log_theta # see MixedProductKernelBenchmark.jl
             end
          end
@@ -32,7 +32,7 @@ EVI = log_likelihood_per_instance
 Marginal queries
 """
 function marginal_log_likelihood_per_instance(pc::ProbCircuit, data)
-    evaluate(pc, data)
+    evaluate_exp(pc, data)
 end
 MAR = marginal_log_likelihood_per_instance
 
@@ -59,16 +59,16 @@ function MPE(pc::ProbCircuit, evidence)::BitMatrix
     end
     
     function mpe_simulate(node::Prob⋁Node, active_samples::BitVector, result::BitMatrix)
-        prs = zeros(length(node.children), size(active_samples)[1] )
-        @simd  for i=1:length(node.children)
-            prs[i,:] .= get_upflow(node.children[i]) .+ (node.log_thetas[i])
+        prs = zeros(length(children(node)), size(active_samples)[1] )
+        @simd  for i=1:length(children(node))
+            prs[i,:] .= get_exp_upflow(children(node)[i]) .+ (node.log_thetas[i])
         end
     
         max_child_ids = [a[1] for a in argmax(prs, dims = 1) ]
-        @simd for i=1:length(node.children)
+        @simd for i=1:length(children(node))
             # Only active for this child if it was the max for that sample
             ids = convert(BitVector, active_samples .* (max_child_ids .== i)[1,:])
-            mpe_simulate(node.children[i], ids, result)
+            mpe_simulate(children(node)[i], ids, result)
         end
     end
     
@@ -93,12 +93,12 @@ Sample from a PSDD without any evidence
 function sample(circuit::ProbCircuit)::AbstractVector{Bool}
 
     simulate(node::ProbLiteralNode) = begin
-        inst[variable(node.origin)] = ispositive(node) ? 1 : 0
+        inst[variable(node)] = ispositive(node) ? 1 : 0
     end
     
     simulate(node::Prob⋁Node) = begin
         idx = sample(exp.(node.log_thetas))
-        simulate(node.children[idx])
+        simulate(children(node)[idx])
     end
 
     simulate(node::Prob⋀Node) = foreach(simulate, children(node))
@@ -122,18 +122,18 @@ function sample(circuit::ProbCircuit, evidence)::AbstractVector{Bool}
     @assert num_examples(evidence) == 1 "evidence have to be one example"
     
     simulate(node::ProbLiteralNode) = begin
-        inst[variable(node.origin)] = ispositive(node) ? 1 : 0
+        inst[variable(node)] = ispositive(node) ? 1 : 0
     end
     
     function simulate(node::Prob⋁Node)
-        prs = [get_upflow(ch)[1] for ch in children(node)] # #evidence == 1
+        prs = [get_exp_upflow(ch)[1] for ch in children(node)] # #evidence == 1
         idx = sample(exp.(node.log_thetas .+ prs))
         simulate(children(node)[idx])
     end
     
     simulate(node::Prob⋀Node) = foreach(simulate, children(node))
 
-    evaluate(circuit, evidence)
+    evaluate_exp(circuit, evidence)
 
     inst = Dict{Var,Int64}()
     simulate(circuit)
diff --git a/src/Reasoning/exp_flow_circuits.jl b/src/Reasoning/exp_flow_circuits.jl
index 7722fe5d..363e7229 100644
--- a/src/Reasoning/exp_flow_circuits.jl
+++ b/src/Reasoning/exp_flow_circuits.jl
@@ -18,6 +18,9 @@ struct UpExpFlow{F} <: ExpFlowNode{F}
     fg::F
 end
 
+import LogicCircuits: children
+children(x::UpExpFlow) = x.children
+
 """
 Construct a upward expectation flow circuit from a given pair of PC and LC circuits
 Note that its assuming the two circuits share the same vtree
@@ -28,7 +31,7 @@ function ExpFlowCircuit(pc::ProbCircuit, lc::LogisticCircuit, batch_size::Int, :
     fgmem = () -> zeros(classes(lc), batch_size)
 
     root_pc = pc
-    root_lc = lc.children[1]
+    root_lc = children(lc)[1]
     
     cache = Dict{Pair{Node, Node}, ExpFlowNode}()
     sizehint!(cache, (num_nodes(pc) + num_nodes(lc))*4÷3)
@@ -36,32 +39,32 @@ function ExpFlowCircuit(pc::ProbCircuit, lc::LogisticCircuit, batch_size::Int, :
 
     function ExpflowTraverse(n::Prob⋁Node, m::Logistic⋁Node) 
         get!(cache, Pair(n, m)) do
-            children = [ ExpflowTraverse(i, j) for i in n.children for j in m.children]
-            node = UpExpFlow{F}(n, m, children, fmem(), fgmem())
+            ch = [ ExpflowTraverse(i, j) for i in children(n) for j in children(m)]
+            node = UpExpFlow{F}(n, m, ch, fmem(), fgmem())
             push!(expFlowCircuit, node)
             return node
         end
     end
     function ExpflowTraverse(n::Prob⋀Node, m::Logistic⋀Node) 
         get!(cache, Pair(n, m)) do
-            children = [ ExpflowTraverse(z[1], z[2]) for z in zip(n.children, m.children) ]
-            node = UpExpFlow{F}(n, m, children, fmem(), fgmem())
+            ch = [ ExpflowTraverse(z[1], z[2]) for z in zip(children(n), children(m)) ]
+            node = UpExpFlow{F}(n, m, ch, fmem(), fgmem())
             push!(expFlowCircuit, node)
             return node
         end
     end
     function ExpflowTraverse(n::ProbLiteralNode, m::Logistic⋁Node) 
         get!(cache, Pair(n, m)) do
-            children = Vector{ExpFlowNode{F}}() # TODO
-            node = UpExpFlow{F}(n, m, children, fmem(), fgmem())
+            ch = Vector{ExpFlowNode{F}}() # TODO
+            node = UpExpFlow{F}(n, m, ch, fmem(), fgmem())
             push!(expFlowCircuit, node)
             return node
         end
     end
     function ExpflowTraverse(n::ProbLiteralNode, m::LogisticLiteral) 
         get!(cache, Pair(n, m)) do
-            children = Vector{ExpFlowNode{F}}() # TODO
-            node = UpExpFlow{F}(n, m, children, fmem(), fgmem())
+            ch = Vector{ExpFlowNode{F}}() # TODO
+            node = UpExpFlow{F}(n, m, ch, fmem(), fgmem())
             push!(expFlowCircuit, node)
             return node
         end
@@ -95,25 +98,25 @@ function exp_pass_up_node(node::ExpFlowNode{E}, data) where E
     if node.p_origin isa Prob⋁Node && node.f_origin isa Logistic⋁Node
         #todo this ordering might be different than the ExpFlowNode children
         pthetas = [exp(node.p_origin.log_thetas[i])
-                    for i in 1:length(node.p_origin.children) for j in 1:length(node.f_origin.children)]
+                    for i in 1:length(children(node.p_origin)) for j in 1:length(children(node.f_origin))]
         fthetas = [node.f_origin.thetas[j,:] # only taking the first class for now
             for i in 1:length(node.p_origin.children) for j in 1:length(node.f_origin.children)]
 
         node.f .= 0.0
         node.fg .= 0.0
-        for z = 1:length(node.children)
-            node.f  .+= pthetas[z] .* node.children[z].f
-            node.fg .+= (pthetas[z] .* fthetas[z]) .* node.children[z].f
-            node.fg .+= pthetas[z] .* node.children[z].fg
+        for z = 1:length(children(node))
+            node.f  .+= pthetas[z] .* children(node)[z].f
+            node.fg .+= (pthetas[z] .* fthetas[z]) .* children(node)[z].f
+            node.fg .+= pthetas[z] .* children(node)[z].fg
         end
     elseif node.p_origin isa Prob⋀Node && node.f_origin isa Logistic⋀Node
-        node.f .= node.children[1].f .* node.children[2].f # assume 2 children
-        node.fg .= (node.children[1].f .* node.children[2].fg) .+
-                   (node.children[2].f .* node.children[1].fg)
+        node.f .= children(node)[1].f .* children(node)[2].f # assume 2 children
+        node.fg .= (children(node)[1].f .* children(node)[2].fg) .+
+                   (children(node)[2].f .* children(node)[1].fg)
 
     elseif node.p_origin isa ProbLiteralNode 
         if node.f_origin isa Logistic⋁Node
-            m = node.f_origin.children[1]
+            m = children(node.f_origin)[1]
         elseif node.f_origin isa LogisticLiteral
             m = node.f_origin
         else
diff --git a/src/Reasoning/expectation.jl b/src/Reasoning/expectation.jl
index 92f25309..85e573c3 100644
--- a/src/Reasoning/expectation.jl
+++ b/src/Reasoning/expectation.jl
@@ -36,7 +36,7 @@ function Expectation(pc::ProbCircuit, lc::LogisticCircuit, data)
     
     # 2. Expectation w.r.t. P(x_m, x_o)
     cache = ExpectationCache()
-    results_unnormalized = exp_g(pc, lc.children[1], data, cache) # skipping the bias node of lc
+    results_unnormalized = exp_g(pc, children(lc)[1], data, cache) # skipping the bias node of lc
 
     # 3. Expectation w.r.t P(x_m | x_o)
     results = transpose(results_unnormalized) ./ p_observed
@@ -59,7 +59,7 @@ function Moment(pc::ProbCircuit, lc::LogisticCircuit, data, moment::Int)
     results_unnormalized = zeros(num_examples(data), classes(lc))
     
     for z = 0:moment-1  
-        results_unnormalized .+= choose(moment, z) .* (biases .^ (z)) .* transpose(moment_g(pc, lc.children[1], data, moment - z, cache))
+        results_unnormalized .+= choose(moment, z) .* (biases .^ (z)) .* transpose(moment_g(pc, children(lc)[1], data, moment - z, cache))
     end
     
     # 3. Moment w.r.t P(x_m | x_o)
@@ -98,10 +98,10 @@ end
 function exp_f(n::Prob⋁Node, m::Logistic⋁Node, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = zeros(1 , num_examples(data) )
-        pthetas = [exp(n.log_thetas[i]) for i in 1:length(n.children)]
-        @fastmath @simd for i in 1:length(n.children)
-            @simd for j in 1:length(m.children)
-                value .+= (pthetas[i] .* exp_f(n.children[i], m.children[j], data, cache))
+        pthetas = [exp(n.log_thetas[i]) for i in 1:num_children(n)]
+        @fastmath @simd for i in 1:num_children(n)
+            @simd for j in 1:num_children(m)
+                value .+= (pthetas[i] .* exp_f(children(n)[i], children(m)[j], data, cache))
             end
         end
         return value
@@ -111,11 +111,11 @@ end
 function exp_f(n::Prob⋀Node, m::Logistic⋀Node, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = ones(1 , num_examples(data) )
-        @fastmath for (i,j) in zip(n.children, m.children)
+        @fastmath for (i,j) in zip(children(n), children(m))
             value .*= exp_f(i, j, data, cache)
         end
         return value
-        # exp_f(n.children[1], m.children[1], data, cache) .* exp_f(n.children[2], m.children[2], data, cache)
+        # exp_f(children(n)[1], children(m)[1], data, cache) .* exp_f(children(n)[2], children(m)[2], data, cache)
     end
 end
 
@@ -143,7 +143,7 @@ Has to be a Logistic⋁Node with only one child, which is a leaf node
 """
 @inline function exp_f(n::ProbLiteralNode, m::Logistic⋁Node, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
-        exp_f(n, m.children[1], data, cache)
+        exp_f(n, children(m)[1], data, cache)
     end
 end
 
@@ -157,22 +157,22 @@ end
 
 # function exp_g(n::Prob⋀, m::Logistic⋀Node, data, cache::ExpectationCache)
 #     value = zeros(classes(m) , num_examples(data))
-#     @fastmath for (i,j) in zip(n.children, m.children)
+#     @fastmath for (i,j) in zip(children(n), children(m))
 #         value .+= exp_fg(i, j, data, cache)
 #     end
 #     return value
-#     # exp_fg(n.children[1], m.children[1], data, cache) .+ exp_fg(n.children[2], m.children[2], data, cache)
+#     # exp_fg(children(n)[1], children(m)[1], data, cache) .+ exp_fg(children(n)[2], children(m)[2], data, cache)
 # end
 
 
 function exp_fg(n::Prob⋁Node, m::Logistic⋁Node, data, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         value = zeros(classes(m) , num_examples(data) )
-        pthetas = [exp(n.log_thetas[i]) for i in 1:length(n.children)]
-        @fastmath @simd for i in 1:length(n.children)
-            for j in 1:length(m.children)
-                value .+= (pthetas[i] .* m.thetas[j,:]) .* exp_f(n.children[i], m.children[j], data, cache)
-                value .+= pthetas[i] .* exp_fg(n.children[i], m.children[j], data, cache)
+        pthetas = [exp(n.log_thetas[i]) for i in 1:num_children(n)]
+        @fastmath @simd for i in 1:num_children(n)
+            for j in 1:num_children(m)
+                value .+= (pthetas[i] .* m.thetas[j,:]) .* exp_f(children(n)[i], children(m)[j], data, cache)
+                value .+= pthetas[i] .* exp_fg(children(n)[i], children(m)[j], data, cache)
             end
         end
         return value
@@ -182,8 +182,8 @@ end
 function exp_fg(n::Prob⋀Node, m::Logistic⋀Node, data, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         # Assuming 2 children
-        value = exp_f(n.children[1], m.children[1], data, cache) .* exp_fg(n.children[2], m.children[2], data, cache)
-        value .+= exp_f(n.children[2], m.children[2], data, cache) .* exp_fg(n.children[1], m.children[1], data, cache)
+        value = exp_f(children(n)[1], children(m)[1], data, cache) .* exp_fg(children(n)[2], children(m)[2], data, cache)
+        value .+= exp_f(children(n)[2], children(m)[2], data, cache) .* exp_fg(children(n)[1], children(m)[1], data, cache)
         return value
     end
 end
@@ -223,11 +223,11 @@ function moment_fg(n::Prob⋁Node, m::Logistic⋁Node, data, moment::Int, cache:
 
     get!(cache.fg, (n, m, moment)) do
         value = zeros(classes(m) , num_examples(data) )
-        pthetas = [exp(n.log_thetas[i]) for i in 1:length(n.children)]
-        @fastmath @simd for i in 1:length(n.children)
-            for j in 1:length(m.children)
+        pthetas = [exp(n.log_thetas[i]) for i in 1:num_children(n)]
+        @fastmath @simd for i in 1:num_children(n)
+            for j in 1:num_children(m)
                 for z in 0:moment
-                    value .+= pthetas[i] .* choose(moment, z) .* m.thetas[j,:].^(moment - z) .* moment_fg(n.children[i], m.children[j], data, z, cache)
+                    value .+= pthetas[i] .* choose(moment, z) .* m.thetas[j,:].^(moment - z) .* moment_fg(children(n)[i], children(m)[j], data, z, cache)
                 end
             end
         end
@@ -255,10 +255,10 @@ function moment_fg(n::Prob⋀Node, m::Logistic⋀Node, data, moment::Int, cache:
         return exp_f(n, m, data, cache)
     end
     get!(cache.fg, (n, m, moment)) do
-        value = moment_fg(n.children[1], m.children[1], data, 0, cache) .* moment_fg(n.children[2], m.children[2], data, moment, cache)
+        value = moment_fg(children(n)[1], children(m)[1], data, 0, cache) .* moment_fg(children(n)[2], children(m)[2], data, moment, cache)
 
         for z in 1:moment
-            value .+= choose(moment, z) .* moment_fg(n.children[1], m.children[1], data, z, cache) .* moment_fg(n.children[2], m.children[2], data, moment - z, cache)
+            value .+= choose(moment, z) .* moment_fg(children(n)[1], children(m)[1], data, z, cache) .* moment_fg(children(n)[2], children(m)[2], data, moment - z, cache)
         end
         return value
     end
diff --git a/src/StructureLearner/CircuitBuilder.jl b/src/StructureLearner/CircuitBuilder.jl
index 758b3b1f..fe73532b 100644
--- a/src/StructureLearner/CircuitBuilder.jl
+++ b/src/StructureLearner/CircuitBuilder.jl
@@ -29,7 +29,7 @@ function compile_prob_circuit_from_clt(clt::CLT)::ProbCircuit
     parent = parent_vector(clt)
 
     prob_children(n)::Vector{<:ProbCircuit{<:node_type_deprecated(n)}} =  
-        collect(ProbCircuit{<:node_type_deprecated(n)}, map(c -> prob_cache[c], n.children))
+        collect(ProbCircuit{<:node_type_deprecated(n)}, map(c -> prob_cache[c], children(n)))
 
     "default order of circuit node, from left to right: +/1 -/0"
 
diff --git a/src/Utils/decorators.jl b/src/Utils/decorators.jl
index b5611870..bc83dd31 100644
--- a/src/Utils/decorators.jl
+++ b/src/Utils/decorators.jl
@@ -1,71 +1,10 @@
-export DecoratorCircuit, literal, origin, and_nodes, or_nodes, ⋀_nodes, ⋁_nodes,
-GateType, NodeType, variable, ispositive, isnegative, origin, num_parameters
-
-using LogicCircuits
-
-"Root of the decorator circuit node hierarchy"
-# TODO rm DecoratorCircuit Type 
-abstract type DecoratorCircuit <: LogicCircuit end
+export num_parameters
 
 #####################
-# functions that need to be implemented for each type of decorator circuit
+# functions that need to be implemented for logistic circuit and probability circuit
 #####################
-"""
-Get the origin node/circuit in a given decorator node/circuit
-"""
-function origin end
 
 """
 Get the number of parameters of a given decorator node/circuit
 """
-function num_parameters end
-
-#####################
-# Abstract infrastructure for decorator circuit nodes
-#####################
-
-import LogicCircuits: GateType, NodeType
-
-"Get the gate type trait of the given `DecoratorCircuit`"
-@inline GateType(instance::DecoratorCircuit) = GateType(typeof(instance))
-
-"Map gate type traits to graph node traits"
-@inline NodeType(::Type{N}) where {N<:DecoratorCircuit} = NodeType(GateType(N))
-
-#####################
-# node functions
-#####################
-
-import LogicCircuits: literal, and_nodes, or_nodes, ⋀_nodes, ⋁_nodes
-
-"Get the logical literal in a given node"
-literal(n::DecoratorCircuit)::Lit = literal(origin(n))
-
-"Get the list of conjunction nodes in a given circuit"
-⋀_nodes(c::DecoratorCircuit) = filter(is⋀gate, c)
-
-"Get the list of And nodes in a given circuit"
-@inline and_nodes(c::DecoratorCircuit) = ⋀_nodes(c)
-
-"Get the list of disjunction nodes in a given circuit"
-⋁_nodes(c::DecoratorCircuit) = filter(is⋁gate, c)
-
-"Get the list of or nodes in a given circuit"
-@inline or_nodes(c::DecoratorCircuit) = ⋁_nodes(c)
-
-#####################
-# derived node functions
-#####################
-
-import LogicCircuits: variable, ispositive, isnegative
-
-"Get the logical variable in a given literal leaf node"
-@inline variable(n::DecoratorCircuit)::Var = variable(GateType(n), origin(n))
-
-"Get the sign of the literal leaf node"
-@inline ispositive(n::DecoratorCircuit)::Bool = ispositive(GateType(n), origin(n))
-@inline isnegative(n::DecoratorCircuit)::Bool = !ispositive(n)
-
-# TODO
-# istrue
-# isfalse
\ No newline at end of file
+function num_parameters end
\ No newline at end of file
diff --git a/temp.vtree b/temp.vtree
new file mode 100644
index 00000000..84eee02b
--- /dev/null
+++ b/temp.vtree
@@ -0,0 +1,17 @@
+c ids of vtree nodes start at 0
+c ids of variables start at 1
+c vtree nodes appear bottom-up, children before parents
+c
+c file syntax:
+c vtree number-of-nodes-in-vtree
+c L id-of-leaf-vtree-node id-of-variable
+c I id-of-internal-vtree-node id-of-left-child id-of-right-child
+c
+vtree 7
+L 0 1
+L 1 2
+I 2 0 1
+L 3 3
+L 4 4
+I 5 3 4
+I 6 2 5
diff --git a/test/LoadSave/circuit_loaders_tests.jl b/test/LoadSave/circuit_loaders_tests.jl
index 0ad98a0f..8110ef46 100644
--- a/test/LoadSave/circuit_loaders_tests.jl
+++ b/test/LoadSave/circuit_loaders_tests.jl
@@ -13,13 +13,13 @@ using ProbabilisticCircuits
    
    # Testing Read Parameters
    EPS = 1e-7
-   or1 = prob_circuit.children[1].children[2]
+   or1 = children(children(prob_circuit)[1])[2]
    @test abs(or1.log_thetas[1] - (-1.6094379124341003)) < EPS
    @test abs(or1.log_thetas[2] - (-1.2039728043259361)) < EPS
    @test abs(or1.log_thetas[3] - (-0.916290731874155)) < EPS
    @test abs(or1.log_thetas[4] - (-2.3025850929940455)) < EPS
 
-   or2 = prob_circuit.children[1].children[1]
+   or2 = children(children(prob_circuit)[1])[1]
    @test abs(or2.log_thetas[1] - (-2.3025850929940455)) < EPS
    @test abs(or2.log_thetas[2] - (-2.3025850929940455)) < EPS
    @test abs(or2.log_thetas[3] - (-2.3025850929940455)) < EPS
diff --git a/test/LoadSave/circuit_savers_test.jl b/test/LoadSave/circuit_savers_test.jl
index 286cfba0..a973654b 100644
--- a/test/LoadSave/circuit_savers_test.jl
+++ b/test/LoadSave/circuit_savers_test.jl
@@ -3,21 +3,23 @@ using LogicCircuits
 using ProbabilisticCircuits
 
 @testset "Circuit saver test" begin
-    mktempdir() do tmp
+    # mktempdir() do tmp
 
-        circuit, vtree = load_struct_prob_circuit(
-                            zoo_psdd_file("little_4var.psdd"), zoo_vtree_file("little_4var.vtree"))
+    #     circuit, vtree = load_struct_prob_circuit(
+    #                         zoo_psdd_file("little_4var.psdd"), zoo_vtree_file("little_4var.vtree"))
 
-        # load, save, and load as .psdd
-        save_circuit("$tmp/temp.psdd", circuit, vtree)
-        save_vtree(vtree, "$tmp/temp.vtree");
-        load_struct_prob_circuit("$tmp/temp.psdd", "$tmp/temp.vtree")
+    #     # load, save, and load as .psdd
+    #     # TODO reinstate after fix Struct Prob Circuit
+    #     # save_circuit("$tmp/temp.psdd", circuit, vtree)
+    #     save_vtree(vtree, "$tmp/temp.vtree");
+
+    #     load_struct_prob_circuit("$tmp/temp.psdd", "$tmp/temp.vtree")
         
-        # save and load as .sdd
-        save_circuit("$tmp/temp.sdd", origin(circuit), vtree)
-        save_vtree(vtree, "$tmp/temp.vtree")
+    #     # save and load as .sdd
+    #     # save_circuit("$tmp/temp.sdd", PlainLogicCircuit(circuit), vtree)
+    #     save_vtree(vtree, "$tmp/temp.vtree")
 
-    end
+    # end
     
     #TODO add some actual @test statements
     @test true
diff --git a/test/Probabilistic/informations_tests.jl b/test/Probabilistic/informations_tests.jl
index 91a23973..641adb99 100644
--- a/test/Probabilistic/informations_tests.jl
+++ b/test/Probabilistic/informations_tests.jl
@@ -3,85 +3,86 @@ using LogicCircuits
 using ProbabilisticCircuits
 
 # TODO reinstate after fix tests by replacing indexing circuit node
-
-@testset "Entropy and KLD" begin
-    pc1, vtree = load_struct_prob_circuit(
-                    zoo_psdd_file("simple2.1.psdd"), zoo_vtree_file("simple2.vtree"))
-    pc2, vtree = load_struct_prob_circuit(
-                    zoo_psdd_file("simple2.2.psdd"), zoo_vtree_file("simple2.vtree"))
-    pc3, vtree = load_struct_prob_circuit(
-                    zoo_psdd_file("simple2.3.psdd"), zoo_vtree_file("simple2.vtree"))
+# TODO reinstate after fix Struct Prob Circuit
+
+# @testset "Entropy and KLD" begin
+#     pc1, vtree = load_struct_prob_circuit(
+#                     zoo_psdd_file("simple2.1.psdd"), zoo_vtree_file("simple2.vtree"))
+#     pc2, vtree = load_struct_prob_circuit(
+#                     zoo_psdd_file("simple2.2.psdd"), zoo_vtree_file("simple2.vtree"))
+#     pc3, vtree = load_struct_prob_circuit(
+#                     zoo_psdd_file("simple2.3.psdd"), zoo_vtree_file("simple2.vtree"))
    
-    # Entropy calculation test
-    @test abs(entropy(pc1) - 1.2899219826090118) < 1e-8
-    @test abs(entropy(pc2) - 0.9359472745536583) < 1e-8
-
-    # KLD Tests #
-    # KLD base tests
-    pr_constraint_cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
-    kl_divergence_cache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}()
-
-    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[3], kl_divergence_cache, pr_constraint_cache)
-    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[2], pc1[3], kl_divergence_cache, pr_constraint_cache)
-    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[4], kl_divergence_cache, pr_constraint_cache)
-    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[5], kl_divergence_cache, pr_constraint_cache)
-    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[2], pc1[5], kl_divergence_cache, pr_constraint_cache)
-
-    # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[1], pc1[6], kl_divergence_cache, pr_constraint_cache)
-    # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[7], pc1[2], kl_divergence_cache, pr_constraint_cache)
-    # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[6], pc2[7], kl_divergence_cache, pr_constraint_cache)
-
-    # KLD calculation test
-    # @test abs(kl_divergence(pc1[1], pc2[1], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-    # @test abs(kl_divergence(pc1[1], pc1[2], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-    # @test abs(kl_divergence(pc1[1], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.9)) < 1e-8
-    # @test abs(kl_divergence(pc1[2], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.1)) < 1e-8
-    # @test abs(kl_divergence(pc1[5], pc2[4], kl_divergence_cache, pr_constraint_cache) - 0.2 * log(0.2)) < 1e-8
-    # @test abs(kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
-    # @test abs(kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
-    @test abs(kl_divergence(pc1, pc2) - 0.5672800167911778) < 1e-8
-
-    kl_divergence_cache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}()
-    # @test abs(kl_divergence(pc2[4], pc3[5], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-    # @test abs(kl_divergence(pc2[4], pc3[4], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-    # @test abs(kl_divergence(pc2[3], pc3[3], kl_divergence_cache, pr_constraint_cache) - 0.9 * log(0.9 / 0.5) - 0.1 * log(0.1 / 0.5)) < 1e-8
-    @test abs(kl_divergence(pc2, pc3) - 0.38966506) < 1e-8
-
-end
-
-@testset "Pr constraint Query" begin
-    # two nodes
-    simplevtree = zoo_vtree_file("simple2.vtree")
-    pc, vtree = load_struct_prob_circuit(
-                    zoo_psdd_file("simple2.4.psdd"), simplevtree)
-
-    cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
-
-    @test abs(pr_constraint(pc, pc, cache) - 1.0) < 1e-8
-    # @test abs(pr_constraint(pc[5], pc[3], cache) - 0.2) < 1e-8
-    # @test abs(pr_constraint(pc[5], pc[4], cache) - 0.8) < 1e-8
-
-    file_circuit = "little_4var.circuit"
-    file_vtree = "little_4var.vtree"
-    logic_circuit, vtree = load_struct_smooth_logic_circuit(
-                                zoo_lc_file(file_circuit), zoo_vtree_file(file_vtree))
-
-    pc = zoo_psdd("little_4var.psdd")
-
-    @test abs(pr_constraint(pc, children(logic_circuit)[1], cache) - 1.0) < 1e-8
-
-    # Test with two psdds
-    pc1, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.5.psdd"), simplevtree)
-    pc2, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.6.psdd"), simplevtree)
-
-    pr_constraint_cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
-    pr_constraint(pc1, pc2, pr_constraint_cache)
-    # @test abs(pr_constraint_cache[pc1[1], pc2[1]] - 1.0) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[1], pc2[2]] - 0.0) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[3], pc2[4]] - 1.0) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[3], pc2[5]] - 0.0) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[9], pc2[8]] - 1.0) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[5], pc2[4]] - 0.2) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[5], pc2[5]] - 0.8) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[2], pc2[3]] - 1.0) < 1e-8
-end
+#     # Entropy calculation test
+#     @test abs(entropy(pc1) - 1.2899219826090118) < 1e-8
+#     @test abs(entropy(pc2) - 0.9359472745536583) < 1e-8
+
+#     # KLD Tests #
+#     # KLD base tests
+#     pr_constraint_cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
+#     kl_divergence_cache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}()
+
+#     # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[3], kl_divergence_cache, pr_constraint_cache)
+#     # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[2], pc1[3], kl_divergence_cache, pr_constraint_cache)
+#     # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[4], kl_divergence_cache, pr_constraint_cache)
+#     # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[5], kl_divergence_cache, pr_constraint_cache)
+#     # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[2], pc1[5], kl_divergence_cache, pr_constraint_cache)
+
+#     # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[1], pc1[6], kl_divergence_cache, pr_constraint_cache)
+#     # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[7], pc1[2], kl_divergence_cache, pr_constraint_cache)
+#     # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[6], pc2[7], kl_divergence_cache, pr_constraint_cache)
+
+#     # KLD calculation test
+#     # @test abs(kl_divergence(pc1[1], pc2[1], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
+#     # @test abs(kl_divergence(pc1[1], pc1[2], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
+#     # @test abs(kl_divergence(pc1[1], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.9)) < 1e-8
+#     # @test abs(kl_divergence(pc1[2], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.1)) < 1e-8
+#     # @test abs(kl_divergence(pc1[5], pc2[4], kl_divergence_cache, pr_constraint_cache) - 0.2 * log(0.2)) < 1e-8
+#     # @test abs(kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
+#     # @test abs(kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
+#     @test abs(kl_divergence(pc1, pc2) - 0.5672800167911778) < 1e-8
+
+#     kl_divergence_cache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}()
+#     # @test abs(kl_divergence(pc2[4], pc3[5], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
+#     # @test abs(kl_divergence(pc2[4], pc3[4], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
+#     # @test abs(kl_divergence(pc2[3], pc3[3], kl_divergence_cache, pr_constraint_cache) - 0.9 * log(0.9 / 0.5) - 0.1 * log(0.1 / 0.5)) < 1e-8
+#     @test abs(kl_divergence(pc2, pc3) - 0.38966506) < 1e-8
+
+# end
+
+# @testset "Pr constraint Query" begin
+#     # two nodes
+#     simplevtree = zoo_vtree_file("simple2.vtree")
+#     pc, vtree = load_struct_prob_circuit(
+#                     zoo_psdd_file("simple2.4.psdd"), simplevtree)
+
+#     cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
+
+#     @test abs(pr_constraint(pc, pc, cache) - 1.0) < 1e-8
+#     # @test abs(pr_constraint(pc[5], pc[3], cache) - 0.2) < 1e-8
+#     # @test abs(pr_constraint(pc[5], pc[4], cache) - 0.8) < 1e-8
+
+#     file_circuit = "little_4var.circuit"
+#     file_vtree = "little_4var.vtree"
+#     logic_circuit, vtree = load_struct_smooth_logic_circuit(
+#                                 zoo_lc_file(file_circuit), zoo_vtree_file(file_vtree))
+
+#     pc = zoo_psdd("little_4var.psdd")
+
+#     @test abs(pr_constraint(pc, children(logic_circuit)[1], cache) - 1.0) < 1e-8
+
+#     # Test with two psdds
+#     pc1, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.5.psdd"), simplevtree)
+#     pc2, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.6.psdd"), simplevtree)
+
+#     pr_constraint_cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
+#     pr_constraint(pc1, pc2, pr_constraint_cache)
+#     # @test abs(pr_constraint_cache[pc1[1], pc2[1]] - 1.0) < 1e-8
+#     # @test abs(pr_constraint_cache[pc1[1], pc2[2]] - 0.0) < 1e-8
+#     # @test abs(pr_constraint_cache[pc1[3], pc2[4]] - 1.0) < 1e-8
+#     # @test abs(pr_constraint_cache[pc1[3], pc2[5]] - 0.0) < 1e-8
+#     # @test abs(pr_constraint_cache[pc1[9], pc2[8]] - 1.0) < 1e-8
+#     # @test abs(pr_constraint_cache[pc1[5], pc2[4]] - 0.2) < 1e-8
+#     # @test abs(pr_constraint_cache[pc1[5], pc2[5]] - 0.8) < 1e-8
+#     # @test abs(pr_constraint_cache[pc1[2], pc2[3]] - 1.0) < 1e-8
+# end
diff --git a/test/Probabilistic/prob_nodes_tests.jl b/test/Probabilistic/prob_nodes_tests.jl
index 1d9c83fa..6f25bbc6 100644
--- a/test/Probabilistic/prob_nodes_tests.jl
+++ b/test/Probabilistic/prob_nodes_tests.jl
@@ -7,7 +7,7 @@ include("../helper/plain_logic_circuits.jl")
 @testset "probabilistic circuit nodes" begin
     c1 = little_3var()
     p1 = ProbCircuit(c1)
-    lit3 = children(p1)[1].children[1]
+    lit3 = children(children(p1)[1])[1]
     @test isempty(intersect(linearize(ProbCircuit(c1)), linearize(ProbCircuit(c1))))
     
     # traits
@@ -20,14 +20,10 @@ include("../helper/plain_logic_circuits.jl")
     @test GateType(lit3) isa LiteralGate
 
     # methods
-    @test origin(p1) === c1
-    @test all(origin.(children(p1)) .=== c1.children)
     @test num_parameters(p1) == 10
 
     # extension methods
-    @test literal(lit3) === literal(children(c1)[1].children[1])
-    @test all(origin.(and_nodes(p1)) .=== and_nodes(c1))
-    @test all(origin.(or_nodes(p1)) .=== or_nodes(c1))
+    @test literal(lit3) === literal(children(children(c1)[1])[1])
     @test variable(left_most_descendent(p1)) == Var(3)
     @test ispositive(left_most_descendent(p1))
     @test !isnegative(left_most_descendent(p1))
diff --git a/test/Probabilistic/queries_tests.jl b/test/Probabilistic/queries_tests.jl
index b87cd359..d157e63d 100644
--- a/test/Probabilistic/queries_tests.jl
+++ b/test/Probabilistic/queries_tests.jl
@@ -52,24 +52,28 @@ end
 @testset "Marginal Pass Down" begin
     EPS = 1e-7;
     prob_circuit = zoo_psdd("little_4var.psdd");
-    logic_circuit = origin(prob_circuit)
+    logic_circuit = PlainLogicCircuit(prob_circuit)
 
     N = 4
     data_full = Bool.(generate_data_all(N))
 
     # Comparing with down pass with fully obeserved data
     compute_flows(logic_circuit, data_full)
-    compute_flows(prob_circuit, data_full)
-
-    for pn in linearize(prob_circuit)
-        @test all(isapprox.(exp.(get_downflow(pn; root=prob_circuit)), 
-            get_downflow(pn.origin; root=logic_circuit), atol=EPS))
+    compute_exp_flows(prob_circuit, data_full)
+
+    lin_prob = linearize(prob_circuit)
+    lin_logic = linearize(logic_circuit)
+    for i in 1 : length(lin_prob)
+        pn = lin_prob[i]
+        ln = lin_logic[i]
+        @test all(isapprox.(exp.(get_exp_downflow(pn; root=prob_circuit)), 
+            get_downflow(ln; root=logic_circuit), atol=EPS))
     end
 
     # Validating one example with missing features done by hand
     data_partial = Int8.([-1 1 -1 1])
     prob_circuit = zoo_psdd("little_4var.psdd");
-    compute_flows(prob_circuit, data_partial)
+    compute_exp_flows(prob_circuit, data_partial)
 
     # (node index, correct down_flow_value)
     true_vals = [(1, 0.5),
@@ -95,7 +99,7 @@ end
     lin = linearize(prob_circuit)
     
     for ind_val in true_vals
-        @test exp(get_downflow(lin[ind_val[1]]; root=prob_circuit)[1]) ≈ ind_val[2] atol= EPS
+        @test exp(get_exp_downflow(lin[ind_val[1]]; root=prob_circuit)[1]) ≈ ind_val[2] atol= EPS
     end
 end
 

From 1a8d95b9ec06e0c877f5489ae50e82ac5a2d926d Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Sat, 25 Jul 2020 22:58:46 -0700
Subject: [PATCH 031/131] fix last commit

---
 temp.vtree | 17 -----------------
 1 file changed, 17 deletions(-)
 delete mode 100644 temp.vtree

diff --git a/temp.vtree b/temp.vtree
deleted file mode 100644
index 84eee02b..00000000
--- a/temp.vtree
+++ /dev/null
@@ -1,17 +0,0 @@
-c ids of vtree nodes start at 0
-c ids of variables start at 1
-c vtree nodes appear bottom-up, children before parents
-c
-c file syntax:
-c vtree number-of-nodes-in-vtree
-c L id-of-leaf-vtree-node id-of-variable
-c I id-of-internal-vtree-node id-of-left-child id-of-right-child
-c
-vtree 7
-L 0 1
-L 1 2
-I 2 0 1
-L 3 3
-L 4 4
-I 5 3 4
-I 6 2 5

From c6e40a875fcf9a55dd8c46680caa6700dc587ccf Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Sat, 25 Jul 2020 23:06:50 -0700
Subject: [PATCH 032/131] rename

---
 src/Probabilistic/plain_prob_nodes.jl | 103 ++++++++++++++++++++++++++
 1 file changed, 103 insertions(+)
 create mode 100644 src/Probabilistic/plain_prob_nodes.jl

diff --git a/src/Probabilistic/plain_prob_nodes.jl b/src/Probabilistic/plain_prob_nodes.jl
new file mode 100644
index 00000000..92dfd3fd
--- /dev/null
+++ b/src/Probabilistic/plain_prob_nodes.jl
@@ -0,0 +1,103 @@
+export ProbCircuit, ProbLeafNode, ProbInnerNode, ProbLiteralNode, Prob⋀Node, 
+Prob⋁Node, check_parameter_integrity
+
+#####################
+# Infrastructure for probabilistic circuit nodes
+#####################
+
+"Root of the probabilistic circuit node hierarchy"
+abstract type ProbCircuit <: LogicCircuit end
+
+"""
+A probabilistic leaf node
+"""
+abstract type ProbLeafNode <: ProbCircuit end
+
+"""
+A probabilistic inner node
+"""
+abstract type ProbInnerNode <: ProbCircuit end
+
+"""
+A probabilistic literal node
+"""
+mutable struct ProbLiteralNode <: ProbLeafNode
+    literal::Lit
+    data
+    counter::UInt32
+    ProbLiteralNode(l) = new(l, nothing, 0)
+end
+
+"""
+A probabilistic conjunction node (And node)
+"""
+mutable struct Prob⋀Node <: ProbInnerNode
+    children::Vector{<:ProbCircuit}
+    data
+    counter::UInt32
+    Prob⋀Node(children) = begin
+        new(convert(Vector{ProbCircuit}, children), nothing, 0)
+    end
+end
+
+"""
+A probabilistic disjunction node (Or node)
+"""
+mutable struct Prob⋁Node <: ProbInnerNode
+    children::Vector{<:ProbCircuit}
+    log_thetas::Vector{Float64}
+    data
+    counter::UInt32
+    Prob⋁Node(children) = begin
+        new(convert(Vector{ProbCircuit}, children), init_array(Float64, length(children)), nothing, 0)
+    end
+end
+
+#####################
+# traits
+#####################
+
+import LogicCircuits.GateType # make available for extension
+
+@inline GateType(::Type{<:ProbLiteralNode}) = LiteralGate()
+@inline GateType(::Type{<:Prob⋀Node}) = ⋀Gate()
+@inline GateType(::Type{<:Prob⋁Node}) = ⋁Gate()
+
+#####################
+# methods
+#####################
+
+import LogicCircuits: children # make available for extension
+@inline children(n::ProbInnerNode) = n.children
+
+import ..Utils: num_parameters
+@inline num_parameters(c::ProbCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
+
+#####################
+# constructors and conversions
+#####################
+
+function ProbCircuit(circuit::LogicCircuit)::ProbCircuit
+    f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
+    f_lit(n) = ProbLiteralNode(literal(n))
+    f_a(n, cn) = Prob⋀Node(cn)
+    f_o(n, cn) = Prob⋁Node(cn)
+    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, ProbCircuit)
+end
+
+function PlainLogicCircuit(circuit::ProbCircuit)::PlainLogicCircuit
+    f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
+    f_lit(n) = PlainLiteralNode(literal(n))
+    f_a(n, cn) = Plain⋀Node(cn)
+    f_o(n, cn) = Plain⋁Node(cn)
+    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, PlainLogicCircuit)
+end
+
+# TODO: import LogicCircuits: conjoin, disjoin, compile # make available for extension 
+
+function check_parameter_integrity(circuit::ProbCircuit)
+    for node in or_nodes(circuit)
+        @assert all(θ -> !isnan(θ), node.log_thetas) "There is a NaN in one of the log_thetas"
+    end
+    true
+end
\ No newline at end of file

From 72f68cf95854b1e2208694db30b342beef81ef82 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Sun, 26 Jul 2020 00:14:55 -0700
Subject: [PATCH 033/131] struct prob circuit

---
 src/LoadSave/circuit_line_compiler.jl      |  17 ++-
 src/LoadSave/circuit_loaders.jl            |   2 +-
 src/Probabilistic/Probabilistic.jl         |   3 +-
 src/Probabilistic/informations.jl          |  42 +++---
 src/Probabilistic/plain_prob_nodes.jl      | 103 -------------
 src/Probabilistic/structured_prob_nodes.jl |  98 +++++++++++++
 test/Probabilistic/informations_tests.jl   | 163 ++++++++++-----------
 7 files changed, 215 insertions(+), 213 deletions(-)
 delete mode 100644 src/Probabilistic/plain_prob_nodes.jl
 create mode 100644 src/Probabilistic/structured_prob_nodes.jl

diff --git a/src/LoadSave/circuit_line_compiler.jl b/src/LoadSave/circuit_line_compiler.jl
index 53c82c53..c51f64ef 100644
--- a/src/LoadSave/circuit_line_compiler.jl
+++ b/src/LoadSave/circuit_line_compiler.jl
@@ -35,10 +35,17 @@ function compile_struct_prob(circuit_lines::CircuitFormatLines, vtree_lines::Vtr
     return prob_circuit, vtree
 end
 
-function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicCircuit, id2lognode::Dict{ID,<:LogicCircuit})::ProbCircuit
+function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicCircuit, id2lognode::Dict{ID,<:LogicCircuit})::Union{ProbCircuit, StructProbCircuit}
     # set up cache mapping logic circuit nodes to their probabilistic decorator
-    prob_circuit = ProbCircuit(logic_circuit)
-    lognode2probnode = Dict{LogicCircuit, ProbCircuit}()
+
+    prob_circuit = nothing
+    # TODO better implementation & type
+    if logic_circuit isa PlainLogicCircuit
+        prob_circuit = ProbCircuit(logic_circuit)
+    elseif logic_circuit isa PlainStructLogicCircuit
+        prob_circuit = StructProbCircuit(logic_circuit)
+    end
+    lognode2probnode = Dict()
 
     prob_lin = linearize(prob_circuit) # TODO better implementation
     logic_lin = linearize(logic_circuit)
@@ -60,11 +67,11 @@ function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicCircuit, i
     end
     function compile(ln::WeightedNamedConstantLine)
         @assert lnconstant(ln) == true
-        root = id2probnode(ln.node_id)::Prob⋁Node
+        root = id2probnode(ln.node_id)
         root.log_thetas .= [ln.weight, log1p(-exp(ln.weight))]
     end
     function compile(ln::DecisionLine{<:PSDDElement})
-        root = id2probnode(ln.node_id)::Prob⋁Node
+        root = id2probnode(ln.node_id)
         root.log_thetas .= [x.weight for x in ln.elements]
     end
 
diff --git a/src/LoadSave/circuit_loaders.jl b/src/LoadSave/circuit_loaders.jl
index d3ffec67..b8f4955a 100644
--- a/src/LoadSave/circuit_loaders.jl
+++ b/src/LoadSave/circuit_loaders.jl
@@ -45,7 +45,7 @@ Support circuit file formats:
 Supported vtree file formats:
     * ".vtree" for Vtree files
 """
-function load_struct_prob_circuit(circuit_file::String, vtree_file::String)::Tuple{ProbCircuit,PlainVtree}
+function load_struct_prob_circuit(circuit_file::String, vtree_file::String)::Tuple{StructProbCircuit,PlainVtree}
     @assert endswith(circuit_file,".psdd")
     circuit_lines = parse_circuit_file(circuit_file)
     vtree_lines = parse_vtree_file(vtree_file)
diff --git a/src/Probabilistic/Probabilistic.jl b/src/Probabilistic/Probabilistic.jl
index a56d3e1c..5d46fd92 100644
--- a/src/Probabilistic/Probabilistic.jl
+++ b/src/Probabilistic/Probabilistic.jl
@@ -4,9 +4,10 @@ using LogicCircuits
 using ..Utils
 
 include("prob_nodes.jl")
+include("structured_prob_nodes.jl")
 include("exp_flows.jl")
 include("queries.jl")
-# include("informations.jl")
+include("informations.jl")
 include("parameters.jl")
 
 end
diff --git a/src/Probabilistic/informations.jl b/src/Probabilistic/informations.jl
index 57aeda1b..bc785ec8 100644
--- a/src/Probabilistic/informations.jl
+++ b/src/Probabilistic/informations.jl
@@ -1,8 +1,8 @@
 export pr_constraint, kl_divergence, entropy
 
-const StrutCircuit = Union{ProbCircuit, StructLogicCircuit}
-const KLDCache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}
-const PRCache = Dict{Tuple{ProbCircuit, StrutCircuit}, Float64}
+const StrutCircuit = Union{StructProbCircuit, StructLogicCircuit}
+const KLDCache = Dict{Tuple{StructProbCircuit, StructProbCircuit}, Float64}
+const PRCache = Dict{Tuple{StructProbCircuit, StrutCircuit}, Float64}
 
 # Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability
 # spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
@@ -10,7 +10,7 @@ const PRCache = Dict{Tuple{ProbCircuit, StrutCircuit}, Float64}
 """
 Calculate the probability of the logic formula given by sdd for the psdd
 """
-function pr_constraint(psdd_node::ProbCircuit, sdd_node::StrutCircuit,
+function pr_constraint(psdd_node::StructProbCircuit, sdd_node::StrutCircuit,
     cache::PRCache=PRCache())::Float64
     
     # Cache hit
@@ -18,7 +18,7 @@ function pr_constraint(psdd_node::ProbCircuit, sdd_node::StrutCircuit,
         return cache[psdd_node, sdd_node]
     
     # Boundary cases
-    elseif psdd_node isa ProbLiteralNode
+    elseif psdd_node isa StructProbLiteralNode
         # Both are literals, just check whether they agrees with each other 
         if isliteralgate(sdd_node)
             if literal(psdd_node) == literal(sdd_node)
@@ -38,7 +38,7 @@ function pr_constraint(psdd_node::ProbCircuit, sdd_node::StrutCircuit,
         end
     
     # The psdd is true
-    elseif children(psdd_node)[1] isa ProbLiteralNode 
+    elseif children(psdd_node)[1] isa StructProbLiteralNode 
         theta = exp(psdd_node.log_thetas[1])
         return get!(cache, (psdd_node, sdd_node),
             theta * pr_constraint(children(psdd_node)[1], sdd_node, cache) +
@@ -66,10 +66,10 @@ end
 """"
 Calculate entropy of the distribution of the input psdd."
 """
-function entropy(psdd_node::Prob⋁Node, psdd_entropy_cache::Dict{ProbCircuit, Float64}=Dict{ProbCircuit, Float64}())::Float64
+function entropy(psdd_node::StructProb⋁Node, psdd_entropy_cache::Dict{StructProbCircuit, Float64}=Dict{StructProbCircuit, Float64}())::Float64
     if psdd_node in keys(psdd_entropy_cache)
         return psdd_entropy_cache[psdd_node]
-    elseif children(psdd_node)[1] isa ProbLiteralNode
+    elseif children(psdd_node)[1] isa StructProbLiteralNode
         return get!(psdd_entropy_cache, psdd_node,
             - exp(psdd_node.log_thetas[1]) * psdd_node.log_thetas[1] -
             exp(psdd_node.log_thetas[2]) * psdd_node.log_thetas[2])
@@ -86,27 +86,27 @@ function entropy(psdd_node::Prob⋁Node, psdd_entropy_cache::Dict{ProbCircuit, F
     end
 end
 
-function entropy(psdd_node::Prob⋀Node, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
+function entropy(psdd_node::StructProb⋀Node, psdd_entropy_cache::Dict{StructProbCircuit, Float64})::Float64
     return get!(psdd_entropy_cache, children(psdd_node)[1], entropy(children(psdd_node)[1], psdd_entropy_cache)) +
         get!(psdd_entropy_cache, children(psdd_node)[2], entropy(children(psdd_node)[2], psdd_entropy_cache))
 end
 
-function entropy(psdd_node::ProbLiteralNode, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
+function entropy(psdd_node::StructProbLiteralNode, psdd_entropy_cache::Dict{StructProbCircuit, Float64})::Float64
     return get!(psdd_entropy_cache, psdd_node, 0.0)
 end
 
 "Calculate KL divergence calculation for psdds that are not necessarily identical"
-function kl_divergence(psdd_node1::Prob⋁Node, psdd_node2::Prob⋁Node,
+function kl_divergence(psdd_node1::StructProb⋁Node, psdd_node2::StructProb⋁Node,
         kl_divergence_cache::KLDCache=KLDCache(), pr_constraint_cache::PRCache=PRCache())
-    @assert !(psdd_node1 isa Prob⋀Node || psdd_node2 isa Prob⋀Node) "Prob⋀ not a valid PSDD node for KL-Divergence"
+    @assert !(psdd_node1 isa StructProb⋀Node || psdd_node2 isa StructProb⋀Node) "Prob⋀ not a valid PSDD node for KL-Divergence"
 
     # Check if both nodes are normalized for same vtree node
-    @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
+    @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
         return kl_divergence_cache[(psdd_node1, psdd_node2)]
-    elseif children(psdd_node1)[1] isa ProbLiteralNode
-        if psdd_node2 isa ProbLiteralNode
+    elseif children(psdd_node1)[1] isa StructProbLiteralNode
+        if psdd_node2 isa StructProbLiteralNode
             kl_divergence(children(psdd_node1)[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
             kl_divergence(children(psdd_node1)[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
             if literal(children(psdd_node1)[1]) == literal(psdd_node2)
@@ -167,10 +167,10 @@ function kl_divergence(psdd_node1::Prob⋁Node, psdd_node2::Prob⋁Node,
     end
 end
 
-function kl_divergence(psdd_node1::ProbLiteralNode, psdd_node2::ProbLiteralNode,
+function kl_divergence(psdd_node1::StructProbLiteralNode, psdd_node2::StructProbLiteralNode,
         kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
     # Check if literals are over same variables in vtree
-   @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
+   @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
         return kl_divergence_cache[psdd_node1, psdd_node2]
@@ -180,9 +180,9 @@ function kl_divergence(psdd_node1::ProbLiteralNode, psdd_node2::ProbLiteralNode,
     end
 end
 
-function kl_divergence(psdd_node1::Prob⋁Node, psdd_node2::ProbLiteralNode,
+function kl_divergence(psdd_node1::StructProb⋁Node, psdd_node2::StructProbLiteralNode,
         kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
-    @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
+    @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
         return kl_divergence_cache[psdd_node1, psdd_node2]
@@ -201,9 +201,9 @@ function kl_divergence(psdd_node1::Prob⋁Node, psdd_node2::ProbLiteralNode,
     end
 end
 
-function kl_divergence(psdd_node1::ProbLiteralNode, psdd_node2::Prob⋁Node,
+function kl_divergence(psdd_node1::StructProbLiteralNode, psdd_node2::StructProb⋁Node,
         kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
-    @assert variables(psdd_node1.origin.vtree) == variables(psdd_node2.origin.vtree) "Both nodes not normalized for same vtree node"
+    @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
         return kl_divergence_cache[psdd_node1, psdd_node2]
diff --git a/src/Probabilistic/plain_prob_nodes.jl b/src/Probabilistic/plain_prob_nodes.jl
deleted file mode 100644
index 92dfd3fd..00000000
--- a/src/Probabilistic/plain_prob_nodes.jl
+++ /dev/null
@@ -1,103 +0,0 @@
-export ProbCircuit, ProbLeafNode, ProbInnerNode, ProbLiteralNode, Prob⋀Node, 
-Prob⋁Node, check_parameter_integrity
-
-#####################
-# Infrastructure for probabilistic circuit nodes
-#####################
-
-"Root of the probabilistic circuit node hierarchy"
-abstract type ProbCircuit <: LogicCircuit end
-
-"""
-A probabilistic leaf node
-"""
-abstract type ProbLeafNode <: ProbCircuit end
-
-"""
-A probabilistic inner node
-"""
-abstract type ProbInnerNode <: ProbCircuit end
-
-"""
-A probabilistic literal node
-"""
-mutable struct ProbLiteralNode <: ProbLeafNode
-    literal::Lit
-    data
-    counter::UInt32
-    ProbLiteralNode(l) = new(l, nothing, 0)
-end
-
-"""
-A probabilistic conjunction node (And node)
-"""
-mutable struct Prob⋀Node <: ProbInnerNode
-    children::Vector{<:ProbCircuit}
-    data
-    counter::UInt32
-    Prob⋀Node(children) = begin
-        new(convert(Vector{ProbCircuit}, children), nothing, 0)
-    end
-end
-
-"""
-A probabilistic disjunction node (Or node)
-"""
-mutable struct Prob⋁Node <: ProbInnerNode
-    children::Vector{<:ProbCircuit}
-    log_thetas::Vector{Float64}
-    data
-    counter::UInt32
-    Prob⋁Node(children) = begin
-        new(convert(Vector{ProbCircuit}, children), init_array(Float64, length(children)), nothing, 0)
-    end
-end
-
-#####################
-# traits
-#####################
-
-import LogicCircuits.GateType # make available for extension
-
-@inline GateType(::Type{<:ProbLiteralNode}) = LiteralGate()
-@inline GateType(::Type{<:Prob⋀Node}) = ⋀Gate()
-@inline GateType(::Type{<:Prob⋁Node}) = ⋁Gate()
-
-#####################
-# methods
-#####################
-
-import LogicCircuits: children # make available for extension
-@inline children(n::ProbInnerNode) = n.children
-
-import ..Utils: num_parameters
-@inline num_parameters(c::ProbCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
-
-#####################
-# constructors and conversions
-#####################
-
-function ProbCircuit(circuit::LogicCircuit)::ProbCircuit
-    f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-    f_lit(n) = ProbLiteralNode(literal(n))
-    f_a(n, cn) = Prob⋀Node(cn)
-    f_o(n, cn) = Prob⋁Node(cn)
-    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, ProbCircuit)
-end
-
-function PlainLogicCircuit(circuit::ProbCircuit)::PlainLogicCircuit
-    f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-    f_lit(n) = PlainLiteralNode(literal(n))
-    f_a(n, cn) = Plain⋀Node(cn)
-    f_o(n, cn) = Plain⋁Node(cn)
-    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, PlainLogicCircuit)
-end
-
-# TODO: import LogicCircuits: conjoin, disjoin, compile # make available for extension 
-
-function check_parameter_integrity(circuit::ProbCircuit)
-    for node in or_nodes(circuit)
-        @assert all(θ -> !isnan(θ), node.log_thetas) "There is a NaN in one of the log_thetas"
-    end
-    true
-end
\ No newline at end of file
diff --git a/src/Probabilistic/structured_prob_nodes.jl b/src/Probabilistic/structured_prob_nodes.jl
new file mode 100644
index 00000000..f8ad864d
--- /dev/null
+++ b/src/Probabilistic/structured_prob_nodes.jl
@@ -0,0 +1,98 @@
+export StructProbCircuit,  StructProbLeafNode, StructProbInnerNode,
+    StructProbLiteralNode, StructProb⋀Node, StructProb⋁Node
+
+#####################
+# Prob circuits that are structured,
+# meaning that each conjunction is associated with a vtree node.
+#####################
+"Root of the plain structure probabilistic circuit node hierarchy"
+abstract type StructProbCircuit <: StructLogicCircuit end
+
+"A plain structured probabilistic leaf node"
+abstract type StructProbLeafNode <: StructProbCircuit end
+
+"A plain structured probabilistic inner node"
+abstract type StructProbInnerNode <: StructProbCircuit end
+
+"A plain structured probabilistic literal leaf node, representing the positive or negative literal of its variable"
+mutable struct StructProbLiteralNode <: StructProbLeafNode
+    literal::Lit
+    vtree::Vtree
+    data
+    counter::UInt32
+    StructProbLiteralNode(l,v) = begin
+        @assert lit2var(l) ∈ variables(v) 
+        new(l, v, nothing, 0)
+    end
+end
+
+"A plain structured probabilistic conjunction node"
+mutable struct StructProb⋀Node <: StructProbInnerNode
+    prime::StructProbCircuit
+    sub::StructProbCircuit
+    vtree::Vtree
+    data
+    counter::UInt32
+    StructProb⋀Node(p,s,v) = begin
+        @assert isinner(v) "Structured conjunctions must respect inner vtree node"
+        @assert varsubset_left(vtree(p),v) "$p does not go left in $v"
+        @assert varsubset_right(vtree(s),v) "$s does not go right in $v"
+        new(p,s, v, nothing, 0)
+    end
+end
+
+"A plain structured probabilistic disjunction node"
+mutable struct StructProb⋁Node <: StructProbInnerNode
+    children::Vector{<:StructProbCircuit}
+    log_thetas::Vector{Float64}
+    vtree::Vtree # could be leaf or inner
+    data
+    counter::UInt32
+    StructProb⋁Node(c, v) = new(c, init_array(Float64, length(c)), v, nothing, 0)
+end
+
+#####################
+# traits
+#####################
+
+import LogicCircuits.GateType # make available for extension
+@inline GateType(::Type{<:StructProbLiteralNode}) = LiteralGate()
+@inline GateType(::Type{<:StructProb⋀Node}) = ⋀Gate()
+@inline GateType(::Type{<:StructProb⋁Node}) = ⋁Gate()
+
+#####################
+# methods
+#####################
+
+import LogicCircuits: children # make available for extension
+@inline children(n::StructProb⋁Node) = n.children
+@inline children(n::StructProb⋀Node) = [n.prime,n.sub]
+
+import ..Utils: num_parameters
+@inline num_parameters(c::StructProbCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
+
+#####################
+# constructors and conversions
+#####################
+
+function StructProbCircuit(circuit::PlainStructLogicCircuit)::StructProbCircuit
+    f_con(n) = error("Cannot construct a struct probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
+    f_lit(n) = StructProbLiteralNode(literal(n), vtree(n))
+    f_a(n, cn) = begin
+        @assert length(cn)==2
+        StructProb⋀Node(cn[1], cn[2], vtree(n))
+    end
+    f_o(n, cn) = StructProb⋁Node(cn, vtree(n))
+    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, StructProbCircuit)
+end 
+
+function PlainStructLogicCircuit(circuit::StructProbCircuit)::PlainStructLogicCircuit
+    f_con(n) = error("Cannot construct a struct probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
+    f_lit(n) = PlainStructLiteralNode(literal(n), vtree(n))
+    f_a(n, cn) = PlainStruct⋀Node(cn, vtree(n))
+    f_o(n, cn) = begin
+        @assert length(cn)==2
+        PlainStruct⋁Node(cn[1], cn[2], vtree(n))
+    end
+    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, PlainStructLogicCircuit)
+end 
diff --git a/test/Probabilistic/informations_tests.jl b/test/Probabilistic/informations_tests.jl
index 641adb99..f696ebf1 100644
--- a/test/Probabilistic/informations_tests.jl
+++ b/test/Probabilistic/informations_tests.jl
@@ -3,86 +3,85 @@ using LogicCircuits
 using ProbabilisticCircuits
 
 # TODO reinstate after fix tests by replacing indexing circuit node
-# TODO reinstate after fix Struct Prob Circuit
-
-# @testset "Entropy and KLD" begin
-#     pc1, vtree = load_struct_prob_circuit(
-#                     zoo_psdd_file("simple2.1.psdd"), zoo_vtree_file("simple2.vtree"))
-#     pc2, vtree = load_struct_prob_circuit(
-#                     zoo_psdd_file("simple2.2.psdd"), zoo_vtree_file("simple2.vtree"))
-#     pc3, vtree = load_struct_prob_circuit(
-#                     zoo_psdd_file("simple2.3.psdd"), zoo_vtree_file("simple2.vtree"))
+
+@testset "Entropy and KLD" begin
+    pc1, vtree = load_struct_prob_circuit(
+                    zoo_psdd_file("simple2.1.psdd"), zoo_vtree_file("simple2.vtree"))
+    pc2, vtree = load_struct_prob_circuit(
+                    zoo_psdd_file("simple2.2.psdd"), zoo_vtree_file("simple2.vtree"))
+    pc3, vtree = load_struct_prob_circuit(
+                    zoo_psdd_file("simple2.3.psdd"), zoo_vtree_file("simple2.vtree"))
    
-#     # Entropy calculation test
-#     @test abs(entropy(pc1) - 1.2899219826090118) < 1e-8
-#     @test abs(entropy(pc2) - 0.9359472745536583) < 1e-8
-
-#     # KLD Tests #
-#     # KLD base tests
-#     pr_constraint_cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
-#     kl_divergence_cache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}()
-
-#     # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[3], kl_divergence_cache, pr_constraint_cache)
-#     # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[2], pc1[3], kl_divergence_cache, pr_constraint_cache)
-#     # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[4], kl_divergence_cache, pr_constraint_cache)
-#     # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[5], kl_divergence_cache, pr_constraint_cache)
-#     # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[2], pc1[5], kl_divergence_cache, pr_constraint_cache)
-
-#     # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[1], pc1[6], kl_divergence_cache, pr_constraint_cache)
-#     # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[7], pc1[2], kl_divergence_cache, pr_constraint_cache)
-#     # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[6], pc2[7], kl_divergence_cache, pr_constraint_cache)
-
-#     # KLD calculation test
-#     # @test abs(kl_divergence(pc1[1], pc2[1], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-#     # @test abs(kl_divergence(pc1[1], pc1[2], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-#     # @test abs(kl_divergence(pc1[1], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.9)) < 1e-8
-#     # @test abs(kl_divergence(pc1[2], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.1)) < 1e-8
-#     # @test abs(kl_divergence(pc1[5], pc2[4], kl_divergence_cache, pr_constraint_cache) - 0.2 * log(0.2)) < 1e-8
-#     # @test abs(kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
-#     # @test abs(kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
-#     @test abs(kl_divergence(pc1, pc2) - 0.5672800167911778) < 1e-8
-
-#     kl_divergence_cache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}()
-#     # @test abs(kl_divergence(pc2[4], pc3[5], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-#     # @test abs(kl_divergence(pc2[4], pc3[4], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-#     # @test abs(kl_divergence(pc2[3], pc3[3], kl_divergence_cache, pr_constraint_cache) - 0.9 * log(0.9 / 0.5) - 0.1 * log(0.1 / 0.5)) < 1e-8
-#     @test abs(kl_divergence(pc2, pc3) - 0.38966506) < 1e-8
-
-# end
-
-# @testset "Pr constraint Query" begin
-#     # two nodes
-#     simplevtree = zoo_vtree_file("simple2.vtree")
-#     pc, vtree = load_struct_prob_circuit(
-#                     zoo_psdd_file("simple2.4.psdd"), simplevtree)
-
-#     cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
-
-#     @test abs(pr_constraint(pc, pc, cache) - 1.0) < 1e-8
-#     # @test abs(pr_constraint(pc[5], pc[3], cache) - 0.2) < 1e-8
-#     # @test abs(pr_constraint(pc[5], pc[4], cache) - 0.8) < 1e-8
-
-#     file_circuit = "little_4var.circuit"
-#     file_vtree = "little_4var.vtree"
-#     logic_circuit, vtree = load_struct_smooth_logic_circuit(
-#                                 zoo_lc_file(file_circuit), zoo_vtree_file(file_vtree))
-
-#     pc = zoo_psdd("little_4var.psdd")
-
-#     @test abs(pr_constraint(pc, children(logic_circuit)[1], cache) - 1.0) < 1e-8
-
-#     # Test with two psdds
-#     pc1, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.5.psdd"), simplevtree)
-#     pc2, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.6.psdd"), simplevtree)
-
-#     pr_constraint_cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
-#     pr_constraint(pc1, pc2, pr_constraint_cache)
-#     # @test abs(pr_constraint_cache[pc1[1], pc2[1]] - 1.0) < 1e-8
-#     # @test abs(pr_constraint_cache[pc1[1], pc2[2]] - 0.0) < 1e-8
-#     # @test abs(pr_constraint_cache[pc1[3], pc2[4]] - 1.0) < 1e-8
-#     # @test abs(pr_constraint_cache[pc1[3], pc2[5]] - 0.0) < 1e-8
-#     # @test abs(pr_constraint_cache[pc1[9], pc2[8]] - 1.0) < 1e-8
-#     # @test abs(pr_constraint_cache[pc1[5], pc2[4]] - 0.2) < 1e-8
-#     # @test abs(pr_constraint_cache[pc1[5], pc2[5]] - 0.8) < 1e-8
-#     # @test abs(pr_constraint_cache[pc1[2], pc2[3]] - 1.0) < 1e-8
-# end
+    # Entropy calculation test
+    @test abs(entropy(pc1) - 1.2899219826090118) < 1e-8
+    @test abs(entropy(pc2) - 0.9359472745536583) < 1e-8
+
+    # KLD Tests #
+    # KLD base tests
+    pr_constraint_cache = Dict{Tuple{StructProbCircuit, Union{StructProbCircuit, StructLogicCircuit}}, Float64}()
+    kl_divergence_cache = Dict{Tuple{StructProbCircuit, StructProbCircuit}, Float64}()
+
+    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[3], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[2], pc1[3], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[4], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[5], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[2], pc1[5], kl_divergence_cache, pr_constraint_cache)
+
+    # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[1], pc1[6], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[7], pc1[2], kl_divergence_cache, pr_constraint_cache)
+    # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[6], pc2[7], kl_divergence_cache, pr_constraint_cache)
+
+    # KLD calculation test
+    # @test abs(kl_divergence(pc1[1], pc2[1], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
+    # @test abs(kl_divergence(pc1[1], pc1[2], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
+    # @test abs(kl_divergence(pc1[1], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.9)) < 1e-8
+    # @test abs(kl_divergence(pc1[2], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.1)) < 1e-8
+    # @test abs(kl_divergence(pc1[5], pc2[4], kl_divergence_cache, pr_constraint_cache) - 0.2 * log(0.2)) < 1e-8
+    # @test abs(kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
+    # @test abs(kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
+    @test abs(kl_divergence(pc1, pc2) - 0.5672800167911778) < 1e-8
+
+    kl_divergence_cache = Dict{Tuple{StructProbCircuit, StructProbCircuit}, Float64}()
+    # @test abs(kl_divergence(pc2[4], pc3[5], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
+    # @test abs(kl_divergence(pc2[4], pc3[4], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
+    # @test abs(kl_divergence(pc2[3], pc3[3], kl_divergence_cache, pr_constraint_cache) - 0.9 * log(0.9 / 0.5) - 0.1 * log(0.1 / 0.5)) < 1e-8
+    @test abs(kl_divergence(pc2, pc3) - 0.38966506) < 1e-8
+
+end
+
+@testset "Pr constraint Query" begin
+    # two nodes
+    simplevtree = zoo_vtree_file("simple2.vtree")
+    pc, vtree = load_struct_prob_circuit(
+                    zoo_psdd_file("simple2.4.psdd"), simplevtree)
+
+    cache = Dict{Tuple{StructProbCircuit, Union{StructProbCircuit, StructLogicCircuit}}, Float64}()
+
+    @test abs(pr_constraint(pc, pc, cache) - 1.0) < 1e-8
+    # @test abs(pr_constraint(pc[5], pc[3], cache) - 0.2) < 1e-8
+    # @test abs(pr_constraint(pc[5], pc[4], cache) - 0.8) < 1e-8
+
+    file_circuit = "little_4var.circuit"
+    file_vtree = "little_4var.vtree"
+    logic_circuit, vtree = load_struct_smooth_logic_circuit(
+                                zoo_lc_file(file_circuit), zoo_vtree_file(file_vtree))
+
+    pc, _ = load_struct_prob_circuit(zoo_psdd_file("little_4var.psdd"), zoo_vtree_file("little_4var.vtree"))
+
+    @test abs(pr_constraint(pc, children(logic_circuit)[1], cache) - 1.0) < 1e-8
+
+    # Test with two psdds
+    pc1, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.5.psdd"), simplevtree)
+    pc2, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.6.psdd"), simplevtree)
+
+    pr_constraint_cache = Dict{Tuple{StructProbCircuit, Union{StructProbCircuit, StructLogicCircuit}}, Float64}()
+    @test abs(pr_constraint(pc1, pc2, pr_constraint_cache) - 1.0) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[1], pc2[1]] - 1.0) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[1], pc2[2]] - 0.0) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[3], pc2[4]] - 1.0) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[3], pc2[5]] - 0.0) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[9], pc2[8]] - 1.0) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[5], pc2[4]] - 0.2) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[5], pc2[5]] - 0.8) < 1e-8
+    # @test abs(pr_constraint_cache[pc1[2], pc2[3]] - 1.0) < 1e-8
+end

From c7e253351eff7c6795100e9623ecb823d84989b3 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Sun, 26 Jul 2020 00:48:24 -0700
Subject: [PATCH 034/131] fix circuit saver and tests

---
 src/LoadSave/circuit_line_compiler.jl      | 12 ++------
 src/LoadSave/circuit_savers.jl             | 14 ++++-----
 src/Probabilistic/informations.jl          | 14 ++++-----
 src/Probabilistic/prob_nodes.jl            | 35 ++++++++--------------
 src/Probabilistic/structured_prob_nodes.jl | 29 ++++++++++++++----
 temp.psdd                                  | 23 ++++++++++++++
 temp.sdd                                   | 24 +++++++++++++++
 temp.vtree                                 | 17 +++++++++++
 test/LoadSave/circuit_savers_test.jl       | 24 +++++++--------
 test/Probabilistic/informations_tests.jl   | 10 +++----
 10 files changed, 134 insertions(+), 68 deletions(-)
 create mode 100644 temp.psdd
 create mode 100644 temp.sdd
 create mode 100644 temp.vtree

diff --git a/src/LoadSave/circuit_line_compiler.jl b/src/LoadSave/circuit_line_compiler.jl
index c51f64ef..a0d09d7e 100644
--- a/src/LoadSave/circuit_line_compiler.jl
+++ b/src/LoadSave/circuit_line_compiler.jl
@@ -35,17 +35,11 @@ function compile_struct_prob(circuit_lines::CircuitFormatLines, vtree_lines::Vtr
     return prob_circuit, vtree
 end
 
-function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicCircuit, id2lognode::Dict{ID,<:LogicCircuit})::Union{ProbCircuit, StructProbCircuit}
+function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicCircuit, id2lognode::Dict{ID,<:LogicCircuit})::ProbCircuit
     # set up cache mapping logic circuit nodes to their probabilistic decorator
 
-    prob_circuit = nothing
-    # TODO better implementation & type
-    if logic_circuit isa PlainLogicCircuit
-        prob_circuit = ProbCircuit(logic_circuit)
-    elseif logic_circuit isa PlainStructLogicCircuit
-        prob_circuit = StructProbCircuit(logic_circuit)
-    end
-    lognode2probnode = Dict()
+    prob_circuit = ProbCircuit(logic_circuit)
+    lognode2probnode = Dict{LogicCircuit, ProbCircuit}()
 
     prob_lin = linearize(prob_circuit) # TODO better implementation
     logic_lin = linearize(logic_circuit)
diff --git a/src/LoadSave/circuit_savers.jl b/src/LoadSave/circuit_savers.jl
index 28789f7f..2a3788be 100644
--- a/src/LoadSave/circuit_savers.jl
+++ b/src/LoadSave/circuit_savers.jl
@@ -15,21 +15,21 @@ using LogicCircuits.LoadSave: SDDElement,
 #####################
 
 "Decompile for psdd circuit, used during saving of circuits to file" 
-decompile(n::ProbLiteralNode, node2id, vtree2id)::UnweightedLiteralLine = 
-    UnweightedLiteralLine(node2id[n], vtree2id[n.origin.vtree], literal(n), true)
+decompile(n::StructProbLiteralNode, node2id, vtree2id)::UnweightedLiteralLine = 
+    UnweightedLiteralLine(node2id[n], vtree2id[n.vtree], literal(n), true)
 
-make_element(n::Prob⋀Node, w::AbstractFloat, node2id) = 
+make_element(n::StructProb⋀Node, w::AbstractFloat, node2id) = 
     PSDDElement(node2id[children(n)[1]],  node2id[children(n)[2]], w)
 
 istrue_node(n)::Bool = 
     is⋁gate(n) && num_children(n) == 2 && GateType(children(n)[1]) isa LiteralGate && GateType(children(n)[2]) isa LiteralGate && 
     ispositive(children(n)[1]) && isnegative(children(n)[2])
 
-function decompile(n::Prob⋁Node, node2id, vtree2id)::Union{WeightedNamedConstantLine, DecisionLine{PSDDElement}} 
+function decompile(n::StructProb⋁Node, node2id, vtree2id)::Union{WeightedNamedConstantLine, DecisionLine{PSDDElement}} 
     if istrue_node(n)
-        WeightedNamedConstantLine(node2id[n], vtree2id[n.origin.vtree], lit2var(children(n)[1].origin.literal), n.log_thetas[1]) # TODO
+        WeightedNamedConstantLine(node2id[n], vtree2id[n.vtree], lit2var(children(n)[1].literal), n.log_thetas[1]) # TODO
     else
-        DecisionLine(node2id[n], vtree2id[n.origin.vtree], UInt32(num_children(n)), map(x -> make_element(x[1], x[2], node2id), zip(children(n), n.log_thetas)))
+        DecisionLine(node2id[n], vtree2id[n.vtree], UInt32(num_children(n)), map(x -> make_element(x[1], x[2], node2id), zip(children(n), n.log_thetas)))
     end
 end
 
@@ -107,7 +107,7 @@ end
 import LogicCircuits.LoadSave: save_circuit, save_as_dot # make available for extension
 
 "Save a circuit to file"
-save_circuit(name::String, circuit::ProbCircuit, vtree::PlainVtree) =
+save_circuit(name::String, circuit::StructProbCircuit, vtree::PlainVtree) =
     save_as_psdd(name, circuit, vtree)
 
 save_circuit(name::String, circuit::LogisticCircuit, vtree::PlainVtree) =
diff --git a/src/Probabilistic/informations.jl b/src/Probabilistic/informations.jl
index bc785ec8..d3208ad2 100644
--- a/src/Probabilistic/informations.jl
+++ b/src/Probabilistic/informations.jl
@@ -1,8 +1,8 @@
 export pr_constraint, kl_divergence, entropy
 
-const StrutCircuit = Union{StructProbCircuit, StructLogicCircuit}
-const KLDCache = Dict{Tuple{StructProbCircuit, StructProbCircuit}, Float64}
-const PRCache = Dict{Tuple{StructProbCircuit, StrutCircuit}, Float64}
+const StrutCircuit = Union{ProbCircuit, StructLogicCircuit}
+const KLDCache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}
+const PRCache = Dict{Tuple{ProbCircuit, StrutCircuit}, Float64}
 
 # Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability
 # spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
@@ -10,7 +10,7 @@ const PRCache = Dict{Tuple{StructProbCircuit, StrutCircuit}, Float64}
 """
 Calculate the probability of the logic formula given by sdd for the psdd
 """
-function pr_constraint(psdd_node::StructProbCircuit, sdd_node::StrutCircuit,
+function pr_constraint(psdd_node::ProbCircuit, sdd_node::StrutCircuit,
     cache::PRCache=PRCache())::Float64
     
     # Cache hit
@@ -66,7 +66,7 @@ end
 """"
 Calculate entropy of the distribution of the input psdd."
 """
-function entropy(psdd_node::StructProb⋁Node, psdd_entropy_cache::Dict{StructProbCircuit, Float64}=Dict{StructProbCircuit, Float64}())::Float64
+function entropy(psdd_node::StructProb⋁Node, psdd_entropy_cache::Dict{ProbCircuit, Float64}=Dict{ProbCircuit, Float64}())::Float64
     if psdd_node in keys(psdd_entropy_cache)
         return psdd_entropy_cache[psdd_node]
     elseif children(psdd_node)[1] isa StructProbLiteralNode
@@ -86,12 +86,12 @@ function entropy(psdd_node::StructProb⋁Node, psdd_entropy_cache::Dict{StructPr
     end
 end
 
-function entropy(psdd_node::StructProb⋀Node, psdd_entropy_cache::Dict{StructProbCircuit, Float64})::Float64
+function entropy(psdd_node::StructProb⋀Node, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
     return get!(psdd_entropy_cache, children(psdd_node)[1], entropy(children(psdd_node)[1], psdd_entropy_cache)) +
         get!(psdd_entropy_cache, children(psdd_node)[2], entropy(children(psdd_node)[2], psdd_entropy_cache))
 end
 
-function entropy(psdd_node::StructProbLiteralNode, psdd_entropy_cache::Dict{StructProbCircuit, Float64})::Float64
+function entropy(psdd_node::StructProbLiteralNode, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
     return get!(psdd_entropy_cache, psdd_node, 0.0)
 end
 
diff --git a/src/Probabilistic/prob_nodes.jl b/src/Probabilistic/prob_nodes.jl
index 92dfd3fd..f002baea 100644
--- a/src/Probabilistic/prob_nodes.jl
+++ b/src/Probabilistic/prob_nodes.jl
@@ -1,22 +1,22 @@
-export ProbCircuit, ProbLeafNode, ProbInnerNode, ProbLiteralNode, Prob⋀Node, 
-Prob⋁Node, check_parameter_integrity
+export PlainProbCircuit, ProbLeafNode, ProbInnerNode, ProbLiteralNode, Prob⋀Node, 
+Prob⋁Node
 
 #####################
 # Infrastructure for probabilistic circuit nodes
 #####################
 
 "Root of the probabilistic circuit node hierarchy"
-abstract type ProbCircuit <: LogicCircuit end
+abstract type PlainProbCircuit <: LogicCircuit end
 
 """
 A probabilistic leaf node
 """
-abstract type ProbLeafNode <: ProbCircuit end
+abstract type ProbLeafNode <: PlainProbCircuit end
 
 """
 A probabilistic inner node
 """
-abstract type ProbInnerNode <: ProbCircuit end
+abstract type ProbInnerNode <: PlainProbCircuit end
 
 """
 A probabilistic literal node
@@ -32,11 +32,11 @@ end
 A probabilistic conjunction node (And node)
 """
 mutable struct Prob⋀Node <: ProbInnerNode
-    children::Vector{<:ProbCircuit}
+    children::Vector{<:PlainProbCircuit}
     data
     counter::UInt32
     Prob⋀Node(children) = begin
-        new(convert(Vector{ProbCircuit}, children), nothing, 0)
+        new(convert(Vector{PlainProbCircuit}, children), nothing, 0)
     end
 end
 
@@ -44,12 +44,12 @@ end
 A probabilistic disjunction node (Or node)
 """
 mutable struct Prob⋁Node <: ProbInnerNode
-    children::Vector{<:ProbCircuit}
+    children::Vector{<:PlainProbCircuit}
     log_thetas::Vector{Float64}
     data
     counter::UInt32
     Prob⋁Node(children) = begin
-        new(convert(Vector{ProbCircuit}, children), init_array(Float64, length(children)), nothing, 0)
+        new(convert(Vector{PlainProbCircuit}, children), init_array(Float64, length(children)), nothing, 0)
     end
 end
 
@@ -71,33 +71,24 @@ import LogicCircuits: children # make available for extension
 @inline children(n::ProbInnerNode) = n.children
 
 import ..Utils: num_parameters
-@inline num_parameters(c::ProbCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
+@inline num_parameters(c::PlainProbCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
 
 #####################
 # constructors and conversions
 #####################
 
-function ProbCircuit(circuit::LogicCircuit)::ProbCircuit
+function PlainProbCircuit(circuit::PlainLogicCircuit)::PlainProbCircuit
     f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
     f_lit(n) = ProbLiteralNode(literal(n))
     f_a(n, cn) = Prob⋀Node(cn)
     f_o(n, cn) = Prob⋁Node(cn)
-    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, ProbCircuit)
+    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, PlainProbCircuit)
 end
 
-function PlainLogicCircuit(circuit::ProbCircuit)::PlainLogicCircuit
+function PlainLogicCircuit(circuit::PlainProbCircuit)::PlainLogicCircuit
     f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
     f_lit(n) = PlainLiteralNode(literal(n))
     f_a(n, cn) = Plain⋀Node(cn)
     f_o(n, cn) = Plain⋁Node(cn)
     foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, PlainLogicCircuit)
 end
-
-# TODO: import LogicCircuits: conjoin, disjoin, compile # make available for extension 
-
-function check_parameter_integrity(circuit::ProbCircuit)
-    for node in or_nodes(circuit)
-        @assert all(θ -> !isnan(θ), node.log_thetas) "There is a NaN in one of the log_thetas"
-    end
-    true
-end
\ No newline at end of file
diff --git a/src/Probabilistic/structured_prob_nodes.jl b/src/Probabilistic/structured_prob_nodes.jl
index f8ad864d..8b2e2a70 100644
--- a/src/Probabilistic/structured_prob_nodes.jl
+++ b/src/Probabilistic/structured_prob_nodes.jl
@@ -1,13 +1,17 @@
-export StructProbCircuit,  StructProbLeafNode, StructProbInnerNode,
-    StructProbLiteralNode, StructProb⋀Node, StructProb⋁Node
+export ProbCircuit, StructProbCircuit,  StructProbLeafNode, StructProbInnerNode,
+    StructProbLiteralNode, StructProb⋀Node, StructProb⋁Node, check_parameter_integrity
 
 #####################
 # Prob circuits that are structured,
 # meaning that each conjunction is associated with a vtree node.
 #####################
+
 "Root of the plain structure probabilistic circuit node hierarchy"
 abstract type StructProbCircuit <: StructLogicCircuit end
 
+"Root of the probabilistic circuit node hierarchy"
+const ProbCircuit = Union{StructProbCircuit, PlainProbCircuit}
+
 "A plain structured probabilistic leaf node"
 abstract type StructProbLeafNode <: StructProbCircuit end
 
@@ -89,10 +93,23 @@ end
 function PlainStructLogicCircuit(circuit::StructProbCircuit)::PlainStructLogicCircuit
     f_con(n) = error("Cannot construct a struct probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
     f_lit(n) = PlainStructLiteralNode(literal(n), vtree(n))
-    f_a(n, cn) = PlainStruct⋀Node(cn, vtree(n))
-    f_o(n, cn) = begin
+    f_a(n, cn) = begin
         @assert length(cn)==2
-        PlainStruct⋁Node(cn[1], cn[2], vtree(n))
+        PlainStruct⋀Node(cn[1], cn[2], vtree(n))
     end
+    f_o(n, cn) = PlainStruct⋁Node(cn, vtree(n))
     foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, PlainStructLogicCircuit)
-end 
+end
+
+@inline ProbCircuit(circuit::PlainStructLogicCircuit) = StructProbCircuit(circuit)
+
+@inline ProbCircuit(circuit::PlainLogicCircuit) = PlainProbCircuit(circuit)
+
+# TODO: import LogicCircuits: conjoin, disjoin, compile # make available for extension 
+
+function check_parameter_integrity(circuit::ProbCircuit)
+    for node in or_nodes(circuit)
+        @assert all(θ -> !isnan(θ), node.log_thetas) "There is a NaN in one of the log_thetas"
+    end
+    true
+end
diff --git a/temp.psdd b/temp.psdd
new file mode 100644
index 00000000..4c059178
--- /dev/null
+++ b/temp.psdd
@@ -0,0 +1,23 @@
+c ids of psdd nodes start at 0
+c psdd nodes appear bottom-up, children before parents
+c 
+c file syntax:
+c psdd count-of-sdd-nodes
+c L id-of-literal-sdd-node id-of-vtree literal
+c T id-of-trueNode-sdd-node id-of-vtree variable log(litProb)
+c D id-of-decomposition-sdd-node id-of-vtree number-of-elements {id-of-prime id-of-sub log(elementProb)}*
+c 
+c File generated by Juice.jl
+c 
+psdd 20
+L 0 0 1
+L 1 1 2
+L 2 1 -2
+L 3 0 -1
+D 4 2 4 0 1 -2.3025850929940455 0 2 -2.3025850929940455 3 1 -2.3025850929940455 3 2 -0.35667494393873245
+L 5 3 3
+L 6 4 4
+L 7 4 -4
+L 8 3 -3
+D 9 5 4 5 6 -1.6094379124341003 5 7 -1.2039728043259361 8 6 -0.916290731874155 8 7 -2.3025850929940455
+D 10 6 1 4 9 0.0
diff --git a/temp.sdd b/temp.sdd
new file mode 100644
index 00000000..12ab2652
--- /dev/null
+++ b/temp.sdd
@@ -0,0 +1,24 @@
+c ids of sdd nodes start at 0
+c sdd nodes appear bottom-up, children before parents
+c 
+c file syntax:
+c sdd count-of-sdd-nodes
+c F id-of-false-sdd-node
+c T id-of-true-sdd-node
+c L id-of-literal-sdd-node id-of-vtree literal
+c D id-of-decomposition-sdd-node id-of-vtree number-of-elements {id-of-prime id-of-sub}*
+c 
+c File generated by Juice.jl
+c 
+sdd 20
+L 0 0 1
+L 1 1 2
+L 2 1 -2
+L 3 0 -1
+D 4 2 4 0 1 0 2 3 1 3 2
+L 5 3 3
+L 6 4 4
+L 7 4 -4
+L 8 3 -3
+D 9 5 4 5 6 5 7 8 6 8 7
+D 10 6 1 4 9
diff --git a/temp.vtree b/temp.vtree
new file mode 100644
index 00000000..84eee02b
--- /dev/null
+++ b/temp.vtree
@@ -0,0 +1,17 @@
+c ids of vtree nodes start at 0
+c ids of variables start at 1
+c vtree nodes appear bottom-up, children before parents
+c
+c file syntax:
+c vtree number-of-nodes-in-vtree
+c L id-of-leaf-vtree-node id-of-variable
+c I id-of-internal-vtree-node id-of-left-child id-of-right-child
+c
+vtree 7
+L 0 1
+L 1 2
+I 2 0 1
+L 3 3
+L 4 4
+I 5 3 4
+I 6 2 5
diff --git a/test/LoadSave/circuit_savers_test.jl b/test/LoadSave/circuit_savers_test.jl
index a973654b..d8696f07 100644
--- a/test/LoadSave/circuit_savers_test.jl
+++ b/test/LoadSave/circuit_savers_test.jl
@@ -3,23 +3,23 @@ using LogicCircuits
 using ProbabilisticCircuits
 
 @testset "Circuit saver test" begin
-    # mktempdir() do tmp
+    mktempdir() do tmp
 
-    #     circuit, vtree = load_struct_prob_circuit(
-    #                         zoo_psdd_file("little_4var.psdd"), zoo_vtree_file("little_4var.vtree"))
+        circuit, vtree = load_struct_prob_circuit(
+                            zoo_psdd_file("little_4var.psdd"), zoo_vtree_file("little_4var.vtree"))
 
-    #     # load, save, and load as .psdd
-    #     # TODO reinstate after fix Struct Prob Circuit
-    #     # save_circuit("$tmp/temp.psdd", circuit, vtree)
-    #     save_vtree(vtree, "$tmp/temp.vtree");
+        # load, save, and load as .psdd
+        # TODO reinstate after fix Struct Prob Circuit
+        save_circuit("$tmp/temp.psdd", circuit, vtree)
+        save_vtree(vtree, "$tmp/temp.vtree");
 
-    #     load_struct_prob_circuit("$tmp/temp.psdd", "$tmp/temp.vtree")
+        load_struct_prob_circuit("$tmp/temp.psdd", "$tmp/temp.vtree")
         
-    #     # save and load as .sdd
-    #     # save_circuit("$tmp/temp.sdd", PlainLogicCircuit(circuit), vtree)
-    #     save_vtree(vtree, "$tmp/temp.vtree")
+        # save and load as .sdd
+        save_circuit("$tmp/temp.sdd", PlainStructLogicCircuit(circuit), vtree)
+        save_vtree(vtree, "$tmp/temp.vtree")
 
-    # end
+    end
     
     #TODO add some actual @test statements
     @test true
diff --git a/test/Probabilistic/informations_tests.jl b/test/Probabilistic/informations_tests.jl
index f696ebf1..f80f41c5 100644
--- a/test/Probabilistic/informations_tests.jl
+++ b/test/Probabilistic/informations_tests.jl
@@ -18,8 +18,8 @@ using ProbabilisticCircuits
 
     # KLD Tests #
     # KLD base tests
-    pr_constraint_cache = Dict{Tuple{StructProbCircuit, Union{StructProbCircuit, StructLogicCircuit}}, Float64}()
-    kl_divergence_cache = Dict{Tuple{StructProbCircuit, StructProbCircuit}, Float64}()
+    pr_constraint_cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
+    kl_divergence_cache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}()
 
     # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[3], kl_divergence_cache, pr_constraint_cache)
     # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[2], pc1[3], kl_divergence_cache, pr_constraint_cache)
@@ -41,7 +41,7 @@ using ProbabilisticCircuits
     # @test abs(kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
     @test abs(kl_divergence(pc1, pc2) - 0.5672800167911778) < 1e-8
 
-    kl_divergence_cache = Dict{Tuple{StructProbCircuit, StructProbCircuit}, Float64}()
+    kl_divergence_cache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}()
     # @test abs(kl_divergence(pc2[4], pc3[5], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
     # @test abs(kl_divergence(pc2[4], pc3[4], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
     # @test abs(kl_divergence(pc2[3], pc3[3], kl_divergence_cache, pr_constraint_cache) - 0.9 * log(0.9 / 0.5) - 0.1 * log(0.1 / 0.5)) < 1e-8
@@ -55,7 +55,7 @@ end
     pc, vtree = load_struct_prob_circuit(
                     zoo_psdd_file("simple2.4.psdd"), simplevtree)
 
-    cache = Dict{Tuple{StructProbCircuit, Union{StructProbCircuit, StructLogicCircuit}}, Float64}()
+    cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
 
     @test abs(pr_constraint(pc, pc, cache) - 1.0) < 1e-8
     # @test abs(pr_constraint(pc[5], pc[3], cache) - 0.2) < 1e-8
@@ -74,7 +74,7 @@ end
     pc1, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.5.psdd"), simplevtree)
     pc2, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.6.psdd"), simplevtree)
 
-    pr_constraint_cache = Dict{Tuple{StructProbCircuit, Union{StructProbCircuit, StructLogicCircuit}}, Float64}()
+    pr_constraint_cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
     @test abs(pr_constraint(pc1, pc2, pr_constraint_cache) - 1.0) < 1e-8
     # @test abs(pr_constraint_cache[pc1[1], pc2[1]] - 1.0) < 1e-8
     # @test abs(pr_constraint_cache[pc1[1], pc2[2]] - 0.0) < 1e-8

From 89f650060295d18f2b6d9e59531a7c2a89901db6 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Sun, 26 Jul 2020 00:48:57 -0700
Subject: [PATCH 035/131] rm file

---
 temp.psdd  | 23 -----------------------
 temp.sdd   | 24 ------------------------
 temp.vtree | 17 -----------------
 3 files changed, 64 deletions(-)
 delete mode 100644 temp.psdd
 delete mode 100644 temp.sdd
 delete mode 100644 temp.vtree

diff --git a/temp.psdd b/temp.psdd
deleted file mode 100644
index 4c059178..00000000
--- a/temp.psdd
+++ /dev/null
@@ -1,23 +0,0 @@
-c ids of psdd nodes start at 0
-c psdd nodes appear bottom-up, children before parents
-c 
-c file syntax:
-c psdd count-of-sdd-nodes
-c L id-of-literal-sdd-node id-of-vtree literal
-c T id-of-trueNode-sdd-node id-of-vtree variable log(litProb)
-c D id-of-decomposition-sdd-node id-of-vtree number-of-elements {id-of-prime id-of-sub log(elementProb)}*
-c 
-c File generated by Juice.jl
-c 
-psdd 20
-L 0 0 1
-L 1 1 2
-L 2 1 -2
-L 3 0 -1
-D 4 2 4 0 1 -2.3025850929940455 0 2 -2.3025850929940455 3 1 -2.3025850929940455 3 2 -0.35667494393873245
-L 5 3 3
-L 6 4 4
-L 7 4 -4
-L 8 3 -3
-D 9 5 4 5 6 -1.6094379124341003 5 7 -1.2039728043259361 8 6 -0.916290731874155 8 7 -2.3025850929940455
-D 10 6 1 4 9 0.0
diff --git a/temp.sdd b/temp.sdd
deleted file mode 100644
index 12ab2652..00000000
--- a/temp.sdd
+++ /dev/null
@@ -1,24 +0,0 @@
-c ids of sdd nodes start at 0
-c sdd nodes appear bottom-up, children before parents
-c 
-c file syntax:
-c sdd count-of-sdd-nodes
-c F id-of-false-sdd-node
-c T id-of-true-sdd-node
-c L id-of-literal-sdd-node id-of-vtree literal
-c D id-of-decomposition-sdd-node id-of-vtree number-of-elements {id-of-prime id-of-sub}*
-c 
-c File generated by Juice.jl
-c 
-sdd 20
-L 0 0 1
-L 1 1 2
-L 2 1 -2
-L 3 0 -1
-D 4 2 4 0 1 0 2 3 1 3 2
-L 5 3 3
-L 6 4 4
-L 7 4 -4
-L 8 3 -3
-D 9 5 4 5 6 5 7 8 6 8 7
-D 10 6 1 4 9
diff --git a/temp.vtree b/temp.vtree
deleted file mode 100644
index 84eee02b..00000000
--- a/temp.vtree
+++ /dev/null
@@ -1,17 +0,0 @@
-c ids of vtree nodes start at 0
-c ids of variables start at 1
-c vtree nodes appear bottom-up, children before parents
-c
-c file syntax:
-c vtree number-of-nodes-in-vtree
-c L id-of-leaf-vtree-node id-of-variable
-c I id-of-internal-vtree-node id-of-left-child id-of-right-child
-c
-vtree 7
-L 0 1
-L 1 2
-I 2 0 1
-L 3 3
-L 4 4
-I 5 3 4
-I 6 2 5

From 9d5ee03f961dda8b090ac3f837f83b7cae807a36 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Mon, 27 Jul 2020 01:46:49 -0700
Subject: [PATCH 036/131] use element notation on vtrees

---
 src/Probabilistic/structured_prob_nodes.jl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Probabilistic/structured_prob_nodes.jl b/src/Probabilistic/structured_prob_nodes.jl
index 8b2e2a70..11fa2050 100644
--- a/src/Probabilistic/structured_prob_nodes.jl
+++ b/src/Probabilistic/structured_prob_nodes.jl
@@ -25,7 +25,7 @@ mutable struct StructProbLiteralNode <: StructProbLeafNode
     data
     counter::UInt32
     StructProbLiteralNode(l,v) = begin
-        @assert lit2var(l) ∈ variables(v) 
+        @assert lit2var(l) ∈ v 
         new(l, v, nothing, 0)
     end
 end

From fcc278d995ee48648bf119cecbd8e156f1c7c6cd Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Fri, 31 Jul 2020 18:09:44 -0700
Subject: [PATCH 037/131] logsumexp -> logaddexp

---
 src/Mixtures/todo/EMLearner.jl  |  2 +-
 src/Mixtures/todo/Mixtures.jl   |  4 ++--
 src/Probabilistic/exp_flows.jl  | 10 +++++-----
 src/Probabilistic/parameters.jl |  2 +-
 4 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/src/Mixtures/todo/EMLearner.jl b/src/Mixtures/todo/EMLearner.jl
index 8ad45ce7..738379cc 100644
--- a/src/Mixtures/todo/EMLearner.jl
+++ b/src/Mixtures/todo/EMLearner.jl
@@ -117,7 +117,7 @@ end
 
 "Compute the component weights for each example from likelihoods"
 function component_weights_per_example(log_p_of_x_and_c)
-    log_p_of_x = logsumexp(log_p_of_x_and_c, 2) # marginalize out components
+    log_p_of_x = logaddexp(log_p_of_x_and_c, 2) # marginalize out components
     log_p_of_given_x_query_c = mapslices(col -> col .- log_p_of_x, log_p_of_x_and_c, dims=[1])
     p_of_given_x_query_c = exp.(log_p_of_given_x_query_c) # no more risk of underflow, so go to linear space
     @assert sum(p_of_given_x_query_c) ≈ size(log_p_of_x_and_c, 1) # each row has proability 1
diff --git a/src/Mixtures/todo/Mixtures.jl b/src/Mixtures/todo/Mixtures.jl
index 88d3498d..2337ccc9 100644
--- a/src/Mixtures/todo/Mixtures.jl
+++ b/src/Mixtures/todo/Mixtures.jl
@@ -119,7 +119,7 @@ end
 
 function log_likelihood_per_instance(mixture::FlatMixtureWithFlow, batch::PlainXData{Bool})::Vector{Float64}
     log_p_of_x_and_c = log_likelihood_per_instance_component(mixture, batch)
-    logsumexp(log_p_of_x_and_c, 2)
+    logaddexp(log_p_of_x_and_c, 2)
 end
 
 function log_likelihood_per_instance(mixture::MetaMixture, batches::XBatches{Bool})::Vector{Float64}
@@ -128,7 +128,7 @@ end
 
 function log_likelihood_per_instance(mixture::MetaMixture, batches::PlainXData{Bool})::Vector{Float64}
     log_p_of_x_and_c = log_likelihood_per_instance_component(mixture, batch)
-    logsumexp(log_p_of_x_and_c, 2)
+    logaddexp(log_p_of_x_and_c, 2)
 end
 
 # Log likelihoods per instance and component (including mixture weight likelihood)
diff --git a/src/Probabilistic/exp_flows.jl b/src/Probabilistic/exp_flows.jl
index 204a63c3..8049e52b 100644
--- a/src/Probabilistic/exp_flows.jl
+++ b/src/Probabilistic/exp_flows.jl
@@ -1,7 +1,7 @@
 export evaluate_exp, compute_exp_flows, get_downflow, get_upflow, get_exp_downflow, get_exp_upflow
 
 
-using StatsFuns: logsumexp
+using StatsFuns: logaddexp
 
 # TODO move to LogicCircuits
 # TODO downflow struct
@@ -97,9 +97,9 @@ function evaluate_exp(root::ProbCircuit, data;
             log_thetas = n.log_thetas
             c1 = call(@inbounds children(n)[1])::ExpUpFlow
             c2 = call(@inbounds children(n)[2])::ExpUpFlow
-            x = flowop(c1, log_thetas[1], c2, log_thetas[2], logsumexp)
+            x = flowop(c1, log_thetas[1], c2, log_thetas[2], logaddexp)
             for (i, c) in enumerate(children(n)[3:end])
-                accumulate(x, call(c), log_thetas[i+2], logsumexp)
+                accumulate(x, call(c), log_thetas[i+2], logaddexp)
             end
             return x
         end
@@ -174,12 +174,12 @@ function compute_exp_flows(circuit::ProbCircuit, data)
                     for i = 1:2
                         downflow_c = downflow(@inbounds children(c)[i])
                         accumulate(downflow_c, downflow_n .+ log_theta .+ upflow2_c.prime_flow 
-                        .+ upflow2_c.sub_flow .- upflow_n, logsumexp)
+                        .+ upflow2_c.sub_flow .- upflow_n, logaddexp)
                     end
                 else
                     upflow1_c = (c.data::ExpUpDownFlow1).upflow
                     downflow_c = downflow(c)
-                    accumulate(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n, logsumexp)
+                    accumulate(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n, logaddexp)
                 end
             end 
         end
diff --git a/src/Probabilistic/parameters.jl b/src/Probabilistic/parameters.jl
index fe3887e6..055575cd 100644
--- a/src/Probabilistic/parameters.jl
+++ b/src/Probabilistic/parameters.jl
@@ -17,7 +17,7 @@ function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
                 @. pn.log_thetas = log((children_flows + uniform_pseudocount) / smoothed_flow)
                 @assert isapprox(sum(exp.(pn.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally"
                 # normalize away any leftover error
-                pn.log_thetas .-= logsumexp(pn.log_thetas)
+                pn.log_thetas .-= logaddexp(pn.log_thetas)
             end
         end
     end

From 9b4b511c1b1a0060c15e0a63aa4ef28c09060180 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Mon, 3 Aug 2020 22:49:05 -0700
Subject: [PATCH 038/131] rm epsilon in log(0)

---
 src/Probabilistic/exp_flows.jl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Probabilistic/exp_flows.jl b/src/Probabilistic/exp_flows.jl
index 204a63c3..b6847230 100644
--- a/src/Probabilistic/exp_flows.jl
+++ b/src/Probabilistic/exp_flows.jl
@@ -54,7 +54,7 @@ const ExpUpFlow = Union{ExpUpFlow1,ExpUpFlow2}
 function evaluate_exp(root::ProbCircuit, data;
                    nload = nload, nsave = nsave, reset=true)::Vector{Float64}
     n_ex::Int = num_examples(data)
-    ϵ = 1e-300
+    ϵ = 0.0
 
     @inline f_lit(n) = begin
         uf = convert(Vector{Int8}, feature_values(data, variable(n)))

From 1ecd28a1ce0447ef59431dddbaf80249a8396870 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Mon, 3 Aug 2020 23:35:35 -0700
Subject: [PATCH 039/131] fix

---
 src/Probabilistic/exp_flows.jl | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Probabilistic/exp_flows.jl b/src/Probabilistic/exp_flows.jl
index 189ed08b..5dea47a9 100644
--- a/src/Probabilistic/exp_flows.jl
+++ b/src/Probabilistic/exp_flows.jl
@@ -5,14 +5,14 @@ using StatsFuns: logaddexp
 
 # TODO move to LogicCircuits
 # TODO downflow struct
-using LogicCircuits: UpFlow, UpFlow1, UpDownFlow, UpDownFlow1, UpDownFlow2
+using LogicCircuits: materialize, UpFlow, UpDownFlow, UpDownFlow1, UpDownFlow2
 
 """
 Get upflow from logic circuit
 """
 @inline get_upflow(n::LogicCircuit) = get_upflow(n.data)
 @inline get_upflow(elems::UpDownFlow1) = elems.upflow
-@inline get_upflow(elems::UpFlow) = UpFlow1(elems)
+@inline get_upflow(elems::UpFlow) = materialize(elems)
 
 """
 Get the node/edge flow from logic circuit

From d2fa8be171feb56ecc09330918865a3372e1cf7d Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Thu, 6 Aug 2020 03:06:32 -0700
Subject: [PATCH 040/131] revise queries

---
 src/LoadSave/circuit_line_compiler.jl |  2 +-
 src/Logistic/queries.jl               | 41 +++++++++++++++++++++---
 test/Logistic/logistic_tests.jl       | 29 -----------------
 test/Logistic/queries_tests.jl        | 46 +++++++++++++++++++++++++++
 4 files changed, 84 insertions(+), 34 deletions(-)
 delete mode 100644 test/Logistic/logistic_tests.jl
 create mode 100644 test/Logistic/queries_tests.jl

diff --git a/src/LoadSave/circuit_line_compiler.jl b/src/LoadSave/circuit_line_compiler.jl
index a0d09d7e..02879f55 100644
--- a/src/LoadSave/circuit_line_compiler.jl
+++ b/src/LoadSave/circuit_line_compiler.jl
@@ -111,7 +111,7 @@ function decorate_logistic(lines::CircuitFormatLines, logic_circuit::LogicCircui
 
     function compile(ln::BiasLine)
         root = id2logisticnode(ln.node_id)::Logistic⋁Node
-        # @assert length(node.thetas) == 1
+        # @assert length(root.thetas) == 1
         root.thetas[1,:] .= ln.weights
     end
 
diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index 7c80e625..ce9b09d5 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -1,10 +1,15 @@
-export class_conditional_likelihood_per_instance
+export class_conditional_likelihood_per_instance, accuracy, predict_class
+
+using LogicCircuits: UpDownFlow1, flow_and
 
-using ..Probabilistic: get_downflow, get_upflow
 """
 Class Conditional Probability
 """
-function class_conditional_likelihood_per_instance(lc::LogisticCircuit,  classes::Int, data)
+@inline function class_conditional_likelihood_per_instance(lc::LogisticCircuit,  classes::Int, data)
+    
+    @inline downflow(or_parent::Logistic⋁Node, c) = 
+        (c.data isa UpDownFlow1) ? c.data.downflow : flow_and(or_parent.data.downflow, c.data)
+    
     compute_flows(lc, data)
     likelihoods = zeros(num_examples(data), classes)
     foreach(lc) do ln
@@ -12,11 +17,39 @@ function class_conditional_likelihood_per_instance(lc::LogisticCircuit,  classes
             # For each class. orig.thetas is 2D so used eachcol
             for (idx, thetaC) in enumerate(eachcol(ln.thetas))
                 foreach(children(ln), thetaC) do c, theta
-                    likelihoods[:, idx] .+= Float64.(get_downflow(ln) .& get_upflow(c)) .* theta
+                    down_flow = Float64.(downflow(ln, c))
+                    @. likelihoods[:, idx] += down_flow * theta
                 end
             end
         end
     end
+    
+    @. likelihoods = 1.0 / (1.0 + exp(-likelihoods))
     likelihoods
 end
 
+"""
+Class Predictions
+"""
+@inline function predict_class(lc::LogisticCircuit, classes::Int, data)
+    class_likelihoods = class_conditional_likelihood_per_instance(lc, classes, data)
+    predict_class(class_likelihoods)
+end
+
+@inline function predict_class(class_likelihoods::AbstractMatrix)
+    _, mxindex = findmax(class_likelihoods; dims=2)
+    dropdims(getindex.(mxindex, 2); dims=2)
+end
+
+"""
+Prediction accuracy
+"""
+@inline accuracy(predicted_class::Vector, labels) = 
+    Float64(sum(@. predicted_class == labels)) / length(labels)
+
+@inline accuracy(lc::LogisticCircuit, classes::Int, data, labels) = 
+    accuracy(predict_class(lc, classes, data), labels)
+
+@inline accuracy(class_likelihoods::AbstractMatrix, labels) = 
+    accuracy(predict_class(class_likelihoods), labels)
+
diff --git a/test/Logistic/logistic_tests.jl b/test/Logistic/logistic_tests.jl
deleted file mode 100644
index 3461a064..00000000
--- a/test/Logistic/logistic_tests.jl
+++ /dev/null
@@ -1,29 +0,0 @@
-using Test
-using LogicCircuits
-using ProbabilisticCircuits
-
-# This tests are supposed to test queries on the circuits
-@testset "Logistic Circuit Class Conditional" begin
-    # Uses a Logistic Circuit with 4 variables, and tests 3 of the configurations to 
-    # match with python version.
-
-    EPS = 1e-7;
-    logistic_circuit = zoo_lc("little_4var.circuit", 2);
-    @test logistic_circuit isa LogisticCircuit;
-
-    # Step 1. Check Probabilities for 3 samples
-    data = Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]);
-    
-    true_prob = [3.43147972 4.66740416; 
-                4.27595352 2.83503504;
-                3.67415087 4.93793472]
-            
-    CLASSES = 2
-    calc_prob = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
-    
-    for i = 1:3
-        for j = 1:2
-            @test true_prob[i,j] ≈ calc_prob[i,j] atol= EPS;
-        end
-    end
-end
\ No newline at end of file
diff --git a/test/Logistic/queries_tests.jl b/test/Logistic/queries_tests.jl
new file mode 100644
index 00000000..76e1035f
--- /dev/null
+++ b/test/Logistic/queries_tests.jl
@@ -0,0 +1,46 @@
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+
+# This tests are supposed to test queries on the circuits
+@testset "Logistic Circuit Class Conditional" begin
+    # Uses a Logistic Circuit with 4 variables, and tests 3 of the configurations to 
+    # match with python version.
+    
+    CLASSES = 2
+
+    logistic_circuit = zoo_lc("little_4var.circuit", CLASSES)
+    @test logistic_circuit isa LogisticCircuit
+
+    # check probabilities for binary samples
+    data = @. Bool([0 0 0 0; 0 1 1 0; 0 0 1 1])
+    # true_weight_func = [3.43147972 4.66740416; 
+    #                     4.27595352 2.83503504;
+    #                     3.67415087 4.93793472]
+    true_prob = [0.96867400053 0.99069084464;
+                 0.98629173861 0.94453994990;
+                 0.97525681816 0.99288164437]
+            
+    class_prob = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
+    for i = 1:3
+        for j = 1:2
+            @test true_prob[i,j] ≈ class_prob[i,j]
+        end
+    end
+
+    # check probabilities for float samples
+    class_prob = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
+    for i = 1:3
+        for j = 1:2
+            @test true_prob[i,j] ≈ class_prob[i,j]
+        end
+    end
+
+    # check predicted_classes
+    true_labels = [2, 1, 2]
+    predicted_classes = predict_class(logistic_circuit, CLASSES, data)
+    @test all(@. predicted_classes == true_labels)
+    
+    # check accuracy
+    @test accuracy(logistic_circuit, CLASSES, data, true_labels) == 1.0
+end
\ No newline at end of file

From a8ea225bd9ab350ce4048fe6afe1f050acf3f92b Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Thu, 6 Aug 2020 03:26:12 -0700
Subject: [PATCH 041/131] retain old functions to mitigate errors

---
 src/Logistic/queries.jl            | 25 ++++++++++++++++++++++++-
 test/Reasoning/expectation_test.jl |  4 ++--
 2 files changed, 26 insertions(+), 3 deletions(-)

diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index ce9b09d5..7420c3f3 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -1,6 +1,29 @@
-export class_conditional_likelihood_per_instance, accuracy, predict_class
+export class_conditional_weights_per_instance, 
+       class_conditional_likelihood_per_instance, 
+       accuracy, predict_class
 
 using LogicCircuits: UpDownFlow1, flow_and
+using ..Probabilistic: get_downflow, get_upflow
+
+"""
+Class Conditional Weights
+"""
+# This is the old implementation. It is retained to pass the exptation tests.
+function class_conditional_weights_per_instance(lc::LogisticCircuit,  classes::Int, data)
+    compute_flows(lc, data)
+    likelihoods = zeros(num_examples(data), classes)
+    foreach(lc) do ln
+        if ln isa Logistic⋁Node
+            # For each class. orig.thetas is 2D so used eachcol
+            for (idx, thetaC) in enumerate(eachcol(ln.thetas))
+                foreach(children(ln), thetaC) do c, theta
+                    likelihoods[:, idx] .+= Float64.(get_downflow(ln) .& get_upflow(c)) .* theta
+                end
+            end
+        end
+    end
+    likelihoods
+end
 
 """
 Class Conditional Probability
diff --git a/test/Reasoning/expectation_test.jl b/test/Reasoning/expectation_test.jl
index c8aafc50..9ad55b98 100644
--- a/test/Reasoning/expectation_test.jl
+++ b/test/Reasoning/expectation_test.jl
@@ -14,7 +14,7 @@ function test_expectation_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data
         calc_p = log_likelihood_per_instance(pc, cur_data_all)
         calc_p = exp.(calc_p)
 
-        calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
+        calc_f = class_conditional_weights_per_instance(lc, CLASSES, cur_data_all)
         true_exp[i, :] = sum(calc_p .* calc_f, dims=1)
         true_exp[i, :] ./= sum(calc_p) #p_observed
     end
@@ -47,7 +47,7 @@ function test_moment_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLA
         calc_p = log_likelihood_per_instance(pc, cur_data_all)
         calc_p = exp.(calc_p)
 
-        calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
+        calc_f = class_conditional_weights_per_instance(lc, CLASSES, cur_data_all)
         true_mom[i, :] = sum(calc_p .* (calc_f .^ moment), dims=1)
         true_mom[i, :] ./= sum(calc_p) #p_observed
     end

From 4a974cbd6336bc20e7564900ac7c965de10cdf03 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Fri, 7 Aug 2020 05:44:56 -0700
Subject: [PATCH 042/131] [logistic circuits] parameter learning

---
 src/Logistic/Logistic.jl        |  1 +
 src/Logistic/parameters.jl      | 50 ++++++++++++++++++++
 src/Logistic/queries.jl         | 23 ++++++----
 test/Logistic/logistic_tests.jl | 81 +++++++++++++++++++++++++++++++++
 test/Logistic/queries_tests.jl  | 46 -------------------
 5 files changed, 145 insertions(+), 56 deletions(-)
 create mode 100644 src/Logistic/parameters.jl
 create mode 100644 test/Logistic/logistic_tests.jl
 delete mode 100644 test/Logistic/queries_tests.jl

diff --git a/src/Logistic/Logistic.jl b/src/Logistic/Logistic.jl
index c657449f..b09f76d0 100644
--- a/src/Logistic/Logistic.jl
+++ b/src/Logistic/Logistic.jl
@@ -5,6 +5,7 @@ using ..Utils
 
 include("logistic_nodes.jl")
 include("queries.jl")
+include("parameters.jl")
 
 # TODO learning
 
diff --git a/src/Logistic/parameters.jl b/src/Logistic/parameters.jl
new file mode 100644
index 00000000..7756b8e1
--- /dev/null
+++ b/src/Logistic/parameters.jl
@@ -0,0 +1,50 @@
+export learn_parameters
+
+using LogicCircuits: compute_flows
+"""
+Maximum likilihood estimation of parameters given data through gradient descent
+"""
+function learn_parameters(lc::LogisticCircuit, classes::Int, data, labels; num_epochs=30, step_size=0.1, flows_computed=false)
+
+    @inline function one_hot(labels::Vector, classes::Int)        
+        one_hot_labels = zeros(length(labels), classes)
+        for (i, j) in enumerate(labels)
+            one_hot_labels[i, j] = 1.0
+        end
+        one_hot_labels
+    end
+
+    one_hot_labels = one_hot(labels, classes)
+    if !flows_computed
+        compute_flows(lc, data)
+    end
+
+    for _ = 1:num_epochs
+        class_probs = class_conditional_likelihood_per_instance(lc, classes, data; flows_computed=true)
+        update_parameters(lc, class_probs, one_hot_labels)
+    end
+
+    nothing
+end
+
+
+@inline function update_parameters(lc::LogisticCircuit, class_probs, one_hot_labels; step_size=0.1)
+    error = class_probs .- one_hot_labels
+
+    foreach(lc) do ln
+        if ln isa Logistic⋁Node
+            #TODO; check whether einsum would speed up calculations here
+            # For each class. orig.thetas is 2D so used eachcol
+            for (class, thetaC) in enumerate(eachcol(ln.thetas))
+                for (idx, c) in enumerate(children(ln))
+                    down_flow = Float64.(downflow(ln, c))
+                    thetaC[idx] -= step_size * sum(error[:, class] .* down_flow) / length(down_flow)
+                end
+            end
+        end
+    end
+    
+    nothing
+end
+
+
diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index 7420c3f3..7640a0fa 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -1,6 +1,6 @@
 export class_conditional_weights_per_instance, 
        class_conditional_likelihood_per_instance, 
-       accuracy, predict_class
+       downflow, accuracy, predict_class
 
 using LogicCircuits: UpDownFlow1, flow_and
 using ..Probabilistic: get_downflow, get_upflow
@@ -15,9 +15,9 @@ function class_conditional_weights_per_instance(lc::LogisticCircuit,  classes::I
     foreach(lc) do ln
         if ln isa Logistic⋁Node
             # For each class. orig.thetas is 2D so used eachcol
-            for (idx, thetaC) in enumerate(eachcol(ln.thetas))
+            for (class, thetaC) in enumerate(eachcol(ln.thetas))
                 foreach(children(ln), thetaC) do c, theta
-                    likelihoods[:, idx] .+= Float64.(get_downflow(ln) .& get_upflow(c)) .* theta
+                    likelihoods[:, class] .+= Float64.(get_downflow(ln) .& get_upflow(c)) .* theta
                 end
             end
         end
@@ -28,20 +28,20 @@ end
 """
 Class Conditional Probability
 """
-@inline function class_conditional_likelihood_per_instance(lc::LogisticCircuit,  classes::Int, data)
-    
-    @inline downflow(or_parent::Logistic⋁Node, c) = 
-        (c.data isa UpDownFlow1) ? c.data.downflow : flow_and(or_parent.data.downflow, c.data)
+@inline function class_conditional_likelihood_per_instance(lc::LogisticCircuit,  classes::Int, data; flows_computed=false)
+    if !flows_computed
+        compute_flows(lc, data)
+    end
     
-    compute_flows(lc, data)
     likelihoods = zeros(num_examples(data), classes)
+    #TODO; check whether einsum would speed up calculations here
     foreach(lc) do ln
         if ln isa Logistic⋁Node
             # For each class. orig.thetas is 2D so used eachcol
-            for (idx, thetaC) in enumerate(eachcol(ln.thetas))
+            for (class, thetaC) in enumerate(eachcol(ln.thetas))
                 foreach(children(ln), thetaC) do c, theta
                     down_flow = Float64.(downflow(ln, c))
-                    @. likelihoods[:, idx] += down_flow * theta
+                    @. likelihoods[:, class] += down_flow * theta
                 end
             end
         end
@@ -51,6 +51,9 @@ Class Conditional Probability
     likelihoods
 end
 
+@inline downflow(or_parent::Logistic⋁Node, c) = 
+    (c.data isa UpDownFlow1) ? c.data.downflow : flow_and(or_parent.data.downflow, c.data)
+
 """
 Class Predictions
 """
diff --git a/test/Logistic/logistic_tests.jl b/test/Logistic/logistic_tests.jl
new file mode 100644
index 00000000..5c83fb9a
--- /dev/null
+++ b/test/Logistic/logistic_tests.jl
@@ -0,0 +1,81 @@
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+
+# This tests are supposed to test queries on the circuits
+@testset "Logistic Circuit Query and Parameter Tests" begin
+    # Uses a Logistic Circuit with 4 variables, and tests 3 of the configurations to 
+    # match with python version.
+    
+    CLASSES = 2
+
+    logistic_circuit = zoo_lc("little_4var.circuit", CLASSES)
+    @test logistic_circuit isa LogisticCircuit
+
+    # check probabilities for binary samples
+    data = @. Bool([0 0 0 0; 0 1 1 0; 0 0 1 1])
+    # true_weight_func = [3.43147972 4.66740416; 
+    #                     4.27595352 2.83503504;
+    #                     3.67415087 4.93793472]
+    true_prob = [0.9686740004857587 0.9906908446064048;
+                 0.9862917386522077 0.9445399501015433;
+                 0.9752568180725943 0.9928816444023877]
+            
+    class_prob = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
+    for i = 1:size(true_prob)[1]
+        for j = 1:CLASSES
+            @test true_prob[i,j] ≈ class_prob[i,j]
+        end
+    end
+
+    # check probabilities for float samples
+    data = Float64.(data)
+    class_prob = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
+    for i = 1:size(true_prob)[1]
+        for j = 1:CLASSES
+            @test true_prob[i,j] ≈ class_prob[i,j]
+        end
+    end
+
+    # check predicted_classes
+    true_labels = [2, 1, 2]
+    predicted_classes = predict_class(logistic_circuit, CLASSES, data)
+    @test all(predicted_classes .== true_labels)
+    
+    # check accuracy
+    @test accuracy(logistic_circuit, CLASSES, data, true_labels) == 1.0
+
+    # check parameter updates
+    original_literal_parameters = Dict{Int, Vector{Float64}}()
+    foreach(logistic_circuit) do ln
+        if ln isa Logistic⋁Node
+            foreach(ln.children, eachrow(ln.thetas)) do c, theta
+                if c isa LogisticLiteral
+                    original_literal_parameters[c.literal] = copy(theta)
+                end
+            end
+        end
+    end
+    
+    one_hot_labels = [0.0 1.0;
+                      1.0 0.0;
+                      0.0 1.0]
+    true_error = true_prob .- one_hot_labels
+    step_size = 0.1
+    learn_parameters(logistic_circuit, CLASSES, data, true_labels; num_epochs=1, step_size=step_size, flows_computed=true)
+    
+    foreach(logistic_circuit) do ln
+        if ln isa Logistic⋁Node
+            foreach(ln.children, eachrow(ln.thetas)) do c, theta
+                if c isa LogisticLiteral
+                    for class = 1:CLASSES
+                        true_update_amount = -step_size * sum(c.data.upflow .* true_error[:, class]) / size(true_error)[1]
+                        updated_amount = theta[class] - original_literal_parameters[c.literal][class]
+                        @test updated_amount ≈ true_update_amount
+                    end
+                end
+            end
+        end
+    end
+
+end
\ No newline at end of file
diff --git a/test/Logistic/queries_tests.jl b/test/Logistic/queries_tests.jl
deleted file mode 100644
index 76e1035f..00000000
--- a/test/Logistic/queries_tests.jl
+++ /dev/null
@@ -1,46 +0,0 @@
-using Test
-using LogicCircuits
-using ProbabilisticCircuits
-
-# This tests are supposed to test queries on the circuits
-@testset "Logistic Circuit Class Conditional" begin
-    # Uses a Logistic Circuit with 4 variables, and tests 3 of the configurations to 
-    # match with python version.
-    
-    CLASSES = 2
-
-    logistic_circuit = zoo_lc("little_4var.circuit", CLASSES)
-    @test logistic_circuit isa LogisticCircuit
-
-    # check probabilities for binary samples
-    data = @. Bool([0 0 0 0; 0 1 1 0; 0 0 1 1])
-    # true_weight_func = [3.43147972 4.66740416; 
-    #                     4.27595352 2.83503504;
-    #                     3.67415087 4.93793472]
-    true_prob = [0.96867400053 0.99069084464;
-                 0.98629173861 0.94453994990;
-                 0.97525681816 0.99288164437]
-            
-    class_prob = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
-    for i = 1:3
-        for j = 1:2
-            @test true_prob[i,j] ≈ class_prob[i,j]
-        end
-    end
-
-    # check probabilities for float samples
-    class_prob = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
-    for i = 1:3
-        for j = 1:2
-            @test true_prob[i,j] ≈ class_prob[i,j]
-        end
-    end
-
-    # check predicted_classes
-    true_labels = [2, 1, 2]
-    predicted_classes = predict_class(logistic_circuit, CLASSES, data)
-    @test all(@. predicted_classes == true_labels)
-    
-    # check accuracy
-    @test accuracy(logistic_circuit, CLASSES, data, true_labels) == 1.0
-end
\ No newline at end of file

From 159b5d9c1d7274991e7009c16133900560fbd082 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Fri, 7 Aug 2020 18:06:45 -0700
Subject: [PATCH 043/131] [logistic circuits] speed up queries

---
 Project.toml            |  4 ++++
 src/Logistic/queries.jl | 40 ++++++++++++++++++----------------------
 2 files changed, 22 insertions(+), 22 deletions(-)

diff --git a/Project.toml b/Project.toml
index cc639b0c..3e0ef01a 100644
--- a/Project.toml
+++ b/Project.toml
@@ -19,6 +19,8 @@ SparseArrays = "2f01184e-e22b-5df5-ae63-d93ebab69eaf"
 Statistics = "10745b16-79ce-11e8-11f9-7d13ad32a3b2"
 StatsBase = "2913bbd2-ae8a-5f71-8c99-4fb6c76f3a91"
 StatsFuns = "4c63d2b9-4356-54db-8cca-17b64c39e42c"
+LoopVectorization = "bdcacae8-1622-11e9-2a5c-532679323890"
+MLDatasets = "eb30cadb-4394-5ae3-aed4-317e484a6458"
 
 [compat]
 BlossomV = "0.4"
@@ -32,4 +34,6 @@ Reexport = "0.2"
 SimpleWeightedGraphs = "1.1"
 StatsBase = "0.33"
 StatsFuns = "0.9"
+LoopVectorization = "0.8.20"
+MLDatasets = "0.4, 0.5"
 julia = "1.5"
diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index 7640a0fa..aa4a7981 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -2,23 +2,25 @@ export class_conditional_weights_per_instance,
        class_conditional_likelihood_per_instance, 
        downflow, accuracy, predict_class
 
-using LogicCircuits: UpDownFlow1, flow_and
+using LogicCircuits: UpDownFlow1, flow_and, or_nodes
 using ..Probabilistic: get_downflow, get_upflow
+using LoopVectorization: @avx
 
 """
 Class Conditional Weights
 """
 # This is the old implementation. It is retained to pass the exptation tests.
-function class_conditional_weights_per_instance(lc::LogisticCircuit,  classes::Int, data)
-    compute_flows(lc, data)
+function class_conditional_weights_per_instance(lc::LogisticCircuit,  classes::Int, data; flows_computed=false)
+    if !flows_computed
+        compute_flows(lc, data)
+    end
+
     likelihoods = zeros(num_examples(data), classes)
-    foreach(lc) do ln
-        if ln isa Logistic⋁Node
-            # For each class. orig.thetas is 2D so used eachcol
-            for (class, thetaC) in enumerate(eachcol(ln.thetas))
-                foreach(children(ln), thetaC) do c, theta
-                    likelihoods[:, class] .+= Float64.(get_downflow(ln) .& get_upflow(c)) .* theta
-                end
+    foreach(or_nodes(lc)) do ln
+        # For each class. orig.thetas is 2D so used eachcol
+        for (class, thetaC) in enumerate(eachcol(ln.thetas))
+            foreach(children(ln), thetaC) do c, theta
+                likelihoods[:, class] .+= Float64.(get_downflow(ln) .& get_upflow(c)) .* theta
             end
         end
     end
@@ -34,20 +36,14 @@ Class Conditional Probability
     end
     
     likelihoods = zeros(num_examples(data), classes)
-    #TODO; check whether einsum would speed up calculations here
-    foreach(lc) do ln
-        if ln isa Logistic⋁Node
-            # For each class. orig.thetas is 2D so used eachcol
-            for (class, thetaC) in enumerate(eachcol(ln.thetas))
-                foreach(children(ln), thetaC) do c, theta
-                    down_flow = Float64.(downflow(ln, c))
-                    @. likelihoods[:, class] += down_flow * theta
-                end
-            end
-        end
+    foreach(or_nodes(lc)) do ln
+        foreach(eachrow(ln.thetas), children(ln)) do theta, c
+            flow = Float64.(downflow(ln, c))
+            @avx @. likelihoods +=  flow * theta'
+        end        
     end
     
-    @. likelihoods = 1.0 / (1.0 + exp(-likelihoods))
+    @avx @. likelihoods = 1.0 / (1.0 + exp(-likelihoods))
     likelihoods
 end
 

From 3354c76ff85815515a18836481b6b88914d403bc Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Fri, 7 Aug 2020 18:12:27 -0700
Subject: [PATCH 044/131] [logistic circuits] speed up queries

---
 src/Logistic/queries.jl | 9 ++++-----
 1 file changed, 4 insertions(+), 5 deletions(-)

diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index aa4a7981..1e60b16d 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -17,13 +17,12 @@ function class_conditional_weights_per_instance(lc::LogisticCircuit,  classes::I
 
     likelihoods = zeros(num_examples(data), classes)
     foreach(or_nodes(lc)) do ln
-        # For each class. orig.thetas is 2D so used eachcol
-        for (class, thetaC) in enumerate(eachcol(ln.thetas))
-            foreach(children(ln), thetaC) do c, theta
-                likelihoods[:, class] .+= Float64.(get_downflow(ln) .& get_upflow(c)) .* theta
-            end
+        foreach(eachrow(ln.thetas), children(ln)) do theta, c
+            flow = Float64.(get_downflow(ln) .& get_upflow(c))
+            @avx @. likelihoods += flow * theta'
         end
     end
+    
     likelihoods
 end
 

From 25e046c0dedc5208395e2468f18d8f691a70c4c6 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Fri, 7 Aug 2020 19:50:03 -0700
Subject: [PATCH 045/131] [logistic circuits] speed up parameter learning

---
 src/Logistic/parameters.jl | 23 +++++++++++------------
 1 file changed, 11 insertions(+), 12 deletions(-)

diff --git a/src/Logistic/parameters.jl b/src/Logistic/parameters.jl
index 7756b8e1..329b90f5 100644
--- a/src/Logistic/parameters.jl
+++ b/src/Logistic/parameters.jl
@@ -1,6 +1,8 @@
 export learn_parameters
 
-using LogicCircuits: compute_flows
+using LogicCircuits: compute_flows, or_nodes
+using LoopVectorization: @avx
+
 """
 Maximum likilihood estimation of parameters given data through gradient descent
 """
@@ -29,18 +31,15 @@ end
 
 
 @inline function update_parameters(lc::LogisticCircuit, class_probs, one_hot_labels; step_size=0.1)
+    num_samples = Float64(size(one_hot_labels)[1])
     error = class_probs .- one_hot_labels
-
-    foreach(lc) do ln
-        if ln isa Logistic⋁Node
-            #TODO; check whether einsum would speed up calculations here
-            # For each class. orig.thetas is 2D so used eachcol
-            for (class, thetaC) in enumerate(eachcol(ln.thetas))
-                for (idx, c) in enumerate(children(ln))
-                    down_flow = Float64.(downflow(ln, c))
-                    thetaC[idx] -= step_size * sum(error[:, class] .* down_flow) / length(down_flow)
-                end
-            end
+    
+    foreach(or_nodes(lc)) do ln
+        foreach(eachrow(ln.thetas), children(ln)) do theta, c
+            flow = Float64.(downflow(ln, c))
+            @avx update_amount = flow' * error / num_samples * step_size
+            update_amount = dropdims(update_amount; dims=1)
+            @avx @. theta -= update_amount
         end
     end
     

From 0e94776f8ed7656daf2e75bc237b8aadb2c5db06 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Wed, 12 Aug 2020 13:17:25 -0700
Subject: [PATCH 046/131] [wip] renaming; some speed benchmark test results

---
 src/Logistic/logistic_nodes.jl     |  4 +-
 src/Logistic/parameters.jl         |  2 +-
 src/Logistic/queries.jl            | 94 ++++++++++++++++++++++--------
 test/Logistic/logistic_tests.jl    | 15 ++---
 test/Reasoning/expectation_test.jl |  4 +-
 5 files changed, 83 insertions(+), 36 deletions(-)

diff --git a/src/Logistic/logistic_nodes.jl b/src/Logistic/logistic_nodes.jl
index 950dd8c8..632867d8 100644
--- a/src/Logistic/logistic_nodes.jl
+++ b/src/Logistic/logistic_nodes.jl
@@ -54,11 +54,11 @@ A logistic disjunction node (Or node)
 """
 mutable struct Logistic⋁Node <: LogisticInnerNode
     children::Vector{<:LogisticCircuit}
-    thetas::Array{Float64, 2}
+    thetas::Array{Float32, 2}
     data
     counter::UInt32
     Logistic⋁Node(children, class::Int) = begin
-        new(convert(Vector{LogisticCircuit}, children), init_array(Float64, length(children), class), nothing, 0)
+        new(convert(Vector{LogisticCircuit}, children), init_array(Float32, length(children), class), nothing, 0)
     end
 end
 
diff --git a/src/Logistic/parameters.jl b/src/Logistic/parameters.jl
index 329b90f5..1bb8219c 100644
--- a/src/Logistic/parameters.jl
+++ b/src/Logistic/parameters.jl
@@ -22,7 +22,7 @@ function learn_parameters(lc::LogisticCircuit, classes::Int, data, labels; num_e
     end
 
     for _ = 1:num_epochs
-        class_probs = class_conditional_likelihood_per_instance(lc, classes, data; flows_computed=true)
+        class_probs = class_likelihood_per_instance(lc, classes, data; flows_computed=true)
         update_parameters(lc, class_probs, one_hot_labels)
     end
 
diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index 1e60b16d..f4324637 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -1,59 +1,105 @@
-export class_conditional_weights_per_instance, 
-       class_conditional_likelihood_per_instance, 
-       downflow, accuracy, predict_class
+export class_weights_per_instance, class_likelihood_per_instance, downflow, accuracy, predict_class, 
+    do_nothing_test, access_flow_test, dummy_calculation_test, dummy_calculation_test2
 
-using LogicCircuits: UpDownFlow1, flow_and, or_nodes
+using LogicCircuits: UpDownFlow1, UpDownFlow2, or_nodes
 using ..Probabilistic: get_downflow, get_upflow
-using LoopVectorization: @avx
+using LoopVectorization: @avx, vifelse
+
 
 """
-Class Conditional Weights
+Class Conditional Probability
 """
-# This is the old implementation. It is retained to pass the exptation tests.
-function class_conditional_weights_per_instance(lc::LogisticCircuit,  classes::Int, data; flows_computed=false)
+# with flows computed (2.03 s (80704 allocations: 3.32 MiB))
+# 5.136 s (275778 allocations: 6.99 GiB) on mnist.circuit
+@inline function class_likelihood_per_instance(lc::LogisticCircuit,  classes::Int, data; flows_computed=false)
     if !flows_computed
         compute_flows(lc, data)
     end
+    
+    weights = class_weights_per_instance(lc, classes, data; flows_computed=true)
+    @avx @. 1.0 / (1.0 + exp(-weights))
+end
 
-    likelihoods = zeros(num_examples(data), classes)
+@inline function class_weights_per_instance(lc::LogisticCircuit,  classes::Int, data; flows_computed=false)
+    if !flows_computed
+        compute_flows(lc, data)
+    end
+    
+    weights = zeros(num_examples(data), classes)
     foreach(or_nodes(lc)) do ln
         foreach(eachrow(ln.thetas), children(ln)) do theta, c
-            flow = Float64.(get_downflow(ln) .& get_upflow(c))
-            @avx @. likelihoods += flow * theta'
-        end
+            flow = Float32.(downflow(ln, c))
+            @avx @. weights +=  flow * theta'
+        end        
     end
     
+    weights
+end
+
+# 5.795 ms (72350 allocations: 6.58 MiB)
+@inline function do_nothing_test(lc::LogisticCircuit,  classes::Int, data)
+    likelihoods = zeros(num_examples(data), classes)
+    foreach(or_nodes(lc)) do ln
+        foreach(eachrow(ln.thetas), children(ln)) do theta, c
+            nothing
+        end        
+    end
+    @avx @. likelihoods = 1.0 / (1.0 + exp(-likelihoods))
     likelihoods
 end
 
-"""
-Class Conditional Probability
-"""
-@inline function class_conditional_likelihood_per_instance(lc::LogisticCircuit,  classes::Int, data; flows_computed=false)
-    if !flows_computed
-        compute_flows(lc, data)
+# 1.574 s (193840 allocations: 6.98 GiB)
+@inline function access_flow_test(lc::LogisticCircuit,  classes::Int, data)
+    foreach(or_nodes(lc)) do ln
+        foreach(eachrow(ln.thetas), children(ln)) do theta, c
+            flow = Float32.(downflow(ln, c)) 
+        end        
     end
-    
+    nothing
+end
+
+# 2.943 s (82272 allocations: 6.74 MiB)
+@inline function dummy_calculation_test(lc::LogisticCircuit,  classes::Int, data)
     likelihoods = zeros(num_examples(data), classes)
     foreach(or_nodes(lc)) do ln
         foreach(eachrow(ln.thetas), children(ln)) do theta, c
-            flow = Float64.(downflow(ln, c))
-            @avx @. likelihoods +=  flow * theta'
+            @avx @. likelihoods += likelihoods
+        end        
+    end
+    @avx @. likelihoods = 1.0 / (1.0 + exp(-likelihoods))
+    likelihoods
+end
+
+# 4.790 s (193843 allocations: 6.99 GiB)
+@inline function dummy_calculation_test2(lc::LogisticCircuit,  classes::Int, data)
+    likelihoods = zeros(num_examples(data), classes)
+    foreach(or_nodes(lc)) do ln
+        foreach(eachrow(ln.thetas), children(ln)) do theta, c
+            flow = Float32.(downflow(ln, c))
+            @avx @. likelihoods += likelihoods
         end        
     end
-    
     @avx @. likelihoods = 1.0 / (1.0 + exp(-likelihoods))
     likelihoods
 end
 
 @inline downflow(or_parent::Logistic⋁Node, c) = 
-    (c.data isa UpDownFlow1) ? c.data.downflow : flow_and(or_parent.data.downflow, c.data)
+    (c.data isa UpDownFlow1) ? c.data.downflow : flow_and(or_parent.data.downflow, c.data, or_parent.data.upflow)
+
+@inline flow_and(downflow_n::BitVector, c_flow::UpDownFlow2, upflow_n::BitVector) = 
+    @. downflow_n & c_flow.prime_flow & c_flow.sub_flow
+
+@inline flow_and(downflow_n::Vector{<:AbstractFloat}, c_flow::UpDownFlow2, upflow_n::Vector{<:AbstractFloat}) = 
+    @avx @. downflow_n * c_flow.prime_flow * make_finite(c_flow.sub_flow/upflow_n)
+
+@inline make_finite(x::T) where T = vifelse(isfinite(x), x, zero(T))
+
 
 """
 Class Predictions
 """
 @inline function predict_class(lc::LogisticCircuit, classes::Int, data)
-    class_likelihoods = class_conditional_likelihood_per_instance(lc, classes, data)
+    class_likelihoods = class_likelihood_per_instance(lc, classes, data)
     predict_class(class_likelihoods)
 end
 
diff --git a/test/Logistic/logistic_tests.jl b/test/Logistic/logistic_tests.jl
index 5c83fb9a..a58ddc76 100644
--- a/test/Logistic/logistic_tests.jl
+++ b/test/Logistic/logistic_tests.jl
@@ -17,11 +17,11 @@ using ProbabilisticCircuits
     # true_weight_func = [3.43147972 4.66740416; 
     #                     4.27595352 2.83503504;
     #                     3.67415087 4.93793472]
-    true_prob = [0.9686740004857587 0.9906908446064048;
-                 0.9862917386522077 0.9445399501015433;
-                 0.9752568180725943 0.9928816444023877]
+    true_prob = [0.9686740008311808 0.9906908445371728;
+                 0.9862917392724188 0.9445399509069984; 
+                 0.9752568185086389 0.9928816444223209]
             
-    class_prob = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
+    class_prob = class_likelihood_per_instance(logistic_circuit, CLASSES, data)
     for i = 1:size(true_prob)[1]
         for j = 1:CLASSES
             @test true_prob[i,j] ≈ class_prob[i,j]
@@ -29,8 +29,8 @@ using ProbabilisticCircuits
     end
 
     # check probabilities for float samples
-    data = Float64.(data)
-    class_prob = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
+    data = Float32.(data)
+    class_prob = class_likelihood_per_instance(logistic_circuit, CLASSES, data)
     for i = 1:size(true_prob)[1]
         for j = 1:CLASSES
             @test true_prob[i,j] ≈ class_prob[i,j]
@@ -60,6 +60,7 @@ using ProbabilisticCircuits
     one_hot_labels = [0.0 1.0;
                       1.0 0.0;
                       0.0 1.0]
+    one_hot_labels = Float32.(one_hot_labels)
     true_error = true_prob .- one_hot_labels
     step_size = 0.1
     learn_parameters(logistic_circuit, CLASSES, data, true_labels; num_epochs=1, step_size=step_size, flows_computed=true)
@@ -71,7 +72,7 @@ using ProbabilisticCircuits
                     for class = 1:CLASSES
                         true_update_amount = -step_size * sum(c.data.upflow .* true_error[:, class]) / size(true_error)[1]
                         updated_amount = theta[class] - original_literal_parameters[c.literal][class]
-                        @test updated_amount ≈ true_update_amount
+                        @test updated_amount ≈ true_update_amount atol=1e-7
                     end
                 end
             end
diff --git a/test/Reasoning/expectation_test.jl b/test/Reasoning/expectation_test.jl
index 9ad55b98..4f886b74 100644
--- a/test/Reasoning/expectation_test.jl
+++ b/test/Reasoning/expectation_test.jl
@@ -14,7 +14,7 @@ function test_expectation_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data
         calc_p = log_likelihood_per_instance(pc, cur_data_all)
         calc_p = exp.(calc_p)
 
-        calc_f = class_conditional_weights_per_instance(lc, CLASSES, cur_data_all)
+        calc_f = class_weights_per_instance(lc, CLASSES, cur_data_all)
         true_exp[i, :] = sum(calc_p .* calc_f, dims=1)
         true_exp[i, :] ./= sum(calc_p) #p_observed
     end
@@ -47,7 +47,7 @@ function test_moment_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLA
         calc_p = log_likelihood_per_instance(pc, cur_data_all)
         calc_p = exp.(calc_p)
 
-        calc_f = class_conditional_weights_per_instance(lc, CLASSES, cur_data_all)
+        calc_f = class_weights_per_instance(lc, CLASSES, cur_data_all)
         true_mom[i, :] = sum(calc_p .* (calc_f .^ moment), dims=1)
         true_mom[i, :] ./= sum(calc_p) #p_observed
     end

From 2f287c4d97573b731a12b4835598afa84fcf3df3 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Sat, 15 Aug 2020 17:36:36 -0700
Subject: [PATCH 047/131] clt init

---
 src/Probabilistic/exp_flows.jl                |  10 +-
 src/Probabilistic/informations.jl             |   4 +-
 src/Probabilistic/parameters.jl               |  22 +-
 src/Probabilistic/queries.jl                  |  20 +-
 src/ProbabilisticCircuits.jl                  |   5 +-
 src/StructureLearner/CircuitBuilder.jl        | 133 ---------
 src/StructureLearner/PSDDInitializer.jl       | 275 ------------------
 src/StructureLearner/StructureLearner.jl      |  17 +-
 .../{ChowLiuTree.jl => chow_liu_tree.jl}      |  18 +-
 src/StructureLearner/init.jl                  | 167 +++++++++++
 src/Utils/Utils.jl                            |   2 +-
 src/Utils/informations.jl                     |  17 +-
 test/StructureLearner/CircuitBuilderTest.jl   |  24 --
 ...wLiuTreeTest.jl => chow_liu_tree_tests.jl} |   3 +-
 .../{PSDDInitializerTest.jl => init_tests.jl} |  17 +-
 test/runtests.jl                              |   2 +-
 16 files changed, 233 insertions(+), 503 deletions(-)
 delete mode 100644 src/StructureLearner/CircuitBuilder.jl
 delete mode 100644 src/StructureLearner/PSDDInitializer.jl
 rename src/StructureLearner/{ChowLiuTree.jl => chow_liu_tree.jl} (84%)
 create mode 100644 src/StructureLearner/init.jl
 delete mode 100644 test/StructureLearner/CircuitBuilderTest.jl
 rename test/StructureLearner/{ChowLiuTreeTest.jl => chow_liu_tree_tests.jl} (87%)
 rename test/StructureLearner/{PSDDInitializerTest.jl => init_tests.jl} (52%)

diff --git a/src/Probabilistic/exp_flows.jl b/src/Probabilistic/exp_flows.jl
index 5dea47a9..5dc4eac6 100644
--- a/src/Probabilistic/exp_flows.jl
+++ b/src/Probabilistic/exp_flows.jl
@@ -1,7 +1,7 @@
 export evaluate_exp, compute_exp_flows, get_downflow, get_upflow, get_exp_downflow, get_exp_upflow
 
 
-using StatsFuns: logaddexp
+using StatsFuns: logsumexp
 
 # TODO move to LogicCircuits
 # TODO downflow struct
@@ -97,9 +97,9 @@ function evaluate_exp(root::ProbCircuit, data;
             log_thetas = n.log_thetas
             c1 = call(@inbounds children(n)[1])::ExpUpFlow
             c2 = call(@inbounds children(n)[2])::ExpUpFlow
-            x = flowop(c1, log_thetas[1], c2, log_thetas[2], logaddexp)
+            x = flowop(c1, log_thetas[1], c2, log_thetas[2], logsumexp)
             for (i, c) in enumerate(children(n)[3:end])
-                accumulate(x, call(c), log_thetas[i+2], logaddexp)
+                accumulate(x, call(c), log_thetas[i+2], logsumexp)
             end
             return x
         end
@@ -174,12 +174,12 @@ function compute_exp_flows(circuit::ProbCircuit, data)
                     for i = 1:2
                         downflow_c = downflow(@inbounds children(c)[i])
                         accumulate(downflow_c, downflow_n .+ log_theta .+ upflow2_c.prime_flow 
-                        .+ upflow2_c.sub_flow .- upflow_n, logaddexp)
+                        .+ upflow2_c.sub_flow .- upflow_n, logsumexp)
                     end
                 else
                     upflow1_c = (c.data::ExpUpDownFlow1).upflow
                     downflow_c = downflow(c)
-                    accumulate(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n, logaddexp)
+                    accumulate(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n, logsumexp)
                 end
             end 
         end
diff --git a/src/Probabilistic/informations.jl b/src/Probabilistic/informations.jl
index d3208ad2..bc6e14c9 100644
--- a/src/Probabilistic/informations.jl
+++ b/src/Probabilistic/informations.jl
@@ -1,4 +1,4 @@
-export pr_constraint, kl_divergence, entropy
+export pr_constraint, kl_divergence
 
 const StrutCircuit = Union{ProbCircuit, StructLogicCircuit}
 const KLDCache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}
@@ -66,6 +66,8 @@ end
 """"
 Calculate entropy of the distribution of the input psdd."
 """
+
+import ..Utils: entropy
 function entropy(psdd_node::StructProb⋁Node, psdd_entropy_cache::Dict{ProbCircuit, Float64}=Dict{ProbCircuit, Float64}())::Float64
     if psdd_node in keys(psdd_entropy_cache)
         return psdd_entropy_cache[psdd_node]
diff --git a/src/Probabilistic/parameters.jl b/src/Probabilistic/parameters.jl
index 055575cd..87186cfa 100644
--- a/src/Probabilistic/parameters.jl
+++ b/src/Probabilistic/parameters.jl
@@ -1,4 +1,5 @@
-export estimate_parameters
+export estimate_parameters, uniform_parameters
+using StatsFuns: logsumexp
 
 """
 Maximum likilihood estimation of parameters given data
@@ -7,7 +8,7 @@ function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
     @assert isbinarydata(data)
     compute_flows(pc, data)
     foreach(pc) do pn
-        if pn isa Prob⋁Node
+        if is⋁gate(pn)
             if num_children(pn) == 1
                 pn.log_thetas .= 0.0
             else
@@ -17,11 +18,26 @@ function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
                 @. pn.log_thetas = log((children_flows + uniform_pseudocount) / smoothed_flow)
                 @assert isapprox(sum(exp.(pn.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally"
                 # normalize away any leftover error
-                pn.log_thetas .-= logaddexp(pn.log_thetas)
+                pn.log_thetas .-= logsumexp(pn.log_thetas)
             end
         end
     end
 end
 
 
+"""
+Uniform distribution
+"""
+function uniform_parameters(pc::ProbCircuit)
+    foreach(pc) do pn
+        if is⋁gate(pn)
+            if num_children(pn) == 1
+                pn.log_thetas .= 0.0
+            else
+                pn.log_thetas .= log.(ones(Float64, num_children(pn)) ./ num_children(pn))
+            end
+        end
+    end
+end
+
 # TODO add em paramaters learning 
\ No newline at end of file
diff --git a/src/Probabilistic/queries.jl b/src/Probabilistic/queries.jl
index 77650b3a..917e9fc7 100644
--- a/src/Probabilistic/queries.jl
+++ b/src/Probabilistic/queries.jl
@@ -12,7 +12,7 @@ function log_likelihood_per_instance(pc::ProbCircuit, data)
     indices = init_array(Bool, num_examples(data))::BitVector
     
     ll(n::ProbCircuit) = ()
-    ll(n::Prob⋁Node) = begin
+    ll(n::Union{Prob⋁Node, StructProb⋁Node}) = begin
         if num_children(n) != 1 # other nodes have no effect on likelihood
             foreach(children(n), n.log_thetas) do c, log_theta
                 indices = get_downflow(n, c)
@@ -50,7 +50,7 @@ function MPE(pc::ProbCircuit, evidence)::BitMatrix
     ans = falses(num_examples(evidence), num_features(evidence))
     active_samples = trues(num_examples(evidence))
 
-    function mpe_simulate(node::ProbLiteralNode, active_samples::BitVector, result::BitMatrix)
+    function mpe_simulate(node::Union{ProbLiteralNode, StructProbLiteralNode}, active_samples::BitVector, result::BitMatrix)
         if ispositive(node)
             result[active_samples, variable(node)] .= 1
         else
@@ -58,7 +58,7 @@ function MPE(pc::ProbCircuit, evidence)::BitMatrix
         end
     end
     
-    function mpe_simulate(node::Prob⋁Node, active_samples::BitVector, result::BitMatrix)
+    function mpe_simulate(node::Union{Prob⋁Node, StructProb⋁Node}, active_samples::BitVector, result::BitMatrix)
         prs = zeros(length(children(node)), size(active_samples)[1] )
         @simd  for i=1:length(children(node))
             prs[i,:] .= get_exp_upflow(children(node)[i]) .+ (node.log_thetas[i])
@@ -72,7 +72,7 @@ function MPE(pc::ProbCircuit, evidence)::BitMatrix
         end
     end
     
-    function mpe_simulate(node::Prob⋀Node, active_samples::BitVector, result::BitMatrix)
+    function mpe_simulate(node::Union{Prob⋀Node, StructProb⋀Node}, active_samples::BitVector, result::BitMatrix)
         for child in children(node)
             mpe_simulate(child, active_samples, result)
         end
@@ -92,16 +92,16 @@ Sample from a PSDD without any evidence
 """
 function sample(circuit::ProbCircuit)::AbstractVector{Bool}
 
-    simulate(node::ProbLiteralNode) = begin
+    simulate(node::Union{ProbLiteralNode, StructProbLiteralNode}) = begin
         inst[variable(node)] = ispositive(node) ? 1 : 0
     end
     
-    simulate(node::Prob⋁Node) = begin
+    simulate(node::Union{Prob⋁Node, StructProb⋁Node}) = begin
         idx = sample(exp.(node.log_thetas))
         simulate(children(node)[idx])
     end
 
-    simulate(node::Prob⋀Node) = foreach(simulate, children(node))
+    simulate(node::Union{Prob⋀Node, StructProb⋀Node}) = foreach(simulate, children(node))
 
     inst = Dict{Var,Int64}()
     simulate(circuit)
@@ -121,17 +121,17 @@ function sample(circuit::ProbCircuit, evidence)::AbstractVector{Bool}
 
     @assert num_examples(evidence) == 1 "evidence have to be one example"
     
-    simulate(node::ProbLiteralNode) = begin
+    simulate(node::Union{ProbLiteralNode, StructProbLiteralNode}) = begin
         inst[variable(node)] = ispositive(node) ? 1 : 0
     end
     
-    function simulate(node::Prob⋁Node)
+    function simulate(node::Union{Prob⋁Node, StructProb⋁Node})
         prs = [get_exp_upflow(ch)[1] for ch in children(node)] # #evidence == 1
         idx = sample(exp.(node.log_thetas .+ prs))
         simulate(children(node)[idx])
     end
     
-    simulate(node::Prob⋀Node) = foreach(simulate, children(node))
+    simulate(node::Union{Prob⋀Node, StructProb⋀Node}) = foreach(simulate, children(node))
 
     evaluate_exp(circuit, evidence)
 
diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 6f62186d..e9ec78e3 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -16,8 +16,7 @@ include("Probabilistic/Probabilistic.jl")
 include("Logistic/Logistic.jl")
 include("LoadSave/LoadSave.jl")
 include("Reasoning/Reasoning.jl")
-
-# include("StructureLearner/StructureLearner.jl")
+include("StructureLearner/StructureLearner.jl")
 
 
 # USE CHILD MODULES (in order to re-export some functions)
@@ -25,6 +24,6 @@ include("Reasoning/Reasoning.jl")
 @reexport using .Logistic
 @reexport using .LoadSave
 @reexport using .Reasoning
-# @reexport using .StructureLearner
+@reexport using .StructureLearner
 
 end
diff --git a/src/StructureLearner/CircuitBuilder.jl b/src/StructureLearner/CircuitBuilder.jl
deleted file mode 100644
index fe73532b..00000000
--- a/src/StructureLearner/CircuitBuilder.jl
+++ /dev/null
@@ -1,133 +0,0 @@
-using LightGraphs: topological_sort_by_dfs, outneighbors
-using MetaGraphs: get_prop
-
-
-"convert literal+/- to probability value 0/1"
-@inline lit2value(l::Lit)::Int = (l > 0 ? 1 : 0)
-
-"""
-Learning from data a circuit with several structure learning algorithms
-"""
-function learn_probabilistic_circuit(data::Union{XData, WXData}; 
-        pseudocount = 1.0, algo = "chow-liu", algo_kwargs=(α=1.0, clt_root="graph_center"))::ProbCircuit
-    if algo == "chow-liu"
-        clt = learn_chow_liu_tree(data; algo_kwargs...)
-        pc = compile_prob_circuit_from_clt(clt)
-        estimate_parameters(pc, convert(XBatches,data); pseudocount = pseudocount)
-        pc 
-    else
-        error("Cannot learn a probabilistic circuit with algorithm $algo")
-    end
-end
-
-"Build decomposable probability circuits from Chow-Liu tree"
-function compile_prob_circuit_from_clt(clt::CLT)::ProbCircuit
-    topo_order = Var.(reverse(topological_sort_by_dfs(clt::CLT))) #order to parse the node
-    lin = Vector{ProbCircuit}()
-    node_cache = Dict{Lit, LogicCircuit}()
-    prob_cache = ProbCache()
-    parent = parent_vector(clt)
-
-    prob_children(n)::Vector{<:ProbCircuit{<:node_type_deprecated(n)}} =  
-        collect(ProbCircuit{<:node_type_deprecated(n)}, map(c -> prob_cache[c], children(n)))
-
-    "default order of circuit node, from left to right: +/1 -/0"
-
-    "compile leaf node into circuits"
-    function compile_leaf(ln::Var)
-        pos = LiteralNode( var2lit(ln))
-        neg = LiteralNode(-var2lit(ln))
-        node_cache[var2lit(ln)] = pos
-        node_cache[-var2lit(ln)] = neg
-        pos2 = ProbLiteral(pos)
-        neg2 = ProbLiteral(neg)
-        push!(lin, pos2)
-        push!(lin, neg2)
-        prob_cache[pos] = pos2
-        prob_cache[neg] = neg2
-    end
-
-    "compile inner disjunction node"
-    function compile_⋁inner(ln::Lit, children::Vector{Var})::Vector{Plain⋁Node}
-        logical_nodes = Vector{Plain⋁Node}()
-        v = lit2value(ln)
-
-        for c in children
-            #build logical ciruits
-            temp = Plain⋁Node([node_cache[lit] for lit in [var2lit(c), - var2lit(c)]])
-            push!(logical_nodes, temp)
-            n = Prob⋁(temp, prob_children(temp))
-            prob_cache[temp] = n
-            n.log_thetas = zeros(Float64, 2)
-            cpt = get_prop(clt, c, :cpt)
-            weights = [cpt[(1, v)], cpt[(0, v)]]
-            n.log_thetas = log.(weights)
-            push!(lin, n)
-        end
-
-        return logical_nodes
-    end
-
-    "compile inner conjunction node into circuits, left node is indicator, rest nodes are disjunction children nodes"
-    function compile_⋀inner(indicator::Lit, children::Vector{Plain⋁Node})
-        leaf = node_cache[indicator]
-        temp = Plain⋀Node(vcat([leaf], children))
-        node_cache[indicator] = temp
-        n = Prob⋀(temp, prob_children(temp))
-        prob_cache[temp] = n
-        push!(lin, n)
-    end
-
-    "compile inner node, 1 inner variable to 2 leaf nodes, 2 * num_children disjunction nodes and 2 conjunction nodes"
-    function compile_inner(ln::Var, children::Vector{Var})
-        compile_leaf(ln)
-        pos⋁ = compile_⋁inner(var2lit(ln), children)
-        neg⋁ = compile_⋁inner(-var2lit(ln), children)
-        compile_⋀inner(var2lit(ln), pos⋁)
-        compile_⋀inner(-var2lit(ln), neg⋁)
-    end
-
-    "compile root, add another disjunction node"
-    function compile_root(root::Var)
-        temp = Plain⋁Node([node_cache[s] for s in [var2lit(root), -var2lit(root)]])
-        n = Prob⋁(temp, prob_children(temp))
-        prob_cache[temp] = n
-        n.log_thetas = zeros(Float64, 2)
-        cpt = get_prop(clt, root, :cpt)
-        weights = [cpt[1], cpt[0]]
-        n.log_thetas = log.(weights)
-        push!(lin, n)
-        return n
-    end
-
-    function compile_independent_roots(roots::Vector{ProbCircuit})
-        temp = Plain⋀Node([c.origin for c in roots])
-        n = Prob⋀(temp, prob_children(temp))
-        prob_cache[temp] = n
-        push!(lin, n)
-        temp = Plain⋁Node([temp])
-        n = Prob⋁{LogicCircuit}(temp, prob_children(temp))
-        prob_cache[temp] = n
-        n.log_thetas = [0.0]
-        push!(lin, n)
-    end
-
-    roots = Vector{ProbCircuit}()
-    for id in topo_order
-        children = Var.(outneighbors(clt, id))
-        if isequal(children, [])
-            compile_leaf(id)
-        else
-            compile_inner(id, children)
-        end
-        if 0 == parent[id]
-            push!(roots, compile_root(id))
-        end
-    end
-
-    if length(roots) > 1
-        compile_independent_roots(roots)
-    end
-
-    return lin
-end
diff --git a/src/StructureLearner/PSDDInitializer.jl b/src/StructureLearner/PSDDInitializer.jl
deleted file mode 100644
index 7a086875..00000000
--- a/src/StructureLearner/PSDDInitializer.jl
+++ /dev/null
@@ -1,275 +0,0 @@
-using ..Utils
-
-"Map from literal to LogicCircuit"
-const LitCache = Dict{Lit, LogicCircuit}
-
-"Use literal to represent constraint (1 to X, -1 to not X), 0 to represent true"
-const ⊤ = convert(Lit, 0)
-
-"""
-Learning from data a structured-decomposable circuit with several structure learning algorithms
-"""
-function learn_struct_prob_circuit(data::Union{XData, WXData}; 
-        pseudocount = 1.0, algo = "chow-liu", algo_kwargs=(α=1.0, clt_root="graph_center"), vtree = "chow-liu", vtree_kwargs=(vtree_mode="balanced",))
-    if algo == "chow-liu"
-        clt = learn_chow_liu_tree(data; algo_kwargs...)
-        vtree = learn_vtree_from_clt(clt; vtree_kwargs...);
-        pc = compile_psdd_from_clt(clt, vtree);
-        estimate_parameters(pc, convert(XBatches,data); pseudocount = pseudocount)
-        pc, vtree
-    else
-        error("Cannot learn a structured-decomposable circuit with algorithm $algo")
-    end
-end
-
-#############
-# Learn PlainVtree from CLT
-#############
-
-"
-Learn a vtree from clt,
-with strategy (close to) `linear` or `balanced`
-"
-function learn_vtree_from_clt(clt::CLT; vtree_mode::String)::PlainVtree
-    roots = [i for (i, x) in enumerate(parent_vector(clt)) if x == 0]
-    rootnode = construct_children(Var.(roots), clt, vtree_mode)
-
-    return linearize(rootnode)
-end
-
-function construct_node(v::Var, clt::CLT, strategy::String)::PlainVtree
-    children = Var.(outneighbors(clt, v))
-    if isempty(children) # leaf node
-        return PlainVtreeLeafNode(v)
-    else
-        right = construct_children(children, clt, strategy)
-        return add_parent(v, right)
-    end
-end
-
-function construct_children(children::Vector{Var}, clt::CLT, strategy::String)::PlainVtree
-    sorted_vars = sort(collect(children))
-    children_nodes = Vector{PlainVtree}()
-    foreach(x -> push!(children_nodes, construct_node(x, clt, strategy)), sorted_vars)
-
-    if strategy == "linear"
-        construct_children_linear(children_nodes, clt)
-    elseif strategy == "balanced"
-        construct_children_balanced(children_nodes, clt)
-    else
-        throw("Unknown type of strategy")
-    end
-end
-
-function construct_children_linear(children_nodes::Vector{PlainVtree}, clt::CLT)::PlainVtree
-    children_nodes = Iterators.Stateful(reverse(children_nodes))
-
-    right = popfirst!(children_nodes)
-    for left in children_nodes
-        right = PlainVtreeInnerNode(left, right)
-    end
-    return right
-end
-
-function construct_children_balanced(children_nodes::Vector{PlainVtree}, clt::CLT)::PlainVtree
-    if length(children_nodes) == 1
-        return children_nodes[1]
-    elseif length(children_nodes) == 2
-        return PlainVtreeInnerNode(children_nodes[1], children_nodes[2])
-    else
-        len = trunc(Int64, length(children_nodes) / 2)
-        left = construct_children_balanced(children_nodes[1 : len], clt)
-        right = construct_children_balanced(children_nodes[len + 1 : end], clt)
-        return PlainVtreeInnerNode(left, right)
-    end
-end
-
-function add_parent(parent::Var, children::PlainVtree)
-    return PlainVtreeInnerNode(PlainVtreeLeafNode(parent), children)
-end
-
-#####################
-# Compile PSDD from CLT and vtree
-#####################
-
-"Compile a psdd circuit from clt and vtree"
-function compile_psdd_from_clt(clt::MetaDiGraph, vtree::PlainVtree)
-    order = linearize(vtree[end])
-    parent_clt = Var.(parent_vector(clt))
-
-    lin = Vector{ProbCircuit}()
-    prob_cache = ProbCache()
-    lit_cache = LitCache()
-    v2p = Dict{PlainVtree, ProbCircuit}()
-
-    get_params(cpt::Dict) = length(cpt) == 2 ? [cpt[1], cpt[0]] : [cpt[(1,1)], cpt[(0,1)], cpt[(1,0)], cpt[(0,0)]]
-    function add_mapping!(v::PlainVtree, circuits::ProbCircuit)
-        if !haskey(v2p, v); v2p[v] = Vector{ProbCircuit}(); end
-        foreach(c -> if !(c in v2p[v]) push!(v2p[v], c);end, circuits)
-    end
-
-    # compile vtree leaf node to terminal/true node
-    function compile_from_vtree_node(v::PlainVtreeLeafNode)
-        var = v.var
-        children = Var.(outneighbors(clt, var))
-        cpt = get_prop(clt, var, :cpt)
-        parent = parent_clt[var]
-        if isequal(children, [])
-            circuit = compile_true_nodes(var, v, get_params(cpt), lit_cache, prob_cache, lin)
-        else
-            circuit = compile_canonical_literals(var, v, get_params(cpt), lit_cache, prob_cache, lin)
-        end
-        add_mapping!(v, circuit)
-    end
-
-    # compile to decision node
-    function compile_from_vtree_node(v::PlainVtreeInnerNode)
-        left_var = left_most_descendent(v.left).var
-        right_var = left_most_descendent(v.right).var
-        left_circuit = v2p[v.left]
-        right_circuit = v2p[v.right]
-
-        if parent_clt[left_var] == parent_clt[right_var] # two nodes are independent, compile to seperate decision nodes
-            circuit = [compile_decision_node([l], [r], v, [1.0], prob_cache, lin) for (l, r) in zip(left_circuit, right_circuit)]
-        elseif left_var == parent_clt[right_var] # conditioned on left
-            cpt = get_prop(clt, left_var, :cpt)
-            circuit = compile_decision_nodes(left_circuit, right_circuit, v, get_params(cpt), prob_cache, lin)
-        else
-            throw("PlainVtree are not learned from the same CLT")
-        end
-        add_mapping!(v, circuit)
-    end
-
-    foreach(compile_from_vtree_node, vtree)
-    return lin
-end
-
-#####################
-# Construct probabilistic circuit node
-#####################
-
-prob_children(n, prob_cache) =  
-    collect(ProbCircuit{<:StructLogicCircuit}, map(c -> prob_cache[c], n.children))
-
-"Add leaf nodes to circuit `lin`"
-function add_prob_leaf_node(var::Var, vtree::PlainVtreeLeafNode, lit_cache::LitCache, prob_cache::ProbCache, lin)
-    pos = PlainStructLiteralNode{PlainVtree}( var2lit(var), vtree)
-    neg = PlainStructLiteralNode{PlainVtree}(-var2lit(var), vtree)
-    lit_cache[var2lit(var)] = pos
-    lit_cache[-var2lit(var)] = neg
-    pos2 = ProbLiteral(pos)
-    neg2 = ProbLiteral(neg)
-    prob_cache[pos] = pos2
-    prob_cache[neg] = neg2
-    push!(lin, pos2)
-    push!(lin, neg2)
-    return (pos2, neg2)
-end
-
-"Add prob⋀ node to circuit `lin`"
-function add_prob⋀_node(children::ProbCircuit, vtree::PlainVtreeInnerNode, prob_cache::ProbCache, lin)::Prob⋀
-    logic = PlainStruct⋀Node{PlainVtree}([c.origin for c in children], vtree)
-    prob = Prob⋀(logic, prob_children(logic, prob_cache))
-    prob_cache[logic] = prob
-    push!(lin, prob)
-    return prob
-end
-
-"Add prob⋁ node to circuit `lin`"
-function add_prob⋁_node(children::ProbCircuit, vtree::PlainVtree, thetas::Vector{Float64}, prob_cache::ProbCache, lin)::Prob⋁
-    logic = PlainStruct⋁Node{PlainVtree}([c.origin for c in children], vtree)
-    prob = Prob⋁(logic, prob_children(logic, prob_cache))
-    prob.log_thetas = log.(thetas)
-    prob_cache[logic] = prob
-    push!(lin, prob)
-    return prob
-end
-
-"Construct decision nodes given `primes` and `subs`"
-function compile_decision_node(primes::ProbCircuit, subs::ProbCircuit, vtree::PlainVtreeInnerNode, params::Vector{Float64}, prob_cache::ProbCache, lin)
-    elements = [add_prob⋀_node([prime, sub], vtree, prob_cache, lin) for (prime, sub) in zip(primes, subs)]
-    return add_prob⋁_node(elements, vtree, params, prob_cache, lin)
-end
-
-"Construct literal nodes given variable `var`"
-function compile_canonical_literals(var::Var, vtree::PlainVtreeLeafNode, probs::Vector{Float64}, lit_cache::LitCache, prob_cache::ProbCache, lin)
-    (pos, neg) = add_prob_leaf_node(var, vtree, lit_cache, prob_cache, lin)
-    return [pos, neg]
-end
-
-"Construct true nodes given variable `var`"
-function compile_true_nodes(var::Var, vtree::PlainVtreeLeafNode, probs::Vector{Float64}, lit_cache::LitCache, prob_cache::ProbCache, lin)
-    (pos, neg) = add_prob_leaf_node(var, vtree, lit_cache, prob_cache, lin)
-    return [add_prob⋁_node([pos, neg], vtree, probs[i:i+1], prob_cache, lin) for i in 1:2:length(probs)]
-end
-
-"Construct decision nodes conditiond on different distribution"
-function compile_decision_nodes(primes::ProbCircuit, subs::ProbCircuit, vtree::PlainVtreeInnerNode, params::Vector{Float64}, prob_cache::ProbCache, lin)
-    return [compile_decision_node(primes, subs, vtree, params[i:i+1], prob_cache, lin) for i in 1:2:length(params)]
-end
-
-#####################
-# Map and cache constraints
-#####################
-
-function set_base(index, n::PlainStructLiteralNode, bases)
-    if ispositive(n)
-        bases[n][variable(n)] = 1
-    else
-        bases[n][variable(n)] = -1
-    end
-end
-
-function set_base(index, n::PlainStruct⋁Node, bases)
-    len = num_children(n)
-    temp = sum([bases[c] for c in n.children])
-    bases[n] = map(x-> if x == len 1; elseif -x == len; -1; else 0; end, temp)
-end
-
-function set_base(index, n::PlainStruct⋀Node, bases)
-    bases[n] = sum([bases[c] for c in n.children])
-end
-
-function calculate_all_bases(circuit::ProbCircuit)::BaseCache
-    num_var = num_variables(circuit[end].origin.vtree)
-    bases = BaseCache()
-    foreach(n -> bases[n.origin] = fill(⊤, num_var), circuit)
-    foreach(n -> set_base(n[1], n[2].origin, bases), enumerate(circuit))
-    @assert all(bases[circuit[end].origin] .== ⊤) "Base of root node should be true"
-    return bases
-end
-
-#####################
-# Compile fully factorized PSDD from vtree, all variables are independent initially
-#####################
-
-function compile_fully_factorized_psdd_from_vtree(vtree::PlainVtree)::ProbCircuit
-
-    function ful_factor_node(v::PlainVtreeLeafNode, lit_cache::LitCache, prob_cache::ProbCache, v2n, lin)
-        var = variables(v)[1]
-        pos, neg = add_prob_leaf_node(var, v, lit_cache, prob_cache, lin)
-        prob_or = add_prob⋁_node([pos, neg], v, [0.5, 0.5], prob_cache, lin)
-        v2n[v] = prob_or
-        nothing
-    end
-
-    function ful_factor_node(v::PlainVtreeInnerNode, lit_cache::LitCache, prob_cache::ProbCache, v2n, lin)
-        left = v2n[v.left]
-        right = v2n[v.right]
-        prob_and = add_prob⋀_node([left, right], v, prob_cache, lin)
-        prob_or = add_prob⋁_node([prob_and], v, [1.0], prob_cache, lin)
-        v2n[v] = prob_or
-        nothing
-    end
-
-    lin = Vector{ProbCircuit}()
-    prob_cache = ProbCache()
-    lit_cache = LitCache()
-    v2n = Dict{PlainVtree, ProbCircuit}()
-
-    for v in vtree
-        ful_factor_node(v, lit_cache, prob_cache, v2n, lin)
-    end
-
-    lin
-end
diff --git a/src/StructureLearner/StructureLearner.jl b/src/StructureLearner/StructureLearner.jl
index b21c0ad7..92d2cf46 100644
--- a/src/StructureLearner/StructureLearner.jl
+++ b/src/StructureLearner/StructureLearner.jl
@@ -2,23 +2,12 @@ module StructureLearner
 
 using LogicCircuits
 using ..Utils
-
 using ..Probabilistic
-using ..IO
-
-export
-# ChowLiuTree
-learn_chow_liu_tree, parent_vector, print_tree, CLT,
+using ..LoadSave
 
-# CircuitBuilder
-compile_prob_circuit_from_clt, learn_probabilistic_circuit, BaseCache, ⊤, LitCache,
 
-# PSDDInitializer
-learn_struct_prob_circuit,
-learn_vtree_from_clt, compile_psdd_from_clt,compile_fully_factorized_psdd_from_vtree
+include("chow_liu_tree.jl")
+include("init.jl")
 
-include("ChowLiuTree.jl")
-include("CircuitBuilder.jl")
-include("PSDDInitializer.jl")
 
 end
diff --git a/src/StructureLearner/ChowLiuTree.jl b/src/StructureLearner/chow_liu_tree.jl
similarity index 84%
rename from src/StructureLearner/ChowLiuTree.jl
rename to src/StructureLearner/chow_liu_tree.jl
index b2581869..ff9ca1ab 100644
--- a/src/StructureLearner/ChowLiuTree.jl
+++ b/src/StructureLearner/chow_liu_tree.jl
@@ -1,5 +1,6 @@
-using LightGraphs: SimpleGraph, SimpleDiGraph, complete_graph, add_edge!, kruskal_mst, bfs_tree, center, 
-    connected_components, induced_subgraph, nv, ne, edges, vertices, src, dst
+export CLT, learn_chow_liu_tree, parent_vector
+using LightGraphs: SimpleGraph, SimpleDiGraph, complete_graph, add_edge!, kruskal_mst, 
+    bfs_tree, center, connected_components, induced_subgraph, nv, ne, edges, vertices, src, dst
 using SimpleWeightedGraphs: SimpleWeightedGraph
 using MetaGraphs: MetaDiGraph, set_prop!, props
 
@@ -16,15 +17,12 @@ const CLT = MetaDiGraph
 learn a Chow-Liu tree from training set `train_x`, with Laplace smoothing factor `α`, specifying the tree root by `clt_root`
 return a `CLT`
 """
-function learn_chow_liu_tree(train_x::XData; α = 1.0, clt_root="graph_center")::CLT
-    learn_chow_liu_tree(WXData(train_x);α=α, clt_root=clt_root)
-end
-
-function learn_chow_liu_tree(train_x::WXData; α = 1.0, clt_root="graph_center")::CLT
+function learn_chow_liu_tree(train_x; α = 1.0, clt_root="graph_center",
+        weight=ones(Float64, num_examples(train_x)))::CLT
     features_num = num_features(train_x)
 
     # calculate mutual information
-    (dis_cache, MI) = mutual_information(feature_matrix(train_x), Data.weights(train_x); α = α)
+    (dis_cache, MI) = mutual_information(train_x, weight; α = α)
 
     # maximum spanning tree/ forest
     g = SimpleWeightedGraph(complete_graph(features_num))
@@ -91,9 +89,7 @@ function parent_vector(tree::CLT)::Vector{Int64}
     return v
 end
 
-#####################
-# Methods for test
-#####################
+import LogicCircuits: print_tree
 "Print edges and vertices of a ChowLiu tree"
 function print_tree(clt::CLT)
     for e in edges(clt) print(e); print(" ");end
diff --git a/src/StructureLearner/init.jl b/src/StructureLearner/init.jl
new file mode 100644
index 00000000..a25838c5
--- /dev/null
+++ b/src/StructureLearner/init.jl
@@ -0,0 +1,167 @@
+export learn_struct_prob_circuit, learn_vtree_from_clt, compile_sdd_from_clt
+using LightGraphs: outneighbors
+using MetaGraphs: get_prop
+
+"""
+Learning from data a structured-decomposable circuit with several structure learning algorithms
+"""
+function learn_struct_prob_circuit(data;
+        pseudocount = 1.0, 
+        algo = "chow-liu", algo_kwargs=(α=1.0, clt_root="graph_center"), 
+        vtree = "chow-liu", vtree_kwargs=(vtree_mode="balanced",))    
+    if algo == "chow-liu"
+        clt = learn_chow_liu_tree(data; algo_kwargs...)
+        vtree = learn_vtree_from_clt(clt; vtree_kwargs...)
+        lc = compile_sdd_from_clt(clt, vtree)
+        pc = ProbCircuit(lc)
+        estimate_parameters(pc, data; pseudocount=pseudocount)
+        pc, vtree
+    else
+        error("Cannot learn a structured-decomposable circuit with algorithm $algo")
+    end
+end
+
+#############
+# Learn PlainVtree from CLT
+#############
+
+"
+Learn a vtree from clt,
+with strategy (close to) `linear` or `balanced`
+"
+function learn_vtree_from_clt(clt::CLT; vtree_mode::String)::PlainVtree
+    roots = [i for (i, x) in enumerate(parent_vector(clt)) if x == 0]
+    rootnode = construct_children(Var.(roots), clt, vtree_mode)
+
+    return rootnode
+end
+
+function construct_node(v::Var, clt::CLT, strategy::String)::PlainVtree
+    children = Var.(outneighbors(clt, v))
+    if isempty(children) # leaf node
+        return PlainVtreeLeafNode(v)
+    else
+        right = construct_children(children, clt, strategy)
+        return add_parent(v, right)
+    end
+end
+
+function construct_children(children::Vector{Var}, clt::CLT, strategy::String)::PlainVtree
+    sorted_vars = sort(collect(children))
+    children_nodes = Vector{PlainVtree}()
+    foreach(x -> push!(children_nodes, construct_node(x, clt, strategy)), sorted_vars)
+
+    if strategy == "linear"
+        construct_children_linear(children_nodes, clt)
+    elseif strategy == "balanced"
+        construct_children_balanced(children_nodes, clt)
+    else
+        throw("Unknown type of strategy")
+    end
+end
+
+function construct_children_linear(children_nodes::Vector{PlainVtree}, clt::CLT)::PlainVtree
+    children_nodes = Iterators.Stateful(reverse(children_nodes))
+
+    right = popfirst!(children_nodes)
+    for left in children_nodes
+        right = PlainVtreeInnerNode(left, right)
+    end
+    return right
+end
+
+function construct_children_balanced(children_nodes::Vector{PlainVtree}, clt::CLT)::PlainVtree
+    if length(children_nodes) == 1
+        return children_nodes[1]
+    elseif length(children_nodes) == 2
+        return PlainVtreeInnerNode(children_nodes[1], children_nodes[2])
+    else
+        len = trunc(Int64, length(children_nodes) / 2)
+        left = construct_children_balanced(children_nodes[1 : len], clt)
+        right = construct_children_balanced(children_nodes[len + 1 : end], clt)
+        return PlainVtreeInnerNode(left, right)
+    end
+end
+
+function add_parent(parent::Var, children::PlainVtree)
+    return PlainVtreeInnerNode(PlainVtreeLeafNode(parent), children)
+end
+
+#####################
+# Compile PSDD from CLT and vtree
+#####################
+
+"Compile a psdd circuit from clt and vtree"
+function compile_sdd_from_clt(clt::CLT, vtree::PlainVtree)::PlainStructLogicCircuit
+
+    parent_clt = Var.(parent_vector(clt))
+    v2p = Dict{PlainVtree, Vector{PlainStructLogicCircuit}}()
+    
+    function add_mapping!(v::PlainVtree, circuits)
+        if !haskey(v2p, v); v2p[v] = Vector{PlainStructLogicCircuit}(); end
+        foreach(c -> if !(c in v2p[v]) push!(v2p[v], c);end, circuits)
+    end
+
+    # compile vtree leaf node to terminal/true node
+    function compile_from_vtree_node(v::PlainVtreeLeafNode)
+        var = v.var
+        children = Var.(outneighbors(clt, var))
+        cpt = get_prop(clt, var, :cpt)
+        parent = parent_clt[var]
+        if isequal(children, [])
+            circuit = compile_true_nodes(var, v; num=length(cpt) ÷ 2)
+        else
+            circuit = compile_canonical_literals(var, v)
+        end
+        add_mapping!(v, circuit)
+        nothing
+    end
+
+    # compile to decision node
+    function compile_from_vtree_node(v::PlainVtreeInnerNode)
+        left_var = left_most_descendent(v.left).var
+        right_var = left_most_descendent(v.right).var
+        left_circuit = v2p[v.left]
+        right_circuit = v2p[v.right]
+
+        if parent_clt[left_var] == parent_clt[right_var] # two nodes are independent, compile to seperate decision nodes
+            circuit = [compile_decision_node([l], [r], v) for (l, r) in zip(left_circuit, right_circuit)]
+        elseif left_var == parent_clt[right_var] # conditioned on left
+            cpt = get_prop(clt, left_var, :cpt)
+            circuit = compile_decision_nodes(left_circuit, right_circuit, v; num=length(cpt) ÷ 2)
+        else
+            throw("PlainVtree are not learned from the same CLT")
+        end
+        add_mapping!(v, circuit)
+        nothing
+    end
+
+    foreach(compile_from_vtree_node, vtree)
+
+    v2p[vtree][end]
+end
+
+#####################
+# Construct circuit node
+#####################
+"Construct decision nodes given `primes` and `subs`"
+function compile_decision_node(primes::Vector{<:PlainStructLogicCircuit}, subs::Vector{<:PlainStructLogicCircuit}, vtree::PlainVtreeInnerNode)
+    elements = [conjoin(prime, sub; use_vtree=vtree) for (prime, sub) in zip(primes, subs)]
+    return disjoin(elements; use_vtree=vtree)
+end
+
+"Construct literal nodes given variable `var`"
+function compile_canonical_literals(var::Var, vtree::PlainVtreeLeafNode)
+    return [PlainStructLiteralNode( var2lit(var), vtree), PlainStructLiteralNode(-var2lit(var), vtree)]
+end
+
+"Construct true nodes given variable `var`"
+function compile_true_nodes(var::Var, vtree::PlainVtreeLeafNode; num)
+    pos, neg = compile_canonical_literals(var, vtree)
+    return [disjoin([pos, neg]; use_vtree = vtree) for _ in 1 : num]
+end
+
+"Construct decision nodes conditiond on different distribution"
+function compile_decision_nodes(primes::Vector{<:PlainStructLogicCircuit}, subs::Vector{<:PlainStructLogicCircuit}, vtree::PlainVtreeInnerNode; num)
+    return [compile_decision_node(primes, subs, vtree) for _ in 1 : num]
+end
diff --git a/src/Utils/Utils.jl b/src/Utils/Utils.jl
index 24c120b6..9bf1f2fc 100644
--- a/src/Utils/Utils.jl
+++ b/src/Utils/Utils.jl
@@ -6,6 +6,6 @@ module Utils
 
 include("misc.jl")
 include("decorators.jl")
-# include("informations.jl")
+include("informations.jl")
 
 end #module
diff --git a/src/Utils/informations.jl b/src/Utils/informations.jl
index 9787b237..d2933590 100644
--- a/src/Utils/informations.jl
+++ b/src/Utils/informations.jl
@@ -1,6 +1,7 @@
 export entropy, conditional_entropy, mutual_information
 using Statistics
 using StatsFuns: xlogx, xlogy
+using LogicCircuits: issomething
 
 "Cache pairwise / marginal distribution for all variables in one dataset"
 mutable struct DisCache
@@ -14,11 +15,11 @@ DisCache(num) = DisCache(Array{Float64}(undef, num, num, 4), Array{Float64}(unde
 #####################
 # Methods for pairwise and marginal distribution
 #####################
-@inline get_parameters(bm::AbstractMatrix{<:Bool}, α, w=nothing) = size(bm)[2], issomething(w) ? sum(w) : size(bm)[1], @. Float64(bm), @. Float64(!bm)
+@inline get_parameters(bm, α, w=nothing) = size(bm)[2], issomething(w) ? sum(w) : size(bm)[1], convert(Matrix{Float64}, bm), convert(Matrix{Float64}, .!bm)
 
-function cache_distributions(bm::AbstractMatrix{<:Bool}, w::Union{Nothing, AbstractVector{<:AbstractFloat}}=nothing; α, flag=(pairwise=true, marginal=true))
+function cache_distributions(bm, w::Union{Nothing, Vector}=nothing; α, flag=(pairwise=true, marginal=true))
     # parameters
-    D, N, (m, notm) = get_parameters(bm, α, w)
+    D, N, m, notm = get_parameters(bm, α, w)
     dis_cache = DisCache(D)
     base = N + 4 * α
     w = isnothing(w) ? ones(Float64, N) : w
@@ -58,18 +59,14 @@ function mutual_information(dis_cache::DisCache)
 end
 
 "Calculate mutual information of given bit matrix `bm`, example weights `w`, and smoothing pseudocount `α`"
-function mutual_information(bm::AbstractMatrix{<:Bool}, w::Union{Nothing, AbstractVector{<:AbstractFloat}}=nothing; α)
+function mutual_information(bm, w::Union{Nothing, Vector}=nothing; α)
     dis_cache = cache_distributions(bm, w; α=α)
     mi = mutual_information(dis_cache)
     return (dis_cache, mi)
 end
 
-function mutual_information(train_x::PlainXData, w::Union{Nothing, AbstractVector{<:AbstractFloat}}=nothing; α)
-    mutual_information(feature_matrix(train_x), w; α=α)
-end
-
 "Calculate set mutual information"
-function set_mutual_information(mi::Matrix, sets::Vector{Vector{Var}})::Matrix
+function set_mutual_information(mi::Matrix, sets::Vector{Vector})::Matrix
     len = length(sets)
     if len == size(mi)[1]
         return mi
@@ -96,7 +93,7 @@ function entropy(bm::AbstractMatrix{<:Bool}, w::Union{Nothing, AbstractVector{<:
     return (dis_cache, entropy(dis_cache))
 end
 
-function sum_entropy_given_x(bm::AbstractMatrix{<:Bool}, x::Var, w::Union{Nothing, AbstractVector{<:AbstractFloat}}=nothing; α)::Float64
+function sum_entropy_given_x(bm::AbstractMatrix{<:Bool}, x, w::Union{Nothing, AbstractVector{<:AbstractFloat}}=nothing; α)::Float64
     @assert x <= size(bm)[2]
     vars = [1 : x-1; x+1 : size(bm)[2]]
     indexes_left = bm[:,x].== 0
diff --git a/test/StructureLearner/CircuitBuilderTest.jl b/test/StructureLearner/CircuitBuilderTest.jl
deleted file mode 100644
index 40c38db5..00000000
--- a/test/StructureLearner/CircuitBuilderTest.jl
+++ /dev/null
@@ -1,24 +0,0 @@
-using Test: @test, @testset
-using LogicCircuits
-using ProbabilisticCircuits
-
-@testset "Probabilistic circuits learner tests" begin
-    data = dataset(twenty_datasets("nltcs"); do_shuffle=false, batch_size=-1)
-    train_x = train(data)
-    pc = learn_probabilistic_circuit(train_x; pseudocount = 1.0, algo = "chow-liu", algo_kwargs=(α=1.0, clt_root="graph_center"))
-    
-    # simple test
-    @test pc isa ProbCircuit
-    @test check_parameter_integrity(pc)
-    @test num_parameters(pc) == 62 
-    @test pc[26].log_thetas[1] ≈ -0.023528423773273476 atol=1.0e-7
-
-    # all evidence sums to 1
-    N = num_features(train_x);
-    data_all = XData(generate_data_all(N))
-    fc = FlowΔ(pc, max_batch_size(train_x), Bool, opts_accumulate_flows)
-    calc_prob_all = log_likelihood_per_instance(fc, data_all)
-    calc_prob_all = exp.(calc_prob_all)
-    sum_prob_all = sum(calc_prob_all)
-    @test sum_prob_all ≈ 1 atol = 1.0e-7;
-end
\ No newline at end of file
diff --git a/test/StructureLearner/ChowLiuTreeTest.jl b/test/StructureLearner/chow_liu_tree_tests.jl
similarity index 87%
rename from test/StructureLearner/ChowLiuTreeTest.jl
rename to test/StructureLearner/chow_liu_tree_tests.jl
index ff624ef0..24b2fb8c 100644
--- a/test/StructureLearner/ChowLiuTreeTest.jl
+++ b/test/StructureLearner/chow_liu_tree_tests.jl
@@ -5,8 +5,7 @@ using LogicCircuits
 using ProbabilisticCircuits
 
 @testset "Chow-Liu Tree learner tests" begin
-    data = dataset(twenty_datasets("nltcs"); do_shuffle=false, batch_size=-1)
-    train_x = train(data)
+    train_x, _, _ = twenty_datasets("nltcs")
     clt = learn_chow_liu_tree(train_x; α=1.0, clt_root="graph_center")
     pv = parent_vector(clt)
 
diff --git a/test/StructureLearner/PSDDInitializerTest.jl b/test/StructureLearner/init_tests.jl
similarity index 52%
rename from test/StructureLearner/PSDDInitializerTest.jl
rename to test/StructureLearner/init_tests.jl
index cd8b51a3..d2986e88 100644
--- a/test/StructureLearner/PSDDInitializerTest.jl
+++ b/test/StructureLearner/init_tests.jl
@@ -3,15 +3,13 @@ using LogicCircuits
 using ProbabilisticCircuits
 
 @testset "Probabilistic circuits learner tests" begin
-    data = dataset(twenty_datasets("nltcs"); do_shuffle=false, batch_size=-1)
-    train_x = train(data)
-    (pc, vtree) = learn_struct_prob_circuit(train_x; pseudocount = 1.0, algo = "chow-liu", algo_kwargs=(α=1.0, clt_root="graph_center"),
-            vtree = "chow-liu", vtree_kwargs=(vtree_mode="balanced",))
+    train_x, _, _ = twenty_datasets("nltcs")
+    (pc, vtree) = learn_struct_prob_circuit(train_x)
     
     # simple test
     @test pc isa ProbCircuit
     @test vtree isa PlainVtree
-    @test num_variables(vtree) == num_features(data)
+    @test num_variables(vtree) == num_features(train_x)
     @test check_parameter_integrity(pc)
     @test num_parameters(pc) == 74 
 
@@ -20,14 +18,13 @@ using ProbabilisticCircuits
 
     # is structured decomposable 
     for (n, vars) in variables_by_node(pc)
-        @test vars == BitSet(variables(origin(n).vtree))
+        @test vars == BitSet(variables(n.vtree))
     end
 
     # all evidence sums to 1
-    N = num_features(train_x);
-    data_all = XData(generate_data_all(N))
-    fc = FlowΔ(pc, max_batch_size(train_x), Bool, opts_accumulate_flows)
-    calc_prob_all = log_likelihood_per_instance(fc, data_all)
+    N = num_features(train_x)
+    data_all = generate_data_all(N)
+    calc_prob_all = log_likelihood_per_instance(pc, data_all)
     calc_prob_all = exp.(calc_prob_all)
     sum_prob_all = sum(calc_prob_all)
     @test sum_prob_all ≈ 1 atol = 1.0e-7;
diff --git a/test/runtests.jl b/test/runtests.jl
index bddbc3e2..e0920969 100644
--- a/test/runtests.jl
+++ b/test/runtests.jl
@@ -12,4 +12,4 @@ end
 using Jive
 
 # TODO reinstate after refactoring all modules
-runtests(@__DIR__, skip=["runtests.jl", "helper", "StructureLearner", "Mixtures", "Utils"])
+runtests(@__DIR__, skip=["runtests.jl", "helper", "Mixtures", "StructureLearner/VtreeLearnerTest.jl"])

From 5f546ae6489d22a263000c35fc0514c732186e26 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Sun, 16 Aug 2020 12:50:38 -0700
Subject: [PATCH 048/131] add structure learn

---
 src/Probabilistic/structured_prob_nodes.jl | 78 +++++++++++++++++++++-
 src/StructureLearner/StructureLearner.jl   |  2 +
 src/StructureLearner/heuristics.jl         | 69 +++++++++++++++++++
 src/StructureLearner/learner.jl            | 39 +++++++++++
 4 files changed, 187 insertions(+), 1 deletion(-)
 create mode 100644 src/StructureLearner/heuristics.jl
 create mode 100644 src/StructureLearner/learner.jl

diff --git a/src/Probabilistic/structured_prob_nodes.jl b/src/Probabilistic/structured_prob_nodes.jl
index 11fa2050..cfcf2ec9 100644
--- a/src/Probabilistic/structured_prob_nodes.jl
+++ b/src/Probabilistic/structured_prob_nodes.jl
@@ -105,7 +105,83 @@ end
 
 @inline ProbCircuit(circuit::PlainLogicCircuit) = PlainProbCircuit(circuit)
 
-# TODO: import LogicCircuits: conjoin, disjoin, compile # make available for extension 
+import LogicCircuits: conjoin, disjoin, compile, vtree, vtree_safe # make available for extension
+
+"Get the vtree corresponding to the argument, or nothing if the node has no vtree"
+@inline vtree(n::StructProbCircuit) = n.vtree
+@inline vtree_safe(n::StructProbInnerNode) = vtree(n)
+@inline vtree_safe(n::StructProbLiteralNode) = vtree(n)
+
+conjoin(arguments::Vector{<:StructProbCircuit};
+        reuse=nothing, use_vtree=nothing) =
+        conjoin(arguments...; reuse, use_vtree)
+
+function conjoin(a1::StructProbCircuit,  
+                 a2::StructProbCircuit;
+                 reuse=nothing, use_vtree=nothing) 
+    reuse isa StructProb⋀Node && reuse.prime == a1 && reuse.sub == a2 && return reuse
+    !(use_vtree isa Vtree) && (reuse isa StructProbCircuit) &&  (use_vtree = reuse.vtree)
+    # if isconstantgate(a1) && isconstantgate(a2) && !(use_vtree isa Vtree)
+    #     # constant nodes don't have a vtree: resolve to a constant
+    #     return StructProbCircuit(istrue(a1) && istrue(a2))
+    # end
+    !(use_vtree isa Vtree) && (use_vtree = find_inode(vtree_safe(a1), vtree_safe(a2)))
+    return StructProb⋀Node(a1, a2, use_vtree)
+end
+
+# ProbCircuit has a default argument for respects: its root's vtree
+respects_vtree(circuit::ProbCircuit) = 
+    respects_vtree(circuit, vtree(circuit))
+
+@inline disjoin(xs::StructProbCircuit...) = disjoin(collect(xs))
+
+function disjoin(arguments::Vector{<:StructProbCircuit};
+                 reuse=nothing, use_vtree=nothing)
+    @assert length(arguments) > 0
+    reuse isa StructProb⋁Node && reuse.children == arguments && return reuse
+    !(use_vtree isa Vtree) && (reuse isa StructProbCircuit) &&  (use_vtree = reuse.vtree)
+    # if all(isconstantgate, arguments) && !(use_vtree isa Vtree)
+    #     # constant nodes don't have a vtree: resolve to a constant
+    #     return StructProbCircuit(any(constant, arguments))
+    # end
+    !(use_vtree isa Vtree) && (use_vtree = mapreduce(vtree_safe, lca, arguments))
+    return StructProb⋁Node(arguments, use_vtree)
+end
+
+# Syntactic sugar for compile with a vtree
+(t::Tuple{<:Type,<:Vtree})(arg) = compile(t[1], t[2], arg)
+(t::Tuple{<:Vtree,<:Type})(arg) = compile(t[2], t[1], arg)
+
+# claim `StructProbCircuit` as the default `ProbCircuit` implementation that has a vtree
+compile(::Type{ProbCircuit}, args...) =
+    compile(StructProbCircuit, args...)
+
+compile(vtree::Vtree, arg) = 
+    compile(ProbCircuit,vtree,arg)
+
+compile(::Type{<:StructProbCircuit}, ::Vtree, b::Bool) =
+    compile(StructProbCircuit, b)
+
+"The unique splain tructured logical false constant" # act as a place holder in `condition`
+const structfalse = PlainStructFalseNode(nothing, 0)
+
+compile(::Type{<:StructProbCircuit}, b::Bool) =
+    b ? structtrue : structfalse
+
+
+
+compile(::Type{<:StructProbCircuit}, vtree::Vtree, l::Lit) =
+    PlainStructLiteralNode(l,find_leaf(lit2var(l),vtree))
+
+
+function compile(::Type{<:StructProbCircuit}, vtree::Vtree, circuit::StructProbCircuit)
+    f_con(n) = error("ProbCircuit does not have a constant node")
+    f_lit(n) = compile(StructProbCircuit, vtree, literal(n))
+    f_a(n, cns) = conjoin(cns...) # note: this will use the LCA as vtree node
+    f_o(n, cns) = disjoin(cns) # note: this will use the LCA as vtree node
+    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, StructProbCircuit)
+end
+
 
 function check_parameter_integrity(circuit::ProbCircuit)
     for node in or_nodes(circuit)
diff --git a/src/StructureLearner/StructureLearner.jl b/src/StructureLearner/StructureLearner.jl
index 92d2cf46..29cfa16e 100644
--- a/src/StructureLearner/StructureLearner.jl
+++ b/src/StructureLearner/StructureLearner.jl
@@ -8,6 +8,8 @@ using ..LoadSave
 
 include("chow_liu_tree.jl")
 include("init.jl")
+include("heuristics.jl")
+include("learner.jl")
 
 
 end
diff --git a/src/StructureLearner/heuristics.jl b/src/StructureLearner/heuristics.jl
new file mode 100644
index 00000000..95c00e1e
--- /dev/null
+++ b/src/StructureLearner/heuristics.jl
@@ -0,0 +1,69 @@
+
+using LinearAlgebra: diagind
+"""
+Pick the edge with maximum flow
+"""
+function eFlow(candidates::Vector{Tuple{Node, Node}})
+    edge2flows = map(candidates) do (or, and)
+        sum(get_downflow(or, and))
+    end
+    (max_flow, max_edge_id) = findmax(edge2flows)
+    candidates[max_edge_id], max_flow
+end
+
+"""
+Pick the variable with maximum sum of mutual information
+"""
+function vMI(edge, vars::Vector{Var}, train_x)
+    examples_id = get_downflow(edge...)  
+    sub_matrix = train_x[examples_id, vars]
+    (_, mi) = mutual_information(sub_matrix; α=1.0)
+    mi[diagind(mi)] .= 0
+    scores = dropdims(sum(mi, dims = 1), dims = 1)
+    var = vars[argmax(scores)]
+    score = maximum(scores)
+    var, score
+end
+
+"""
+Pick the edge randomly
+"""
+function eRand(candidates::Vector{Tuple{Node, Node}})
+    return rand(candidates)
+end
+
+"""
+Pick the variable randomly
+"""
+function vRand(vars::Vector{Var})
+    lits = collect(Set{Lit}(scope[and]))
+    vars =  Var.(intersect(filter(l -> l > 0, lits), - filter(l -> l < 0, lits)))
+    return Var(rand(vars))
+end
+
+function heuristic_loss(circuit::LogicCircuit, train_x; pick_edge="eFlow", pick_var="vMI")
+    candidates, scope = split_candidates(circuit)
+    compute_flows(circuit, train_x)
+    if pick_edge == "eFlow"
+        edge, flow = eFlow(candidates)
+    elseif pick_edge == "eRand"
+        edge = eRand(candidates)
+    else
+        error("Heuristics $pick_edge to pick edge is undefined.")
+    end
+
+    or, and = edge
+    lits = collect(Set{Lit}(scope[and]))
+    vars =  Var.(intersect(filter(l -> l > 0, lits), - filter(l -> l < 0, lits)))
+
+    if pick_var == "vMI"
+        var, score = vMI(edge, vars, train_x)
+    elseif pick_var == "vRand"
+        var = vRand(vars)
+    else
+        error("Heuristics $pick_var to pick variable is undefined.")
+    end
+
+    return (or, and), var
+end
+
diff --git a/src/StructureLearner/learner.jl b/src/StructureLearner/learner.jl
new file mode 100644
index 00000000..4ac904a9
--- /dev/null
+++ b/src/StructureLearner/learner.jl
@@ -0,0 +1,39 @@
+export learn_single_model
+using LogicCircuits: split_step, struct_learn
+using Statistics: mean
+using Random
+"""
+Learn structure decomposable circuits
+"""
+function learn_single_model(train_x;
+        pick_edge="eFlow", pick_var="vMI", depth=1, 
+        pseudocount=1.0,
+        sanity_check=true,
+        maxiter=typemax(Int),
+        seed=1337)
+
+    # init
+    Random.seed!(seed)
+    pc, vtree = learn_struct_prob_circuit(train_x)
+
+    # structure_update
+    loss(circuit) = heuristic_loss(circuit, train_x; pick_edge=pick_edge, pick_var=pick_var)
+    pc_split_step(circuit) = begin
+        c::ProbCircuit, = split_step(circuit; loss=loss, depth=depth, sanity_check=sanity_check)
+        estimate_parameters(c, train_x; pseudocount=pseudocount)
+        return c, missing
+    end
+    iter = 0
+    log_per_iter(circuit) = begin
+        ll = EVI(circuit, train_x)
+        println("Log likelihood of iteration $iter is $(mean(ll))")
+        println()
+        iter += 1
+        false
+    end
+    log_per_iter(pc)
+    pc = struct_learn(pc; 
+        primitives=[pc_split_step], kwargs=Dict(pc_split_step=>()), 
+        maxiter=maxiter, stop=log_per_iter)
+end
+

From 38add39e27cf06bf7b67341bd287e5ecee1d2b0b Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Sun, 16 Aug 2020 16:28:30 -0700
Subject: [PATCH 049/131] add emsembles circuits & em

---
 Project.toml                               |   1 +
 src/Mixtures/Mixtures.jl                   |  11 ++
 src/Mixtures/deprecated/Clustering.jl      |  21 ----
 src/Mixtures/em.jl                         | 118 +++++++++++++++++++++
 src/Mixtures/shared_prob_nodes.jl          |  81 ++++++++++++++
 src/Probabilistic/prob_nodes.jl            |   2 +
 src/Probabilistic/structured_prob_nodes.jl |  35 ++----
 src/ProbabilisticCircuits.jl               |   2 +
 8 files changed, 224 insertions(+), 47 deletions(-)
 create mode 100644 src/Mixtures/Mixtures.jl
 delete mode 100644 src/Mixtures/deprecated/Clustering.jl
 create mode 100644 src/Mixtures/em.jl
 create mode 100644 src/Mixtures/shared_prob_nodes.jl

diff --git a/Project.toml b/Project.toml
index cc639b0c..cb10d139 100644
--- a/Project.toml
+++ b/Project.toml
@@ -7,6 +7,7 @@ BlossomV = "6c721016-9dae-5d90-abf6-67daaccb2332"
 Clustering = "aaaa29a8-35af-508c-8bc3-b662a17a0fe5"
 DataStructures = "864edb3b-99cc-5e75-8d2d-829cb0a9cfe8"
 LightGraphs = "093fc24a-ae57-5d10-9952-331d41423f4d"
+LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
 LogicCircuits = "a7847b3b-b7f1-4dd5-83c3-60e0aa0f8599"
 MetaGraphs = "626554b9-1ddb-594c-aa3c-2596fe9399a5"
 Metis = "2679e427-3c69-5b7f-982b-ece356f1e94b"
diff --git a/src/Mixtures/Mixtures.jl b/src/Mixtures/Mixtures.jl
new file mode 100644
index 00000000..d837d53b
--- /dev/null
+++ b/src/Mixtures/Mixtures.jl
@@ -0,0 +1,11 @@
+module Mixtures
+
+using LogicCircuits
+using ..Utils
+using ..Probabilistic
+using ..LoadSave
+
+include("shared_prob_nodes.jl")
+include("em.jl")
+
+end
\ No newline at end of file
diff --git a/src/Mixtures/deprecated/Clustering.jl b/src/Mixtures/deprecated/Clustering.jl
deleted file mode 100644
index 47c30403..00000000
--- a/src/Mixtures/deprecated/Clustering.jl
+++ /dev/null
@@ -1,21 +0,0 @@
-using Clustering
-
-function clustering(train_x::XData, mix_num::Int64; maxiter=200)::XBatches{<:Bool}
-    if mix_num == 1
-        return convert(XBatches, train_x)
-    end
-    
-    n = num_examples(train_x)
-    X = feature_matrix(train_x)'
-
-    println("Running K-means clustering algorithm with num of components $mix_num, maximum iterations $maxiter")
-    R = kmeans(X, mix_num; maxiter=maxiter)
-    @assert nclusters(R) == mix_num
-    a = assignments(R)
-
-    clustered_train_x = Vector{PlainXData{Bool,BitMatrix}}()
-    for k in 1 : mix_num
-        push!(clustered_train_x, XData(convert(BitMatrix, X[:, findall(x -> x == k, a)]')))
-    end
-    return clustered_train_x
-end
\ No newline at end of file
diff --git a/src/Mixtures/em.jl b/src/Mixtures/em.jl
new file mode 100644
index 00000000..2f35f3f4
--- /dev/null
+++ b/src/Mixtures/em.jl
@@ -0,0 +1,118 @@
+export one_step_em, component_weights_per_example, initial_weights, clustering,
+log_likelihood_per_instance_per_component, estimate_parameters_cached, learn_em_model
+using Statistics: mean
+using LinearAlgebra: normalize!
+using Clustering: kmeans, nclusters, assignments
+
+function one_step_em(spc, train_x, component_weights;pseudocount)
+    # E step
+    lls = log_likelihood_per_instance_per_component(spc, train_x)
+    lls .+= log.(component_weights)
+
+    example_weights = component_weights_per_example(lls)
+    component_weights .= sum(example_weights, dims=1)
+    normalize!(component_weights, 1.0)
+
+    # M step
+    estimate_parameters_cached(spc, example_weights; pseudocount=pseudocount)
+    logsumexp(lls, 2), component_weights
+end
+
+function component_weights_per_example(log_p_of_x_and_c)
+    log_p_of_x = logsumexp(log_p_of_x_and_c, 2) # marginalize out components
+    log_p_of_given_x_query_c = mapslices(col -> col .- log_p_of_x, log_p_of_x_and_c, dims=[1])
+    p_of_given_x_query_c = exp.(log_p_of_given_x_query_c) # no more risk of underflow, so go to linear space
+    @assert sum(p_of_given_x_query_c) ≈ size(log_p_of_x_and_c, 1) "$(sum(p_of_given_x_query_c)) != $(size(log_p_of_x_and_c))"# each row has proability 1
+    Matrix(p_of_given_x_query_c)
+end
+
+function initial_weights(train_x, mix_num::Int64; alg="cluster")::Vector{Float64}
+    if alg == "cluster"
+        clustered = clustering(train_x, mix_num)
+        counting = Float64.(num_examples.(clustered))
+        return normalize!(counting, 1)
+    elseif alg == "random"
+        return normalize!(rand(Float64, mix_num), 1)
+    else
+        error("Initialize weights algorithm is $undefined")
+    end
+end
+
+function clustering(train_x, mix_num::Int64; maxiter=200)::Vector
+    train_x = Matrix(train_x)
+    if mix_num == 1
+        return [train_x]
+    end
+    
+    n = num_examples(train_x)
+
+    R = kmeans(train_x, mix_num; maxiter=maxiter)
+    @assert nclusters(R) == mix_num
+    a = assignments(R)
+
+    clustered_train_x = Vector()
+    for k in 1 : mix_num
+        push!(clustered_train_x, train_x[:, findall(x -> x == k, a)]')
+    end
+
+    return clustered_train_x
+end
+
+function log_likelihood_per_instance_per_component(pc::SharedProbCircuit, data)
+    @assert isbinarydata(data) "Can only calculate EVI on Bool data"
+    
+    compute_flows(pc, data)
+    num_mix = num_components(pc)
+    log_likelihoods = zeros(Float64, num_examples(data), num_mix)
+    indices = init_array(Bool, num_examples(data))::BitVector
+    
+    
+    ll(n::SharedProbCircuit) = ()
+    ll(n::SharedProb⋁Node) = begin
+        if num_children(n) != 1 # other nodes have no effect on likelihood
+            for i in 1 : num_children(n)
+                c = children(n)[i]
+                log_theta = reshape(n.log_thetas[i, :], 1, num_mix)
+                indices = get_downflow(n, c)
+                view(log_likelihoods, indices::BitVector, :) .+=  log_theta # see MixedProductKernelBenchmark.jl
+            end
+         end
+    end
+
+    foreach(ll, pc)
+    log_likelihoods
+end
+
+function estimate_parameters_cached(pc::SharedProbCircuit, example_weights; pseudocount::Float64)
+    foreach(pc) do pn
+        if is⋁gate(pn)
+            if num_children(pn) == 1
+                pn.log_thetas .= 0.0
+            else
+                smoothed_flow = Float64.(sum(example_weights[get_downflow(pn), :], dims=1)) .+ pseudocount
+                uniform_pseudocount = pseudocount / num_children(pn)
+                children_flows = vcat(map(c -> sum(example_weights[get_downflow(pn, c), :], dims=1), children(pn))...)
+                @. pn.log_thetas = log((children_flows + uniform_pseudocount) / smoothed_flow)
+                @assert all(sum(exp.(pn.log_thetas), dims=1) .≈ 1.0) "Parameters do not sum to one locally"
+                # normalize away any leftover error
+                pn.log_thetas .-= logsumexp(pn.log_thetas, dims=1)
+            end
+        end
+    end
+end
+
+function learn_em_model(pc, train_x;
+        num_mix=5,
+        pseudocount=1.0,
+        maxiter=typemax(Int))
+    spc = SharedProbCircuit(pc, num_mix)
+    compute_flows(spc, train_x)
+    estimate_parameters_cached(spc, ones(Float64, num_examples(train_x), num_mix) ./ num_mix; pseudocount=pseudocount)
+    component_weights = reshape(initial_weights(train_x, num_mix), 1, num_mix)
+
+    for iter in 1 : maxiter
+        @assert isapprox(sum(component_weights), 1.0; atol=1e-10)
+        lls, component_weights = one_step_em(spc, train_x, component_weights; pseudocount=pseudocount)
+        println("Log likelihood per instance is $(mean(lls))")
+    end
+end
\ No newline at end of file
diff --git a/src/Mixtures/shared_prob_nodes.jl b/src/Mixtures/shared_prob_nodes.jl
new file mode 100644
index 00000000..2d4f180f
--- /dev/null
+++ b/src/Mixtures/shared_prob_nodes.jl
@@ -0,0 +1,81 @@
+export SharedProbCircuit, SharedProbLeafNode, SharedProbInnerNode, SharedProbLiteralNode,
+SharedProb⋀Node, SharedProb⋁Node, num_components
+
+#####################
+# Probabilistic circuits which share the same structure
+#####################
+
+"""
+Root of the probabilistic circuit node hierarchy
+"""
+abstract type SharedProbCircuit <: LogicCircuit end
+
+"""
+A probabilistic leaf node
+"""
+abstract type SharedProbLeafNode <: SharedProbCircuit end
+
+"""
+A probabilistic inner node
+"""
+abstract type SharedProbInnerNode <: SharedProbCircuit end
+
+"""
+A probabilistic literal node
+"""
+mutable struct SharedProbLiteralNode <: SharedProbLeafNode
+    literal::Lit
+    data
+    counter::UInt32
+    SharedProbLiteralNode(l) = new(l, nothing, 0)
+end
+
+"""
+A probabilistic conjunction node (And node)
+"""
+mutable struct SharedProb⋀Node <: SharedProbInnerNode
+    children::Vector{<:SharedProbCircuit}
+    data
+    counter::UInt32
+    SharedProb⋀Node(children) = new(convert(Vector{SharedProbCircuit}, children), nothing, 0)
+end
+
+"""
+A probabilistic disjunction node (Or node)
+"""
+mutable struct SharedProb⋁Node <: SharedProbInnerNode
+    children::Vector{<:SharedProbCircuit}
+    log_thetas::Matrix{Float64}
+    data
+    counter::UInt32
+    SharedProb⋁Node(children, n_mixture) = begin
+        new(convert(Vector{SharedProbCircuit}, children), init_array(Float64, length(children), n_mixture), nothing, 0)
+    end
+end
+
+#####################
+# traits
+#####################
+
+import LogicCircuits.GateType # make available for extension
+@inline GateType(::Type{<:SharedProbLiteralNode}) = LiteralGate()
+@inline GateType(::Type{<:SharedProb⋀Node}) = ⋀Gate()
+@inline GateType(::Type{<:SharedProb⋁Node}) = ⋁Gate()
+
+#####################
+# constructors and conversions
+#####################
+
+function SharedProbCircuit(circuit::LogicCircuit, num_mixture::Int64)::SharedProbCircuit
+    f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
+    f_lit(n) = SharedProbLiteralNode(literal(n))
+    f_a(n, cn) = SharedProb⋀Node(cn)
+    f_o(n, cn) = SharedProb⋁Node(cn, num_mixture)
+    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, SharedProbCircuit)
+end
+
+
+import LogicCircuits: children # make available for extension
+
+@inline children(n::SharedProbInnerNode) = n.children
+@inline num_components(n::SharedProbCircuit) = size(n.log_thetas)[2]
diff --git a/src/Probabilistic/prob_nodes.jl b/src/Probabilistic/prob_nodes.jl
index f002baea..96694851 100644
--- a/src/Probabilistic/prob_nodes.jl
+++ b/src/Probabilistic/prob_nodes.jl
@@ -1,6 +1,8 @@
 export PlainProbCircuit, ProbLeafNode, ProbInnerNode, ProbLiteralNode, Prob⋀Node, 
 Prob⋁Node
 
+using LogicCircuits: LogicCircuit
+
 #####################
 # Infrastructure for probabilistic circuit nodes
 #####################
diff --git a/src/Probabilistic/structured_prob_nodes.jl b/src/Probabilistic/structured_prob_nodes.jl
index cfcf2ec9..cc064d9f 100644
--- a/src/Probabilistic/structured_prob_nodes.jl
+++ b/src/Probabilistic/structured_prob_nodes.jl
@@ -68,10 +68,15 @@ import LogicCircuits.GateType # make available for extension
 # methods
 #####################
 
-import LogicCircuits: children # make available for extension
+import LogicCircuits: children, vtree, vtree_safe # make available for extension
 @inline children(n::StructProb⋁Node) = n.children
 @inline children(n::StructProb⋀Node) = [n.prime,n.sub]
 
+"Get the vtree corresponding to the argument, or nothing if the node has no vtree"
+@inline vtree(n::StructProbCircuit) = n.vtree
+@inline vtree_safe(n::StructProbInnerNode) = vtree(n)
+@inline vtree_safe(n::StructProbLiteralNode) = vtree(n)
+
 import ..Utils: num_parameters
 @inline num_parameters(c::StructProbCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
 
@@ -105,12 +110,7 @@ end
 
 @inline ProbCircuit(circuit::PlainLogicCircuit) = PlainProbCircuit(circuit)
 
-import LogicCircuits: conjoin, disjoin, compile, vtree, vtree_safe # make available for extension
-
-"Get the vtree corresponding to the argument, or nothing if the node has no vtree"
-@inline vtree(n::StructProbCircuit) = n.vtree
-@inline vtree_safe(n::StructProbInnerNode) = vtree(n)
-@inline vtree_safe(n::StructProbLiteralNode) = vtree(n)
+import LogicCircuits: conjoin, disjoin, compile # make available for extension
 
 conjoin(arguments::Vector{<:StructProbCircuit};
         reuse=nothing, use_vtree=nothing) =
@@ -121,10 +121,6 @@ function conjoin(a1::StructProbCircuit,
                  reuse=nothing, use_vtree=nothing) 
     reuse isa StructProb⋀Node && reuse.prime == a1 && reuse.sub == a2 && return reuse
     !(use_vtree isa Vtree) && (reuse isa StructProbCircuit) &&  (use_vtree = reuse.vtree)
-    # if isconstantgate(a1) && isconstantgate(a2) && !(use_vtree isa Vtree)
-    #     # constant nodes don't have a vtree: resolve to a constant
-    #     return StructProbCircuit(istrue(a1) && istrue(a2))
-    # end
     !(use_vtree isa Vtree) && (use_vtree = find_inode(vtree_safe(a1), vtree_safe(a2)))
     return StructProb⋀Node(a1, a2, use_vtree)
 end
@@ -140,36 +136,23 @@ function disjoin(arguments::Vector{<:StructProbCircuit};
     @assert length(arguments) > 0
     reuse isa StructProb⋁Node && reuse.children == arguments && return reuse
     !(use_vtree isa Vtree) && (reuse isa StructProbCircuit) &&  (use_vtree = reuse.vtree)
-    # if all(isconstantgate, arguments) && !(use_vtree isa Vtree)
-    #     # constant nodes don't have a vtree: resolve to a constant
-    #     return StructProbCircuit(any(constant, arguments))
-    # end
     !(use_vtree isa Vtree) && (use_vtree = mapreduce(vtree_safe, lca, arguments))
     return StructProb⋁Node(arguments, use_vtree)
 end
 
-# Syntactic sugar for compile with a vtree
-(t::Tuple{<:Type,<:Vtree})(arg) = compile(t[1], t[2], arg)
-(t::Tuple{<:Vtree,<:Type})(arg) = compile(t[2], t[1], arg)
-
 # claim `StructProbCircuit` as the default `ProbCircuit` implementation that has a vtree
 compile(::Type{ProbCircuit}, args...) =
     compile(StructProbCircuit, args...)
 
-compile(vtree::Vtree, arg) = 
-    compile(ProbCircuit,vtree,arg)
-
 compile(::Type{<:StructProbCircuit}, ::Vtree, b::Bool) =
     compile(StructProbCircuit, b)
 
-"The unique splain tructured logical false constant" # act as a place holder in `condition`
-const structfalse = PlainStructFalseNode(nothing, 0)
+# act as a place holder in `condition`
+using LogicCircuits: structfalse
 
 compile(::Type{<:StructProbCircuit}, b::Bool) =
     b ? structtrue : structfalse
 
-
-
 compile(::Type{<:StructProbCircuit}, vtree::Vtree, l::Lit) =
     PlainStructLiteralNode(l,find_leaf(lit2var(l),vtree))
 
diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index e9ec78e3..f02f5b58 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -17,6 +17,7 @@ include("Logistic/Logistic.jl")
 include("LoadSave/LoadSave.jl")
 include("Reasoning/Reasoning.jl")
 include("StructureLearner/StructureLearner.jl")
+include("Mixtures/Mixtures.jl")
 
 
 # USE CHILD MODULES (in order to re-export some functions)
@@ -25,5 +26,6 @@ include("StructureLearner/StructureLearner.jl")
 @reexport using .LoadSave
 @reexport using .Reasoning
 @reexport using .StructureLearner
+@reexport using .Mixtures
 
 end

From 495ed9a9633163a5830223a096456b778093f7a8 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Sun, 16 Aug 2020 19:01:49 -0700
Subject: [PATCH 050/131] [test] expectation: bypass precision problem

---
 test/Reasoning/expectation_test.jl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/test/Reasoning/expectation_test.jl b/test/Reasoning/expectation_test.jl
index 4f886b74..97d1cc8a 100644
--- a/test/Reasoning/expectation_test.jl
+++ b/test/Reasoning/expectation_test.jl
@@ -3,7 +3,7 @@ using LogicCircuits
 using ProbabilisticCircuits
 
 function test_expectation_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLASSES::Int)
-    EPS = 1e-7;
+    EPS = 1e-5;
     COUNT = size(data)[1]
     # Compute True expectation brute force
     true_exp = zeros(COUNT, CLASSES)

From cffa0f89b084daa3462cb283528582cd7b58cb42 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Sun, 16 Aug 2020 22:39:31 -0700
Subject: [PATCH 051/131] [feature] logistic circuit: gpu support

---
 Project.toml                                  |   2 +
 src/Logistic/Logistic.jl                      |   5 +-
 .../{parameters.jl => learn_parameters.jl}    |   0
 src/Logistic/parameter_circuit.jl             | 127 ++++++++++++++++++
 4 files changed, 132 insertions(+), 2 deletions(-)
 rename src/Logistic/{parameters.jl => learn_parameters.jl} (100%)
 create mode 100644 src/Logistic/parameter_circuit.jl

diff --git a/Project.toml b/Project.toml
index 3e0ef01a..368a92ad 100644
--- a/Project.toml
+++ b/Project.toml
@@ -5,6 +5,7 @@ version = "0.1.1"
 [deps]
 BlossomV = "6c721016-9dae-5d90-abf6-67daaccb2332"
 Clustering = "aaaa29a8-35af-508c-8bc3-b662a17a0fe5"
+CUDA = "052768ef-5323-5732-b1bb-66c8b64840ba"
 DataStructures = "864edb3b-99cc-5e75-8d2d-829cb0a9cfe8"
 LightGraphs = "093fc24a-ae57-5d10-9952-331d41423f4d"
 LogicCircuits = "a7847b3b-b7f1-4dd5-83c3-60e0aa0f8599"
@@ -25,6 +26,7 @@ MLDatasets = "eb30cadb-4394-5ae3-aed4-317e484a6458"
 [compat]
 BlossomV = "0.4"
 Clustering = "0.14"
+CUDA = "1.2"
 DataStructures = "0.17"
 LightGraphs = "1.3"
 LogicCircuits = "0.1.1"
diff --git a/src/Logistic/Logistic.jl b/src/Logistic/Logistic.jl
index b09f76d0..cd45019e 100644
--- a/src/Logistic/Logistic.jl
+++ b/src/Logistic/Logistic.jl
@@ -5,8 +5,9 @@ using ..Utils
 
 include("logistic_nodes.jl")
 include("queries.jl")
-include("parameters.jl")
+include("parameter_circuit.jl")
+include("learn_parameters.jl")
 
-# TODO learning
+# TODO structure learning
 
 end
\ No newline at end of file
diff --git a/src/Logistic/parameters.jl b/src/Logistic/learn_parameters.jl
similarity index 100%
rename from src/Logistic/parameters.jl
rename to src/Logistic/learn_parameters.jl
diff --git a/src/Logistic/parameter_circuit.jl b/src/Logistic/parameter_circuit.jl
new file mode 100644
index 00000000..1a88c68a
--- /dev/null
+++ b/src/Logistic/parameter_circuit.jl
@@ -0,0 +1,127 @@
+using CUDA
+using LogicCircuits
+
+export ParameterCircuit, CuParameterCircuit
+export class_likelihood_and_flow, class_weights_and_flow
+
+# In a parameter circuit,
+# 1 is true, 2 is false
+const TRUE_BITS = Int32(1)
+const FALSE_BITS = Int32(2)
+# 3:nf+2 are nf positive literals
+# nf+3:2nf+2 are nf negative literals
+# 2nf+2:end are inner decision nodes
+
+struct ParameterCircuit
+    decisions::Matrix{Int32}
+    elements::Matrix{Int32}
+    parameters::Matrix{Float32}
+end
+
+
+ParameterCircuit(circuit::LogisticCircuit, nc::Integer, num_features::Integer) = begin
+    @assert is⋁gate(circuit)
+    decisions::Vector{Int32} = Vector{Int32}()
+    elements::Vector{Int32} = Vector{Int32}()
+    parameters::Vector{Float32} = Vector{Float32}()
+    num_decisions::Int32 = 2 * num_features + 2
+    num_elements::Int32 = 0
+    # num_parameters always equals num_elements
+    
+    f_con(n) = istrue(n) ? TRUE_BITS : FALSE_BITS
+    f_lit(n) = ispositive(n) ? Int32(2 + variable(n)) : Int32(2 + num_features + variable(n))
+    f_and(n, cs) = begin
+        @assert length(cs) == 2
+        Int32[cs[1], cs[2]]
+    end
+    f_or(n, cs) = begin
+        first_element = num_elements + 1
+        foreach(cs, eachrow(n.thetas)) do c, theta
+            @assert size(theta)[1] == nc
+            append!(parameters, theta)
+            num_elements += 1
+            if c isa Vector{Int32}
+                @assert length(c) == 2
+                push!(elements, c[1], c[2])
+            else
+                @assert c isa Int32
+                push!(elements, c, TRUE_BITS)
+            end
+        end
+        num_decisions += 1
+        push!(decisions, first_element, num_elements)
+        num_decisions
+    end
+    foldup_aggregate(circuit, f_con, f_lit, f_and, f_or, Union{Int32, Vector{Int32}})
+    decisions2 = reshape(decisions, 2, :)
+    elements2 = reshape(elements, 2, :) 
+    parameters_nc = reshape(parameters, nc, :)
+    @assert size(elements2)[2] == size(parameters_nc)[2]
+    return ParameterCircuit(decisions2, elements2, parameters_nc)
+end
+
+struct CuParameterCircuit
+    decisions::CuMatrix{Int32}
+    elements::CuMatrix{Int32}
+    parameters::CuMatrix{Float32}
+    CuParameterCircuit(parameter_circuit::ParameterCircuit) = new(CuMatrix(parameter_circuit.decisions), CuMatrix(parameter_circuit.elements), CuMatrix(parameter_circuit.parameters))
+end
+
+function class_likelihood_and_flow(parameter_circuit::CuParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing)
+    cw, flow = class_weights_and_flow(parameter_circuit, nc, data, reuse_up, reuse_down)
+    return @. 1.0 / (1.0 + exp(-cw)), flow
+end
+
+function class_weights_and_flow(parameter_circuit::CuParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing)
+    ne = num_examples(data)
+    nf = num_features(data)
+    nd = size(parameter_circuit.decisions)[2]
+    nl = 2 + 2 * nf
+    
+    v = value_matrix(CuMatrix, ne, nl + nd, reuse_up)
+    flow = if reuse_down isa CuArray{Float32} && size(reuse_down) == (ne, nl + nd)
+        reuse_down
+    else
+        CUDA.zeros(Float32, ne, nl + nd)
+    end
+    cw = CUDA.zeros(Float32, ne, nc)
+    
+    set_leaf_layer(v, data)
+    num_threads_per_block = 256
+    numblocks = ceil(Int, ne/num_threads_per_block)
+    CUDA.@sync begin
+        @cuda threads=num_threads_per_block blocks=numblocks class_weights_flow_kernel_cuda(cw, flow, v, parameter_circuit.decisions, parameter_circuit.elements, parameter_circuit.parameters, ne, nc, nd, nl)
+    end
+    return cw, flow
+end
+
+function class_weights_flow_kernel_cuda(cw, flow, v, decisions, elements, parameters, ne, nc, nd, nl)
+    evaluate_kernel_cuda(v, decisions, elements, ne, nd, nl)
+
+    index = (blockIdx().x - 1) * blockDim().x + threadIdx().x
+    stride = blockDim().x * gridDim().x
+    for j = index:stride:ne
+        flow[j, nl + nd] = v[j, nl + nd]
+        for i = nd:-1:1
+            first_elem = decisions[1, i]
+            last_elem = decisions[2, i]
+            n_up = v[j, nl + i]
+            if n_up > zero(Float32)
+                n_down = flow[j, nl + i]
+                for k = first_elem:last_elem
+                    e1 = elements[1, k]
+                    e2 = elements[2, k]
+                    c_up = v[j, e1] * v[j, e2]
+                    additional_flow = c_up / n_up * n_down
+                    flow[j, e1] += additional_flow
+                    flow[j, e2] += additional_flow
+                    for class = 1:nc
+                        cw[j, class] += additional_flow * parameters[class, k]
+                    end
+                end
+            end
+        end
+    end
+    
+    return nothing
+end
\ No newline at end of file

From 973ff15bd51fa9358c4af5d94bb7f64ab1303702 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Mon, 17 Aug 2020 01:08:09 -0700
Subject: [PATCH 052/131] [feature] logistic circuit: gpu w/ auto batch

---
 src/Logistic/parameter_circuit.jl | 193 ++++++++++++++++++++++++++++--
 1 file changed, 185 insertions(+), 8 deletions(-)

diff --git a/src/Logistic/parameter_circuit.jl b/src/Logistic/parameter_circuit.jl
index 1a88c68a..c0ca6d7c 100644
--- a/src/Logistic/parameter_circuit.jl
+++ b/src/Logistic/parameter_circuit.jl
@@ -4,6 +4,10 @@ using LogicCircuits
 export ParameterCircuit, CuParameterCircuit
 export class_likelihood_and_flow, class_weights_and_flow
 
+export LayeredParameterCircuit, CuLayeredParameterCircuit
+export class_likelihood_and_flow2, class_weights_and_flow2
+
+
 # In a parameter circuit,
 # 1 is true, 2 is false
 const TRUE_BITS = Int32(1)
@@ -12,13 +16,13 @@ const FALSE_BITS = Int32(2)
 # nf+3:2nf+2 are nf negative literals
 # 2nf+2:end are inner decision nodes
 
+
 struct ParameterCircuit
     decisions::Matrix{Int32}
     elements::Matrix{Int32}
     parameters::Matrix{Float32}
 end
 
-
 ParameterCircuit(circuit::LogisticCircuit, nc::Integer, num_features::Integer) = begin
     @assert is⋁gate(circuit)
     decisions::Vector{Int32} = Vector{Int32}()
@@ -67,15 +71,15 @@ struct CuParameterCircuit
     CuParameterCircuit(parameter_circuit::ParameterCircuit) = new(CuMatrix(parameter_circuit.decisions), CuMatrix(parameter_circuit.elements), CuMatrix(parameter_circuit.parameters))
 end
 
-function class_likelihood_and_flow(parameter_circuit::CuParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing)
-    cw, flow = class_weights_and_flow(parameter_circuit, nc, data, reuse_up, reuse_down)
+function class_likelihood_and_flow(circuit::CuParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing)
+    cw, flow = class_weights_and_flow(circuit, nc, data, reuse_up, reuse_down)
     return @. 1.0 / (1.0 + exp(-cw)), flow
 end
 
-function class_weights_and_flow(parameter_circuit::CuParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing)
+function class_weights_and_flow(circuit::CuParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing)
     ne = num_examples(data)
     nf = num_features(data)
-    nd = size(parameter_circuit.decisions)[2]
+    nd = size(circuit.decisions)[2]
     nl = 2 + 2 * nf
     
     v = value_matrix(CuMatrix, ne, nl + nd, reuse_up)
@@ -90,12 +94,12 @@ function class_weights_and_flow(parameter_circuit::CuParameterCircuit, nc::Integ
     num_threads_per_block = 256
     numblocks = ceil(Int, ne/num_threads_per_block)
     CUDA.@sync begin
-        @cuda threads=num_threads_per_block blocks=numblocks class_weights_flow_kernel_cuda(cw, flow, v, parameter_circuit.decisions, parameter_circuit.elements, parameter_circuit.parameters, ne, nc, nd, nl)
+        @cuda threads=num_threads_per_block blocks=numblocks pass_down_and_sum_cw_layer_kernel_cuda(cw, flow, v, circuit.decisions, circuit.elements, circuit.parameters, ne, nc, nd, nl)
     end
     return cw, flow
 end
 
-function class_weights_flow_kernel_cuda(cw, flow, v, decisions, elements, parameters, ne, nc, nd, nl)
+function pass_down_and_sum_cw_layer_kernel_cuda(cw, flow, v, decisions, elements, parameters, ne, nc, nd, nl)
     evaluate_kernel_cuda(v, decisions, elements, ne, nd, nl)
 
     index = (blockIdx().x - 1) * blockDim().x + threadIdx().x
@@ -124,4 +128,177 @@ function class_weights_flow_kernel_cuda(cw, flow, v, decisions, elements, parame
     end
     
     return nothing
-end
\ No newline at end of file
+end
+
+
+
+struct ParameterLayer
+    decisions::Matrix{Int32}
+    elements::Matrix{Int32}
+    parameters::Matrix{Float32}
+end
+
+struct LayeredParameterCircuit
+    layers::Vector{ParameterLayer}
+end
+
+LayeredParameterCircuit(circuit::LogisticCircuit, nc::Integer, num_features::Integer) = begin
+    @assert is⋁gate(circuit)
+    decisions::Vector{Vector{Int32}} = Vector{Vector{Int32}}()
+    elements::Vector{Vector{Int32}} = Vector{Vector{Int32}}()
+    parameters::Vector{Vector{Float32}} = Vector{Vector{Float32}}()
+    num_decisions::Int32 = 2 * num_features + 2
+    num_elements::Vector{Int32} = Vector{Int32}()
+    # num_parameters always equals num_elements
+
+    ensure_layer(i) = begin
+        if length(decisions) < i
+            # add a new layer
+            push!(decisions, Int32[])
+            push!(elements, Int32[])
+            push!(parameters, Float32[])
+            push!(num_elements, 0)
+        end
+    end
+    
+    f_con(n) = LayeredDecisionId(0, istrue(n) ? TRUE_BITS : FALSE_BITS)
+    f_lit(n) = LayeredDecisionId(0, 
+        ispositive(n) ? Int32(2 + variable(n)) : Int32(2 + num_features + variable(n)))
+
+    f_and(n, cs) = begin
+        @assert length(cs) == 2
+        LayeredDecisionId[cs[1], cs[2]]
+    end
+    f_or(n, cs) = begin
+        num_decisions += 1
+        # determine layer
+        layer_id = zero(Int32)
+        for c in cs
+            if c isa Vector{LayeredDecisionId}
+                @assert length(c) == 2
+                layer_id = max(layer_id, c[1].layer_id, c[2].layer_id)
+            else
+                @assert c isa LayeredDecisionId
+                layer_id = max(layer_id, c.layer_id)
+            end
+        end
+        layer_id += 1
+        ensure_layer(layer_id)
+        first_element = num_elements[layer_id] + 1
+        foreach(cs, eachrow(n.thetas)) do c, theta
+            @assert size(theta)[1] == nc
+            append!(parameters[layer_id], theta)
+            num_elements[layer_id] += 1
+            if c isa Vector{LayeredDecisionId}
+                push!(elements[layer_id], c[1].decision_id, c[2].decision_id)
+            else
+                push!(elements[layer_id], c.decision_id, TRUE_BITS)
+            end
+        end
+        push!(decisions[layer_id], num_decisions, first_element, num_elements[layer_id])
+        LayeredDecisionId(layer_id, num_decisions)
+    end
+
+    foldup_aggregate(circuit, f_con, f_lit, f_and, f_or, 
+        Union{LayeredDecisionId,Vector{LayeredDecisionId}})
+    
+    layers = map(decisions, elements, parameters) do d, e, p
+        ParameterLayer(reshape(d, 3, :), reshape(e, 2, :), reshape(p, nc, :))
+    end
+    return LayeredParameterCircuit(layers)
+end
+
+struct CuParameterLayer
+    decisions::CuMatrix{Int32}
+    elements::CuMatrix{Int32}
+    parameters::CuMatrix{Float32}
+    CuParameterLayer(l::ParameterLayer) = new(CuMatrix(l.decisions), CuMatrix(l.elements), CuMatrix(l.parameters))
+end
+
+struct CuLayeredParameterCircuit
+    layers::Vector{CuParameterLayer}
+    CuLayeredParameterCircuit(l::LayeredParameterCircuit) = new(map(CuParameterLayer, l.layers))
+end
+
+num_decisions(l::CuParameterLayer) = size(l.decisions)[2]
+num_decisions(l::CuLayeredParameterCircuit) = sum(num_decisions, l.layers)
+
+function class_likelihood_and_flow2(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing)
+    cw, flow = class_weights_and_flow2(circuit, nc, data, reuse_up, reuse_down)
+    return @. 1.0 / (1.0 + exp(-cw)), flow
+end
+
+function class_weights_and_flow2(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing)
+    ne = num_examples(data)
+    nf = num_features(data)
+    nd = num_decisions(circuit)
+    nl = 2 + 2 * nf
+    v = value_matrix(CuMatrix, ne, nl + nd, reuse_up)
+    set_leaf_layer(v, data)
+    
+    dec_per_thread = 8
+    CUDA.@sync for layer in circuit.layers
+        ndl = num_decisions(layer)
+        num_threads = balance_threads(ne, ndl / dec_per_thread, 8)
+        num_blocks = (ceil(Int, ne / num_threads[1]), ceil(Int, ndl / num_threads[2] / dec_per_thread)) 
+        @cuda threads=num_threads blocks=num_blocks evaluate_layer_kernel_cuda2(v, layer.decisions, layer.elements)
+    end
+
+    flow = if reuse_down isa CuArray{Float32} && size(reuse_down) == (ne, nl + nd)
+        reuse_down .= zero(Float32)
+        reuse_down
+    else
+        CUDA.zeros(Float32, ne, nl + nd)
+    end
+    flow[:,end] .= v[:,end] # set flow at root
+    cw = CUDA.zeros(Float32, ne, nc) # initialize class_weights
+    
+    dec_per_thread = 4
+    CUDA.@sync for layer in Iterators.reverse(circuit.layers)
+        ndl = num_decisions(layer)
+        num_threads = balance_threads(ne, ndl / dec_per_thread, 8)
+        num_blocks = (ceil(Int, ne / num_threads[1]), ceil(Int, ndl / num_threads[2] / dec_per_thread)) 
+        @cuda threads=num_threads blocks=num_blocks pass_down_and_sum_cw_layer_kernel_cuda2(cw, flow, v, layer.decisions, layer.elements, layer.parameters)
+    end
+    
+    return cw, flow
+end
+
+function pass_down_and_sum_cw_layer_kernel_cuda2(cw, flow, v, decisions, elements, parameters)
+    index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
+    index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
+    stride_x = blockDim().x * gridDim().x
+    stride_y = blockDim().y * gridDim().y
+    ne, nc = size(cw)
+    _, num_decisions = size(decisions)
+    
+    for j = index_x:stride_x:ne
+        for i = index_y:stride_y:num_decisions
+            decision_id = @inbounds decisions[1, i]
+            first_elem = @inbounds decisions[2, i]
+            last_elem = @inbounds decisions[3, i]
+            n_up = @inbounds v[j, decision_id]
+            if n_up > zero(Float32)
+                n_down = @inbounds flow[j, decision_id]
+                for e = first_elem:last_elem
+                    e1 = @inbounds elements[1, e]
+                    e2 = @inbounds elements[2, e]
+                    c_up = @inbounds (v[j, e1] * v[j, e2])
+                    additional_flow = c_up / n_up * n_down
+                    # following needs to be memory safe
+                    CUDA.@atomic flow[j, e1] += additional_flow #atomic is automatically inbounds
+                    CUDA.@atomic flow[j, e2] += additional_flow #atomic is automatically inbounds
+                    for class=1:nc
+                        CUDA.@atomic cw[j, class] += additional_flow * parameters[class, e]
+                    end
+                end
+            end
+        end
+    end
+    
+    return nothing
+end
+
+
+
+# TODO; paramter learning
\ No newline at end of file

From d8822530fb34e30d95811880e53858529d184b66 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Mon, 17 Aug 2020 01:19:19 -0700
Subject: [PATCH 053/131] [test] expectation: bypass precision problem

---
 test/Reasoning/expectation_test.jl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/test/Reasoning/expectation_test.jl b/test/Reasoning/expectation_test.jl
index 97d1cc8a..8959c381 100644
--- a/test/Reasoning/expectation_test.jl
+++ b/test/Reasoning/expectation_test.jl
@@ -36,7 +36,7 @@ function test_expectation_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data
 end
 
 function test_moment_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLASSES::Int, moment::Int)
-    EPS = 1e-7;
+    EPS = 1e-5;
     COUNT = size(data)[1]
     # Compute True moment brute force
     true_mom = zeros(COUNT, CLASSES)

From 6eccc2f1a3fb393af0696e2695bef46748688237 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Mon, 17 Aug 2020 04:32:41 -0700
Subject: [PATCH 054/131] [refactor] logistic circuits: reuse bit_circuit

---
 src/Logistic/parameter_circuit.jl | 241 ++++++------------------------
 1 file changed, 44 insertions(+), 197 deletions(-)

diff --git a/src/Logistic/parameter_circuit.jl b/src/Logistic/parameter_circuit.jl
index c0ca6d7c..93959780 100644
--- a/src/Logistic/parameter_circuit.jl
+++ b/src/Logistic/parameter_circuit.jl
@@ -1,145 +1,17 @@
 using CUDA
 using LogicCircuits
 
-export ParameterCircuit, CuParameterCircuit
-export class_likelihood_and_flow, class_weights_and_flow
-
 export LayeredParameterCircuit, CuLayeredParameterCircuit
-export class_likelihood_and_flow2, class_weights_and_flow2
-
+export class_likelihood_and_flow, class_weights_and_flow
 
-# In a parameter circuit,
+# in a parameter circuit
 # 1 is true, 2 is false
-const TRUE_BITS = Int32(1)
-const FALSE_BITS = Int32(2)
-# 3:nf+2 are nf positive literals
-# nf+3:2nf+2 are nf negative literals
-# 2nf+2:end are inner decision nodes
-
-
-struct ParameterCircuit
-    decisions::Matrix{Int32}
-    elements::Matrix{Int32}
-    parameters::Matrix{Float32}
-end
-
-ParameterCircuit(circuit::LogisticCircuit, nc::Integer, num_features::Integer) = begin
-    @assert is⋁gate(circuit)
-    decisions::Vector{Int32} = Vector{Int32}()
-    elements::Vector{Int32} = Vector{Int32}()
-    parameters::Vector{Float32} = Vector{Float32}()
-    num_decisions::Int32 = 2 * num_features + 2
-    num_elements::Int32 = 0
-    # num_parameters always equals num_elements
-    
-    f_con(n) = istrue(n) ? TRUE_BITS : FALSE_BITS
-    f_lit(n) = ispositive(n) ? Int32(2 + variable(n)) : Int32(2 + num_features + variable(n))
-    f_and(n, cs) = begin
-        @assert length(cs) == 2
-        Int32[cs[1], cs[2]]
-    end
-    f_or(n, cs) = begin
-        first_element = num_elements + 1
-        foreach(cs, eachrow(n.thetas)) do c, theta
-            @assert size(theta)[1] == nc
-            append!(parameters, theta)
-            num_elements += 1
-            if c isa Vector{Int32}
-                @assert length(c) == 2
-                push!(elements, c[1], c[2])
-            else
-                @assert c isa Int32
-                push!(elements, c, TRUE_BITS)
-            end
-        end
-        num_decisions += 1
-        push!(decisions, first_element, num_elements)
-        num_decisions
-    end
-    foldup_aggregate(circuit, f_con, f_lit, f_and, f_or, Union{Int32, Vector{Int32}})
-    decisions2 = reshape(decisions, 2, :)
-    elements2 = reshape(elements, 2, :) 
-    parameters_nc = reshape(parameters, nc, :)
-    @assert size(elements2)[2] == size(parameters_nc)[2]
-    return ParameterCircuit(decisions2, elements2, parameters_nc)
-end
-
-struct CuParameterCircuit
-    decisions::CuMatrix{Int32}
-    elements::CuMatrix{Int32}
-    parameters::CuMatrix{Float32}
-    CuParameterCircuit(parameter_circuit::ParameterCircuit) = new(CuMatrix(parameter_circuit.decisions), CuMatrix(parameter_circuit.elements), CuMatrix(parameter_circuit.parameters))
-end
-
-function class_likelihood_and_flow(circuit::CuParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing)
-    cw, flow = class_weights_and_flow(circuit, nc, data, reuse_up, reuse_down)
-    return @. 1.0 / (1.0 + exp(-cw)), flow
-end
-
-function class_weights_and_flow(circuit::CuParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing)
-    ne = num_examples(data)
-    nf = num_features(data)
-    nd = size(circuit.decisions)[2]
-    nl = 2 + 2 * nf
-    
-    v = value_matrix(CuMatrix, ne, nl + nd, reuse_up)
-    flow = if reuse_down isa CuArray{Float32} && size(reuse_down) == (ne, nl + nd)
-        reuse_down
-    else
-        CUDA.zeros(Float32, ne, nl + nd)
-    end
-    cw = CUDA.zeros(Float32, ne, nc)
-    
-    set_leaf_layer(v, data)
-    num_threads_per_block = 256
-    numblocks = ceil(Int, ne/num_threads_per_block)
-    CUDA.@sync begin
-        @cuda threads=num_threads_per_block blocks=numblocks pass_down_and_sum_cw_layer_kernel_cuda(cw, flow, v, circuit.decisions, circuit.elements, circuit.parameters, ne, nc, nd, nl)
-    end
-    return cw, flow
-end
-
-function pass_down_and_sum_cw_layer_kernel_cuda(cw, flow, v, decisions, elements, parameters, ne, nc, nd, nl)
-    evaluate_kernel_cuda(v, decisions, elements, ne, nd, nl)
-
-    index = (blockIdx().x - 1) * blockDim().x + threadIdx().x
-    stride = blockDim().x * gridDim().x
-    for j = index:stride:ne
-        flow[j, nl + nd] = v[j, nl + nd]
-        for i = nd:-1:1
-            first_elem = decisions[1, i]
-            last_elem = decisions[2, i]
-            n_up = v[j, nl + i]
-            if n_up > zero(Float32)
-                n_down = flow[j, nl + i]
-                for k = first_elem:last_elem
-                    e1 = elements[1, k]
-                    e2 = elements[2, k]
-                    c_up = v[j, e1] * v[j, e2]
-                    additional_flow = c_up / n_up * n_down
-                    flow[j, e1] += additional_flow
-                    flow[j, e2] += additional_flow
-                    for class = 1:nc
-                        cw[j, class] += additional_flow * parameters[class, k]
-                    end
-                end
-            end
-        end
-    end
-    
-    return nothing
-end
-
-
-
-struct ParameterLayer
-    decisions::Matrix{Int32}
-    elements::Matrix{Int32}
-    parameters::Matrix{Float32}
-end
+const TRUE_ID = Int32(1)
+const FALSE_ID = Int32(2)
 
 struct LayeredParameterCircuit
-    layers::Vector{ParameterLayer}
+    layered_circuit::LayeredBitCircuit
+    layered_parameters::Vector{Matrix{Float32}}
 end
 
 LayeredParameterCircuit(circuit::LogisticCircuit, nc::Integer, num_features::Integer) = begin
@@ -161,7 +33,7 @@ LayeredParameterCircuit(circuit::LogisticCircuit, nc::Integer, num_features::Int
         end
     end
     
-    f_con(n) = LayeredDecisionId(0, istrue(n) ? TRUE_BITS : FALSE_BITS)
+    f_con(n) = LayeredDecisionId(0, istrue(n) ? TRUE_ID : FALSE_ID)
     f_lit(n) = LayeredDecisionId(0, 
         ispositive(n) ? Int32(2 + variable(n)) : Int32(2 + num_features + variable(n)))
 
@@ -192,7 +64,7 @@ LayeredParameterCircuit(circuit::LogisticCircuit, nc::Integer, num_features::Int
             if c isa Vector{LayeredDecisionId}
                 push!(elements[layer_id], c[1].decision_id, c[2].decision_id)
             else
-                push!(elements[layer_id], c.decision_id, TRUE_BITS)
+                push!(elements[layer_id], c.decision_id, TRUE_ID)
             end
         end
         push!(decisions[layer_id], num_decisions, first_element, num_elements[layer_id])
@@ -202,69 +74,55 @@ LayeredParameterCircuit(circuit::LogisticCircuit, nc::Integer, num_features::Int
     foldup_aggregate(circuit, f_con, f_lit, f_and, f_or, 
         Union{LayeredDecisionId,Vector{LayeredDecisionId}})
     
-    layers = map(decisions, elements, parameters) do d, e, p
-        ParameterLayer(reshape(d, 3, :), reshape(e, 2, :), reshape(p, nc, :))
+    circuit_layers = map(decisions, elements) do d, e
+        Layer(reshape(d, 3, :), reshape(e, 2, :))
     end
-    return LayeredParameterCircuit(layers)
-end
-
-struct CuParameterLayer
-    decisions::CuMatrix{Int32}
-    elements::CuMatrix{Int32}
-    parameters::CuMatrix{Float32}
-    CuParameterLayer(l::ParameterLayer) = new(CuMatrix(l.decisions), CuMatrix(l.elements), CuMatrix(l.parameters))
+    parameter_layers = map(parameters) do p
+        reshape(p, nc, :)
+    end
+    return LayeredParameterCircuit(LayeredBitCircuit(circuit_layers), parameter_layers)
 end
 
 struct CuLayeredParameterCircuit
-    layers::Vector{CuParameterLayer}
-    CuLayeredParameterCircuit(l::LayeredParameterCircuit) = new(map(CuParameterLayer, l.layers))
+    layered_circuit::CuLayeredBitCircuit
+    layered_parameters::Vector{CuMatrix{Float32}}
+    CuLayeredParameterCircuit(l::LayeredParameterCircuit) = new(CuLayeredBitCircuit(l.layered_circuit), map(CuMatrix, l.layered_parameters))
 end
 
-num_decisions(l::CuParameterLayer) = size(l.decisions)[2]
-num_decisions(l::CuLayeredParameterCircuit) = sum(num_decisions, l.layers)
-
-function class_likelihood_and_flow2(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing)
-    cw, flow = class_weights_and_flow2(circuit, nc, data, reuse_up, reuse_down)
+function class_likelihood_and_flow(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing, reuse_cw=nothing)
+    cw, flow = class_weights_and_flow(circuit, nc, data, reuse_up, reuse_down, reuse_cw)
     return @. 1.0 / (1.0 + exp(-cw)), flow
 end
 
-function class_weights_and_flow2(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing)
-    ne = num_examples(data)
-    nf = num_features(data)
-    nd = num_decisions(circuit)
-    nl = 2 + 2 * nf
-    v = value_matrix(CuMatrix, ne, nl + nd, reuse_up)
-    set_leaf_layer(v, data)
-    
-    dec_per_thread = 8
-    CUDA.@sync for layer in circuit.layers
-        ndl = num_decisions(layer)
-        num_threads = balance_threads(ne, ndl / dec_per_thread, 8)
-        num_blocks = (ceil(Int, ne / num_threads[1]), ceil(Int, ndl / num_threads[2] / dec_per_thread)) 
-        @cuda threads=num_threads blocks=num_blocks evaluate_layer_kernel_cuda2(v, layer.decisions, layer.elements)
-    end
+function class_weights_and_flow(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing, reuse_cw=nothing)
+    _, edge_flow, _ = compute_flows2(circuit.layered_circuit, data, reuse_up, reuse_down)
+    cw = calculate_class_weights(circuit, nc, data, edge_flow, reuse_cw)
+    return cw, edge_flow
+end
 
-    flow = if reuse_down isa CuArray{Float32} && size(reuse_down) == (ne, nl + nd)
-        reuse_down .= zero(Float32)
-        reuse_down
+function calculate_class_weights(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, flow, reuse_cw=nothing)
+    ne = num_examples(data)
+    cw = if reuse_cw isa CuMatrix{Float32} && size(reuse_cw) == (ne, nc)
+        reuse_cw .= zero(Float32)
+        reuse_cw
     else
-        CUDA.zeros(Float32, ne, nl + nd)
+        CUDA.zeros(Float32, ne, nc)
     end
-    flow[:,end] .= v[:,end] # set flow at root
-    cw = CUDA.zeros(Float32, ne, nc) # initialize class_weights
-    
-    dec_per_thread = 4
-    CUDA.@sync for layer in Iterators.reverse(circuit.layers)
-        ndl = num_decisions(layer)
+
+    dec_per_thread = 8
+    CUDA.@sync for i = 1:length(circuit.layered_circuit.layers)
+        circuit_layer = circuit.layered_circuit.layers[i]
+        parameter_layer = circuit.layered_parameters[i]
+        ndl = num_decisions(circuit_layer)
         num_threads = balance_threads(ne, ndl / dec_per_thread, 8)
         num_blocks = (ceil(Int, ne / num_threads[1]), ceil(Int, ndl / num_threads[2] / dec_per_thread)) 
-        @cuda threads=num_threads blocks=num_blocks pass_down_and_sum_cw_layer_kernel_cuda2(cw, flow, v, layer.decisions, layer.elements, layer.parameters)
+        @cuda threads=num_threads blocks=num_blocks calculate_class_weights_layer_kernel_cuda(cw, flow, circuit_layer.decisions, parameter_layer)
     end
     
-    return cw, flow
+    return cw
 end
 
-function pass_down_and_sum_cw_layer_kernel_cuda2(cw, flow, v, decisions, elements, parameters)
+function calculate_class_weights_layer_kernel_cuda(cw, flow, decisions, parameters)
     index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
     index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
     stride_x = blockDim().x * gridDim().x
@@ -274,23 +132,12 @@ function pass_down_and_sum_cw_layer_kernel_cuda2(cw, flow, v, decisions, element
     
     for j = index_x:stride_x:ne
         for i = index_y:stride_y:num_decisions
-            decision_id = @inbounds decisions[1, i]
             first_elem = @inbounds decisions[2, i]
             last_elem = @inbounds decisions[3, i]
-            n_up = @inbounds v[j, decision_id]
-            if n_up > zero(Float32)
-                n_down = @inbounds flow[j, decision_id]
-                for e = first_elem:last_elem
-                    e1 = @inbounds elements[1, e]
-                    e2 = @inbounds elements[2, e]
-                    c_up = @inbounds (v[j, e1] * v[j, e2])
-                    additional_flow = c_up / n_up * n_down
-                    # following needs to be memory safe
-                    CUDA.@atomic flow[j, e1] += additional_flow #atomic is automatically inbounds
-                    CUDA.@atomic flow[j, e2] += additional_flow #atomic is automatically inbounds
-                    for class=1:nc
-                        CUDA.@atomic cw[j, class] += additional_flow * parameters[class, e]
-                    end
+            for e = first_elem:last_elem
+                # following needs to be memory safe
+                for class=1:nc
+                    CUDA.@atomic cw[j, class] += flow[j, e] * parameters[class, e] #atomic is automatically inbounds
                 end
             end
         end
@@ -301,4 +148,4 @@ end
 
 
 
-# TODO; paramter learning
\ No newline at end of file
+# TODO; parameter learning
\ No newline at end of file

From 7e6ffead080b316b7d3ad2d01178f419cd5326ec Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Mon, 17 Aug 2020 07:10:19 -0700
Subject: [PATCH 055/131] [fix] parameter_circuit: edge flow

---
 src/Logistic/parameter_circuit.jl | 17 +++++++++--------
 1 file changed, 9 insertions(+), 8 deletions(-)

diff --git a/src/Logistic/parameter_circuit.jl b/src/Logistic/parameter_circuit.jl
index 93959780..974e34e0 100644
--- a/src/Logistic/parameter_circuit.jl
+++ b/src/Logistic/parameter_circuit.jl
@@ -2,7 +2,7 @@ using CUDA
 using LogicCircuits
 
 export LayeredParameterCircuit, CuLayeredParameterCircuit
-export class_likelihood_and_flow, class_weights_and_flow
+export class_likelihood, class_weights
 
 # in a parameter circuit
 # 1 is true, 2 is false
@@ -89,15 +89,15 @@ struct CuLayeredParameterCircuit
     CuLayeredParameterCircuit(l::LayeredParameterCircuit) = new(CuLayeredBitCircuit(l.layered_circuit), map(CuMatrix, l.layered_parameters))
 end
 
-function class_likelihood_and_flow(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing, reuse_cw=nothing)
-    cw, flow = class_weights_and_flow(circuit, nc, data, reuse_up, reuse_down, reuse_cw)
-    return @. 1.0 / (1.0 + exp(-cw)), flow
+function class_likelihood(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing, reuse_cp=nothing)
+    cw, node_flow, edge_flow, v = class_weights(circuit, nc, data, reuse_up, reuse_down, reuse_cp)
+    return @. 1.0 / (1.0 + exp(-cw)), node_flow, edge_flow, v
 end
 
-function class_weights_and_flow(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing, reuse_cw=nothing)
-    _, edge_flow, _ = compute_flows2(circuit.layered_circuit, data, reuse_up, reuse_down)
+function class_weights(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing, reuse_cw=nothing)
+    node_flow, edge_flow, v = compute_flows2(circuit.layered_circuit, data, reuse_up, reuse_down)
     cw = calculate_class_weights(circuit, nc, data, edge_flow, reuse_cw)
-    return cw, edge_flow
+    return cw, node_flow, edge_flow, v
 end
 
 function calculate_class_weights(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, flow, reuse_cw=nothing)
@@ -112,11 +112,12 @@ function calculate_class_weights(circuit::CuLayeredParameterCircuit, nc::Integer
     dec_per_thread = 8
     CUDA.@sync for i = 1:length(circuit.layered_circuit.layers)
         circuit_layer = circuit.layered_circuit.layers[i]
+        flow_layer = flow[i]
         parameter_layer = circuit.layered_parameters[i]
         ndl = num_decisions(circuit_layer)
         num_threads = balance_threads(ne, ndl / dec_per_thread, 8)
         num_blocks = (ceil(Int, ne / num_threads[1]), ceil(Int, ndl / num_threads[2] / dec_per_thread)) 
-        @cuda threads=num_threads blocks=num_blocks calculate_class_weights_layer_kernel_cuda(cw, flow, circuit_layer.decisions, parameter_layer)
+        @cuda threads=num_threads blocks=num_blocks calculate_class_weights_layer_kernel_cuda(cw, flow_layer, circuit_layer.decisions, parameter_layer)
     end
     
     return cw

From 1e6d67ab72c3b3fa64b22d64090f8f5fef6bee98 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Mon, 17 Aug 2020 14:37:41 -0700
Subject: [PATCH 056/131] [feature] logistic circuit: learn parameter w/ gpu

---
 src/Logistic/parameter_circuit.jl | 71 ++++++++++++++++++++++++++++---
 1 file changed, 65 insertions(+), 6 deletions(-)

diff --git a/src/Logistic/parameter_circuit.jl b/src/Logistic/parameter_circuit.jl
index 974e34e0..2cab8367 100644
--- a/src/Logistic/parameter_circuit.jl
+++ b/src/Logistic/parameter_circuit.jl
@@ -3,6 +3,7 @@ using LogicCircuits
 
 export LayeredParameterCircuit, CuLayeredParameterCircuit
 export class_likelihood, class_weights
+export one_hot, learn_parameters, update_parameters
 
 # in a parameter circuit
 # 1 is true, 2 is false
@@ -91,7 +92,8 @@ end
 
 function class_likelihood(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing, reuse_cp=nothing)
     cw, node_flow, edge_flow, v = class_weights(circuit, nc, data, reuse_up, reuse_down, reuse_cp)
-    return @. 1.0 / (1.0 + exp(-cw)), node_flow, edge_flow, v
+    one = Float32(1.0)
+    return @. one / (one + exp(-cw)), node_flow, edge_flow, v
 end
 
 function class_weights(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing, reuse_cw=nothing)
@@ -109,14 +111,14 @@ function calculate_class_weights(circuit::CuLayeredParameterCircuit, nc::Integer
         CUDA.zeros(Float32, ne, nc)
     end
 
-    dec_per_thread = 8
+    dec_per_thread = 4
     CUDA.@sync for i = 1:length(circuit.layered_circuit.layers)
         circuit_layer = circuit.layered_circuit.layers[i]
         flow_layer = flow[i]
         parameter_layer = circuit.layered_parameters[i]
         ndl = num_decisions(circuit_layer)
         num_threads = balance_threads(ne, ndl / dec_per_thread, 8)
-        num_blocks = (ceil(Int, ne / num_threads[1]), ceil(Int, ndl / num_threads[2] / dec_per_thread)) 
+        num_blocks = ceil(Int, ne / num_threads[1]), ceil(Int, ndl / num_threads[2] / dec_per_thread)
         @cuda threads=num_threads blocks=num_blocks calculate_class_weights_layer_kernel_cuda(cw, flow_layer, circuit_layer.decisions, parameter_layer)
     end
     
@@ -136,9 +138,9 @@ function calculate_class_weights_layer_kernel_cuda(cw, flow, decisions, paramete
             first_elem = @inbounds decisions[2, i]
             last_elem = @inbounds decisions[3, i]
             for e = first_elem:last_elem
-                # following needs to be memory safe
+                # following are memory safe
                 for class=1:nc
-                    CUDA.@atomic cw[j, class] += flow[j, e] * parameters[class, e] #atomic is automatically inbounds
+                    @inbounds cw[j, class] += @inbounds flow[j, e] * parameters[class, e] 
                 end
             end
         end
@@ -148,5 +150,62 @@ function calculate_class_weights_layer_kernel_cuda(cw, flow, decisions, paramete
 end
 
 
+function one_hot(labels::Vector, nc::Integer)    
+    ne = length(labels) 
+    one_hot_labels = zeros(Float32, ne, nc)
+    for (i, j) in enumerate(labels)
+        one_hot_labels[i, j + 1] = 1.0
+    end
+    one_hot_labels
+end
+
+function learn_parameters(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, labels::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing, reuse_cp=nothing, num_epochs=20, step_size=0.0001)
+    cp, node_flow, edge_flow, v = class_likelihood(circuit, nc, data, reuse_up, reuse_down, reuse_cp)
+    update_parameters(circuit, labels, cp, edge_flow, step_size)
+    for _ = 2:num_epochs
+        cp, node_flow, edge_flow, v = class_likelihood(circuit, nc, data, v, (node_flow, edge_flow), cp)
+        update_parameters(circuit, labels, cp, edge_flow, step_size)
+    end
+    return nothing
+end
+
+function update_parameters(circuit::CuLayeredParameterCircuit, labels, cp, flow, step_size=0.0001)
+    _, nc = size(labels)
+    step_size = Float32(step_size)
+    class_per_thread = 1
+    CUDA.@sync for i = 1:length(circuit.layered_circuit.layers)
+        circuit_layer = circuit.layered_circuit.layers[i]
+        flow_layer = flow[i]
+        parameter_layer = circuit.layered_parameters[i]
+        ndl = num_decisions(circuit_layer)
+        num_threads = balance_threads(ndl, nc / class_per_thread, 8)
+        num_blocks = ceil(Int, ndl / num_threads[1]), ceil(Int, ndl / num_threads[2] / class_per_thread)
+        @cuda threads=num_threads blocks=num_blocks update_parameters_layer_kernel_cuda(labels, cp, flow_layer, circuit_layer.decisions, parameter_layer, step_size)
+    end
+    return nothing
+end
 
-# TODO; parameter learning
\ No newline at end of file
+function update_parameters_layer_kernel_cuda(labels, cp, flow, decisions, parameters, step_size)
+    index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
+    index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
+    stride_x = blockDim().x * gridDim().x
+    stride_y = blockDim().y * gridDim().y
+    ne, nc = size(labels)
+    _, num_decisions = size(decisions)
+    
+    for class = index_y:stride_y:nc
+        for i = index_x:stride_x:num_decisions
+            first_elem = @inbounds decisions[2, i]
+            last_elem = @inbounds decisions[3, i]
+            for e = first_elem:last_elem
+                for j = 1:ne
+                    u = @inbounds flow[j, e] * (cp[j, class] - labels[j, class]) * step_size
+                    # following are memory safe
+                    @inbounds parameters[class, e] -= u 
+                end
+            end
+        end
+    end
+    
+    return nothing
+end
\ No newline at end of file

From 6c0c19a7320662d9dcc88df50e5cf5b4b87fabe9 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Mon, 17 Aug 2020 14:55:11 -0700
Subject: [PATCH 057/131] [fix] logistic circuit: memory safe

---
 src/Logistic/parameter_circuit.jl | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Logistic/parameter_circuit.jl b/src/Logistic/parameter_circuit.jl
index 2cab8367..48b340e5 100644
--- a/src/Logistic/parameter_circuit.jl
+++ b/src/Logistic/parameter_circuit.jl
@@ -138,9 +138,9 @@ function calculate_class_weights_layer_kernel_cuda(cw, flow, decisions, paramete
             first_elem = @inbounds decisions[2, i]
             last_elem = @inbounds decisions[3, i]
             for e = first_elem:last_elem
-                # following are memory safe
+                # following needs to be memory safe
                 for class=1:nc
-                    @inbounds cw[j, class] += @inbounds flow[j, e] * parameters[class, e] 
+                    @CUDA.atomic cw[j, class] += flow[j, e] * parameters[class, e] # atomic is automatically inbounds
                 end
             end
         end

From 68f11feafa6d4bdd4161148a08d0295ab1dec34a Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Wed, 19 Aug 2020 22:10:16 -0500
Subject: [PATCH 058/131] [feature] logistic circuit: recover edge flow from v
 and node_flow

---
 src/Logistic/parameter_circuit.jl | 39 ++++++++++++++++++-------------
 1 file changed, 23 insertions(+), 16 deletions(-)

diff --git a/src/Logistic/parameter_circuit.jl b/src/Logistic/parameter_circuit.jl
index 48b340e5..91da4bb7 100644
--- a/src/Logistic/parameter_circuit.jl
+++ b/src/Logistic/parameter_circuit.jl
@@ -91,18 +91,18 @@ struct CuLayeredParameterCircuit
 end
 
 function class_likelihood(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing, reuse_cp=nothing)
-    cw, node_flow, edge_flow, v = class_weights(circuit, nc, data, reuse_up, reuse_down, reuse_cp)
+    cw, flow, v = class_weights(circuit, nc, data, reuse_up, reuse_down, reuse_cp)
     one = Float32(1.0)
-    return @. one / (one + exp(-cw)), node_flow, edge_flow, v
+    return @. one / (one + exp(-cw)), flow, v
 end
 
 function class_weights(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing, reuse_cw=nothing)
-    node_flow, edge_flow, v = compute_flows2(circuit.layered_circuit, data, reuse_up, reuse_down)
-    cw = calculate_class_weights(circuit, nc, data, edge_flow, reuse_cw)
-    return cw, node_flow, edge_flow, v
+    flow, v = compute_flows2(circuit.layered_circuit, data, reuse_up, reuse_down)
+    cw = calculate_class_weights(circuit, nc, data, v, flow, reuse_cw)
+    return cw, flow, v
 end
 
-function calculate_class_weights(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, flow, reuse_cw=nothing)
+function calculate_class_weights(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, v, flow, reuse_cw=nothing)
     ne = num_examples(data)
     cw = if reuse_cw isa CuMatrix{Float32} && size(reuse_cw) == (ne, nc)
         reuse_cw .= zero(Float32)
@@ -114,18 +114,17 @@ function calculate_class_weights(circuit::CuLayeredParameterCircuit, nc::Integer
     dec_per_thread = 4
     CUDA.@sync for i = 1:length(circuit.layered_circuit.layers)
         circuit_layer = circuit.layered_circuit.layers[i]
-        flow_layer = flow[i]
         parameter_layer = circuit.layered_parameters[i]
         ndl = num_decisions(circuit_layer)
         num_threads = balance_threads(ne, ndl / dec_per_thread, 8)
         num_blocks = ceil(Int, ne / num_threads[1]), ceil(Int, ndl / num_threads[2] / dec_per_thread)
-        @cuda threads=num_threads blocks=num_blocks calculate_class_weights_layer_kernel_cuda(cw, flow_layer, circuit_layer.decisions, parameter_layer)
+        @cuda threads=num_threads blocks=num_blocks calculate_class_weights_layer_kernel_cuda(cw, v, flow, circuit_layer.decisions, circuit_layer.elements, parameter_layer)
     end
     
     return cw
 end
 
-function calculate_class_weights_layer_kernel_cuda(cw, flow, decisions, parameters)
+function calculate_class_weights_layer_kernel_cuda(cw, v, flow, decisions, elements, parameters)
     index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
     index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
     stride_x = blockDim().x * gridDim().x
@@ -135,12 +134,21 @@ function calculate_class_weights_layer_kernel_cuda(cw, flow, decisions, paramete
     
     for j = index_x:stride_x:ne
         for i = index_y:stride_y:num_decisions
-            first_elem = @inbounds decisions[2, i]
-            last_elem = @inbounds decisions[3, i]
-            for e = first_elem:last_elem
-                # following needs to be memory safe
-                for class=1:nc
-                    @CUDA.atomic cw[j, class] += flow[j, e] * parameters[class, e] # atomic is automatically inbounds
+            decision_id = @inbounds decisions[1, i]
+            n_up = @inbounds v[j, decision_id]
+            if n_up > zero(Float32)
+                first_elem = @inbounds decisions[2, i]
+                last_elem = @inbounds decisions[3, i]
+                n_down = @inbounds flow[j, decision_id]
+                for e = first_elem:last_elem
+                    e1 = @inbounds elements[1,first_elem]
+                    e2 = @inbounds elements[2,first_elem]
+                    e_up = @inbounds (v[j, e1] * v[j, e2])
+                    edge_flow = e_up / n_up * n_down
+                    # following needs to be memory safe
+                    for class=1:nc
+                        @CUDA.atomic cw[j, class] += edge_flow * parameters[class, e] # atomic is automatically inbounds
+                    end
                 end
             end
         end
@@ -149,7 +157,6 @@ function calculate_class_weights_layer_kernel_cuda(cw, flow, decisions, paramete
     return nothing
 end
 
-
 function one_hot(labels::Vector, nc::Integer)    
     ne = length(labels) 
     one_hot_labels = zeros(Float32, ne, nc)

From c0f902031b8d89027aaa45f4d2e9c37a01644990 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 22 Aug 2020 13:55:15 -0500
Subject: [PATCH 059/131] BitCircuit-based parameter learning on CPU

---
 .gitignore                      |  3 +-
 Project.toml                    |  2 ++
 src/Probabilistic/parameters.jl | 58 +++++++++++++++++++++++++++++++++
 3 files changed, 62 insertions(+), 1 deletion(-)

diff --git a/.gitignore b/.gitignore
index 2ec4662b..b4bd018e 100644
--- a/.gitignore
+++ b/.gitignore
@@ -10,4 +10,5 @@
 *.vscode
 **checkpoint.ipynb
 *Manifest.toml
-docs/build/
\ No newline at end of file
+docs/build/
+scratch/
\ No newline at end of file
diff --git a/Project.toml b/Project.toml
index cb10d139..5f58ad73 100644
--- a/Project.toml
+++ b/Project.toml
@@ -4,11 +4,13 @@ version = "0.1.1"
 
 [deps]
 BlossomV = "6c721016-9dae-5d90-abf6-67daaccb2332"
+CUDA = "052768ef-5323-5732-b1bb-66c8b64840ba"
 Clustering = "aaaa29a8-35af-508c-8bc3-b662a17a0fe5"
 DataStructures = "864edb3b-99cc-5e75-8d2d-829cb0a9cfe8"
 LightGraphs = "093fc24a-ae57-5d10-9952-331d41423f4d"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
 LogicCircuits = "a7847b3b-b7f1-4dd5-83c3-60e0aa0f8599"
+LoopVectorization = "bdcacae8-1622-11e9-2a5c-532679323890"
 MetaGraphs = "626554b9-1ddb-594c-aa3c-2596fe9399a5"
 Metis = "2679e427-3c69-5b7f-982b-ece356f1e94b"
 Pkg = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f"
diff --git a/src/Probabilistic/parameters.jl b/src/Probabilistic/parameters.jl
index 87186cfa..9e24d7d6 100644
--- a/src/Probabilistic/parameters.jl
+++ b/src/Probabilistic/parameters.jl
@@ -1,5 +1,8 @@
 export estimate_parameters, uniform_parameters
+
 using StatsFuns: logsumexp
+using CUDA
+using LoopVectorization
 
 """
 Maximum likilihood estimation of parameters given data
@@ -24,6 +27,61 @@ function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
     end
 end
 
+function estimate_parameters2(pc::ProbCircuit, data; pseudocount::Float64)
+    @assert isbinarydata(data) "Probabilistic circuit parameter estimation for binary data only"
+    bc = BitCircuit(pc, data; reset=false) #TODO: avoid resetting bit, do it at the end when collecting results
+    log_params, node_flow, edge_flow = if isgpu(data)
+        error("todo")
+    else
+        estimate_parameters2_cpu(bc, pseudocount)
+    end
+    compute_values_flows(bc, data; node_flow, edge_flow)
+    log_params_cpu::Vector{Float64} = to_cpu(log_params)
+    foreach_reset(pc) do pn
+        if is⋁gate(pn)
+            if num_children(pn) == 1
+                pn.log_thetas .= 0.0
+            else
+                id = (pn.data::NodeId).node_id
+                @inbounds els_start = bc.nodes[1,id]
+                @inbounds els_end = bc.nodes[2,id]
+                @inbounds @views pn.log_thetas .= log_params_cpu[els_start:els_end]
+                @assert isapprox(sum(exp.(pn.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally"
+                pn.log_thetas .-= logsumexp(pn.log_thetas) # normalize away any leftover error
+            end
+        end
+    end
+end
+
+function estimate_parameters2_cpu(bc, pseudocount)
+    # no need to synchronize, since each computation is unique to a decision node
+    node_counts::Vector{UInt} = Vector{UInt}(undef, num_nodes(bc))
+    log_params::Vector{Float64} = Vector{Float64}(undef, num_elements(bc))
+
+    @inline function node_flow_cpu(flows, values, dec_id, els_start, els_end, locks)
+        if els_start != els_end
+            @inbounds node_counts[dec_id] = sum(1:size(flows,1)) do i
+                count_ones(flows[i, dec_id]) 
+            end
+        end
+        nothing
+    end
+    
+    @inline function edge_flow_cpu(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
+        log_theta = if els_start != els_end
+            edge_count = sum(1:size(flows,1)) do i
+                @inbounds count_ones(values[i, p] & values[i, s] & flows[i, dec_id]) 
+            end
+            log((edge_count+pseudocount/(els_end-els_start+1))/(node_counts[dec_id]+pseudocount))
+        else
+            zero(Float64)
+        end
+        @inbounds log_params[el_id] = log_theta
+        nothing
+    end
+
+    return (log_params, node_flow_cpu, edge_flow_cpu)
+end
 
 """
 Uniform distribution

From b97060c9a3e7e47dbb176d91ea70569425b5b5bb Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 23 Aug 2020 03:12:46 -0500
Subject: [PATCH 060/131] GPU parameter learning

---
 src/Probabilistic/parameters.jl | 71 ++++++++++++++++++++++++++-------
 1 file changed, 57 insertions(+), 14 deletions(-)

diff --git a/src/Probabilistic/parameters.jl b/src/Probabilistic/parameters.jl
index 9e24d7d6..7c705844 100644
--- a/src/Probabilistic/parameters.jl
+++ b/src/Probabilistic/parameters.jl
@@ -30,13 +30,13 @@ end
 function estimate_parameters2(pc::ProbCircuit, data; pseudocount::Float64)
     @assert isbinarydata(data) "Probabilistic circuit parameter estimation for binary data only"
     bc = BitCircuit(pc, data; reset=false) #TODO: avoid resetting bit, do it at the end when collecting results
-    log_params, node_flow, edge_flow = if isgpu(data)
-        error("todo")
+    on_node, on_edge, get_params = if isgpu(data)
+        estimate_parameters2_gpu(bc, pseudocount)
     else
         estimate_parameters2_cpu(bc, pseudocount)
     end
-    compute_values_flows(bc, data; node_flow, edge_flow)
-    log_params_cpu::Vector{Float64} = to_cpu(log_params)
+    compute_values_flows(bc, data; on_node, on_edge)
+    params::Vector{Float64} = get_params()
     foreach_reset(pc) do pn
         if is⋁gate(pn)
             if num_children(pn) == 1
@@ -45,12 +45,13 @@ function estimate_parameters2(pc::ProbCircuit, data; pseudocount::Float64)
                 id = (pn.data::NodeId).node_id
                 @inbounds els_start = bc.nodes[1,id]
                 @inbounds els_end = bc.nodes[2,id]
-                @inbounds @views pn.log_thetas .= log_params_cpu[els_start:els_end]
-                @assert isapprox(sum(exp.(pn.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally"
+                @inbounds @views pn.log_thetas .= params[els_start:els_end]
+                @assert isapprox(sum(exp.(pn.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally: $(sum(exp.(pn.log_thetas))); $(pn.log_thetas)"
                 pn.log_thetas .-= logsumexp(pn.log_thetas) # normalize away any leftover error
             end
         end
     end
+    params
 end
 
 function estimate_parameters2_cpu(bc, pseudocount)
@@ -58,7 +59,7 @@ function estimate_parameters2_cpu(bc, pseudocount)
     node_counts::Vector{UInt} = Vector{UInt}(undef, num_nodes(bc))
     log_params::Vector{Float64} = Vector{Float64}(undef, num_elements(bc))
 
-    @inline function node_flow_cpu(flows, values, dec_id, els_start, els_end, locks)
+    @inline function on_node(flows, values, dec_id, els_start, els_end, locks)
         if els_start != els_end
             @inbounds node_counts[dec_id] = sum(1:size(flows,1)) do i
                 count_ones(flows[i, dec_id]) 
@@ -67,20 +68,62 @@ function estimate_parameters2_cpu(bc, pseudocount)
         nothing
     end
     
-    @inline function edge_flow_cpu(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
-        log_theta = if els_start != els_end
+    @inline function on_edge(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
+        if els_start != els_end
             edge_count = sum(1:size(flows,1)) do i
                 @inbounds count_ones(values[i, p] & values[i, s] & flows[i, dec_id]) 
             end
-            log((edge_count+pseudocount/(els_end-els_start+1))/(node_counts[dec_id]+pseudocount))
-        else
-            zero(Float64)
+            # TODO do the log before the division?
+            log_param = log((edge_count+pseudocount/(els_end-els_start+1))
+                            /(node_counts[dec_id]+pseudocount))
+            @inbounds log_params[el_id] = log_param
+        end
+        nothing
+    end
+
+    get_params() = log_params
+
+    return (on_node, on_edge, get_params)
+end
+
+function estimate_parameters2_gpu(bc, pseudocount)
+    node_counts::CuVector{Int32} = CUDA.zeros(Int32, num_nodes(bc))
+    edge_counts::CuVector{Int32} = CUDA.zeros(Int32, num_elements(bc))
+    params::CuVector{Float64} = CuVector{Float64}(undef, num_elements(bc))
+    params .= -100
+    # need to manually cudaconvert closure variables
+    node_counts_device = CUDA.cudaconvert(node_counts)
+    edge_counts_device = CUDA.cudaconvert(edge_counts)
+    params_device = CUDA.cudaconvert(params)
+    
+    @inline function on_node(flows, values, dec_id, els_start, els_end, ex_id)
+        if els_start != els_end
+            @inbounds c::Int32 = count_ones(flows[ex_id, dec_id]) # cast for @atomic to be happy
+            CUDA.@atomic node_counts_device[dec_id] += c
+        end
+        if isone(ex_id) # only do this once
+            for i=els_start:els_end
+                params_device[i] = pseudocount/(els_end-els_start+1)
+            end
+        end
+        nothing
+    end
+    
+    @inline function on_edge(flows, values, dec_id, el_id, p, s, els_start, els_end, ex_id, edge_flow)
+        if els_start != els_end
+            c::Int32 = count_ones(edge_flow) # cast for @atomic to be happy
+            CUDA.@atomic edge_counts_device[el_id] += c
         end
-        @inbounds log_params[el_id] = log_theta
         nothing
     end
 
-    return (log_params, node_flow_cpu, edge_flow_cpu)
+    function get_params()
+        parent_counts = @views node_counts[bc.elements[1,:]]
+        params .= log.((params .+ edge_counts) ./ (parent_counts .+ pseudocount))
+        to_cpu(params)
+    end
+
+    return (on_node, on_edge, get_params)
 end
 
 """

From a0ac5c8af3473cc17a773d3f8055e802223460fb Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 23 Aug 2020 03:45:56 -0500
Subject: [PATCH 061/131] NodeId type annotation

---
 src/Probabilistic/parameters.jl | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/Probabilistic/parameters.jl b/src/Probabilistic/parameters.jl
index 7c705844..42eeb4cb 100644
--- a/src/Probabilistic/parameters.jl
+++ b/src/Probabilistic/parameters.jl
@@ -42,7 +42,7 @@ function estimate_parameters2(pc::ProbCircuit, data; pseudocount::Float64)
             if num_children(pn) == 1
                 pn.log_thetas .= 0.0
             else
-                id = (pn.data::NodeId).node_id
+                id = (pn.data::⋁NodeId).node_id
                 @inbounds els_start = bc.nodes[1,id]
                 @inbounds els_end = bc.nodes[2,id]
                 @inbounds @views pn.log_thetas .= params[els_start:els_end]
@@ -90,7 +90,6 @@ function estimate_parameters2_gpu(bc, pseudocount)
     node_counts::CuVector{Int32} = CUDA.zeros(Int32, num_nodes(bc))
     edge_counts::CuVector{Int32} = CUDA.zeros(Int32, num_elements(bc))
     params::CuVector{Float64} = CuVector{Float64}(undef, num_elements(bc))
-    params .= -100
     # need to manually cudaconvert closure variables
     node_counts_device = CUDA.cudaconvert(node_counts)
     edge_counts_device = CUDA.cudaconvert(edge_counts)

From 2fcc73838d02f8e9058a2d13a858c6f7edec6760 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 23 Aug 2020 20:06:21 -0500
Subject: [PATCH 062/131] minor changes

---
 src/Probabilistic/parameters.jl | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Probabilistic/parameters.jl b/src/Probabilistic/parameters.jl
index 42eeb4cb..50fab9ea 100644
--- a/src/Probabilistic/parameters.jl
+++ b/src/Probabilistic/parameters.jl
@@ -29,7 +29,7 @@ end
 
 function estimate_parameters2(pc::ProbCircuit, data; pseudocount::Float64)
     @assert isbinarydata(data) "Probabilistic circuit parameter estimation for binary data only"
-    bc = BitCircuit(pc, data; reset=false) #TODO: avoid resetting bit, do it at the end when collecting results
+    bc = BitCircuit(pc, data; reset=false)
     on_node, on_edge, get_params = if isgpu(data)
         estimate_parameters2_gpu(bc, pseudocount)
     else
@@ -40,7 +40,7 @@ function estimate_parameters2(pc::ProbCircuit, data; pseudocount::Float64)
     foreach_reset(pc) do pn
         if is⋁gate(pn)
             if num_children(pn) == 1
-                pn.log_thetas .= 0.0
+                pn.log_thetas .= zero(Float64)
             else
                 id = (pn.data::⋁NodeId).node_id
                 @inbounds els_start = bc.nodes[1,id]
@@ -118,7 +118,7 @@ function estimate_parameters2_gpu(bc, pseudocount)
 
     function get_params()
         parent_counts = @views node_counts[bc.elements[1,:]]
-        params .= log.((params .+ edge_counts) ./ (parent_counts .+ pseudocount))
+        params .= log.(params .+ edge_counts) .- log.(parent_counts .+ pseudocount)
         to_cpu(params)
     end
 

From 38da4f7294908abeb16b77ece2cc61921e04dae2 Mon Sep 17 00:00:00 2001
From: Pasha Khosravi <khosravipasha@gmail.com>
Date: Thu, 27 Aug 2020 06:54:51 -0700
Subject: [PATCH 063/131] fix test build

---
 test/Project.toml | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/test/Project.toml b/test/Project.toml
index 90671629..37e12102 100644
--- a/test/Project.toml
+++ b/test/Project.toml
@@ -1,6 +1,12 @@
 [deps]
+DataFrames = "a93c6f00-e57d-5684-b7b6-d8193f3e46c0"
 Distributed = "8ba89e20-285c-5b6f-9357-94700520ee1b"
 Jive = "ba5e3d4b-8524-549f-bc71-e76ad9e9deed"
 Pkg = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
 Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
+
+[compat]
+DataFrames = "0.21"
+Jive = "0.2.10"
+julia = "1.5"
\ No newline at end of file

From b82163c078e467df5a76fc9d85b1fc159d8b9e12 Mon Sep 17 00:00:00 2001
From: Pasha Khosravi <khosravipasha@gmail.com>
Date: Thu, 27 Aug 2020 07:11:52 -0700
Subject: [PATCH 064/131] add test deps

---
 test/Project.toml | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/test/Project.toml b/test/Project.toml
index 37e12102..8f317fa7 100644
--- a/test/Project.toml
+++ b/test/Project.toml
@@ -1,12 +1,14 @@
 [deps]
+CUDA = "052768ef-5323-5732-b1bb-66c8b64840ba"
 DataFrames = "a93c6f00-e57d-5684-b7b6-d8193f3e46c0"
 Distributed = "8ba89e20-285c-5b6f-9357-94700520ee1b"
 Jive = "ba5e3d4b-8524-549f-bc71-e76ad9e9deed"
+LogicCircuits = "a7847b3b-b7f1-4dd5-83c3-60e0aa0f8599"
 Pkg = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
 Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
 
 [compat]
 DataFrames = "0.21"
-Jive = "0.2.10"
-julia = "1.5"
\ No newline at end of file
+Jive = "0.2"
+julia = "1.5"

From 1c9ffeb466ce937c4a158a7dcb53db8945b44eb8 Mon Sep 17 00:00:00 2001
From: Pasha Khosravi <khosravipasha@gmail.com>
Date: Thu, 27 Aug 2020 07:24:53 -0700
Subject: [PATCH 065/131] fix test error

---
 test/structured_prob_nodes_tests.jl | 1 +
 1 file changed, 1 insertion(+)

diff --git a/test/structured_prob_nodes_tests.jl b/test/structured_prob_nodes_tests.jl
index 2947c9f5..984fa65b 100644
--- a/test/structured_prob_nodes_tests.jl
+++ b/test/structured_prob_nodes_tests.jl
@@ -1,6 +1,7 @@
 using Test
 using LogicCircuits
 using ProbabilisticCircuits
+using DataFrames: DataFrame
 
 
 @testset "structured probabilistic circuit nodes" begin

From 1ddd63f15d454fbccdc7db9c484109f4add1cdd4 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 29 Aug 2020 20:39:46 -0500
Subject: [PATCH 066/131] bugfix

---
 src/Probabilistic/parameters.jl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Probabilistic/parameters.jl b/src/Probabilistic/parameters.jl
index 50fab9ea..84dc0571 100644
--- a/src/Probabilistic/parameters.jl
+++ b/src/Probabilistic/parameters.jl
@@ -29,7 +29,7 @@ end
 
 function estimate_parameters2(pc::ProbCircuit, data; pseudocount::Float64)
     @assert isbinarydata(data) "Probabilistic circuit parameter estimation for binary data only"
-    bc = BitCircuit(pc, data; reset=false)
+    bc = BitCircuit(pc, data; reset=false, on_gpu = isgpu(data))
     on_node, on_edge, get_params = if isgpu(data)
         estimate_parameters2_gpu(bc, pseudocount)
     else

From cfe5a6fc5624313f0e3a5b74b0bae084f85552a5 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 29 Aug 2020 21:03:46 -0500
Subject: [PATCH 067/131] temproarily remove broken code

---
 src/Logistic/queries.jl             |  42 +--
 src/Probabilistic/exp_flows.jl      | 398 +++++++++++++-------------
 src/Probabilistic/parameters.jl     |  28 +-
 src/Utils/misc.jl                   |   3 +-
 test/Logistic/logistic_tests.jl     |  48 ++--
 test/Probabilistic/queries_tests.jl | 424 ++++++++++++++--------------
 test/Reasoning/expectation_test.jl  | 284 ++++++++++---------
 test/StructureLearner/init_tests.jl |  67 +++--
 8 files changed, 647 insertions(+), 647 deletions(-)

diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index 7c80e625..a89b4984 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -1,22 +1,24 @@
-export class_conditional_likelihood_per_instance
+#TODO: reinstate
 
-using ..Probabilistic: get_downflow, get_upflow
-"""
-Class Conditional Probability
-"""
-function class_conditional_likelihood_per_instance(lc::LogisticCircuit,  classes::Int, data)
-    compute_flows(lc, data)
-    likelihoods = zeros(num_examples(data), classes)
-    foreach(lc) do ln
-        if ln isa Logistic⋁Node
-            # For each class. orig.thetas is 2D so used eachcol
-            for (idx, thetaC) in enumerate(eachcol(ln.thetas))
-                foreach(children(ln), thetaC) do c, theta
-                    likelihoods[:, idx] .+= Float64.(get_downflow(ln) .& get_upflow(c)) .* theta
-                end
-            end
-        end
-    end
-    likelihoods
-end
+# export class_conditional_likelihood_per_instance
+
+# using ..Probabilistic: get_downflow, get_upflow
+# """
+# Class Conditional Probability
+# """
+# function class_conditional_likelihood_per_instance(lc::LogisticCircuit,  classes::Int, data)
+#     compute_flows(lc, data)
+#     likelihoods = zeros(num_examples(data), classes)
+#     foreach(lc) do ln
+#         if ln isa Logistic⋁Node
+#             # For each class. orig.thetas is 2D so used eachcol
+#             for (idx, thetaC) in enumerate(eachcol(ln.thetas))
+#                 foreach(children(ln), thetaC) do c, theta
+#                     likelihoods[:, idx] .+= Float64.(get_downflow(ln) .& get_upflow(c)) .* theta
+#                 end
+#             end
+#         end
+#     end
+#     likelihoods
+# end
 
diff --git a/src/Probabilistic/exp_flows.jl b/src/Probabilistic/exp_flows.jl
index 5dc4eac6..d356bdc3 100644
--- a/src/Probabilistic/exp_flows.jl
+++ b/src/Probabilistic/exp_flows.jl
@@ -1,217 +1,219 @@
-export evaluate_exp, compute_exp_flows, get_downflow, get_upflow, get_exp_downflow, get_exp_upflow
-
-
-using StatsFuns: logsumexp
-
-# TODO move to LogicCircuits
-# TODO downflow struct
-using LogicCircuits: materialize, UpFlow, UpDownFlow, UpDownFlow1, UpDownFlow2
-
-"""
-Get upflow from logic circuit
-"""
-@inline get_upflow(n::LogicCircuit) = get_upflow(n.data)
-@inline get_upflow(elems::UpDownFlow1) = elems.upflow
-@inline get_upflow(elems::UpFlow) = materialize(elems)
-
-"""
-Get the node/edge flow from logic circuit
-"""
-function get_downflow(n::LogicCircuit; root=nothing)::BitVector
-    downflow(x::UpDownFlow1) = x.downflow
-    downflow(x::UpDownFlow2) = begin
-        ors = or_nodes(root)
-        p = findall(p -> n in children(p), ors)
-        @assert length(p) == 1
-        get_downflow(ors[p[1]], n)
-    end
-    downflow(n.data)
-end
-
-function get_downflow(n::LogicCircuit, c::LogicCircuit)::BitVector
-    @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
-    get_downflow(n) .& get_upflow(c)
-end
-
-#####################
-# performance-critical queries related to circuit flows
-#####################
-
-"Container for circuit flows represented as a float vector"
-const ExpUpFlow1 = Vector{Float64}
-
-"Container for circuit flows represented as an implicit conjunction of a prime and sub float vector (saves memory allocations in circuits with many binary conjunctions)"
-struct ExpUpFlow2
-    prime_flow::Vector{Float64}
-    sub_flow::Vector{Float64}
-end
-
-const ExpUpFlow = Union{ExpUpFlow1,ExpUpFlow2}
-
-@inline ExpUpFlow1(elems::ExpUpFlow1) = elems
-@inline ExpUpFlow1(elems::ExpUpFlow2) = elems.prime_flow .+ elems.sub_flow
-
-function evaluate_exp(root::ProbCircuit, data;
-                   nload = nload, nsave = nsave, reset=true)::Vector{Float64}
-    n_ex::Int = num_examples(data)
-    ϵ = 0.0
-
-    @inline f_lit(n) = begin
-        uf = convert(Vector{Int8}, feature_values(data, variable(n)))
-        if ispositive(n)
-            uf[uf.==-1] .= 1
-        else
-            uf .= 1 .- uf
-            uf[uf.==2] .= 1
-        end
-        uf = convert(Vector{Float64}, uf)
-        uf .= log.(uf .+ ϵ)
-    end
+#TODO: reinstate in new framework
+
+# export evaluate_exp, compute_exp_flows, get_downflow, get_upflow, get_exp_downflow, get_exp_upflow
+
+
+# using StatsFuns: logsumexp
+
+# # TODO move to LogicCircuits
+# # TODO downflow struct
+# using LogicCircuits: materialize, UpFlow, UpDownFlow, UpDownFlow1, UpDownFlow2
+
+# """
+# Get upflow from logic circuit
+# """
+# @inline get_upflow(n::LogicCircuit) = get_upflow(n.data)
+# @inline get_upflow(elems::UpDownFlow1) = elems.upflow
+# @inline get_upflow(elems::UpFlow) = materialize(elems)
+
+# """
+# Get the node/edge flow from logic circuit
+# """
+# function get_downflow(n::LogicCircuit; root=nothing)::BitVector
+#     downflow(x::UpDownFlow1) = x.downflow
+#     downflow(x::UpDownFlow2) = begin
+#         ors = or_nodes(root)
+#         p = findall(p -> n in children(p), ors)
+#         @assert length(p) == 1
+#         get_downflow(ors[p[1]], n)
+#     end
+#     downflow(n.data)
+# end
+
+# function get_downflow(n::LogicCircuit, c::LogicCircuit)::BitVector
+#     @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
+#     get_downflow(n) .& get_upflow(c)
+# end
+
+# #####################
+# # performance-critical queries related to circuit flows
+# #####################
+
+# "Container for circuit flows represented as a float vector"
+# const ExpUpFlow1 = Vector{Float64}
+
+# "Container for circuit flows represented as an implicit conjunction of a prime and sub float vector (saves memory allocations in circuits with many binary conjunctions)"
+# struct ExpUpFlow2
+#     prime_flow::Vector{Float64}
+#     sub_flow::Vector{Float64}
+# end
+
+# const ExpUpFlow = Union{ExpUpFlow1,ExpUpFlow2}
+
+# @inline ExpUpFlow1(elems::ExpUpFlow1) = elems
+# @inline ExpUpFlow1(elems::ExpUpFlow2) = elems.prime_flow .+ elems.sub_flow
+
+# function evaluate_exp(root::ProbCircuit, data;
+#                    nload = nload, nsave = nsave, reset=true)::Vector{Float64}
+#     n_ex::Int = num_examples(data)
+#     ϵ = 0.0
+
+#     @inline f_lit(n) = begin
+#         uf = convert(Vector{Int8}, feature_values(data, variable(n)))
+#         if ispositive(n)
+#             uf[uf.==-1] .= 1
+#         else
+#             uf .= 1 .- uf
+#             uf[uf.==2] .= 1
+#         end
+#         uf = convert(Vector{Float64}, uf)
+#         uf .= log.(uf .+ ϵ)
+#     end
     
-    @inline f_con(n) = begin
-        uf = istrue(n) ? ones(Float64, n_ex) : zeros(Float64, n_ex)
-        uf .= log.(uf .+ ϵ)
-    end
+#     @inline f_con(n) = begin
+#         uf = istrue(n) ? ones(Float64, n_ex) : zeros(Float64, n_ex)
+#         uf .= log.(uf .+ ϵ)
+#     end
     
-    @inline fa(n, call) = begin
-        if num_children(n) == 1
-            return ExpUpFlow1(call(@inbounds children(n)[1]))
-        else
-            c1 = call(@inbounds children(n)[1])::ExpUpFlow
-            c2 = call(@inbounds children(n)[2])::ExpUpFlow
-            if num_children(n) == 2 && c1 isa ExpUpFlow1 && c2 isa ExpUpFlow1 
-                return ExpUpFlow2(c1, c2) # no need to allocate a new BitVector
-            end
-            x = flowop(c1, c2, +)
-            for c in children(n)[3:end]
-                accumulate(x, call(c), +)
-            end
-            return x
-        end
-    end
+#     @inline fa(n, call) = begin
+#         if num_children(n) == 1
+#             return ExpUpFlow1(call(@inbounds children(n)[1]))
+#         else
+#             c1 = call(@inbounds children(n)[1])::ExpUpFlow
+#             c2 = call(@inbounds children(n)[2])::ExpUpFlow
+#             if num_children(n) == 2 && c1 isa ExpUpFlow1 && c2 isa ExpUpFlow1 
+#                 return ExpUpFlow2(c1, c2) # no need to allocate a new BitVector
+#             end
+#             x = flowop(c1, c2, +)
+#             for c in children(n)[3:end]
+#                 accumulate(x, call(c), +)
+#             end
+#             return x
+#         end
+#     end
     
-    @inline fo(n, call) = begin
-        if num_children(n) == 1
-            return ExpUpFlow1(call(@inbounds children(n)[1]))
-        else
-            log_thetas = n.log_thetas
-            c1 = call(@inbounds children(n)[1])::ExpUpFlow
-            c2 = call(@inbounds children(n)[2])::ExpUpFlow
-            x = flowop(c1, log_thetas[1], c2, log_thetas[2], logsumexp)
-            for (i, c) in enumerate(children(n)[3:end])
-                accumulate(x, call(c), log_thetas[i+2], logsumexp)
-            end
-            return x
-        end
-    end
+#     @inline fo(n, call) = begin
+#         if num_children(n) == 1
+#             return ExpUpFlow1(call(@inbounds children(n)[1]))
+#         else
+#             log_thetas = n.log_thetas
+#             c1 = call(@inbounds children(n)[1])::ExpUpFlow
+#             c2 = call(@inbounds children(n)[2])::ExpUpFlow
+#             x = flowop(c1, log_thetas[1], c2, log_thetas[2], logsumexp)
+#             for (i, c) in enumerate(children(n)[3:end])
+#                 accumulate(x, call(c), log_thetas[i+2], logsumexp)
+#             end
+#             return x
+#         end
+#     end
     
-    # ensure flow us Flow1 at the root, even when it's a conjunction
-    root_flow = ExpUpFlow1(foldup(root, f_con, f_lit, fa, fo, ExpUpFlow; nload, nsave, reset))
-    return nsave(root, root_flow)
-end
+#     # ensure flow us Flow1 at the root, even when it's a conjunction
+#     root_flow = ExpUpFlow1(foldup(root, f_con, f_lit, fa, fo, ExpUpFlow; nload, nsave, reset))
+#     return nsave(root, root_flow)
+# end
 
-@inline flowop(x::ExpUpFlow, y::ExpUpFlow, op)::ExpUpFlow1 =
-    op.(ExpUpFlow1(x), ExpUpFlow1(y))
+# @inline flowop(x::ExpUpFlow, y::ExpUpFlow, op)::ExpUpFlow1 =
+#     op.(ExpUpFlow1(x), ExpUpFlow1(y))
 
-@inline flowop(x::ExpUpFlow, w1::Float64, y::ExpUpFlow, w2::Float64, op)::ExpUpFlow1 =
-    op.(ExpUpFlow1(x) .+ w1, ExpUpFlow1(y) .+ w2)
+# @inline flowop(x::ExpUpFlow, w1::Float64, y::ExpUpFlow, w2::Float64, op)::ExpUpFlow1 =
+#     op.(ExpUpFlow1(x) .+ w1, ExpUpFlow1(y) .+ w2)
 
-import Base.accumulate
-@inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, op) = 
-    @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v)); nothing
+# import Base.accumulate
+# @inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, op) = 
+#     @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v)); nothing
 
-@inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, w::Float64, op) = 
-    @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v) + w); nothing
+# @inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, w::Float64, op) = 
+#     @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v) + w); nothing
 
 
-#####################
-# downward pass
-#####################
+# #####################
+# # downward pass
+# #####################
 
-struct ExpUpDownFlow1
-    upflow::ExpUpFlow1
-    downflow::Vector{Float64}
-    ExpUpDownFlow1(upf::ExpUpFlow1) = new(upf, log.(zeros(Float64, length(upf)) .+ 1e-300))
-end
+# struct ExpUpDownFlow1
+#     upflow::ExpUpFlow1
+#     downflow::Vector{Float64}
+#     ExpUpDownFlow1(upf::ExpUpFlow1) = new(upf, log.(zeros(Float64, length(upf)) .+ 1e-300))
+# end
 
-const ExpUpDownFlow2 = ExpUpFlow2
+# const ExpUpDownFlow2 = ExpUpFlow2
 
-const ExpUpDownFlow = Union{ExpUpDownFlow1, ExpUpDownFlow2}
+# const ExpUpDownFlow = Union{ExpUpDownFlow1, ExpUpDownFlow2}
 
 
-function compute_exp_flows(circuit::ProbCircuit, data)
+# function compute_exp_flows(circuit::ProbCircuit, data)
 
-    # upward pass
-    @inline upflow!(n, v) = begin
-        n.data = (v isa ExpUpFlow1) ? ExpUpDownFlow1(v) : v
-        v
-    end
+#     # upward pass
+#     @inline upflow!(n, v) = begin
+#         n.data = (v isa ExpUpFlow1) ? ExpUpDownFlow1(v) : v
+#         v
+#     end
 
-    @inline upflow(n) = begin
-        d = n.data::ExpUpDownFlow
-        (d isa ExpUpDownFlow1) ? d.upflow : d
-    end
+#     @inline upflow(n) = begin
+#         d = n.data::ExpUpDownFlow
+#         (d isa ExpUpDownFlow1) ? d.upflow : d
+#     end
 
-    evaluate_exp(circuit, data; nload=upflow, nsave=upflow!, reset=false)
+#     evaluate_exp(circuit, data; nload=upflow, nsave=upflow!, reset=false)
     
-    # downward pass
-
-    @inline downflow(n) = (n.data::ExpUpDownFlow1).downflow
-    @inline isfactorized(n) = n.data::ExpUpDownFlow isa ExpUpDownFlow2
-
-    downflow(circuit) .= 0.0
-
-    foreach_down(circuit; setcounter=false) do n
-        if isinner(n) && !isfactorized(n)
-            downflow_n = downflow(n)
-            upflow_n = upflow(n)
-            for ite in 1 : num_children(n)
-                c = children(n)[ite]
-                log_theta = is⋀gate(n) ? 0.0 : n.log_thetas[ite]
-                if isfactorized(c)
-                    upflow2_c = c.data::ExpUpDownFlow2
-                    # propagate one level further down
-                    for i = 1:2
-                        downflow_c = downflow(@inbounds children(c)[i])
-                        accumulate(downflow_c, downflow_n .+ log_theta .+ upflow2_c.prime_flow 
-                        .+ upflow2_c.sub_flow .- upflow_n, logsumexp)
-                    end
-                else
-                    upflow1_c = (c.data::ExpUpDownFlow1).upflow
-                    downflow_c = downflow(c)
-                    accumulate(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n, logsumexp)
-                end
-            end 
-        end
-        nothing
-    end
-    nothing
-end
-
-
-"""
-Get upflow of a probabilistic circuit
-"""
-@inline get_exp_upflow(pc::ProbCircuit) = get_exp_upflow(pc.data)
-@inline get_exp_upflow(elems::ExpUpDownFlow1) = elems.upflow
-@inline get_exp_upflow(elems::ExpUpFlow) = ExpUpFlow1(elems)
-
-"""
-Get the node/edge downflow from probabilistic circuit
-"""
-function get_exp_downflow(n::ProbCircuit; root=nothing)::Vector{Float64}
-    downflow(x::ExpUpDownFlow1) = x.downflow
-    downflow(x::ExpUpDownFlow2) = begin
-        ors = or_nodes(root)
-        p = findall(p -> n in children(p), ors)
-        @assert length(p) == 1
-        get_exp_downflow(ors[p[1]], n)
-    end
-    downflow(n.data)
-end
-
-function get_exp_downflow(n::ProbCircuit, c::ProbCircuit)::Vector{Float64}
-    @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
-    log_theta = n.log_thetas[findfirst(x -> x == c, children(n))]
-    return get_exp_downflow(n) .+ log_theta .+ get_exp_upflow(c) .- get_exp_upflow(n)
-end
\ No newline at end of file
+#     # downward pass
+
+#     @inline downflow(n) = (n.data::ExpUpDownFlow1).downflow
+#     @inline isfactorized(n) = n.data::ExpUpDownFlow isa ExpUpDownFlow2
+
+#     downflow(circuit) .= 0.0
+
+#     foreach_down(circuit; setcounter=false) do n
+#         if isinner(n) && !isfactorized(n)
+#             downflow_n = downflow(n)
+#             upflow_n = upflow(n)
+#             for ite in 1 : num_children(n)
+#                 c = children(n)[ite]
+#                 log_theta = is⋀gate(n) ? 0.0 : n.log_thetas[ite]
+#                 if isfactorized(c)
+#                     upflow2_c = c.data::ExpUpDownFlow2
+#                     # propagate one level further down
+#                     for i = 1:2
+#                         downflow_c = downflow(@inbounds children(c)[i])
+#                         accumulate(downflow_c, downflow_n .+ log_theta .+ upflow2_c.prime_flow 
+#                         .+ upflow2_c.sub_flow .- upflow_n, logsumexp)
+#                     end
+#                 else
+#                     upflow1_c = (c.data::ExpUpDownFlow1).upflow
+#                     downflow_c = downflow(c)
+#                     accumulate(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n, logsumexp)
+#                 end
+#             end 
+#         end
+#         nothing
+#     end
+#     nothing
+# end
+
+
+# """
+# Get upflow of a probabilistic circuit
+# """
+# @inline get_exp_upflow(pc::ProbCircuit) = get_exp_upflow(pc.data)
+# @inline get_exp_upflow(elems::ExpUpDownFlow1) = elems.upflow
+# @inline get_exp_upflow(elems::ExpUpFlow) = ExpUpFlow1(elems)
+
+# """
+# Get the node/edge downflow from probabilistic circuit
+# """
+# function get_exp_downflow(n::ProbCircuit; root=nothing)::Vector{Float64}
+#     downflow(x::ExpUpDownFlow1) = x.downflow
+#     downflow(x::ExpUpDownFlow2) = begin
+#         ors = or_nodes(root)
+#         p = findall(p -> n in children(p), ors)
+#         @assert length(p) == 1
+#         get_exp_downflow(ors[p[1]], n)
+#     end
+#     downflow(n.data)
+# end
+
+# function get_exp_downflow(n::ProbCircuit, c::ProbCircuit)::Vector{Float64}
+#     @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
+#     log_theta = n.log_thetas[findfirst(x -> x == c, children(n))]
+#     return get_exp_downflow(n) .+ log_theta .+ get_exp_upflow(c) .- get_exp_upflow(n)
+# end
\ No newline at end of file
diff --git a/src/Probabilistic/parameters.jl b/src/Probabilistic/parameters.jl
index 84dc0571..e8e144f5 100644
--- a/src/Probabilistic/parameters.jl
+++ b/src/Probabilistic/parameters.jl
@@ -8,32 +8,12 @@ using LoopVectorization
 Maximum likilihood estimation of parameters given data
 """
 function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
-    @assert isbinarydata(data)
-    compute_flows(pc, data)
-    foreach(pc) do pn
-        if is⋁gate(pn)
-            if num_children(pn) == 1
-                pn.log_thetas .= 0.0
-            else
-                smoothed_flow = Float64(sum(get_downflow(pn))) + pseudocount
-                uniform_pseudocount = pseudocount / num_children(pn)
-                children_flows = map(c -> sum(get_downflow(pn, c)), children(pn))
-                @. pn.log_thetas = log((children_flows + uniform_pseudocount) / smoothed_flow)
-                @assert isapprox(sum(exp.(pn.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally"
-                # normalize away any leftover error
-                pn.log_thetas .-= logsumexp(pn.log_thetas)
-            end
-        end
-    end
-end
-
-function estimate_parameters2(pc::ProbCircuit, data; pseudocount::Float64)
     @assert isbinarydata(data) "Probabilistic circuit parameter estimation for binary data only"
     bc = BitCircuit(pc, data; reset=false, on_gpu = isgpu(data))
     on_node, on_edge, get_params = if isgpu(data)
-        estimate_parameters2_gpu(bc, pseudocount)
+        estimate_parameters_gpu(bc, pseudocount)
     else
-        estimate_parameters2_cpu(bc, pseudocount)
+        estimate_parameters_cpu(bc, pseudocount)
     end
     compute_values_flows(bc, data; on_node, on_edge)
     params::Vector{Float64} = get_params()
@@ -54,7 +34,7 @@ function estimate_parameters2(pc::ProbCircuit, data; pseudocount::Float64)
     params
 end
 
-function estimate_parameters2_cpu(bc, pseudocount)
+function estimate_parameters_cpu(bc, pseudocount)
     # no need to synchronize, since each computation is unique to a decision node
     node_counts::Vector{UInt} = Vector{UInt}(undef, num_nodes(bc))
     log_params::Vector{Float64} = Vector{Float64}(undef, num_elements(bc))
@@ -86,7 +66,7 @@ function estimate_parameters2_cpu(bc, pseudocount)
     return (on_node, on_edge, get_params)
 end
 
-function estimate_parameters2_gpu(bc, pseudocount)
+function estimate_parameters_gpu(bc, pseudocount)
     node_counts::CuVector{Int32} = CUDA.zeros(Int32, num_nodes(bc))
     edge_counts::CuVector{Int32} = CUDA.zeros(Int32, num_elements(bc))
     params::CuVector{Float64} = CuVector{Float64}(undef, num_elements(bc))
diff --git a/src/Utils/misc.jl b/src/Utils/misc.jl
index 7b1c39f7..15d33338 100644
--- a/src/Utils/misc.jl
+++ b/src/Utils/misc.jl
@@ -1,6 +1,7 @@
 export to_long_mi,
     generate_all, generate_data_all
 
+using DataFrames
 
 ###################
 # Misc.
@@ -63,5 +64,5 @@ function generate_data_all(N::Int)
             transpose(parse.(Bool, split(bitstring(mask)[end-N+1:end], "")))
         );
     end
-    data_all
+    DataFrame(data_all)
 end
diff --git a/test/Logistic/logistic_tests.jl b/test/Logistic/logistic_tests.jl
index 3461a064..db741936 100644
--- a/test/Logistic/logistic_tests.jl
+++ b/test/Logistic/logistic_tests.jl
@@ -1,29 +1,31 @@
-using Test
-using LogicCircuits
-using ProbabilisticCircuits
+#TODO: reinstate
 
-# This tests are supposed to test queries on the circuits
-@testset "Logistic Circuit Class Conditional" begin
-    # Uses a Logistic Circuit with 4 variables, and tests 3 of the configurations to 
-    # match with python version.
+# using Test
+# using LogicCircuits
+# using ProbabilisticCircuits
 
-    EPS = 1e-7;
-    logistic_circuit = zoo_lc("little_4var.circuit", 2);
-    @test logistic_circuit isa LogisticCircuit;
+# # This tests are supposed to test queries on the circuits
+# @testset "Logistic Circuit Class Conditional" begin
+#     # Uses a Logistic Circuit with 4 variables, and tests 3 of the configurations to 
+#     # match with python version.
 
-    # Step 1. Check Probabilities for 3 samples
-    data = Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]);
+#     EPS = 1e-7;
+#     logistic_circuit = zoo_lc("little_4var.circuit", 2);
+#     @test logistic_circuit isa LogisticCircuit;
+
+#     # Step 1. Check Probabilities for 3 samples
+#     data = Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]);
     
-    true_prob = [3.43147972 4.66740416; 
-                4.27595352 2.83503504;
-                3.67415087 4.93793472]
+#     true_prob = [3.43147972 4.66740416; 
+#                 4.27595352 2.83503504;
+#                 3.67415087 4.93793472]
             
-    CLASSES = 2
-    calc_prob = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
+#     CLASSES = 2
+#     calc_prob = class_conditional_likelihood_per_instance(logistic_circuit, CLASSES, data)
     
-    for i = 1:3
-        for j = 1:2
-            @test true_prob[i,j] ≈ calc_prob[i,j] atol= EPS;
-        end
-    end
-end
\ No newline at end of file
+#     for i = 1:3
+#         for j = 1:2
+#             @test true_prob[i,j] ≈ calc_prob[i,j] atol= EPS;
+#         end
+#     end
+# end
\ No newline at end of file
diff --git a/test/Probabilistic/queries_tests.jl b/test/Probabilistic/queries_tests.jl
index d157e63d..3e1af1f9 100644
--- a/test/Probabilistic/queries_tests.jl
+++ b/test/Probabilistic/queries_tests.jl
@@ -1,212 +1,214 @@
-using Test
-using LogicCircuits
-using ProbabilisticCircuits
-
-@testset "Probability of Full Evidence" begin
-    # Uses a PSDD with 4 variables, and tests 3 of the configurations to
-    # match with python. Also tests all probabilities sum up to 1.
-
-    EPS = 1e-7;
-    prob_circuit = zoo_psdd("little_4var.psdd");
-    @test prob_circuit isa ProbCircuit;
-
-    # Step 1. Check Probabilities for 3 samples
-    data = Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]);
-    true_prob = [0.07; 0.03; 0.13999999999999999]
-
-    calc_prob = log_likelihood_per_instance(prob_circuit, data)
-    calc_prob = exp.(calc_prob)
-
-    for i = 1:3
-        @test true_prob[i] ≈ calc_prob[i] atol= EPS;
-    end
-
-    # Step 2. Add up all probabilities and see if they add up to one
-    N = 4;
-    data_all = generate_data_all(N)
-
-    calc_prob_all = log_likelihood_per_instance(prob_circuit, data_all)
-    calc_prob_all = exp.(calc_prob_all)
-    sum_prob_all = sum(calc_prob_all)
-
-    @test 1 ≈ sum_prob_all atol = EPS;
-end
-
-@testset "Probability of partial Evidence (marginals)" begin
-    EPS = 1e-7;
-    prob_circuit = zoo_psdd("little_4var.psdd");
-
-    data = Int8.([0 0 0 0; 0 1 1 0; 0 0 1 1;
-                0 0 0 -1; -1 1 0 -1; -1 -1 -1 -1; 0 -1 -1 -1])
-    true_prob = [0.07; 0.03; 0.13999999999999999;
-                    0.3499999999999; 0.1; 1.0; 0.8]
-
-    calc_prob = marginal_log_likelihood_per_instance(prob_circuit, data)
-    calc_prob = exp.(calc_prob)
-
-    for i = 1:length(true_prob)
-        @test true_prob[i] ≈ calc_prob[i] atol= EPS;
-    end
-end
-
-@testset "Marginal Pass Down" begin
-    EPS = 1e-7;
-    prob_circuit = zoo_psdd("little_4var.psdd");
-    logic_circuit = PlainLogicCircuit(prob_circuit)
-
-    N = 4
-    data_full = Bool.(generate_data_all(N))
-
-    # Comparing with down pass with fully obeserved data
-    compute_flows(logic_circuit, data_full)
-    compute_exp_flows(prob_circuit, data_full)
-
-    lin_prob = linearize(prob_circuit)
-    lin_logic = linearize(logic_circuit)
-    for i in 1 : length(lin_prob)
-        pn = lin_prob[i]
-        ln = lin_logic[i]
-        @test all(isapprox.(exp.(get_exp_downflow(pn; root=prob_circuit)), 
-            get_downflow(ln; root=logic_circuit), atol=EPS))
-    end
-
-    # Validating one example with missing features done by hand
-    data_partial = Int8.([-1 1 -1 1])
-    prob_circuit = zoo_psdd("little_4var.psdd");
-    compute_exp_flows(prob_circuit, data_partial)
-
-    # (node index, correct down_flow_value)
-    true_vals = [(1, 0.5),
-                (2, 1.0),
-                (3, 0.5),
-                (4, 0.0),
-                (5, 0.0),
-                (6, 0.5),
-                (7, 0.5),
-                (8, 0.0),
-                (9, 1.0),
-                (10, 1/3),
-                (11, 1),
-                (12, 1/3),
-                (13, 0.0),
-                (14, 0.0),
-                (15, 2/3),
-                (16, 2/3),
-                (17, 0.0),
-                (18, 1.0),
-                (19, 1.0),
-                (20, 1.0)]
-    lin = linearize(prob_circuit)
+#TODO: reinstate
+
+# using Test
+# using LogicCircuits
+# using ProbabilisticCircuits
+
+# @testset "Probability of Full Evidence" begin
+#     # Uses a PSDD with 4 variables, and tests 3 of the configurations to
+#     # match with python. Also tests all probabilities sum up to 1.
+
+#     EPS = 1e-7;
+#     prob_circuit = zoo_psdd("little_4var.psdd");
+#     @test prob_circuit isa ProbCircuit;
+
+#     # Step 1. Check Probabilities for 3 samples
+#     data = Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]);
+#     true_prob = [0.07; 0.03; 0.13999999999999999]
+
+#     calc_prob = log_likelihood_per_instance(prob_circuit, data)
+#     calc_prob = exp.(calc_prob)
+
+#     for i = 1:3
+#         @test true_prob[i] ≈ calc_prob[i] atol= EPS;
+#     end
+
+#     # Step 2. Add up all probabilities and see if they add up to one
+#     N = 4;
+#     data_all = generate_data_all(N)
+
+#     calc_prob_all = log_likelihood_per_instance(prob_circuit, data_all)
+#     calc_prob_all = exp.(calc_prob_all)
+#     sum_prob_all = sum(calc_prob_all)
+
+#     @test 1 ≈ sum_prob_all atol = EPS;
+# end
+
+# @testset "Probability of partial Evidence (marginals)" begin
+#     EPS = 1e-7;
+#     prob_circuit = zoo_psdd("little_4var.psdd");
+
+#     data = Int8.([0 0 0 0; 0 1 1 0; 0 0 1 1;
+#                 0 0 0 -1; -1 1 0 -1; -1 -1 -1 -1; 0 -1 -1 -1])
+#     true_prob = [0.07; 0.03; 0.13999999999999999;
+#                     0.3499999999999; 0.1; 1.0; 0.8]
+
+#     calc_prob = marginal_log_likelihood_per_instance(prob_circuit, data)
+#     calc_prob = exp.(calc_prob)
+
+#     for i = 1:length(true_prob)
+#         @test true_prob[i] ≈ calc_prob[i] atol= EPS;
+#     end
+# end
+
+# @testset "Marginal Pass Down" begin
+#     EPS = 1e-7;
+#     prob_circuit = zoo_psdd("little_4var.psdd");
+#     logic_circuit = PlainLogicCircuit(prob_circuit)
+
+#     N = 4
+#     data_full = Bool.(generate_data_all(N))
+
+#     # Comparing with down pass with fully obeserved data
+#     compute_flows(logic_circuit, data_full)
+#     compute_exp_flows(prob_circuit, data_full)
+
+#     lin_prob = linearize(prob_circuit)
+#     lin_logic = linearize(logic_circuit)
+#     for i in 1 : length(lin_prob)
+#         pn = lin_prob[i]
+#         ln = lin_logic[i]
+#         @test all(isapprox.(exp.(get_exp_downflow(pn; root=prob_circuit)), 
+#             get_downflow(ln; root=logic_circuit), atol=EPS))
+#     end
+
+#     # Validating one example with missing features done by hand
+#     data_partial = Int8.([-1 1 -1 1])
+#     prob_circuit = zoo_psdd("little_4var.psdd");
+#     compute_exp_flows(prob_circuit, data_partial)
+
+#     # (node index, correct down_flow_value)
+#     true_vals = [(1, 0.5),
+#                 (2, 1.0),
+#                 (3, 0.5),
+#                 (4, 0.0),
+#                 (5, 0.0),
+#                 (6, 0.5),
+#                 (7, 0.5),
+#                 (8, 0.0),
+#                 (9, 1.0),
+#                 (10, 1/3),
+#                 (11, 1),
+#                 (12, 1/3),
+#                 (13, 0.0),
+#                 (14, 0.0),
+#                 (15, 2/3),
+#                 (16, 2/3),
+#                 (17, 0.0),
+#                 (18, 1.0),
+#                 (19, 1.0),
+#                 (20, 1.0)]
+#     lin = linearize(prob_circuit)
     
-    for ind_val in true_vals
-        @test exp(get_exp_downflow(lin[ind_val[1]]; root=prob_circuit)[1]) ≈ ind_val[2] atol= EPS
-    end
-end
-
-function test_mpe_brute_force(prob_circuit, evidence)
-    EPS = 1e-9;
-    result = MPE(prob_circuit, evidence);
-    for idx = 1 : num_examples(evidence)
-        marg = generate_all(evidence[idx,:])
-        lls = log_likelihood_per_instance(prob_circuit, marg);
-        brute_mpe = marg[argmax(lls), :]
-
-        # Compare and validate p(result[idx]) == p(brute_mpe)
-        comp_data = vcat(result[idx,:]',  brute_mpe')
-        lls2 = log_likelihood_per_instance(prob_circuit, comp_data);
-
-        @test lls2[1] ≈ lls2[2] atol= EPS
-    end
-end
-
-@testset "MPE Brute Force Test Small (4 var)" begin
-    prob_circuit = zoo_psdd("little_4var.psdd");
-    evidence = Int8.( [-1 0 0 0;
-                                0 -1 -1 0;
-                                1 1 1 -1;
-                                1 0 1 0;
-                                -1 -1 -1 1;
-                                -1 -1 -1 -1] )
-
-    test_mpe_brute_force(prob_circuit, evidence)
-
-end
-
-@testset "MPE Brute Force Test Big (15 var)" begin
-    N = 15
-    COUNT = 10
-
-    prob_circuit = zoo_psdd("exp-D15-N1000-C4.psdd");
-    evidence = Int8.(rand( (-1,0,1), (COUNT, N)))
-
-    test_mpe_brute_force(prob_circuit, evidence)
-end
-
-@testset "Sampling Test" begin
-    EPS = 1e-2;
-    prob_circuit = zoo_psdd("little_4var.psdd");
-
-    N = 4;
-    data_all = generate_data_all(N);
-
-    calc_prob_all = log_likelihood_per_instance(prob_circuit, data_all);
-    calc_prob_all = exp.(calc_prob_all);
-
-    using DataStructures
-    hist = DefaultDict{AbstractString,Float64}(0.0)
-
-    Nsamples = 1000 * 1000
-    for i = 1:Nsamples
-        cur = join(Int.(sample(prob_circuit)))
-        hist[cur] += 1
-    end
-
-    for k in keys(hist)
-        hist[k] /= Nsamples
-    end
-
-    for k in keys(hist)
-        cur = parse(Int32, k, base=2) + 1 # cause Julia arrays start at 1 :(
-        @test calc_prob_all[cur] ≈ hist[k] atol= EPS;
-    end
-
-
-end
-
-using DataStructures
-@testset "Sampling With Evidence" begin
-    # TODO (pashak) this test should be improved by adding few more cases
-    EPS = 1e-2;
-    prob_circuit = zoo_psdd("little_4var.psdd");
-
-    N = 4;
-    data = Int8.([0 -1 0 -1])
-    calc_prob = marginal_log_likelihood_per_instance(prob_circuit, data);
-    calc_prob = exp.(calc_prob);
-
-    data_all = Int8.([0 0 0 0;
-                    0 0 0 1;
-                    0 1 0 0;
-                    0 1 0 1;]);
-    calc_prob_all = marginal_log_likelihood_per_instance(prob_circuit, data_all);
-    calc_prob_all = exp.(calc_prob_all);
-
-    calc_prob_all ./= calc_prob[1]
-
-    hist = DefaultDict{AbstractString,Float64}(0.0)
-
-    Nsamples = 1000 * 1000
-    for i = 1:Nsamples
-        cur = join(Int.(sample(prob_circuit, data)))
-        hist[cur] += 1
-    end
-
-    for k in keys(hist)
-        hist[k] /= Nsamples
-    end
-
-    for ind = 1:4
-        cur = join(data_all[ind, :])
-        @test calc_prob_all[ind] ≈ hist[cur] atol= EPS;
-    end
-end
\ No newline at end of file
+#     for ind_val in true_vals
+#         @test exp(get_exp_downflow(lin[ind_val[1]]; root=prob_circuit)[1]) ≈ ind_val[2] atol= EPS
+#     end
+# end
+
+# function test_mpe_brute_force(prob_circuit, evidence)
+#     EPS = 1e-9;
+#     result = MPE(prob_circuit, evidence);
+#     for idx = 1 : num_examples(evidence)
+#         marg = generate_all(evidence[idx,:])
+#         lls = log_likelihood_per_instance(prob_circuit, marg);
+#         brute_mpe = marg[argmax(lls), :]
+
+#         # Compare and validate p(result[idx]) == p(brute_mpe)
+#         comp_data = vcat(result[idx,:]',  brute_mpe')
+#         lls2 = log_likelihood_per_instance(prob_circuit, comp_data);
+
+#         @test lls2[1] ≈ lls2[2] atol= EPS
+#     end
+# end
+
+# @testset "MPE Brute Force Test Small (4 var)" begin
+#     prob_circuit = zoo_psdd("little_4var.psdd");
+#     evidence = Int8.( [-1 0 0 0;
+#                                 0 -1 -1 0;
+#                                 1 1 1 -1;
+#                                 1 0 1 0;
+#                                 -1 -1 -1 1;
+#                                 -1 -1 -1 -1] )
+
+#     test_mpe_brute_force(prob_circuit, evidence)
+
+# end
+
+# @testset "MPE Brute Force Test Big (15 var)" begin
+#     N = 15
+#     COUNT = 10
+
+#     prob_circuit = zoo_psdd("exp-D15-N1000-C4.psdd");
+#     evidence = Int8.(rand( (-1,0,1), (COUNT, N)))
+
+#     test_mpe_brute_force(prob_circuit, evidence)
+# end
+
+# @testset "Sampling Test" begin
+#     EPS = 1e-2;
+#     prob_circuit = zoo_psdd("little_4var.psdd");
+
+#     N = 4;
+#     data_all = generate_data_all(N);
+
+#     calc_prob_all = log_likelihood_per_instance(prob_circuit, data_all);
+#     calc_prob_all = exp.(calc_prob_all);
+
+#     using DataStructures
+#     hist = DefaultDict{AbstractString,Float64}(0.0)
+
+#     Nsamples = 1000 * 1000
+#     for i = 1:Nsamples
+#         cur = join(Int.(sample(prob_circuit)))
+#         hist[cur] += 1
+#     end
+
+#     for k in keys(hist)
+#         hist[k] /= Nsamples
+#     end
+
+#     for k in keys(hist)
+#         cur = parse(Int32, k, base=2) + 1 # cause Julia arrays start at 1 :(
+#         @test calc_prob_all[cur] ≈ hist[k] atol= EPS;
+#     end
+
+
+# end
+
+# using DataStructures
+# @testset "Sampling With Evidence" begin
+#     # TODO (pashak) this test should be improved by adding few more cases
+#     EPS = 1e-2;
+#     prob_circuit = zoo_psdd("little_4var.psdd");
+
+#     N = 4;
+#     data = Int8.([0 -1 0 -1])
+#     calc_prob = marginal_log_likelihood_per_instance(prob_circuit, data);
+#     calc_prob = exp.(calc_prob);
+
+#     data_all = Int8.([0 0 0 0;
+#                     0 0 0 1;
+#                     0 1 0 0;
+#                     0 1 0 1;]);
+#     calc_prob_all = marginal_log_likelihood_per_instance(prob_circuit, data_all);
+#     calc_prob_all = exp.(calc_prob_all);
+
+#     calc_prob_all ./= calc_prob[1]
+
+#     hist = DefaultDict{AbstractString,Float64}(0.0)
+
+#     Nsamples = 1000 * 1000
+#     for i = 1:Nsamples
+#         cur = join(Int.(sample(prob_circuit, data)))
+#         hist[cur] += 1
+#     end
+
+#     for k in keys(hist)
+#         hist[k] /= Nsamples
+#     end
+
+#     for ind = 1:4
+#         cur = join(data_all[ind, :])
+#         @test calc_prob_all[ind] ≈ hist[cur] atol= EPS;
+#     end
+# end
\ No newline at end of file
diff --git a/test/Reasoning/expectation_test.jl b/test/Reasoning/expectation_test.jl
index c8aafc50..0e498e88 100644
--- a/test/Reasoning/expectation_test.jl
+++ b/test/Reasoning/expectation_test.jl
@@ -1,142 +1,144 @@
-using Test
-using LogicCircuits
-using ProbabilisticCircuits
-
-function test_expectation_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLASSES::Int)
-    EPS = 1e-7;
-    COUNT = size(data)[1]
-    # Compute True expectation brute force
-    true_exp = zeros(COUNT, CLASSES)
-    for i in 1:COUNT
-        row = data[i, :]
-        cur_data_all = generate_all(row)
-
-        calc_p = log_likelihood_per_instance(pc, cur_data_all)
-        calc_p = exp.(calc_p)
-
-        calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
-        true_exp[i, :] = sum(calc_p .* calc_f, dims=1)
-        true_exp[i, :] ./= sum(calc_p) #p_observed
-    end
-
-    # Compute Circuit Expect
-    calc_exp, cache = Expectation(pc, lc, data);
-    for i = 1:COUNT
-        for j = 1:CLASSES
-            @test true_exp[i,j] ≈ calc_exp[i,j] atol= EPS;
-        end
-    end    
-    # Compute Bottom Up Expectation
-    calc_exp_2, exp_flow = ExpectationUpward(pc, lc, data);
-    for i = 1:COUNT
-        for j = 1:CLASSES
-            @test true_exp[i,j] ≈ calc_exp_2[i,j] atol= EPS;
-        end
-    end
-end
-
-function test_moment_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLASSES::Int, moment::Int)
-    EPS = 1e-7;
-    COUNT = size(data)[1]
-    # Compute True moment brute force
-    true_mom = zeros(COUNT, CLASSES)
-    for i in 1:COUNT
-        row = data[i, :]
-        cur_data_all = generate_all(row)
-
-        calc_p = log_likelihood_per_instance(pc, cur_data_all)
-        calc_p = exp.(calc_p)
-
-        calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
-        true_mom[i, :] = sum(calc_p .* (calc_f .^ moment), dims=1)
-        true_mom[i, :] ./= sum(calc_p) #p_observed
-    end
-
-    # Compute Circuit Moment
-    calc_mom, cache = Moment(pc, lc, data, moment);
-    for i = 1:COUNT
-        for j = 1:CLASSES
-            @test (true_mom[i,j] / (calc_mom[i,j] )) ≈ 1.0 atol= EPS;
-        end
-    end    
-end
-
-
-@testset "Expectation Brute Force Test Small (4 Var)" begin
-    psdd_file       = "little_4var.psdd"
-    logistic_file   = "little_4var.circuit"
-    CLASSES = 2
-    N = 4
-
-    pc = zoo_psdd(psdd_file);
-    lc = zoo_lc(logistic_file, CLASSES);
-    data = Int8.([
-                        0 0 0 0; 
-                        0 1 1 0; 
-                        0 0 1 1;
-                        -1 -1 -1 -1;
-                        -1 0 1 -1;
-                        0 1 -1 1;
-                        1 -1 0 -1;
-                        -1 0 1 -1;
-                        -1 -1 0 1;
-                        -1 -1 -1 1;
-                        -1 -1 -1 0;
-                        ]);
-
-    test_expectation_brute_force(pc, lc, data, CLASSES)
-end
-
-
-@testset "Expectation Brute Force Test Big (15 Var)" begin
-    psdd_file       = "exp-D15-N1000-C4.psdd"
-    logistic_file   = "exp-D15-N1000-C4.circuit"
-    CLASSES = 4
-    N = 15
-    COUNT = 10
-
-    pc = zoo_psdd(psdd_file);
-    lc = zoo_lc(logistic_file, CLASSES);
-    data = Int8.(rand( (-1,0,1), (COUNT, N) ))
+#TODO: reinstate
+
+# using Test
+# using LogicCircuits
+# using ProbabilisticCircuits
+
+# function test_expectation_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLASSES::Int)
+#     EPS = 1e-7;
+#     COUNT = size(data)[1]
+#     # Compute True expectation brute force
+#     true_exp = zeros(COUNT, CLASSES)
+#     for i in 1:COUNT
+#         row = data[i, :]
+#         cur_data_all = generate_all(row)
+
+#         calc_p = log_likelihood_per_instance(pc, cur_data_all)
+#         calc_p = exp.(calc_p)
+
+#         calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
+#         true_exp[i, :] = sum(calc_p .* calc_f, dims=1)
+#         true_exp[i, :] ./= sum(calc_p) #p_observed
+#     end
+
+#     # Compute Circuit Expect
+#     calc_exp, cache = Expectation(pc, lc, data);
+#     for i = 1:COUNT
+#         for j = 1:CLASSES
+#             @test true_exp[i,j] ≈ calc_exp[i,j] atol= EPS;
+#         end
+#     end    
+#     # Compute Bottom Up Expectation
+#     calc_exp_2, exp_flow = ExpectationUpward(pc, lc, data);
+#     for i = 1:COUNT
+#         for j = 1:CLASSES
+#             @test true_exp[i,j] ≈ calc_exp_2[i,j] atol= EPS;
+#         end
+#     end
+# end
+
+# function test_moment_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLASSES::Int, moment::Int)
+#     EPS = 1e-7;
+#     COUNT = size(data)[1]
+#     # Compute True moment brute force
+#     true_mom = zeros(COUNT, CLASSES)
+#     for i in 1:COUNT
+#         row = data[i, :]
+#         cur_data_all = generate_all(row)
+
+#         calc_p = log_likelihood_per_instance(pc, cur_data_all)
+#         calc_p = exp.(calc_p)
+
+#         calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
+#         true_mom[i, :] = sum(calc_p .* (calc_f .^ moment), dims=1)
+#         true_mom[i, :] ./= sum(calc_p) #p_observed
+#     end
+
+#     # Compute Circuit Moment
+#     calc_mom, cache = Moment(pc, lc, data, moment);
+#     for i = 1:COUNT
+#         for j = 1:CLASSES
+#             @test (true_mom[i,j] / (calc_mom[i,j] )) ≈ 1.0 atol= EPS;
+#         end
+#     end    
+# end
+
+
+# @testset "Expectation Brute Force Test Small (4 Var)" begin
+#     psdd_file       = "little_4var.psdd"
+#     logistic_file   = "little_4var.circuit"
+#     CLASSES = 2
+#     N = 4
+
+#     pc = zoo_psdd(psdd_file);
+#     lc = zoo_lc(logistic_file, CLASSES);
+#     data = Int8.([
+#                         0 0 0 0; 
+#                         0 1 1 0; 
+#                         0 0 1 1;
+#                         -1 -1 -1 -1;
+#                         -1 0 1 -1;
+#                         0 1 -1 1;
+#                         1 -1 0 -1;
+#                         -1 0 1 -1;
+#                         -1 -1 0 1;
+#                         -1 -1 -1 1;
+#                         -1 -1 -1 0;
+#                         ]);
+
+#     test_expectation_brute_force(pc, lc, data, CLASSES)
+# end
+
+
+# @testset "Expectation Brute Force Test Big (15 Var)" begin
+#     psdd_file       = "exp-D15-N1000-C4.psdd"
+#     logistic_file   = "exp-D15-N1000-C4.circuit"
+#     CLASSES = 4
+#     N = 15
+#     COUNT = 10
+
+#     pc = zoo_psdd(psdd_file);
+#     lc = zoo_lc(logistic_file, CLASSES);
+#     data = Int8.(rand( (-1,0,1), (COUNT, N) ))
     
-    test_expectation_brute_force(pc, lc, data, CLASSES)
-end
-
-
-@testset "Moment Brute Force Test Small (4 Var)" begin
-    psdd_file       = "little_4var.psdd"
-    logistic_file   = "little_4var.circuit";
-    CLASSES = 2
-    N = 4
-    COUNT = 100
-
-    pc = zoo_psdd(psdd_file);
-    lc = zoo_lc(logistic_file, CLASSES);
-    data = Int8.(rand( (-1,0,1), (COUNT, N) ))
-
-    test_moment_brute_force(pc, lc, data, CLASSES, 1)
-    test_moment_brute_force(pc, lc, data, CLASSES, 2)
-    test_moment_brute_force(pc, lc, data, CLASSES, 3)
-    test_moment_brute_force(pc, lc, data, CLASSES, 4)
-    test_moment_brute_force(pc, lc, data, CLASSES, 10)
-    test_moment_brute_force(pc, lc, data, CLASSES, 15)
-end
-
-@testset "Moment Brute Force Test Big (15 Var)" begin
-    psdd_file       = "exp-D15-N1000-C4.psdd"
-    logistic_file   = "exp-D15-N1000-C4.circuit";
-    CLASSES = 4
-    N = 15
-    COUNT = 10
-
-    pc = zoo_psdd(psdd_file);
-    lc = zoo_lc(logistic_file, CLASSES);
-    data = Int8.(rand( (-1,0,1), (COUNT, N) ))
-
-    test_moment_brute_force(pc, lc, data, CLASSES, 1)
-    test_moment_brute_force(pc, lc, data, CLASSES, 2)
-    test_moment_brute_force(pc, lc, data, CLASSES, 3)
-    test_moment_brute_force(pc, lc, data, CLASSES, 4)
-    test_moment_brute_force(pc, lc, data, CLASSES, 10)
-    test_moment_brute_force(pc, lc, data, CLASSES, 15)
-end
\ No newline at end of file
+#     test_expectation_brute_force(pc, lc, data, CLASSES)
+# end
+
+
+# @testset "Moment Brute Force Test Small (4 Var)" begin
+#     psdd_file       = "little_4var.psdd"
+#     logistic_file   = "little_4var.circuit";
+#     CLASSES = 2
+#     N = 4
+#     COUNT = 100
+
+#     pc = zoo_psdd(psdd_file);
+#     lc = zoo_lc(logistic_file, CLASSES);
+#     data = Int8.(rand( (-1,0,1), (COUNT, N) ))
+
+#     test_moment_brute_force(pc, lc, data, CLASSES, 1)
+#     test_moment_brute_force(pc, lc, data, CLASSES, 2)
+#     test_moment_brute_force(pc, lc, data, CLASSES, 3)
+#     test_moment_brute_force(pc, lc, data, CLASSES, 4)
+#     test_moment_brute_force(pc, lc, data, CLASSES, 10)
+#     test_moment_brute_force(pc, lc, data, CLASSES, 15)
+# end
+
+# @testset "Moment Brute Force Test Big (15 Var)" begin
+#     psdd_file       = "exp-D15-N1000-C4.psdd"
+#     logistic_file   = "exp-D15-N1000-C4.circuit";
+#     CLASSES = 4
+#     N = 15
+#     COUNT = 10
+
+#     pc = zoo_psdd(psdd_file);
+#     lc = zoo_lc(logistic_file, CLASSES);
+#     data = Int8.(rand( (-1,0,1), (COUNT, N) ))
+
+#     test_moment_brute_force(pc, lc, data, CLASSES, 1)
+#     test_moment_brute_force(pc, lc, data, CLASSES, 2)
+#     test_moment_brute_force(pc, lc, data, CLASSES, 3)
+#     test_moment_brute_force(pc, lc, data, CLASSES, 4)
+#     test_moment_brute_force(pc, lc, data, CLASSES, 10)
+#     test_moment_brute_force(pc, lc, data, CLASSES, 15)
+# end
\ No newline at end of file
diff --git a/test/StructureLearner/init_tests.jl b/test/StructureLearner/init_tests.jl
index d2986e88..b8063df3 100644
--- a/test/StructureLearner/init_tests.jl
+++ b/test/StructureLearner/init_tests.jl
@@ -1,31 +1,40 @@
-using Test: @test, @testset
-using LogicCircuits
-using ProbabilisticCircuits
+# TODO: reinstate
 
-@testset "Probabilistic circuits learner tests" begin
-    train_x, _, _ = twenty_datasets("nltcs")
-    (pc, vtree) = learn_struct_prob_circuit(train_x)
+# using Test: @test, @testset
+# using LogicCircuits
+# using ProbabilisticCircuits
+
+# @testset "Probabilistic circuits learner tests" begin
+#     train_x, _, _ = twenty_datasets("nltcs")
+
+#     @assert train_x isa DataFrame
+#     @assert isbinarydata(train_x)
+
+#     (pc, vtree) = learn_struct_prob_circuit(train_x)
     
-    # simple test
-    @test pc isa ProbCircuit
-    @test vtree isa PlainVtree
-    @test num_variables(vtree) == num_features(train_x)
-    @test check_parameter_integrity(pc)
-    @test num_parameters(pc) == 74 
-
-    # test below has started to fail -- unclear whether that is a bug or randomness...?
-    # @test pc[28].log_thetas[1] ≈ -1.1870882896239272 atol=1.0e-7
-
-    # is structured decomposable 
-    for (n, vars) in variables_by_node(pc)
-        @test vars == BitSet(variables(n.vtree))
-    end
-
-    # all evidence sums to 1
-    N = num_features(train_x)
-    data_all = generate_data_all(N)
-    calc_prob_all = log_likelihood_per_instance(pc, data_all)
-    calc_prob_all = exp.(calc_prob_all)
-    sum_prob_all = sum(calc_prob_all)
-    @test sum_prob_all ≈ 1 atol = 1.0e-7;
-end
\ No newline at end of file
+#     # simple test
+#     @test pc isa ProbCircuit
+#     @test vtree isa PlainVtree
+#     @test num_variables(vtree) == num_features(train_x)
+#     @test check_parameter_integrity(pc)
+#     @test num_parameters(pc) == 74 
+
+#     # test below has started to fail -- unclear whether that is a bug or randomness...?
+#     # @test pc[28].log_thetas[1] ≈ -1.1870882896239272 atol=1.0e-7
+
+#     # is structured decomposable 
+#     for (n, vars) in variables_by_node(pc)
+#         @test vars == BitSet(variables(n.vtree))
+#     end
+
+#     # all evidence sums to 1
+#     N = num_features(train_x)
+#     data_all = generate_data_all(N)
+#     @assert data_all isa DataFrame
+#     @assert isbinarydata(data_all)
+
+#     calc_prob_all = log_likelihood_per_instance(pc, data_all)
+#     calc_prob_all = exp.(calc_prob_all)
+#     sum_prob_all = sum(calc_prob_all)
+#     @test sum_prob_all ≈ 1 atol = 1.0e-7;
+# end
\ No newline at end of file

From e635c2f121394d948da41e05501986007e352da6 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 29 Aug 2020 21:36:26 -0500
Subject: [PATCH 068/131] remove submodules

---
 Project.toml                                  |   2 +
 docs/src/api/internals/logistic.md            |   5 -
 docs/src/api/internals/probabilistic.md       |   5 -
 docs/src/api/internals/reasoning.md           |   5 -
 docs/src/api/internals/structureLearner.md    |   5 -
 src/IO/CircuitLineCompiler.jl                 | 115 ------------------
 src/LoadSave/LoadSave.jl                      |   5 +-
 src/Logistic/Logistic.jl                      |  11 --
 src/Mixtures/Mixtures.jl                      |  11 --
 src/Probabilistic/Probabilistic.jl            |  13 --
 src/ProbabilisticCircuits.jl                  |  33 +++--
 src/Reasoning/Reasoning.jl                    |  11 --
 src/StructureLearner/StructureLearner.jl      |  15 ---
 src/{Probabilistic => }/exp_flows.jl          |   0
 src/{Probabilistic => }/informations.jl       |   0
 src/{Logistic => logistic}/logistic_nodes.jl  |   0
 src/{Logistic => logistic}/queries.jl         |   0
 .../deprecated/Bagging.jl                     |   0
 src/{Mixtures => mixtures}/em.jl              |   0
 .../shared_prob_nodes.jl                      |   0
 src/{Mixtures => mixtures}/todo/EMLearner.jl  |   0
 src/{Mixtures => mixtures}/todo/Mixtures.jl   |   0
 src/{Probabilistic => }/parameters.jl         |   0
 src/{Probabilistic => }/prob_nodes.jl         |   0
 src/{Probabilistic => }/queries.jl            |   0
 .../exp_flow_circuits.jl                      |   0
 src/{Reasoning => reasoning}/expectation.jl   |   0
 .../structured_prob_nodes.jl                  |   0
 .../VtreeLearner.jl                           |   0
 .../chow_liu_tree.jl                          |   0
 .../heuristics.jl                             |   0
 .../init.jl                                   |   0
 .../learner.jl                                |   0
 33 files changed, 24 insertions(+), 212 deletions(-)
 delete mode 100644 docs/src/api/internals/logistic.md
 delete mode 100644 docs/src/api/internals/probabilistic.md
 delete mode 100644 docs/src/api/internals/reasoning.md
 delete mode 100644 docs/src/api/internals/structureLearner.md
 delete mode 100644 src/IO/CircuitLineCompiler.jl
 delete mode 100644 src/Logistic/Logistic.jl
 delete mode 100644 src/Mixtures/Mixtures.jl
 delete mode 100644 src/Probabilistic/Probabilistic.jl
 delete mode 100644 src/Reasoning/Reasoning.jl
 delete mode 100644 src/StructureLearner/StructureLearner.jl
 rename src/{Probabilistic => }/exp_flows.jl (100%)
 rename src/{Probabilistic => }/informations.jl (100%)
 rename src/{Logistic => logistic}/logistic_nodes.jl (100%)
 rename src/{Logistic => logistic}/queries.jl (100%)
 rename src/{Mixtures => mixtures}/deprecated/Bagging.jl (100%)
 rename src/{Mixtures => mixtures}/em.jl (100%)
 rename src/{Mixtures => mixtures}/shared_prob_nodes.jl (100%)
 rename src/{Mixtures => mixtures}/todo/EMLearner.jl (100%)
 rename src/{Mixtures => mixtures}/todo/Mixtures.jl (100%)
 rename src/{Probabilistic => }/parameters.jl (100%)
 rename src/{Probabilistic => }/prob_nodes.jl (100%)
 rename src/{Probabilistic => }/queries.jl (100%)
 rename src/{Reasoning => reasoning}/exp_flow_circuits.jl (100%)
 rename src/{Reasoning => reasoning}/expectation.jl (100%)
 rename src/{Probabilistic => }/structured_prob_nodes.jl (100%)
 rename src/{StructureLearner => structurelearner}/VtreeLearner.jl (100%)
 rename src/{StructureLearner => structurelearner}/chow_liu_tree.jl (100%)
 rename src/{StructureLearner => structurelearner}/heuristics.jl (100%)
 rename src/{StructureLearner => structurelearner}/init.jl (100%)
 rename src/{StructureLearner => structurelearner}/learner.jl (100%)

diff --git a/Project.toml b/Project.toml
index 5f58ad73..7094194f 100644
--- a/Project.toml
+++ b/Project.toml
@@ -6,6 +6,7 @@ version = "0.1.1"
 BlossomV = "6c721016-9dae-5d90-abf6-67daaccb2332"
 CUDA = "052768ef-5323-5732-b1bb-66c8b64840ba"
 Clustering = "aaaa29a8-35af-508c-8bc3-b662a17a0fe5"
+DataFrames = "a93c6f00-e57d-5684-b7b6-d8193f3e46c0"
 DataStructures = "864edb3b-99cc-5e75-8d2d-829cb0a9cfe8"
 LightGraphs = "093fc24a-ae57-5d10-9952-331d41423f4d"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
@@ -25,6 +26,7 @@ StatsFuns = "4c63d2b9-4356-54db-8cca-17b64c39e42c"
 
 [compat]
 BlossomV = "0.4"
+CUDA = "1.2"
 Clustering = "0.14"
 DataStructures = "0.17"
 LightGraphs = "1.3"
diff --git a/docs/src/api/internals/logistic.md b/docs/src/api/internals/logistic.md
deleted file mode 100644
index 6fc07a5e..00000000
--- a/docs/src/api/internals/logistic.md
+++ /dev/null
@@ -1,5 +0,0 @@
-# Logistic
-
-```@autodocs
-Modules = [Logistic]
-```
diff --git a/docs/src/api/internals/probabilistic.md b/docs/src/api/internals/probabilistic.md
deleted file mode 100644
index 8d045097..00000000
--- a/docs/src/api/internals/probabilistic.md
+++ /dev/null
@@ -1,5 +0,0 @@
-# Probabilistic
-
-```@autodocs
-Modules = [ProbabilisticCircuits.Probabilistic]
-```
\ No newline at end of file
diff --git a/docs/src/api/internals/reasoning.md b/docs/src/api/internals/reasoning.md
deleted file mode 100644
index e8428ba2..00000000
--- a/docs/src/api/internals/reasoning.md
+++ /dev/null
@@ -1,5 +0,0 @@
-# Reasoning
-
-```@autodocs
-Modules = [ProbabilisticCircuits.Reasoning]
-```
diff --git a/docs/src/api/internals/structureLearner.md b/docs/src/api/internals/structureLearner.md
deleted file mode 100644
index 78ab902f..00000000
--- a/docs/src/api/internals/structureLearner.md
+++ /dev/null
@@ -1,5 +0,0 @@
-# StructureLearner
-
-```@autodocs
-Modules = [ProbabilisticCircuits.StructureLearner]
-```
diff --git a/src/IO/CircuitLineCompiler.jl b/src/IO/CircuitLineCompiler.jl
deleted file mode 100644
index 604a2e5e..00000000
--- a/src/IO/CircuitLineCompiler.jl
+++ /dev/null
@@ -1,115 +0,0 @@
-#####################
-# Compilers to ProbabilisticCircuits data structures starting from already parsed line objects
-#####################
-
-# reuse some internal infrastructure of LogicCircuits' IO module
-using LogicCircuits.IO: CircuitFormatLines, CircuitFormatLine, VtreeFormatLines, CircuitHeaderLine, UnweightedLiteralLine, WeightedLiteralLine, DecisionLine, LCElement, BiasLine, WeightedNamedConstantLine, PSDDElement, CircuitCommentLine, ID,
-compile_smooth_struct_logical_m, compile_smooth_logical_m
-
-"""
-Compile lines into a probabilistic circuit.
-"""
-function compile_prob(lines::CircuitFormatLines)::ProbΔ
-    # first compile a logic circuit
-    logic_circuit, id2lognode = compile_smooth_logical_m(lines)
-    decorate_prob(lines, logic_circuit, id2lognode)
-end
-
-"""
-Compile lines into a logistic circuit.
-"""
-function compile_logistic(lines::CircuitFormatLines, classes::Int)::LogisticΔ
-    # first compile a logic circuit
-    logic_circuit, id2lognode = compile_smooth_logical_m(lines)
-    decorate_logistic(lines, logic_circuit, classes, id2lognode)
-end
-
-"""
-Compile circuit and vtree lines into a structured probabilistic circuit (one whose logic circuit origin is structured).
-"""
-function compile_struct_prob(circuit_lines::CircuitFormatLines, vtree_lines::VtreeFormatLines)
-    logic_circuit, vtree, id2vtree, id2lognode = compile_smooth_struct_logical_m(circuit_lines, vtree_lines)
-    prob_circuit = decorate_prob(circuit_lines, logic_circuit, id2lognode)
-    return prob_circuit, vtree
-end
-
-function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicΔ, id2lognode::Dict{ID,<:LogicCircuit})::ProbΔ
-    # set up cache mapping logic circuit nodes to their probabilistic decorator
-    lognode2probnode = ProbCache()
-    # build a corresponding probabilistic circuit
-    prob_circuit = ProbΔ(logic_circuit,lognode2probnode)
-    # map from line node ids to probabilistic circuit nodes
-    id2probnode(id) = lognode2probnode[id2lognode[id]]
-
-    # go through lines again and update the probabilistic circuit node parameters
-
-    function compile(ln::CircuitFormatLine)
-        error("Compilation of line $ln into probabilistic circuit is not supported")
-    end
-    function compile(::Union{CircuitHeaderLine,CircuitCommentLine,UnweightedLiteralLine})
-        # do nothing
-    end
-    function compile(ln::WeightedNamedConstantLine)
-        @assert lnconstant(ln) == true
-        node = id2probnode(ln.node_id)::Prob⋁
-        node.log_thetas .= [ln.weight, log1p(-exp(ln.weight)) ]
-    end
-    function compile(ln::DecisionLine{<:PSDDElement})
-        node = id2probnode(ln.node_id)::Prob⋁
-        node.log_thetas .= [x.weight for x in ln.elements]
-    end
-    for ln in lines
-        compile(ln)
-    end
-
-    prob_circuit
-end
-
-
-function decorate_logistic(lines::CircuitFormatLines, logic_circuit::LogicΔ, 
-                            classes::Int, id2lognode::Dict{ID,<:LogicCircuit})::LogisticΔ
-                        
-    # set up cache mapping logic circuit nodes to their logistic decorator
-    log2logistic = LogisticCache()
-    # build a corresponding probabilistic circuit
-    logistic_circuit = LogisticΔ(logic_circuit, classes, log2logistic)
-    # map from line node ids to probabilistic circuit nodes
-    id2logisticnode(id) = log2logistic[id2lognode[id]]
-
-    # go through lines again and update the probabilistic circuit node parameters
-
-    function compile(ln::CircuitFormatLine)
-        error("Compilation of line $ln into logistic circuit is not supported")
-    end
-    function compile(::Union{CircuitHeaderLine,CircuitCommentLine,UnweightedLiteralLine})
-        # do nothing
-    end
-
-    function compile(ln::CircuitHeaderLine)
-        # do nothing
-    end
-
-    function compile(ln::WeightedLiteralLine)
-        node = id2logisticnode(ln.node_id)::Logistic⋁
-        node.thetas[1, :] .= ln.weights
-    end
-
-    function compile(ln::DecisionLine{<:LCElement})
-        node = id2logisticnode(ln.node_id)::Logistic⋁
-        for (ind, elem) in enumerate(ln.elements)
-            node.thetas[ind, :] .= elem.weights
-        end
-    end
-
-    function compile(ln::BiasLine)
-        node = id2logisticnode(ln.node_id)::Logistic⋁
-        # @assert length(node.thetas) == 1
-        node.thetas[1,:] .= ln.weights
-    end
-
-    for ln in lines
-        compile(ln)
-    end
-
-    logistic_circuit
-end
\ No newline at end of file
diff --git a/src/LoadSave/LoadSave.jl b/src/LoadSave/LoadSave.jl
index e5b72dee..c28a0c77 100644
--- a/src/LoadSave/LoadSave.jl
+++ b/src/LoadSave/LoadSave.jl
@@ -1,11 +1,10 @@
 module LoadSave
 
 using LogicCircuits
-using ..Utils
-using ..Probabilistic
-using ..Logistic
+using ...ProbabilisticCircuits
 
 include("circuit_line_compiler.jl")
 include("circuit_loaders.jl")
 include("circuit_savers.jl")
+
 end
\ No newline at end of file
diff --git a/src/Logistic/Logistic.jl b/src/Logistic/Logistic.jl
deleted file mode 100644
index c657449f..00000000
--- a/src/Logistic/Logistic.jl
+++ /dev/null
@@ -1,11 +0,0 @@
-module Logistic
-
-using LogicCircuits
-using ..Utils
-
-include("logistic_nodes.jl")
-include("queries.jl")
-
-# TODO learning
-
-end
\ No newline at end of file
diff --git a/src/Mixtures/Mixtures.jl b/src/Mixtures/Mixtures.jl
deleted file mode 100644
index d837d53b..00000000
--- a/src/Mixtures/Mixtures.jl
+++ /dev/null
@@ -1,11 +0,0 @@
-module Mixtures
-
-using LogicCircuits
-using ..Utils
-using ..Probabilistic
-using ..LoadSave
-
-include("shared_prob_nodes.jl")
-include("em.jl")
-
-end
\ No newline at end of file
diff --git a/src/Probabilistic/Probabilistic.jl b/src/Probabilistic/Probabilistic.jl
deleted file mode 100644
index 5d46fd92..00000000
--- a/src/Probabilistic/Probabilistic.jl
+++ /dev/null
@@ -1,13 +0,0 @@
-module Probabilistic
-
-using LogicCircuits
-using ..Utils
-
-include("prob_nodes.jl")
-include("structured_prob_nodes.jl")
-include("exp_flows.jl")
-include("queries.jl")
-include("informations.jl")
-include("parameters.jl")
-
-end
diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index f02f5b58..732a0979 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -10,22 +10,29 @@ using LogicCircuits
 include("Utils/Utils.jl")
 @reexport using .Utils
 
+include("prob_nodes.jl")
+include("structured_prob_nodes.jl")
+include("exp_flows.jl")
+include("queries.jl")
+include("informations.jl")
+include("parameters.jl")
 
-# INCLUDE CHILD MODULES
-include("Probabilistic/Probabilistic.jl")
-include("Logistic/Logistic.jl")
-include("LoadSave/LoadSave.jl")
-include("Reasoning/Reasoning.jl")
-include("StructureLearner/StructureLearner.jl")
-include("Mixtures/Mixtures.jl")
+include("logistic/logistic_nodes.jl")
+include("logistic/queries.jl")
+
+include("reasoning/expectation.jl")
+include("reasoning/exp_flow_circuits.jl")
+
+include("mixtures/shared_prob_nodes.jl")
+include("mixtures/em.jl")
 
+include("structurelearner/chow_liu_tree.jl")
+include("structurelearner/init.jl")
+include("structurelearner/heuristics.jl")
+include("structurelearner/learner.jl")
 
-# USE CHILD MODULES (in order to re-export some functions)
-@reexport using .Probabilistic
-@reexport using .Logistic
+
+include("LoadSave/LoadSave.jl")
 @reexport using .LoadSave
-@reexport using .Reasoning
-@reexport using .StructureLearner
-@reexport using .Mixtures
 
 end
diff --git a/src/Reasoning/Reasoning.jl b/src/Reasoning/Reasoning.jl
deleted file mode 100644
index a87f0145..00000000
--- a/src/Reasoning/Reasoning.jl
+++ /dev/null
@@ -1,11 +0,0 @@
-module Reasoning
-
-using LogicCircuits
-using ..Utils
-using ..Probabilistic
-using ..Logistic
-
-include("expectation.jl")
-include("exp_flow_circuits.jl")
-
-end
\ No newline at end of file
diff --git a/src/StructureLearner/StructureLearner.jl b/src/StructureLearner/StructureLearner.jl
deleted file mode 100644
index 29cfa16e..00000000
--- a/src/StructureLearner/StructureLearner.jl
+++ /dev/null
@@ -1,15 +0,0 @@
-module StructureLearner
-
-using LogicCircuits
-using ..Utils
-using ..Probabilistic
-using ..LoadSave
-
-
-include("chow_liu_tree.jl")
-include("init.jl")
-include("heuristics.jl")
-include("learner.jl")
-
-
-end
diff --git a/src/Probabilistic/exp_flows.jl b/src/exp_flows.jl
similarity index 100%
rename from src/Probabilistic/exp_flows.jl
rename to src/exp_flows.jl
diff --git a/src/Probabilistic/informations.jl b/src/informations.jl
similarity index 100%
rename from src/Probabilistic/informations.jl
rename to src/informations.jl
diff --git a/src/Logistic/logistic_nodes.jl b/src/logistic/logistic_nodes.jl
similarity index 100%
rename from src/Logistic/logistic_nodes.jl
rename to src/logistic/logistic_nodes.jl
diff --git a/src/Logistic/queries.jl b/src/logistic/queries.jl
similarity index 100%
rename from src/Logistic/queries.jl
rename to src/logistic/queries.jl
diff --git a/src/Mixtures/deprecated/Bagging.jl b/src/mixtures/deprecated/Bagging.jl
similarity index 100%
rename from src/Mixtures/deprecated/Bagging.jl
rename to src/mixtures/deprecated/Bagging.jl
diff --git a/src/Mixtures/em.jl b/src/mixtures/em.jl
similarity index 100%
rename from src/Mixtures/em.jl
rename to src/mixtures/em.jl
diff --git a/src/Mixtures/shared_prob_nodes.jl b/src/mixtures/shared_prob_nodes.jl
similarity index 100%
rename from src/Mixtures/shared_prob_nodes.jl
rename to src/mixtures/shared_prob_nodes.jl
diff --git a/src/Mixtures/todo/EMLearner.jl b/src/mixtures/todo/EMLearner.jl
similarity index 100%
rename from src/Mixtures/todo/EMLearner.jl
rename to src/mixtures/todo/EMLearner.jl
diff --git a/src/Mixtures/todo/Mixtures.jl b/src/mixtures/todo/Mixtures.jl
similarity index 100%
rename from src/Mixtures/todo/Mixtures.jl
rename to src/mixtures/todo/Mixtures.jl
diff --git a/src/Probabilistic/parameters.jl b/src/parameters.jl
similarity index 100%
rename from src/Probabilistic/parameters.jl
rename to src/parameters.jl
diff --git a/src/Probabilistic/prob_nodes.jl b/src/prob_nodes.jl
similarity index 100%
rename from src/Probabilistic/prob_nodes.jl
rename to src/prob_nodes.jl
diff --git a/src/Probabilistic/queries.jl b/src/queries.jl
similarity index 100%
rename from src/Probabilistic/queries.jl
rename to src/queries.jl
diff --git a/src/Reasoning/exp_flow_circuits.jl b/src/reasoning/exp_flow_circuits.jl
similarity index 100%
rename from src/Reasoning/exp_flow_circuits.jl
rename to src/reasoning/exp_flow_circuits.jl
diff --git a/src/Reasoning/expectation.jl b/src/reasoning/expectation.jl
similarity index 100%
rename from src/Reasoning/expectation.jl
rename to src/reasoning/expectation.jl
diff --git a/src/Probabilistic/structured_prob_nodes.jl b/src/structured_prob_nodes.jl
similarity index 100%
rename from src/Probabilistic/structured_prob_nodes.jl
rename to src/structured_prob_nodes.jl
diff --git a/src/StructureLearner/VtreeLearner.jl b/src/structurelearner/VtreeLearner.jl
similarity index 100%
rename from src/StructureLearner/VtreeLearner.jl
rename to src/structurelearner/VtreeLearner.jl
diff --git a/src/StructureLearner/chow_liu_tree.jl b/src/structurelearner/chow_liu_tree.jl
similarity index 100%
rename from src/StructureLearner/chow_liu_tree.jl
rename to src/structurelearner/chow_liu_tree.jl
diff --git a/src/StructureLearner/heuristics.jl b/src/structurelearner/heuristics.jl
similarity index 100%
rename from src/StructureLearner/heuristics.jl
rename to src/structurelearner/heuristics.jl
diff --git a/src/StructureLearner/init.jl b/src/structurelearner/init.jl
similarity index 100%
rename from src/StructureLearner/init.jl
rename to src/structurelearner/init.jl
diff --git a/src/StructureLearner/learner.jl b/src/structurelearner/learner.jl
similarity index 100%
rename from src/StructureLearner/learner.jl
rename to src/structurelearner/learner.jl

From 86181ab61c4a985d0b227857b338441a754cc0ee Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 30 Aug 2020 01:42:47 -0500
Subject: [PATCH 069/131] prob nodes

---
 src/LoadSave/circuit_savers.jl         |  12 +--
 src/ProbabilisticCircuits.jl           |  37 ++++-----
 src/Utils/Utils.jl                     |   1 -
 src/Utils/decorators.jl                |  10 ---
 src/Utils/misc.jl                      |   2 +-
 src/abstract_prob_nodes.jl             |  67 +++++++++++++++
 src/informations.jl                    |  26 +++---
 src/mixtures/em.jl                     |   2 +-
 src/mixtures/shared_prob_nodes.jl      |  34 ++++----
 src/plain_prob_nodes.jl                | 108 +++++++++++++++++++++++++
 src/prob_nodes.jl                      |  96 ----------------------
 src/queries.jl                         |  20 ++---
 src/reasoning/exp_flow_circuits.jl     |  14 ++--
 src/reasoning/expectation.jl           |  28 +++----
 src/structured_prob_nodes.jl           |  48 +++++------
 test/Probabilistic/prob_nodes_tests.jl |   6 +-
 16 files changed, 290 insertions(+), 221 deletions(-)
 delete mode 100644 src/Utils/decorators.jl
 create mode 100644 src/abstract_prob_nodes.jl
 create mode 100644 src/plain_prob_nodes.jl
 delete mode 100644 src/prob_nodes.jl

diff --git a/src/LoadSave/circuit_savers.jl b/src/LoadSave/circuit_savers.jl
index 2a3788be..99353283 100644
--- a/src/LoadSave/circuit_savers.jl
+++ b/src/LoadSave/circuit_savers.jl
@@ -15,17 +15,17 @@ using LogicCircuits.LoadSave: SDDElement,
 #####################
 
 "Decompile for psdd circuit, used during saving of circuits to file" 
-decompile(n::StructProbLiteralNode, node2id, vtree2id)::UnweightedLiteralLine = 
+decompile(n::StructPlainProbLiteralNode, node2id, vtree2id)::UnweightedLiteralLine = 
     UnweightedLiteralLine(node2id[n], vtree2id[n.vtree], literal(n), true)
 
-make_element(n::StructProb⋀Node, w::AbstractFloat, node2id) = 
+make_element(n::StructPlainMulNode, w::AbstractFloat, node2id) = 
     PSDDElement(node2id[children(n)[1]],  node2id[children(n)[2]], w)
 
 istrue_node(n)::Bool = 
     is⋁gate(n) && num_children(n) == 2 && GateType(children(n)[1]) isa LiteralGate && GateType(children(n)[2]) isa LiteralGate && 
     ispositive(children(n)[1]) && isnegative(children(n)[2])
 
-function decompile(n::StructProb⋁Node, node2id, vtree2id)::Union{WeightedNamedConstantLine, DecisionLine{PSDDElement}} 
+function decompile(n::StructPlainSumNode, node2id, vtree2id)::Union{WeightedNamedConstantLine, DecisionLine{PSDDElement}} 
     if istrue_node(n)
         WeightedNamedConstantLine(node2id[n], vtree2id[n.vtree], lit2var(children(n)[1].literal), n.log_thetas[1]) # TODO
     else
@@ -139,13 +139,13 @@ function save_as_dot(circuit::ProbCircuit, file::String)
     end
 
     for n in reverse(circuit)
-        if n isa Prob⋀Node
+        if n isa PlainMulNode
             write(f, "$(node_cache[n]) [label=\"*$(node_cache[n])\"]\n")
         elseif n isa Prob⋁
             write(f, "$(node_cache[n]) [label=\"+$(node_cache[n])\"]\n")
-        elseif n isa ProbLiteralNode && ispositive(n)
+        elseif n isa PlainProbLiteralNode && ispositive(n)
             write(f, "$(node_cache[n]) [label=\"+$(variable(n.origin))\"]\n")
-        elseif n isa ProbLiteralNode && isnegative(n)
+        elseif n isa PlainProbLiteralNode && isnegative(n)
             write(f, "$(node_cache[n]) [label=\"-$(variable(n.origin))\"]\n")
         else
             throw("unknown ProbCircuit type")
diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 732a0979..991787bb 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -10,29 +10,30 @@ using LogicCircuits
 include("Utils/Utils.jl")
 @reexport using .Utils
 
-include("prob_nodes.jl")
-include("structured_prob_nodes.jl")
-include("exp_flows.jl")
-include("queries.jl")
-include("informations.jl")
-include("parameters.jl")
+include("abstract_prob_nodes.jl")
+include("plain_prob_nodes.jl")
+# include("structured_prob_nodes.jl")
+# include("exp_flows.jl")
+# include("queries.jl")
+# include("informations.jl")
+# include("parameters.jl")
 
-include("logistic/logistic_nodes.jl")
-include("logistic/queries.jl")
+# include("logistic/logistic_nodes.jl")
+# include("logistic/queries.jl")
 
-include("reasoning/expectation.jl")
-include("reasoning/exp_flow_circuits.jl")
+# include("reasoning/expectation.jl")
+# include("reasoning/exp_flow_circuits.jl")
 
-include("mixtures/shared_prob_nodes.jl")
-include("mixtures/em.jl")
+# include("mixtures/shared_prob_nodes.jl")
+# include("mixtures/em.jl")
 
-include("structurelearner/chow_liu_tree.jl")
-include("structurelearner/init.jl")
-include("structurelearner/heuristics.jl")
-include("structurelearner/learner.jl")
+# include("structurelearner/chow_liu_tree.jl")
+# include("structurelearner/init.jl")
+# include("structurelearner/heuristics.jl")
+# include("structurelearner/learner.jl")
 
 
-include("LoadSave/LoadSave.jl")
-@reexport using .LoadSave
+# include("LoadSave/LoadSave.jl")
+# @reexport using .LoadSave
 
 end
diff --git a/src/Utils/Utils.jl b/src/Utils/Utils.jl
index 9bf1f2fc..b8ef7cac 100644
--- a/src/Utils/Utils.jl
+++ b/src/Utils/Utils.jl
@@ -5,7 +5,6 @@ that could be useful in any Julia project
 module Utils
 
 include("misc.jl")
-include("decorators.jl")
 include("informations.jl")
 
 end #module
diff --git a/src/Utils/decorators.jl b/src/Utils/decorators.jl
deleted file mode 100644
index bc83dd31..00000000
--- a/src/Utils/decorators.jl
+++ /dev/null
@@ -1,10 +0,0 @@
-export num_parameters
-
-#####################
-# functions that need to be implemented for logistic circuit and probability circuit
-#####################
-
-"""
-Get the number of parameters of a given decorator node/circuit
-"""
-function num_parameters end
\ No newline at end of file
diff --git a/src/Utils/misc.jl b/src/Utils/misc.jl
index 15d33338..642ba70e 100644
--- a/src/Utils/misc.jl
+++ b/src/Utils/misc.jl
@@ -7,7 +7,6 @@ using DataFrames
 # Misc.
 ####################
 
-
 function to_long_mi(m::Matrix{Float64}, min_int, max_int)::Matrix{Int64}
     δmi = maximum(m) - minimum(m)
     δint = max_int - min_int
@@ -17,6 +16,7 @@ end
 ###################
 # One-Hot Encoding
 ####################
+
 """
 One-hot encode data (2-D Array) based on categories (1-D Array)
 Each row of the return value is a concatenation of one-hot encoding of elements of the same row in data
diff --git a/src/abstract_prob_nodes.jl b/src/abstract_prob_nodes.jl
new file mode 100644
index 00000000..7b6e4d8b
--- /dev/null
+++ b/src/abstract_prob_nodes.jl
@@ -0,0 +1,67 @@
+export ProbCircuit,
+    multiply, summate, ismul, issum,
+    num_parameters,
+    mul_nodes, sum_nodes
+
+using LogicCircuits: LogicCircuit
+
+#####################
+# Abstract probabilistic circuit nodes
+#####################
+
+"Root of the probabilistic circuit node hierarchy"
+abstract type ProbCircuit <: LogicCircuit end
+
+#####################
+# node functions that need to be implemented for each type of circuit
+#####################
+
+import ..Utils.children # make available for extension by concrete types
+import LogicCircuits.compile # make available for extension by concrete types
+
+"Multiply nodes into a single circuit"
+function multiply end
+
+"Sum nodes into a single circuit"
+function summate end
+
+#####################
+# derived functions
+#####################
+
+"Is the node a multiplication?"
+@inline ismul(n) = GateType(n) isa ⋀Gate
+"Is the node a summation?"
+@inline issum(n) = GateType(n) isa ⋁Gate
+
+"Count the number of parameters in the circuit"
+@inline num_parameters(c::ProbCircuit) = 
+    sum(n -> num_parameters(n), sum_nodes(c))
+
+#####################
+# methods to easily construct circuits
+#####################
+
+@inline multiply(xs::PlainProbCircuit...) = multiply(collect(xs))
+@inline summate(xs::PlainProbCircuit...) = summate(collect(xs))
+
+import LogicCircuits: conjoin, disjoin # make available for extension
+
+# alias conjoin/disjoin using mul/sum terminology
+@inline conjoin(args::Vector{<:ProbCircuit}; reuse=nothing) = 
+    multiply(args; reuse)
+@inline disjoin(args::Vector{<:ProbCircuit}; reuse=nothing) = 
+    summate(args; reuse)
+
+@inline Base.:*(x::ProbCircuit, y::ProbCircuit) = multiply(x,y)
+@inline Base.:+(x::ProbCircuit, y::ProbCircuit) = summate(x,y)
+
+#####################
+# circuit inspection
+#####################
+
+"Get the list of multiplication nodes in a given circuit"
+mul_nodes(c::ProbCircuit) = ⋀_nodes(c)
+
+"Get the list of summation nodes in a given circuit"
+sum_nodes(c::ProbCircuit) = ⋁_nodes(c)
diff --git a/src/informations.jl b/src/informations.jl
index bc6e14c9..ade07e3d 100644
--- a/src/informations.jl
+++ b/src/informations.jl
@@ -18,7 +18,7 @@ function pr_constraint(psdd_node::ProbCircuit, sdd_node::StrutCircuit,
         return cache[psdd_node, sdd_node]
     
     # Boundary cases
-    elseif psdd_node isa StructProbLiteralNode
+    elseif psdd_node isa StructPlainProbLiteralNode
         # Both are literals, just check whether they agrees with each other 
         if isliteralgate(sdd_node)
             if literal(psdd_node) == literal(sdd_node)
@@ -38,7 +38,7 @@ function pr_constraint(psdd_node::ProbCircuit, sdd_node::StrutCircuit,
         end
     
     # The psdd is true
-    elseif children(psdd_node)[1] isa StructProbLiteralNode 
+    elseif children(psdd_node)[1] isa StructPlainProbLiteralNode 
         theta = exp(psdd_node.log_thetas[1])
         return get!(cache, (psdd_node, sdd_node),
             theta * pr_constraint(children(psdd_node)[1], sdd_node, cache) +
@@ -68,10 +68,10 @@ Calculate entropy of the distribution of the input psdd."
 """
 
 import ..Utils: entropy
-function entropy(psdd_node::StructProb⋁Node, psdd_entropy_cache::Dict{ProbCircuit, Float64}=Dict{ProbCircuit, Float64}())::Float64
+function entropy(psdd_node::StructPlainSumNode, psdd_entropy_cache::Dict{ProbCircuit, Float64}=Dict{ProbCircuit, Float64}())::Float64
     if psdd_node in keys(psdd_entropy_cache)
         return psdd_entropy_cache[psdd_node]
-    elseif children(psdd_node)[1] isa StructProbLiteralNode
+    elseif children(psdd_node)[1] isa StructPlainProbLiteralNode
         return get!(psdd_entropy_cache, psdd_node,
             - exp(psdd_node.log_thetas[1]) * psdd_node.log_thetas[1] -
             exp(psdd_node.log_thetas[2]) * psdd_node.log_thetas[2])
@@ -88,27 +88,27 @@ function entropy(psdd_node::StructProb⋁Node, psdd_entropy_cache::Dict{ProbCirc
     end
 end
 
-function entropy(psdd_node::StructProb⋀Node, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
+function entropy(psdd_node::StructPlainMulNode, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
     return get!(psdd_entropy_cache, children(psdd_node)[1], entropy(children(psdd_node)[1], psdd_entropy_cache)) +
         get!(psdd_entropy_cache, children(psdd_node)[2], entropy(children(psdd_node)[2], psdd_entropy_cache))
 end
 
-function entropy(psdd_node::StructProbLiteralNode, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
+function entropy(psdd_node::StructPlainProbLiteralNode, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
     return get!(psdd_entropy_cache, psdd_node, 0.0)
 end
 
 "Calculate KL divergence calculation for psdds that are not necessarily identical"
-function kl_divergence(psdd_node1::StructProb⋁Node, psdd_node2::StructProb⋁Node,
+function kl_divergence(psdd_node1::StructPlainSumNode, psdd_node2::StructPlainSumNode,
         kl_divergence_cache::KLDCache=KLDCache(), pr_constraint_cache::PRCache=PRCache())
-    @assert !(psdd_node1 isa StructProb⋀Node || psdd_node2 isa StructProb⋀Node) "Prob⋀ not a valid PSDD node for KL-Divergence"
+    @assert !(psdd_node1 isa StructPlainMulNode || psdd_node2 isa StructPlainMulNode) "Prob⋀ not a valid PSDD node for KL-Divergence"
 
     # Check if both nodes are normalized for same vtree node
     @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
         return kl_divergence_cache[(psdd_node1, psdd_node2)]
-    elseif children(psdd_node1)[1] isa StructProbLiteralNode
-        if psdd_node2 isa StructProbLiteralNode
+    elseif children(psdd_node1)[1] isa StructPlainProbLiteralNode
+        if psdd_node2 isa StructPlainProbLiteralNode
             kl_divergence(children(psdd_node1)[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
             kl_divergence(children(psdd_node1)[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
             if literal(children(psdd_node1)[1]) == literal(psdd_node2)
@@ -169,7 +169,7 @@ function kl_divergence(psdd_node1::StructProb⋁Node, psdd_node2::StructProb⋁N
     end
 end
 
-function kl_divergence(psdd_node1::StructProbLiteralNode, psdd_node2::StructProbLiteralNode,
+function kl_divergence(psdd_node1::StructPlainProbLiteralNode, psdd_node2::StructPlainProbLiteralNode,
         kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
     # Check if literals are over same variables in vtree
    @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
@@ -182,7 +182,7 @@ function kl_divergence(psdd_node1::StructProbLiteralNode, psdd_node2::StructProb
     end
 end
 
-function kl_divergence(psdd_node1::StructProb⋁Node, psdd_node2::StructProbLiteralNode,
+function kl_divergence(psdd_node1::StructPlainSumNode, psdd_node2::StructPlainProbLiteralNode,
         kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
     @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
 
@@ -203,7 +203,7 @@ function kl_divergence(psdd_node1::StructProb⋁Node, psdd_node2::StructProbLite
     end
 end
 
-function kl_divergence(psdd_node1::StructProbLiteralNode, psdd_node2::StructProb⋁Node,
+function kl_divergence(psdd_node1::StructPlainProbLiteralNode, psdd_node2::StructPlainSumNode,
         kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
     @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
 
diff --git a/src/mixtures/em.jl b/src/mixtures/em.jl
index 2f35f3f4..ddb1d518 100644
--- a/src/mixtures/em.jl
+++ b/src/mixtures/em.jl
@@ -68,7 +68,7 @@ function log_likelihood_per_instance_per_component(pc::SharedProbCircuit, data)
     
     
     ll(n::SharedProbCircuit) = ()
-    ll(n::SharedProb⋁Node) = begin
+    ll(n::SharedPlainSumNode) = begin
         if num_children(n) != 1 # other nodes have no effect on likelihood
             for i in 1 : num_children(n)
                 c = children(n)[i]
diff --git a/src/mixtures/shared_prob_nodes.jl b/src/mixtures/shared_prob_nodes.jl
index 2d4f180f..e1af2011 100644
--- a/src/mixtures/shared_prob_nodes.jl
+++ b/src/mixtures/shared_prob_nodes.jl
@@ -1,5 +1,5 @@
-export SharedProbCircuit, SharedProbLeafNode, SharedProbInnerNode, SharedProbLiteralNode,
-SharedProb⋀Node, SharedProb⋁Node, num_components
+export SharedProbCircuit, SharedPlainProbLeafNode, SharedPlainProbInnerNode, SharedPlainProbLiteralNode,
+SharedPlainMulNode, SharedPlainSumNode, num_components
 
 #####################
 # Probabilistic circuits which share the same structure
@@ -13,42 +13,42 @@ abstract type SharedProbCircuit <: LogicCircuit end
 """
 A probabilistic leaf node
 """
-abstract type SharedProbLeafNode <: SharedProbCircuit end
+abstract type SharedPlainProbLeafNode <: SharedProbCircuit end
 
 """
 A probabilistic inner node
 """
-abstract type SharedProbInnerNode <: SharedProbCircuit end
+abstract type SharedPlainProbInnerNode <: SharedProbCircuit end
 
 """
 A probabilistic literal node
 """
-mutable struct SharedProbLiteralNode <: SharedProbLeafNode
+mutable struct SharedPlainProbLiteralNode <: SharedPlainProbLeafNode
     literal::Lit
     data
     counter::UInt32
-    SharedProbLiteralNode(l) = new(l, nothing, 0)
+    SharedPlainProbLiteralNode(l) = new(l, nothing, 0)
 end
 
 """
 A probabilistic conjunction node (And node)
 """
-mutable struct SharedProb⋀Node <: SharedProbInnerNode
+mutable struct SharedPlainMulNode <: SharedPlainProbInnerNode
     children::Vector{<:SharedProbCircuit}
     data
     counter::UInt32
-    SharedProb⋀Node(children) = new(convert(Vector{SharedProbCircuit}, children), nothing, 0)
+    SharedPlainMulNode(children) = new(convert(Vector{SharedProbCircuit}, children), nothing, 0)
 end
 
 """
 A probabilistic disjunction node (Or node)
 """
-mutable struct SharedProb⋁Node <: SharedProbInnerNode
+mutable struct SharedPlainSumNode <: SharedPlainProbInnerNode
     children::Vector{<:SharedProbCircuit}
     log_thetas::Matrix{Float64}
     data
     counter::UInt32
-    SharedProb⋁Node(children, n_mixture) = begin
+    SharedPlainSumNode(children, n_mixture) = begin
         new(convert(Vector{SharedProbCircuit}, children), init_array(Float64, length(children), n_mixture), nothing, 0)
     end
 end
@@ -58,9 +58,9 @@ end
 #####################
 
 import LogicCircuits.GateType # make available for extension
-@inline GateType(::Type{<:SharedProbLiteralNode}) = LiteralGate()
-@inline GateType(::Type{<:SharedProb⋀Node}) = ⋀Gate()
-@inline GateType(::Type{<:SharedProb⋁Node}) = ⋁Gate()
+@inline GateType(::Type{<:SharedPlainProbLiteralNode}) = LiteralGate()
+@inline GateType(::Type{<:SharedPlainMulNode}) = ⋀Gate()
+@inline GateType(::Type{<:SharedPlainSumNode}) = ⋁Gate()
 
 #####################
 # constructors and conversions
@@ -68,14 +68,14 @@ import LogicCircuits.GateType # make available for extension
 
 function SharedProbCircuit(circuit::LogicCircuit, num_mixture::Int64)::SharedProbCircuit
     f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-    f_lit(n) = SharedProbLiteralNode(literal(n))
-    f_a(n, cn) = SharedProb⋀Node(cn)
-    f_o(n, cn) = SharedProb⋁Node(cn, num_mixture)
+    f_lit(n) = SharedPlainProbLiteralNode(literal(n))
+    f_a(n, cn) = SharedPlainMulNode(cn)
+    f_o(n, cn) = SharedPlainSumNode(cn, num_mixture)
     foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, SharedProbCircuit)
 end
 
 
 import LogicCircuits: children # make available for extension
 
-@inline children(n::SharedProbInnerNode) = n.children
+@inline children(n::SharedPlainProbInnerNode) = n.children
 @inline num_components(n::SharedProbCircuit) = size(n.log_thetas)[2]
diff --git a/src/plain_prob_nodes.jl b/src/plain_prob_nodes.jl
new file mode 100644
index 00000000..68ced299
--- /dev/null
+++ b/src/plain_prob_nodes.jl
@@ -0,0 +1,108 @@
+export PlainProbCircuit, 
+    PlainProbLeafNode, PlainProbInnerNode, 
+    PlainProbLiteralNode, PlainMulNode, PlainSumNode
+
+#####################
+# Plain probabilistic circuit nodes
+#####################
+
+"Root of the plain probabilistic circuit node hierarchy"
+abstract type PlainProbCircuit <: ProbCircuit end
+
+"A probabilistic leaf node"
+abstract type PlainProbLeafNode <: PlainProbCircuit end
+
+"A probabilistic inner node"
+abstract type PlainProbInnerNode <: PlainProbCircuit end
+
+"A probabilistic literal node"
+mutable struct PlainProbLiteralNode <: PlainProbLeafNode
+    literal::Lit
+    data
+    counter::UInt32
+    PlainProbLiteralNode(l) = new(l, nothing, 0)
+end
+
+"A probabilistic conjunction node (multiplication node)"
+mutable struct PlainMulNode <: PlainProbInnerNode
+    children::Vector{PlainProbCircuit}
+    data
+    counter::UInt32
+    PlainMulNode(children) = begin
+        new(convert(Vector{PlainProbCircuit}, children), nothing, 0)
+    end
+end
+
+"A probabilistic disjunction node (summation node)"
+mutable struct PlainSumNode <: PlainProbInnerNode
+    children::Vector{PlainProbCircuit}
+    log_thetas::Vector{Float64}
+    data
+    counter::UInt32
+    PlainSumNode(c) = begin
+        new(c, init_array(Float64, length(children)), nothing, 0)
+    end
+end
+
+#####################
+# traits
+#####################
+
+import LogicCircuits.GateType # make available for extension
+
+@inline GateType(::Type{<:PlainProbLiteralNode}) = LiteralGate()
+@inline GateType(::Type{<:PlainMulNode}) = ⋀Gate()
+@inline GateType(::Type{<:PlainSumNode}) = ⋁Gate()
+
+#####################
+# methods
+#####################
+
+import LogicCircuits: children # make available for extension
+@inline children(n::PlainProbInnerNode) = n.children
+
+@inline num_parameters(n::PlainSumNode) = num_children(n)
+
+#####################
+# constructors and conversions
+#####################
+
+function multiply(arguments::Vector{<:PlainProbCircuit};
+                 reuse=nothing)
+    @assert length(arguments) > 0
+    reuse isa PlainMulNode && children(reuse) == arguments && return reuse
+    return PlainMulNode(arguments)
+end
+
+function summate(arguments::Vector{<:PlainProbCircuit};
+                    reuse=nothing)
+    @assert length(arguments) > 0
+    reuse isa PlainSumNode && children(reuse) == arguments && return reuse
+    return PlainSumNode(arguments)
+end
+
+# claim `PlainProbCircuit` as the default `ProbCircuit` implementation
+compile(::Type{ProbCircuit}, args...) =
+    compile(PlainProbCircuit, args...)
+
+compile(::Type{<:PlainProbCircuit}, ::Bool) =
+    error("Probabilistic circuits do not have constant leafs.")
+
+compile(::Type{<:PlainProbCircuit}, l::Lit) =
+    PlainProbLiteralNode(l)
+
+function compile(::Type{<:PlainProbCircuit}, circuit::LogicCircuit)
+    f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
+    f_lit(n) = compile(PlainProbCircuit, literal(n))
+    f_a(_, cns) = multiply(cns)
+    f_o(_, cns) = summate(cns)
+    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, PlainProbCircuit)
+end
+
+fully_factorized_circuit(::Type{ProbCircuit}, n::Int) =
+    fully_factorized_circuit(PlainProbCircuit, n)
+
+function fully_factorized_circuit(::Type{<:PlainProbCircuit}, n::Int)
+    ff_logic_circuit = fully_factorized_circuit(PlainLogicCircuit, n)
+    compile(PlainProbCircuit, ff_logic_circuit)
+end
\ No newline at end of file
diff --git a/src/prob_nodes.jl b/src/prob_nodes.jl
deleted file mode 100644
index 96694851..00000000
--- a/src/prob_nodes.jl
+++ /dev/null
@@ -1,96 +0,0 @@
-export PlainProbCircuit, ProbLeafNode, ProbInnerNode, ProbLiteralNode, Prob⋀Node, 
-Prob⋁Node
-
-using LogicCircuits: LogicCircuit
-
-#####################
-# Infrastructure for probabilistic circuit nodes
-#####################
-
-"Root of the probabilistic circuit node hierarchy"
-abstract type PlainProbCircuit <: LogicCircuit end
-
-"""
-A probabilistic leaf node
-"""
-abstract type ProbLeafNode <: PlainProbCircuit end
-
-"""
-A probabilistic inner node
-"""
-abstract type ProbInnerNode <: PlainProbCircuit end
-
-"""
-A probabilistic literal node
-"""
-mutable struct ProbLiteralNode <: ProbLeafNode
-    literal::Lit
-    data
-    counter::UInt32
-    ProbLiteralNode(l) = new(l, nothing, 0)
-end
-
-"""
-A probabilistic conjunction node (And node)
-"""
-mutable struct Prob⋀Node <: ProbInnerNode
-    children::Vector{<:PlainProbCircuit}
-    data
-    counter::UInt32
-    Prob⋀Node(children) = begin
-        new(convert(Vector{PlainProbCircuit}, children), nothing, 0)
-    end
-end
-
-"""
-A probabilistic disjunction node (Or node)
-"""
-mutable struct Prob⋁Node <: ProbInnerNode
-    children::Vector{<:PlainProbCircuit}
-    log_thetas::Vector{Float64}
-    data
-    counter::UInt32
-    Prob⋁Node(children) = begin
-        new(convert(Vector{PlainProbCircuit}, children), init_array(Float64, length(children)), nothing, 0)
-    end
-end
-
-#####################
-# traits
-#####################
-
-import LogicCircuits.GateType # make available for extension
-
-@inline GateType(::Type{<:ProbLiteralNode}) = LiteralGate()
-@inline GateType(::Type{<:Prob⋀Node}) = ⋀Gate()
-@inline GateType(::Type{<:Prob⋁Node}) = ⋁Gate()
-
-#####################
-# methods
-#####################
-
-import LogicCircuits: children # make available for extension
-@inline children(n::ProbInnerNode) = n.children
-
-import ..Utils: num_parameters
-@inline num_parameters(c::PlainProbCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
-
-#####################
-# constructors and conversions
-#####################
-
-function PlainProbCircuit(circuit::PlainLogicCircuit)::PlainProbCircuit
-    f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-    f_lit(n) = ProbLiteralNode(literal(n))
-    f_a(n, cn) = Prob⋀Node(cn)
-    f_o(n, cn) = Prob⋁Node(cn)
-    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, PlainProbCircuit)
-end
-
-function PlainLogicCircuit(circuit::PlainProbCircuit)::PlainLogicCircuit
-    f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-    f_lit(n) = PlainLiteralNode(literal(n))
-    f_a(n, cn) = Plain⋀Node(cn)
-    f_o(n, cn) = Plain⋁Node(cn)
-    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, PlainLogicCircuit)
-end
diff --git a/src/queries.jl b/src/queries.jl
index 917e9fc7..91b0f2e7 100644
--- a/src/queries.jl
+++ b/src/queries.jl
@@ -12,7 +12,7 @@ function log_likelihood_per_instance(pc::ProbCircuit, data)
     indices = init_array(Bool, num_examples(data))::BitVector
     
     ll(n::ProbCircuit) = ()
-    ll(n::Union{Prob⋁Node, StructProb⋁Node}) = begin
+    ll(n::Union{PlainSumNode, StructPlainSumNode}) = begin
         if num_children(n) != 1 # other nodes have no effect on likelihood
             foreach(children(n), n.log_thetas) do c, log_theta
                 indices = get_downflow(n, c)
@@ -50,7 +50,7 @@ function MPE(pc::ProbCircuit, evidence)::BitMatrix
     ans = falses(num_examples(evidence), num_features(evidence))
     active_samples = trues(num_examples(evidence))
 
-    function mpe_simulate(node::Union{ProbLiteralNode, StructProbLiteralNode}, active_samples::BitVector, result::BitMatrix)
+    function mpe_simulate(node::Union{PlainProbLiteralNode, StructPlainProbLiteralNode}, active_samples::BitVector, result::BitMatrix)
         if ispositive(node)
             result[active_samples, variable(node)] .= 1
         else
@@ -58,7 +58,7 @@ function MPE(pc::ProbCircuit, evidence)::BitMatrix
         end
     end
     
-    function mpe_simulate(node::Union{Prob⋁Node, StructProb⋁Node}, active_samples::BitVector, result::BitMatrix)
+    function mpe_simulate(node::Union{PlainSumNode, StructPlainSumNode}, active_samples::BitVector, result::BitMatrix)
         prs = zeros(length(children(node)), size(active_samples)[1] )
         @simd  for i=1:length(children(node))
             prs[i,:] .= get_exp_upflow(children(node)[i]) .+ (node.log_thetas[i])
@@ -72,7 +72,7 @@ function MPE(pc::ProbCircuit, evidence)::BitMatrix
         end
     end
     
-    function mpe_simulate(node::Union{Prob⋀Node, StructProb⋀Node}, active_samples::BitVector, result::BitMatrix)
+    function mpe_simulate(node::Union{PlainMulNode, StructPlainMulNode}, active_samples::BitVector, result::BitMatrix)
         for child in children(node)
             mpe_simulate(child, active_samples, result)
         end
@@ -92,16 +92,16 @@ Sample from a PSDD without any evidence
 """
 function sample(circuit::ProbCircuit)::AbstractVector{Bool}
 
-    simulate(node::Union{ProbLiteralNode, StructProbLiteralNode}) = begin
+    simulate(node::Union{PlainProbLiteralNode, StructPlainProbLiteralNode}) = begin
         inst[variable(node)] = ispositive(node) ? 1 : 0
     end
     
-    simulate(node::Union{Prob⋁Node, StructProb⋁Node}) = begin
+    simulate(node::Union{PlainSumNode, StructPlainSumNode}) = begin
         idx = sample(exp.(node.log_thetas))
         simulate(children(node)[idx])
     end
 
-    simulate(node::Union{Prob⋀Node, StructProb⋀Node}) = foreach(simulate, children(node))
+    simulate(node::Union{PlainMulNode, StructPlainMulNode}) = foreach(simulate, children(node))
 
     inst = Dict{Var,Int64}()
     simulate(circuit)
@@ -121,17 +121,17 @@ function sample(circuit::ProbCircuit, evidence)::AbstractVector{Bool}
 
     @assert num_examples(evidence) == 1 "evidence have to be one example"
     
-    simulate(node::Union{ProbLiteralNode, StructProbLiteralNode}) = begin
+    simulate(node::Union{PlainProbLiteralNode, StructPlainProbLiteralNode}) = begin
         inst[variable(node)] = ispositive(node) ? 1 : 0
     end
     
-    function simulate(node::Union{Prob⋁Node, StructProb⋁Node})
+    function simulate(node::Union{PlainSumNode, StructPlainSumNode})
         prs = [get_exp_upflow(ch)[1] for ch in children(node)] # #evidence == 1
         idx = sample(exp.(node.log_thetas .+ prs))
         simulate(children(node)[idx])
     end
     
-    simulate(node::Union{Prob⋀Node, StructProb⋀Node}) = foreach(simulate, children(node))
+    simulate(node::Union{PlainMulNode, StructPlainMulNode}) = foreach(simulate, children(node))
 
     evaluate_exp(circuit, evidence)
 
diff --git a/src/reasoning/exp_flow_circuits.jl b/src/reasoning/exp_flow_circuits.jl
index 363e7229..eef7575b 100644
--- a/src/reasoning/exp_flow_circuits.jl
+++ b/src/reasoning/exp_flow_circuits.jl
@@ -37,7 +37,7 @@ function ExpFlowCircuit(pc::ProbCircuit, lc::LogisticCircuit, batch_size::Int, :
     sizehint!(cache, (num_nodes(pc) + num_nodes(lc))*4÷3)
     expFlowCircuit = Vector{ExpFlowNode}()
 
-    function ExpflowTraverse(n::Prob⋁Node, m::Logistic⋁Node) 
+    function ExpflowTraverse(n::PlainSumNode, m::Logistic⋁Node) 
         get!(cache, Pair(n, m)) do
             ch = [ ExpflowTraverse(i, j) for i in children(n) for j in children(m)]
             node = UpExpFlow{F}(n, m, ch, fmem(), fgmem())
@@ -45,7 +45,7 @@ function ExpFlowCircuit(pc::ProbCircuit, lc::LogisticCircuit, batch_size::Int, :
             return node
         end
     end
-    function ExpflowTraverse(n::Prob⋀Node, m::Logistic⋀Node) 
+    function ExpflowTraverse(n::PlainMulNode, m::Logistic⋀Node) 
         get!(cache, Pair(n, m)) do
             ch = [ ExpflowTraverse(z[1], z[2]) for z in zip(children(n), children(m)) ]
             node = UpExpFlow{F}(n, m, ch, fmem(), fgmem())
@@ -53,7 +53,7 @@ function ExpFlowCircuit(pc::ProbCircuit, lc::LogisticCircuit, batch_size::Int, :
             return node
         end
     end
-    function ExpflowTraverse(n::ProbLiteralNode, m::Logistic⋁Node) 
+    function ExpflowTraverse(n::PlainProbLiteralNode, m::Logistic⋁Node) 
         get!(cache, Pair(n, m)) do
             ch = Vector{ExpFlowNode{F}}() # TODO
             node = UpExpFlow{F}(n, m, ch, fmem(), fgmem())
@@ -61,7 +61,7 @@ function ExpFlowCircuit(pc::ProbCircuit, lc::LogisticCircuit, batch_size::Int, :
             return node
         end
     end
-    function ExpflowTraverse(n::ProbLiteralNode, m::LogisticLiteral) 
+    function ExpflowTraverse(n::PlainProbLiteralNode, m::LogisticLiteral) 
         get!(cache, Pair(n, m)) do
             ch = Vector{ExpFlowNode{F}}() # TODO
             node = UpExpFlow{F}(n, m, ch, fmem(), fgmem())
@@ -95,7 +95,7 @@ function exp_pass_up_node(node::ExpFlowNode{E}, data) where E
     pType = typeof(node.p_origin)
     fType = typeof(node.f_origin)
 
-    if node.p_origin isa Prob⋁Node && node.f_origin isa Logistic⋁Node
+    if node.p_origin isa PlainSumNode && node.f_origin isa Logistic⋁Node
         #todo this ordering might be different than the ExpFlowNode children
         pthetas = [exp(node.p_origin.log_thetas[i])
                     for i in 1:length(children(node.p_origin)) for j in 1:length(children(node.f_origin))]
@@ -109,12 +109,12 @@ function exp_pass_up_node(node::ExpFlowNode{E}, data) where E
             node.fg .+= (pthetas[z] .* fthetas[z]) .* children(node)[z].f
             node.fg .+= pthetas[z] .* children(node)[z].fg
         end
-    elseif node.p_origin isa Prob⋀Node && node.f_origin isa Logistic⋀Node
+    elseif node.p_origin isa PlainMulNode && node.f_origin isa Logistic⋀Node
         node.f .= children(node)[1].f .* children(node)[2].f # assume 2 children
         node.fg .= (children(node)[1].f .* children(node)[2].fg) .+
                    (children(node)[2].f .* children(node)[1].fg)
 
-    elseif node.p_origin isa ProbLiteralNode 
+    elseif node.p_origin isa PlainProbLiteralNode 
         if node.f_origin isa Logistic⋁Node
             m = children(node.f_origin)[1]
         elseif node.f_origin isa LogisticLiteral
diff --git a/src/reasoning/expectation.jl b/src/reasoning/expectation.jl
index 85e573c3..9bc70047 100644
--- a/src/reasoning/expectation.jl
+++ b/src/reasoning/expectation.jl
@@ -95,7 +95,7 @@ end
 # exp_f (pr-constraint) is originally from:
 #   Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
 
-function exp_f(n::Prob⋁Node, m::Logistic⋁Node, data, cache::Union{ExpectationCache, MomentCache})
+function exp_f(n::PlainSumNode, m::Logistic⋁Node, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = zeros(1 , num_examples(data) )
         pthetas = [exp(n.log_thetas[i]) for i in 1:num_children(n)]
@@ -108,7 +108,7 @@ function exp_f(n::Prob⋁Node, m::Logistic⋁Node, data, cache::Union{Expectatio
     end
 end
 
-function exp_f(n::Prob⋀Node, m::Logistic⋀Node, data, cache::Union{ExpectationCache, MomentCache})
+function exp_f(n::PlainMulNode, m::Logistic⋀Node, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = ones(1 , num_examples(data) )
         @fastmath for (i,j) in zip(children(n), children(m))
@@ -120,7 +120,7 @@ function exp_f(n::Prob⋀Node, m::Logistic⋀Node, data, cache::Union{Expectatio
 end
 
 
-@inline function exp_f(n::ProbLiteralNode, m::LogisticLiteral, data, cache::Union{ExpectationCache, MomentCache})
+@inline function exp_f(n::PlainProbLiteralNode, m::LogisticLiteral, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = zeros(1 , num_examples(data) )
         var = lit2var(literal(m))
@@ -141,7 +141,7 @@ end
 """
 Has to be a Logistic⋁Node with only one child, which is a leaf node 
 """
-@inline function exp_f(n::ProbLiteralNode, m::Logistic⋁Node, data, cache::Union{ExpectationCache, MomentCache})
+@inline function exp_f(n::PlainProbLiteralNode, m::Logistic⋁Node, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         exp_f(n, children(m)[1], data, cache)
     end
@@ -151,7 +151,7 @@ end
 ######## exp_g, exp_fg
 ########################################################################
 
-@inline function exp_g(n::Prob⋁Node, m::Logistic⋁Node, data, cache::ExpectationCache)
+@inline function exp_g(n::PlainSumNode, m::Logistic⋁Node, data, cache::ExpectationCache)
     exp_fg(n, m, data, cache) # exp_fg and exp_g are the same for OR nodes
 end
 
@@ -165,7 +165,7 @@ end
 # end
 
 
-function exp_fg(n::Prob⋁Node, m::Logistic⋁Node, data, cache::ExpectationCache)
+function exp_fg(n::PlainSumNode, m::Logistic⋁Node, data, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         value = zeros(classes(m) , num_examples(data) )
         pthetas = [exp(n.log_thetas[i]) for i in 1:num_children(n)]
@@ -179,7 +179,7 @@ function exp_fg(n::Prob⋁Node, m::Logistic⋁Node, data, cache::ExpectationCach
     end
 end
 
-function exp_fg(n::Prob⋀Node, m::Logistic⋀Node, data, cache::ExpectationCache)
+function exp_fg(n::PlainMulNode, m::Logistic⋀Node, data, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         # Assuming 2 children
         value = exp_f(children(n)[1], children(m)[1], data, cache) .* exp_fg(children(n)[2], children(m)[2], data, cache)
@@ -192,13 +192,13 @@ end
 """
 Has to be a Logistic⋁Node with only one child, which is a leaf node 
 """
-@inline function exp_fg(n::ProbLiteralNode, m::Logistic⋁Node, data, cache::ExpectationCache)
+@inline function exp_fg(n::PlainProbLiteralNode, m::Logistic⋁Node, data, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         m.thetas[1,:] .* exp_f(n, m, data, cache)
     end
 end
 
-@inline function exp_fg(n::ProbLiteralNode, m::LogisticLiteral, data, cache::ExpectationCache)
+@inline function exp_fg(n::PlainProbLiteralNode, m::LogisticLiteral, data, cache::ExpectationCache)
     #dont know how many classes, boradcasting does the job
     zeros(1 , num_examples(data)) 
 end
@@ -207,7 +207,7 @@ end
 ######## moment_g, moment_fg
 ########################################################################
 
-@inline function moment_g(n::Prob⋁Node, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
+@inline function moment_g(n::PlainSumNode, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
     get!(cache.fg, (n, m, moment)) do
         moment_fg(n, m, data, moment, cache)
     end
@@ -216,7 +216,7 @@ end
 """
 Calculating  E[g^k * f]
 """
-function moment_fg(n::Prob⋁Node, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
+function moment_fg(n::PlainSumNode, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
     if moment == 0
         return exp_f(n, m, data, cache)
     end
@@ -235,13 +235,13 @@ function moment_fg(n::Prob⋁Node, m::Logistic⋁Node, data, moment::Int, cache:
     end
 end
 
-@inline function moment_fg(n::ProbLiteralNode, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
+@inline function moment_fg(n::PlainProbLiteralNode, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
     get!(cache.fg, (n, m, moment)) do
         m.thetas[1,:].^(moment) .* exp_f(n, m, data, cache)
     end
 end
 
-@inline function moment_fg(n::ProbLiteralNode, m::LogisticLiteral, data, moment::Int, cache::MomentCache)
+@inline function moment_fg(n::PlainProbLiteralNode, m::LogisticLiteral, data, moment::Int, cache::MomentCache)
     #dont know how many classes, boradcasting does the job
     if moment == 0
         exp_f(n, m, data, cache)
@@ -250,7 +250,7 @@ end
     end
 end
 
-function moment_fg(n::Prob⋀Node, m::Logistic⋀Node, data, moment::Int, cache::MomentCache)
+function moment_fg(n::PlainMulNode, m::Logistic⋀Node, data, moment::Int, cache::MomentCache)
     if moment == 0
         return exp_f(n, m, data, cache)
     end
diff --git a/src/structured_prob_nodes.jl b/src/structured_prob_nodes.jl
index cc064d9f..cd0f9fc6 100644
--- a/src/structured_prob_nodes.jl
+++ b/src/structured_prob_nodes.jl
@@ -1,5 +1,5 @@
-export ProbCircuit, StructProbCircuit,  StructProbLeafNode, StructProbInnerNode,
-    StructProbLiteralNode, StructProb⋀Node, StructProb⋁Node, check_parameter_integrity
+export ProbCircuit, StructProbCircuit,  StructPlainProbLeafNode, StructPlainProbInnerNode,
+    StructPlainProbLiteralNode, StructPlainMulNode, StructPlainSumNode, check_parameter_integrity
 
 #####################
 # Prob circuits that are structured,
@@ -13,31 +13,31 @@ abstract type StructProbCircuit <: StructLogicCircuit end
 const ProbCircuit = Union{StructProbCircuit, PlainProbCircuit}
 
 "A plain structured probabilistic leaf node"
-abstract type StructProbLeafNode <: StructProbCircuit end
+abstract type StructPlainProbLeafNode <: StructProbCircuit end
 
 "A plain structured probabilistic inner node"
-abstract type StructProbInnerNode <: StructProbCircuit end
+abstract type StructPlainProbInnerNode <: StructProbCircuit end
 
 "A plain structured probabilistic literal leaf node, representing the positive or negative literal of its variable"
-mutable struct StructProbLiteralNode <: StructProbLeafNode
+mutable struct StructPlainProbLiteralNode <: StructPlainProbLeafNode
     literal::Lit
     vtree::Vtree
     data
     counter::UInt32
-    StructProbLiteralNode(l,v) = begin
+    StructPlainProbLiteralNode(l,v) = begin
         @assert lit2var(l) ∈ v 
         new(l, v, nothing, 0)
     end
 end
 
 "A plain structured probabilistic conjunction node"
-mutable struct StructProb⋀Node <: StructProbInnerNode
+mutable struct StructPlainMulNode <: StructPlainProbInnerNode
     prime::StructProbCircuit
     sub::StructProbCircuit
     vtree::Vtree
     data
     counter::UInt32
-    StructProb⋀Node(p,s,v) = begin
+    StructPlainMulNode(p,s,v) = begin
         @assert isinner(v) "Structured conjunctions must respect inner vtree node"
         @assert varsubset_left(vtree(p),v) "$p does not go left in $v"
         @assert varsubset_right(vtree(s),v) "$s does not go right in $v"
@@ -46,13 +46,13 @@ mutable struct StructProb⋀Node <: StructProbInnerNode
 end
 
 "A plain structured probabilistic disjunction node"
-mutable struct StructProb⋁Node <: StructProbInnerNode
+mutable struct StructPlainSumNode <: StructPlainProbInnerNode
     children::Vector{<:StructProbCircuit}
     log_thetas::Vector{Float64}
     vtree::Vtree # could be leaf or inner
     data
     counter::UInt32
-    StructProb⋁Node(c, v) = new(c, init_array(Float64, length(c)), v, nothing, 0)
+    StructPlainSumNode(c, v) = new(c, init_array(Float64, length(c)), v, nothing, 0)
 end
 
 #####################
@@ -60,22 +60,22 @@ end
 #####################
 
 import LogicCircuits.GateType # make available for extension
-@inline GateType(::Type{<:StructProbLiteralNode}) = LiteralGate()
-@inline GateType(::Type{<:StructProb⋀Node}) = ⋀Gate()
-@inline GateType(::Type{<:StructProb⋁Node}) = ⋁Gate()
+@inline GateType(::Type{<:StructPlainProbLiteralNode}) = LiteralGate()
+@inline GateType(::Type{<:StructPlainMulNode}) = ⋀Gate()
+@inline GateType(::Type{<:StructPlainSumNode}) = ⋁Gate()
 
 #####################
 # methods
 #####################
 
 import LogicCircuits: children, vtree, vtree_safe # make available for extension
-@inline children(n::StructProb⋁Node) = n.children
-@inline children(n::StructProb⋀Node) = [n.prime,n.sub]
+@inline children(n::StructPlainSumNode) = n.children
+@inline children(n::StructPlainMulNode) = [n.prime,n.sub]
 
 "Get the vtree corresponding to the argument, or nothing if the node has no vtree"
 @inline vtree(n::StructProbCircuit) = n.vtree
-@inline vtree_safe(n::StructProbInnerNode) = vtree(n)
-@inline vtree_safe(n::StructProbLiteralNode) = vtree(n)
+@inline vtree_safe(n::StructPlainProbInnerNode) = vtree(n)
+@inline vtree_safe(n::StructPlainProbLiteralNode) = vtree(n)
 
 import ..Utils: num_parameters
 @inline num_parameters(c::StructProbCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
@@ -86,12 +86,12 @@ import ..Utils: num_parameters
 
 function StructProbCircuit(circuit::PlainStructLogicCircuit)::StructProbCircuit
     f_con(n) = error("Cannot construct a struct probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-    f_lit(n) = StructProbLiteralNode(literal(n), vtree(n))
+    f_lit(n) = StructPlainProbLiteralNode(literal(n), vtree(n))
     f_a(n, cn) = begin
         @assert length(cn)==2
-        StructProb⋀Node(cn[1], cn[2], vtree(n))
+        StructPlainMulNode(cn[1], cn[2], vtree(n))
     end
-    f_o(n, cn) = StructProb⋁Node(cn, vtree(n))
+    f_o(n, cn) = StructPlainSumNode(cn, vtree(n))
     foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, StructProbCircuit)
 end 
 
@@ -119,10 +119,10 @@ conjoin(arguments::Vector{<:StructProbCircuit};
 function conjoin(a1::StructProbCircuit,  
                  a2::StructProbCircuit;
                  reuse=nothing, use_vtree=nothing) 
-    reuse isa StructProb⋀Node && reuse.prime == a1 && reuse.sub == a2 && return reuse
+    reuse isa StructPlainMulNode && reuse.prime == a1 && reuse.sub == a2 && return reuse
     !(use_vtree isa Vtree) && (reuse isa StructProbCircuit) &&  (use_vtree = reuse.vtree)
     !(use_vtree isa Vtree) && (use_vtree = find_inode(vtree_safe(a1), vtree_safe(a2)))
-    return StructProb⋀Node(a1, a2, use_vtree)
+    return StructPlainMulNode(a1, a2, use_vtree)
 end
 
 # ProbCircuit has a default argument for respects: its root's vtree
@@ -134,10 +134,10 @@ respects_vtree(circuit::ProbCircuit) =
 function disjoin(arguments::Vector{<:StructProbCircuit};
                  reuse=nothing, use_vtree=nothing)
     @assert length(arguments) > 0
-    reuse isa StructProb⋁Node && reuse.children == arguments && return reuse
+    reuse isa StructPlainSumNode && reuse.children == arguments && return reuse
     !(use_vtree isa Vtree) && (reuse isa StructProbCircuit) &&  (use_vtree = reuse.vtree)
     !(use_vtree isa Vtree) && (use_vtree = mapreduce(vtree_safe, lca, arguments))
-    return StructProb⋁Node(arguments, use_vtree)
+    return StructPlainSumNode(arguments, use_vtree)
 end
 
 # claim `StructProbCircuit` as the default `ProbCircuit` implementation that has a vtree
diff --git a/test/Probabilistic/prob_nodes_tests.jl b/test/Probabilistic/prob_nodes_tests.jl
index 6f25bbc6..1872e85a 100644
--- a/test/Probabilistic/prob_nodes_tests.jl
+++ b/test/Probabilistic/prob_nodes_tests.jl
@@ -12,9 +12,9 @@ include("../helper/plain_logic_circuits.jl")
     
     # traits
     @test p1 isa ProbCircuit
-    @test p1 isa Prob⋁Node
-    @test children(p1)[1] isa Prob⋀Node
-    @test lit3 isa ProbLiteralNode
+    @test p1 isa PlainSumNode
+    @test children(p1)[1] isa PlainMulNode
+    @test lit3 isa PlainProbLiteralNode
     @test GateType(p1) isa ⋁Gate
     @test GateType(children(p1)[1]) isa ⋀Gate
     @test GateType(lit3) isa LiteralGate

From 65486206cf893a738aefd41786fbd8f99c8d6078 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 30 Aug 2020 02:02:40 -0500
Subject: [PATCH 070/131] disable broken tests during refactoring

---
 src/ProbabilisticCircuits.jl                          |  2 +-
 src/abstract_prob_nodes.jl                            |  9 ++++-----
 src/plain_prob_nodes.jl                               |  7 +++++--
 test/{ => broken}/LoadSave/circuit_loaders_tests.jl   |  0
 test/{ => broken}/LoadSave/circuit_savers_test.jl     |  0
 test/{ => broken}/Logistic/logistic_tests.jl          |  0
 test/{ => broken}/Mixtures/EMLearnerTest.jl           |  0
 test/{ => broken}/Probabilistic/informations_tests.jl |  0
 test/{ => broken}/Probabilistic/parameters_tests.jl   |  0
 test/{ => broken}/Probabilistic/queries_tests.jl      |  0
 test/{ => broken}/Reasoning/expectation_test.jl       |  0
 .../{ => broken}/StructureLearner/VtreeLearnerTest.jl |  0
 .../StructureLearner/chow_liu_tree_tests.jl           |  0
 test/{ => broken}/StructureLearner/init_tests.jl      |  0
 test/{ => broken}/Utils/informations_tests.jl         |  0
 .../prob_nodes_tests.jl => plain_prob_nodes_tests.jl} | 11 ++++++++---
 test/runtests.jl                                      |  2 +-
 17 files changed, 19 insertions(+), 12 deletions(-)
 rename test/{ => broken}/LoadSave/circuit_loaders_tests.jl (100%)
 rename test/{ => broken}/LoadSave/circuit_savers_test.jl (100%)
 rename test/{ => broken}/Logistic/logistic_tests.jl (100%)
 rename test/{ => broken}/Mixtures/EMLearnerTest.jl (100%)
 rename test/{ => broken}/Probabilistic/informations_tests.jl (100%)
 rename test/{ => broken}/Probabilistic/parameters_tests.jl (100%)
 rename test/{ => broken}/Probabilistic/queries_tests.jl (100%)
 rename test/{ => broken}/Reasoning/expectation_test.jl (100%)
 rename test/{ => broken}/StructureLearner/VtreeLearnerTest.jl (100%)
 rename test/{ => broken}/StructureLearner/chow_liu_tree_tests.jl (100%)
 rename test/{ => broken}/StructureLearner/init_tests.jl (100%)
 rename test/{ => broken}/Utils/informations_tests.jl (100%)
 rename test/{Probabilistic/prob_nodes_tests.jl => plain_prob_nodes_tests.jl} (82%)

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 991787bb..1e023f08 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -5,7 +5,7 @@ module ProbabilisticCircuits
 # USE EXTERNAL MODULES
 
 using Reexport
-using LogicCircuits
+@reexport using LogicCircuits
 
 include("Utils/Utils.jl")
 @reexport using .Utils
diff --git a/src/abstract_prob_nodes.jl b/src/abstract_prob_nodes.jl
index 7b6e4d8b..8226c203 100644
--- a/src/abstract_prob_nodes.jl
+++ b/src/abstract_prob_nodes.jl
@@ -16,8 +16,7 @@ abstract type ProbCircuit <: LogicCircuit end
 # node functions that need to be implemented for each type of circuit
 #####################
 
-import ..Utils.children # make available for extension by concrete types
-import LogicCircuits.compile # make available for extension by concrete types
+import LogicCircuits: children, compile # extend
 
 "Multiply nodes into a single circuit"
 function multiply end
@@ -36,14 +35,14 @@ function summate end
 
 "Count the number of parameters in the circuit"
 @inline num_parameters(c::ProbCircuit) = 
-    sum(n -> num_parameters(n), sum_nodes(c))
+    sum(n -> num_parameters_node(n), sum_nodes(c))
 
 #####################
 # methods to easily construct circuits
 #####################
 
-@inline multiply(xs::PlainProbCircuit...) = multiply(collect(xs))
-@inline summate(xs::PlainProbCircuit...) = summate(collect(xs))
+@inline multiply(xs::ProbCircuit...) = multiply(collect(xs))
+@inline summate(xs::ProbCircuit...) = summate(collect(xs))
 
 import LogicCircuits: conjoin, disjoin # make available for extension
 
diff --git a/src/plain_prob_nodes.jl b/src/plain_prob_nodes.jl
index 68ced299..a0892710 100644
--- a/src/plain_prob_nodes.jl
+++ b/src/plain_prob_nodes.jl
@@ -40,7 +40,7 @@ mutable struct PlainSumNode <: PlainProbInnerNode
     data
     counter::UInt32
     PlainSumNode(c) = begin
-        new(c, init_array(Float64, length(children)), nothing, 0)
+        new(c, init_array(Float64, length(c)), nothing, 0)
     end
 end
 
@@ -61,7 +61,8 @@ import LogicCircuits.GateType # make available for extension
 import LogicCircuits: children # make available for extension
 @inline children(n::PlainProbInnerNode) = n.children
 
-@inline num_parameters(n::PlainSumNode) = num_children(n)
+"Count the number of parameters in the node"
+@inline num_parameters_node(n::PlainSumNode) = num_children(n)
 
 #####################
 # constructors and conversions
@@ -99,6 +100,8 @@ function compile(::Type{<:PlainProbCircuit}, circuit::LogicCircuit)
     foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, PlainProbCircuit)
 end
 
+import LogicCircuits: fully_factorized_circuit #extend
+
 fully_factorized_circuit(::Type{ProbCircuit}, n::Int) =
     fully_factorized_circuit(PlainProbCircuit, n)
 
diff --git a/test/LoadSave/circuit_loaders_tests.jl b/test/broken/LoadSave/circuit_loaders_tests.jl
similarity index 100%
rename from test/LoadSave/circuit_loaders_tests.jl
rename to test/broken/LoadSave/circuit_loaders_tests.jl
diff --git a/test/LoadSave/circuit_savers_test.jl b/test/broken/LoadSave/circuit_savers_test.jl
similarity index 100%
rename from test/LoadSave/circuit_savers_test.jl
rename to test/broken/LoadSave/circuit_savers_test.jl
diff --git a/test/Logistic/logistic_tests.jl b/test/broken/Logistic/logistic_tests.jl
similarity index 100%
rename from test/Logistic/logistic_tests.jl
rename to test/broken/Logistic/logistic_tests.jl
diff --git a/test/Mixtures/EMLearnerTest.jl b/test/broken/Mixtures/EMLearnerTest.jl
similarity index 100%
rename from test/Mixtures/EMLearnerTest.jl
rename to test/broken/Mixtures/EMLearnerTest.jl
diff --git a/test/Probabilistic/informations_tests.jl b/test/broken/Probabilistic/informations_tests.jl
similarity index 100%
rename from test/Probabilistic/informations_tests.jl
rename to test/broken/Probabilistic/informations_tests.jl
diff --git a/test/Probabilistic/parameters_tests.jl b/test/broken/Probabilistic/parameters_tests.jl
similarity index 100%
rename from test/Probabilistic/parameters_tests.jl
rename to test/broken/Probabilistic/parameters_tests.jl
diff --git a/test/Probabilistic/queries_tests.jl b/test/broken/Probabilistic/queries_tests.jl
similarity index 100%
rename from test/Probabilistic/queries_tests.jl
rename to test/broken/Probabilistic/queries_tests.jl
diff --git a/test/Reasoning/expectation_test.jl b/test/broken/Reasoning/expectation_test.jl
similarity index 100%
rename from test/Reasoning/expectation_test.jl
rename to test/broken/Reasoning/expectation_test.jl
diff --git a/test/StructureLearner/VtreeLearnerTest.jl b/test/broken/StructureLearner/VtreeLearnerTest.jl
similarity index 100%
rename from test/StructureLearner/VtreeLearnerTest.jl
rename to test/broken/StructureLearner/VtreeLearnerTest.jl
diff --git a/test/StructureLearner/chow_liu_tree_tests.jl b/test/broken/StructureLearner/chow_liu_tree_tests.jl
similarity index 100%
rename from test/StructureLearner/chow_liu_tree_tests.jl
rename to test/broken/StructureLearner/chow_liu_tree_tests.jl
diff --git a/test/StructureLearner/init_tests.jl b/test/broken/StructureLearner/init_tests.jl
similarity index 100%
rename from test/StructureLearner/init_tests.jl
rename to test/broken/StructureLearner/init_tests.jl
diff --git a/test/Utils/informations_tests.jl b/test/broken/Utils/informations_tests.jl
similarity index 100%
rename from test/Utils/informations_tests.jl
rename to test/broken/Utils/informations_tests.jl
diff --git a/test/Probabilistic/prob_nodes_tests.jl b/test/plain_prob_nodes_tests.jl
similarity index 82%
rename from test/Probabilistic/prob_nodes_tests.jl
rename to test/plain_prob_nodes_tests.jl
index 1872e85a..4c83c70e 100644
--- a/test/Probabilistic/prob_nodes_tests.jl
+++ b/test/plain_prob_nodes_tests.jl
@@ -2,14 +2,17 @@ using Test
 using LogicCircuits
 using ProbabilisticCircuits
 
-include("../helper/plain_logic_circuits.jl")
+include("helper/plain_logic_circuits.jl")
 
 @testset "probabilistic circuit nodes" begin
+
     c1 = little_3var()
+
+    @test isdisjoint(linearize(ProbCircuit(c1)), linearize(ProbCircuit(c1)))
+    
     p1 = ProbCircuit(c1)
     lit3 = children(children(p1)[1])[1]
-    @test isempty(intersect(linearize(ProbCircuit(c1)), linearize(ProbCircuit(c1))))
-    
+
     # traits
     @test p1 isa ProbCircuit
     @test p1 isa PlainSumNode
@@ -30,4 +33,6 @@ include("../helper/plain_logic_circuits.jl")
     @test num_nodes(p1) == 15
     @test num_edges(p1) == 18
 
+    r1 = fully_factorized_circuit(ProbCircuit,10)
+    
 end
\ No newline at end of file
diff --git a/test/runtests.jl b/test/runtests.jl
index e0920969..6c0ce54c 100644
--- a/test/runtests.jl
+++ b/test/runtests.jl
@@ -12,4 +12,4 @@ end
 using Jive
 
 # TODO reinstate after refactoring all modules
-runtests(@__DIR__, skip=["runtests.jl", "helper", "Mixtures", "StructureLearner/VtreeLearnerTest.jl"])
+runtests(@__DIR__, skip=["runtests.jl", "helper", "broken"])

From 235df8da7d8b39027b906b9c04a0b86949cf8e91 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 30 Aug 2020 02:24:13 -0500
Subject: [PATCH 071/131] reinstate `parameters.jl`

---
 src/ProbabilisticCircuits.jl                  |  3 ++-
 test/broken/Probabilistic/parameters_tests.jl |  8 --------
 test/parameters_tests.jl                      | 16 ++++++++++++++++
 test/plain_prob_nodes_tests.jl                |  3 ++-
 4 files changed, 20 insertions(+), 10 deletions(-)
 delete mode 100644 test/broken/Probabilistic/parameters_tests.jl
 create mode 100644 test/parameters_tests.jl

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 1e023f08..8f56a49f 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -12,11 +12,12 @@ include("Utils/Utils.jl")
 
 include("abstract_prob_nodes.jl")
 include("plain_prob_nodes.jl")
+include("parameters.jl")
+
 # include("structured_prob_nodes.jl")
 # include("exp_flows.jl")
 # include("queries.jl")
 # include("informations.jl")
-# include("parameters.jl")
 
 # include("logistic/logistic_nodes.jl")
 # include("logistic/queries.jl")
diff --git a/test/broken/Probabilistic/parameters_tests.jl b/test/broken/Probabilistic/parameters_tests.jl
deleted file mode 100644
index 0f953904..00000000
--- a/test/broken/Probabilistic/parameters_tests.jl
+++ /dev/null
@@ -1,8 +0,0 @@
-using Test
-using LogicCircuits
-using ProbabilisticCircuits
-
-# TODO add tests
-@testset "MLE tests" begin
-    @test true
-end
\ No newline at end of file
diff --git a/test/parameters_tests.jl b/test/parameters_tests.jl
new file mode 100644
index 00000000..3c05f660
--- /dev/null
+++ b/test/parameters_tests.jl
@@ -0,0 +1,16 @@
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+using DataFrames: DataFrame
+
+@testset "MLE tests" begin
+    
+    dfb = DataFrame(BitMatrix([true false; true true; false true]))
+    r = fully_factorized_circuit(ProbCircuit,num_features(dfb))
+    estimate_parameters(r,dfb; pseudocount=1.0)
+
+    # TODO test identical likelihoods with
+    # ll1  = LogicCircuits.Utils.fully_factorized_log_likelihood(dfb; pseudocount=1)
+    # ll0 = LogicCircuits.Utils.fully_factorized_log_likelihood(dfb)
+
+end
\ No newline at end of file
diff --git a/test/plain_prob_nodes_tests.jl b/test/plain_prob_nodes_tests.jl
index 4c83c70e..eb43baec 100644
--- a/test/plain_prob_nodes_tests.jl
+++ b/test/plain_prob_nodes_tests.jl
@@ -34,5 +34,6 @@ include("helper/plain_logic_circuits.jl")
     @test num_edges(p1) == 18
 
     r1 = fully_factorized_circuit(ProbCircuit,10)
-    
+    @test num_parameters(r1) == 2*10+1
+
 end
\ No newline at end of file

From d20a06966c725f88904cb39e505ead4199cb5897 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 30 Aug 2020 22:13:09 -0500
Subject: [PATCH 072/131] reinstate structured probabilistic circuits and add
 tests

---
 src/LoadSave/circuit_savers.jl      |   6 +-
 src/ProbabilisticCircuits.jl        |   3 +-
 src/abstract_prob_nodes.jl          |  10 +++
 src/informations.jl                 |  26 +++---
 src/plain_prob_nodes.jl             |   3 -
 src/queries.jl                      |  20 ++---
 src/structured_prob_nodes.jl        | 135 ++++++++++------------------
 test/plain_prob_nodes_tests.jl      |   5 +-
 test/structured_prob_nodes_tests.jl | 100 +++++++++++++++++++++
 9 files changed, 189 insertions(+), 119 deletions(-)
 create mode 100644 test/structured_prob_nodes_tests.jl

diff --git a/src/LoadSave/circuit_savers.jl b/src/LoadSave/circuit_savers.jl
index 99353283..180e54a2 100644
--- a/src/LoadSave/circuit_savers.jl
+++ b/src/LoadSave/circuit_savers.jl
@@ -15,17 +15,17 @@ using LogicCircuits.LoadSave: SDDElement,
 #####################
 
 "Decompile for psdd circuit, used during saving of circuits to file" 
-decompile(n::StructPlainProbLiteralNode, node2id, vtree2id)::UnweightedLiteralLine = 
+decompile(n::StructProbLiteralNode, node2id, vtree2id)::UnweightedLiteralLine = 
     UnweightedLiteralLine(node2id[n], vtree2id[n.vtree], literal(n), true)
 
-make_element(n::StructPlainMulNode, w::AbstractFloat, node2id) = 
+make_element(n::StructMulNode, w::AbstractFloat, node2id) = 
     PSDDElement(node2id[children(n)[1]],  node2id[children(n)[2]], w)
 
 istrue_node(n)::Bool = 
     is⋁gate(n) && num_children(n) == 2 && GateType(children(n)[1]) isa LiteralGate && GateType(children(n)[2]) isa LiteralGate && 
     ispositive(children(n)[1]) && isnegative(children(n)[2])
 
-function decompile(n::StructPlainSumNode, node2id, vtree2id)::Union{WeightedNamedConstantLine, DecisionLine{PSDDElement}} 
+function decompile(n::StructSumNode, node2id, vtree2id)::Union{WeightedNamedConstantLine, DecisionLine{PSDDElement}} 
     if istrue_node(n)
         WeightedNamedConstantLine(node2id[n], vtree2id[n.vtree], lit2var(children(n)[1].literal), n.log_thetas[1]) # TODO
     else
diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 8f56a49f..83b3588d 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -14,7 +14,8 @@ include("abstract_prob_nodes.jl")
 include("plain_prob_nodes.jl")
 include("parameters.jl")
 
-# include("structured_prob_nodes.jl")
+include("structured_prob_nodes.jl")
+
 # include("exp_flows.jl")
 # include("queries.jl")
 # include("informations.jl")
diff --git a/src/abstract_prob_nodes.jl b/src/abstract_prob_nodes.jl
index 8226c203..4d9c0127 100644
--- a/src/abstract_prob_nodes.jl
+++ b/src/abstract_prob_nodes.jl
@@ -55,6 +55,9 @@ import LogicCircuits: conjoin, disjoin # make available for extension
 @inline Base.:*(x::ProbCircuit, y::ProbCircuit) = multiply(x,y)
 @inline Base.:+(x::ProbCircuit, y::ProbCircuit) = summate(x,y)
 
+compile(::Type{<:ProbCircuit}, ::Bool) =
+    error("Probabilistic circuits do not have constant leafs.")
+
 #####################
 # circuit inspection
 #####################
@@ -64,3 +67,10 @@ mul_nodes(c::ProbCircuit) = ⋀_nodes(c)
 
 "Get the list of summation nodes in a given circuit"
 sum_nodes(c::ProbCircuit) = ⋁_nodes(c)
+
+function check_parameter_integrity(circuit::ProbCircuit)
+    for node in sum_nodes(circuit)
+        @assert all(θ -> !isnan(θ), node.log_thetas) "There is a NaN in one of the log_thetas"
+    end
+    true
+end
\ No newline at end of file
diff --git a/src/informations.jl b/src/informations.jl
index ade07e3d..67d0f3af 100644
--- a/src/informations.jl
+++ b/src/informations.jl
@@ -18,7 +18,7 @@ function pr_constraint(psdd_node::ProbCircuit, sdd_node::StrutCircuit,
         return cache[psdd_node, sdd_node]
     
     # Boundary cases
-    elseif psdd_node isa StructPlainProbLiteralNode
+    elseif psdd_node isa StructProbLiteralNode
         # Both are literals, just check whether they agrees with each other 
         if isliteralgate(sdd_node)
             if literal(psdd_node) == literal(sdd_node)
@@ -38,7 +38,7 @@ function pr_constraint(psdd_node::ProbCircuit, sdd_node::StrutCircuit,
         end
     
     # The psdd is true
-    elseif children(psdd_node)[1] isa StructPlainProbLiteralNode 
+    elseif children(psdd_node)[1] isa StructProbLiteralNode 
         theta = exp(psdd_node.log_thetas[1])
         return get!(cache, (psdd_node, sdd_node),
             theta * pr_constraint(children(psdd_node)[1], sdd_node, cache) +
@@ -68,10 +68,10 @@ Calculate entropy of the distribution of the input psdd."
 """
 
 import ..Utils: entropy
-function entropy(psdd_node::StructPlainSumNode, psdd_entropy_cache::Dict{ProbCircuit, Float64}=Dict{ProbCircuit, Float64}())::Float64
+function entropy(psdd_node::StructSumNode, psdd_entropy_cache::Dict{ProbCircuit, Float64}=Dict{ProbCircuit, Float64}())::Float64
     if psdd_node in keys(psdd_entropy_cache)
         return psdd_entropy_cache[psdd_node]
-    elseif children(psdd_node)[1] isa StructPlainProbLiteralNode
+    elseif children(psdd_node)[1] isa StructProbLiteralNode
         return get!(psdd_entropy_cache, psdd_node,
             - exp(psdd_node.log_thetas[1]) * psdd_node.log_thetas[1] -
             exp(psdd_node.log_thetas[2]) * psdd_node.log_thetas[2])
@@ -88,27 +88,27 @@ function entropy(psdd_node::StructPlainSumNode, psdd_entropy_cache::Dict{ProbCir
     end
 end
 
-function entropy(psdd_node::StructPlainMulNode, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
+function entropy(psdd_node::StructMulNode, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
     return get!(psdd_entropy_cache, children(psdd_node)[1], entropy(children(psdd_node)[1], psdd_entropy_cache)) +
         get!(psdd_entropy_cache, children(psdd_node)[2], entropy(children(psdd_node)[2], psdd_entropy_cache))
 end
 
-function entropy(psdd_node::StructPlainProbLiteralNode, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
+function entropy(psdd_node::StructProbLiteralNode, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
     return get!(psdd_entropy_cache, psdd_node, 0.0)
 end
 
 "Calculate KL divergence calculation for psdds that are not necessarily identical"
-function kl_divergence(psdd_node1::StructPlainSumNode, psdd_node2::StructPlainSumNode,
+function kl_divergence(psdd_node1::StructSumNode, psdd_node2::StructSumNode,
         kl_divergence_cache::KLDCache=KLDCache(), pr_constraint_cache::PRCache=PRCache())
-    @assert !(psdd_node1 isa StructPlainMulNode || psdd_node2 isa StructPlainMulNode) "Prob⋀ not a valid PSDD node for KL-Divergence"
+    @assert !(psdd_node1 isa StructMulNode || psdd_node2 isa StructMulNode) "Prob⋀ not a valid PSDD node for KL-Divergence"
 
     # Check if both nodes are normalized for same vtree node
     @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
 
     if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
         return kl_divergence_cache[(psdd_node1, psdd_node2)]
-    elseif children(psdd_node1)[1] isa StructPlainProbLiteralNode
-        if psdd_node2 isa StructPlainProbLiteralNode
+    elseif children(psdd_node1)[1] isa StructProbLiteralNode
+        if psdd_node2 isa StructProbLiteralNode
             kl_divergence(children(psdd_node1)[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
             kl_divergence(children(psdd_node1)[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
             if literal(children(psdd_node1)[1]) == literal(psdd_node2)
@@ -169,7 +169,7 @@ function kl_divergence(psdd_node1::StructPlainSumNode, psdd_node2::StructPlainSu
     end
 end
 
-function kl_divergence(psdd_node1::StructPlainProbLiteralNode, psdd_node2::StructPlainProbLiteralNode,
+function kl_divergence(psdd_node1::StructProbLiteralNode, psdd_node2::StructProbLiteralNode,
         kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
     # Check if literals are over same variables in vtree
    @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
@@ -182,7 +182,7 @@ function kl_divergence(psdd_node1::StructPlainProbLiteralNode, psdd_node2::Struc
     end
 end
 
-function kl_divergence(psdd_node1::StructPlainSumNode, psdd_node2::StructPlainProbLiteralNode,
+function kl_divergence(psdd_node1::StructSumNode, psdd_node2::StructProbLiteralNode,
         kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
     @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
 
@@ -203,7 +203,7 @@ function kl_divergence(psdd_node1::StructPlainSumNode, psdd_node2::StructPlainPr
     end
 end
 
-function kl_divergence(psdd_node1::StructPlainProbLiteralNode, psdd_node2::StructPlainSumNode,
+function kl_divergence(psdd_node1::StructProbLiteralNode, psdd_node2::StructSumNode,
         kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
     @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
 
diff --git a/src/plain_prob_nodes.jl b/src/plain_prob_nodes.jl
index a0892710..3403ecee 100644
--- a/src/plain_prob_nodes.jl
+++ b/src/plain_prob_nodes.jl
@@ -86,9 +86,6 @@ end
 compile(::Type{ProbCircuit}, args...) =
     compile(PlainProbCircuit, args...)
 
-compile(::Type{<:PlainProbCircuit}, ::Bool) =
-    error("Probabilistic circuits do not have constant leafs.")
-
 compile(::Type{<:PlainProbCircuit}, l::Lit) =
     PlainProbLiteralNode(l)
 
diff --git a/src/queries.jl b/src/queries.jl
index 91b0f2e7..190c536a 100644
--- a/src/queries.jl
+++ b/src/queries.jl
@@ -12,7 +12,7 @@ function log_likelihood_per_instance(pc::ProbCircuit, data)
     indices = init_array(Bool, num_examples(data))::BitVector
     
     ll(n::ProbCircuit) = ()
-    ll(n::Union{PlainSumNode, StructPlainSumNode}) = begin
+    ll(n::Union{PlainSumNode, StructSumNode}) = begin
         if num_children(n) != 1 # other nodes have no effect on likelihood
             foreach(children(n), n.log_thetas) do c, log_theta
                 indices = get_downflow(n, c)
@@ -50,7 +50,7 @@ function MPE(pc::ProbCircuit, evidence)::BitMatrix
     ans = falses(num_examples(evidence), num_features(evidence))
     active_samples = trues(num_examples(evidence))
 
-    function mpe_simulate(node::Union{PlainProbLiteralNode, StructPlainProbLiteralNode}, active_samples::BitVector, result::BitMatrix)
+    function mpe_simulate(node::Union{PlainProbLiteralNode, StructProbLiteralNode}, active_samples::BitVector, result::BitMatrix)
         if ispositive(node)
             result[active_samples, variable(node)] .= 1
         else
@@ -58,7 +58,7 @@ function MPE(pc::ProbCircuit, evidence)::BitMatrix
         end
     end
     
-    function mpe_simulate(node::Union{PlainSumNode, StructPlainSumNode}, active_samples::BitVector, result::BitMatrix)
+    function mpe_simulate(node::Union{PlainSumNode, StructSumNode}, active_samples::BitVector, result::BitMatrix)
         prs = zeros(length(children(node)), size(active_samples)[1] )
         @simd  for i=1:length(children(node))
             prs[i,:] .= get_exp_upflow(children(node)[i]) .+ (node.log_thetas[i])
@@ -72,7 +72,7 @@ function MPE(pc::ProbCircuit, evidence)::BitMatrix
         end
     end
     
-    function mpe_simulate(node::Union{PlainMulNode, StructPlainMulNode}, active_samples::BitVector, result::BitMatrix)
+    function mpe_simulate(node::Union{PlainMulNode, StructMulNode}, active_samples::BitVector, result::BitMatrix)
         for child in children(node)
             mpe_simulate(child, active_samples, result)
         end
@@ -92,16 +92,16 @@ Sample from a PSDD without any evidence
 """
 function sample(circuit::ProbCircuit)::AbstractVector{Bool}
 
-    simulate(node::Union{PlainProbLiteralNode, StructPlainProbLiteralNode}) = begin
+    simulate(node::Union{PlainProbLiteralNode, StructProbLiteralNode}) = begin
         inst[variable(node)] = ispositive(node) ? 1 : 0
     end
     
-    simulate(node::Union{PlainSumNode, StructPlainSumNode}) = begin
+    simulate(node::Union{PlainSumNode, StructSumNode}) = begin
         idx = sample(exp.(node.log_thetas))
         simulate(children(node)[idx])
     end
 
-    simulate(node::Union{PlainMulNode, StructPlainMulNode}) = foreach(simulate, children(node))
+    simulate(node::Union{PlainMulNode, StructMulNode}) = foreach(simulate, children(node))
 
     inst = Dict{Var,Int64}()
     simulate(circuit)
@@ -121,17 +121,17 @@ function sample(circuit::ProbCircuit, evidence)::AbstractVector{Bool}
 
     @assert num_examples(evidence) == 1 "evidence have to be one example"
     
-    simulate(node::Union{PlainProbLiteralNode, StructPlainProbLiteralNode}) = begin
+    simulate(node::Union{PlainProbLiteralNode, StructProbLiteralNode}) = begin
         inst[variable(node)] = ispositive(node) ? 1 : 0
     end
     
-    function simulate(node::Union{PlainSumNode, StructPlainSumNode})
+    function simulate(node::Union{PlainSumNode, StructSumNode})
         prs = [get_exp_upflow(ch)[1] for ch in children(node)] # #evidence == 1
         idx = sample(exp.(node.log_thetas .+ prs))
         simulate(children(node)[idx])
     end
     
-    simulate(node::Union{PlainMulNode, StructPlainMulNode}) = foreach(simulate, children(node))
+    simulate(node::Union{PlainMulNode, StructMulNode}) = foreach(simulate, children(node))
 
     evaluate_exp(circuit, evidence)
 
diff --git a/src/structured_prob_nodes.jl b/src/structured_prob_nodes.jl
index cd0f9fc6..f1817ee5 100644
--- a/src/structured_prob_nodes.jl
+++ b/src/structured_prob_nodes.jl
@@ -1,5 +1,5 @@
-export ProbCircuit, StructProbCircuit,  StructPlainProbLeafNode, StructPlainProbInnerNode,
-    StructPlainProbLiteralNode, StructPlainMulNode, StructPlainSumNode, check_parameter_integrity
+export ProbCircuit, StructProbCircuit, StructProbLeafNode, StructProbInnerNode,
+    StructProbLiteralNode, StructMulNode, StructSumNode, check_parameter_integrity
 
 #####################
 # Prob circuits that are structured,
@@ -7,37 +7,34 @@ export ProbCircuit, StructProbCircuit,  StructPlainProbLeafNode, StructPlainProb
 #####################
 
 "Root of the plain structure probabilistic circuit node hierarchy"
-abstract type StructProbCircuit <: StructLogicCircuit end
-
-"Root of the probabilistic circuit node hierarchy"
-const ProbCircuit = Union{StructProbCircuit, PlainProbCircuit}
+abstract type StructProbCircuit <: ProbCircuit end
 
 "A plain structured probabilistic leaf node"
-abstract type StructPlainProbLeafNode <: StructProbCircuit end
+abstract type StructProbLeafNode <: StructProbCircuit end
 
 "A plain structured probabilistic inner node"
-abstract type StructPlainProbInnerNode <: StructProbCircuit end
+abstract type StructProbInnerNode <: StructProbCircuit end
 
 "A plain structured probabilistic literal leaf node, representing the positive or negative literal of its variable"
-mutable struct StructPlainProbLiteralNode <: StructPlainProbLeafNode
+mutable struct StructProbLiteralNode <: StructProbLeafNode
     literal::Lit
     vtree::Vtree
     data
     counter::UInt32
-    StructPlainProbLiteralNode(l,v) = begin
+    StructProbLiteralNode(l,v) = begin
         @assert lit2var(l) ∈ v 
         new(l, v, nothing, 0)
     end
 end
 
 "A plain structured probabilistic conjunction node"
-mutable struct StructPlainMulNode <: StructPlainProbInnerNode
+mutable struct StructMulNode <: StructProbInnerNode
     prime::StructProbCircuit
     sub::StructProbCircuit
     vtree::Vtree
     data
     counter::UInt32
-    StructPlainMulNode(p,s,v) = begin
+    StructMulNode(p,s,v) = begin
         @assert isinner(v) "Structured conjunctions must respect inner vtree node"
         @assert varsubset_left(vtree(p),v) "$p does not go left in $v"
         @assert varsubset_right(vtree(s),v) "$s does not go right in $v"
@@ -46,13 +43,14 @@ mutable struct StructPlainMulNode <: StructPlainProbInnerNode
 end
 
 "A plain structured probabilistic disjunction node"
-mutable struct StructPlainSumNode <: StructPlainProbInnerNode
-    children::Vector{<:StructProbCircuit}
+mutable struct StructSumNode <: StructProbInnerNode
+    children::Vector{StructProbCircuit}
     log_thetas::Vector{Float64}
     vtree::Vtree # could be leaf or inner
     data
     counter::UInt32
-    StructPlainSumNode(c, v) = new(c, init_array(Float64, length(c)), v, nothing, 0)
+    StructSumNode(c, v) = 
+        new(c, init_array(Float64, length(c)), v, nothing, 0)
 end
 
 #####################
@@ -60,115 +58,76 @@ end
 #####################
 
 import LogicCircuits.GateType # make available for extension
-@inline GateType(::Type{<:StructPlainProbLiteralNode}) = LiteralGate()
-@inline GateType(::Type{<:StructPlainMulNode}) = ⋀Gate()
-@inline GateType(::Type{<:StructPlainSumNode}) = ⋁Gate()
+@inline GateType(::Type{<:StructProbLiteralNode}) = LiteralGate()
+@inline GateType(::Type{<:StructMulNode}) = ⋀Gate()
+@inline GateType(::Type{<:StructSumNode}) = ⋁Gate()
 
 #####################
 # methods
 #####################
 
-import LogicCircuits: children, vtree, vtree_safe # make available for extension
-@inline children(n::StructPlainSumNode) = n.children
-@inline children(n::StructPlainMulNode) = [n.prime,n.sub]
+import LogicCircuits: children, vtree, vtree_safe, respects_vtree # make available for extension
+@inline children(n::StructSumNode) = n.children
+@inline children(n::StructMulNode) = [n.prime,n.sub]
 
 "Get the vtree corresponding to the argument, or nothing if the node has no vtree"
 @inline vtree(n::StructProbCircuit) = n.vtree
-@inline vtree_safe(n::StructPlainProbInnerNode) = vtree(n)
-@inline vtree_safe(n::StructPlainProbLiteralNode) = vtree(n)
+@inline vtree_safe(n::StructProbInnerNode) = vtree(n)
+@inline vtree_safe(n::StructProbLiteralNode) = vtree(n)
 
-import ..Utils: num_parameters
-@inline num_parameters(c::StructProbCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
+# ProbCircuit has a default argument for respects: its root's vtree
+respects_vtree(circuit::StructProbCircuit) = 
+    respects_vtree(circuit, vtree(circuit))
+
+@inline num_parameters_node(n::StructSumNode) = num_children(n)
 
 #####################
-# constructors and conversions
+# constructors and compilation
 #####################
 
-function StructProbCircuit(circuit::PlainStructLogicCircuit)::StructProbCircuit
-    f_con(n) = error("Cannot construct a struct probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-    f_lit(n) = StructPlainProbLiteralNode(literal(n), vtree(n))
-    f_a(n, cn) = begin
-        @assert length(cn)==2
-        StructPlainMulNode(cn[1], cn[2], vtree(n))
-    end
-    f_o(n, cn) = StructPlainSumNode(cn, vtree(n))
-    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, StructProbCircuit)
-end 
-
-function PlainStructLogicCircuit(circuit::StructProbCircuit)::PlainStructLogicCircuit
-    f_con(n) = error("Cannot construct a struct probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-    f_lit(n) = PlainStructLiteralNode(literal(n), vtree(n))
-    f_a(n, cn) = begin
-        @assert length(cn)==2
-        PlainStruct⋀Node(cn[1], cn[2], vtree(n))
-    end
-    f_o(n, cn) = PlainStruct⋁Node(cn, vtree(n))
-    foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, PlainStructLogicCircuit)
-end
-
-@inline ProbCircuit(circuit::PlainStructLogicCircuit) = StructProbCircuit(circuit)
-
-@inline ProbCircuit(circuit::PlainLogicCircuit) = PlainProbCircuit(circuit)
-
-import LogicCircuits: conjoin, disjoin, compile # make available for extension
-
-conjoin(arguments::Vector{<:StructProbCircuit};
+multiply(arguments::Vector{<:StructProbCircuit};
         reuse=nothing, use_vtree=nothing) =
-        conjoin(arguments...; reuse, use_vtree)
+        multiply(arguments...; reuse, use_vtree)
 
-function conjoin(a1::StructProbCircuit,  
+function multiply(a1::StructProbCircuit,  
                  a2::StructProbCircuit;
                  reuse=nothing, use_vtree=nothing) 
-    reuse isa StructPlainMulNode && reuse.prime == a1 && reuse.sub == a2 && return reuse
+    reuse isa StructMulNode && reuse.prime == a1 && reuse.sub == a2 && return reuse
     !(use_vtree isa Vtree) && (reuse isa StructProbCircuit) &&  (use_vtree = reuse.vtree)
     !(use_vtree isa Vtree) && (use_vtree = find_inode(vtree_safe(a1), vtree_safe(a2)))
-    return StructPlainMulNode(a1, a2, use_vtree)
+    return StructMulNode(a1, a2, use_vtree)
 end
 
-# ProbCircuit has a default argument for respects: its root's vtree
-respects_vtree(circuit::ProbCircuit) = 
-    respects_vtree(circuit, vtree(circuit))
-
-@inline disjoin(xs::StructProbCircuit...) = disjoin(collect(xs))
-
-function disjoin(arguments::Vector{<:StructProbCircuit};
+function summate(arguments::Vector{<:StructProbCircuit};
                  reuse=nothing, use_vtree=nothing)
     @assert length(arguments) > 0
-    reuse isa StructPlainSumNode && reuse.children == arguments && return reuse
+    reuse isa StructSumNode && reuse.children == arguments && return reuse
     !(use_vtree isa Vtree) && (reuse isa StructProbCircuit) &&  (use_vtree = reuse.vtree)
     !(use_vtree isa Vtree) && (use_vtree = mapreduce(vtree_safe, lca, arguments))
-    return StructPlainSumNode(arguments, use_vtree)
+    return StructSumNode(arguments, use_vtree)
 end
 
 # claim `StructProbCircuit` as the default `ProbCircuit` implementation that has a vtree
-compile(::Type{ProbCircuit}, args...) =
-    compile(StructProbCircuit, args...)
-
-compile(::Type{<:StructProbCircuit}, ::Vtree, b::Bool) =
-    compile(StructProbCircuit, b)
 
-# act as a place holder in `condition`
-using LogicCircuits: structfalse
+compile(n::StructProbCircuit, args...) = 
+    compile(typeof(n), root(vtree(n)), args...)
 
-compile(::Type{<:StructProbCircuit}, b::Bool) =
-    b ? structtrue : structfalse
+compile(::Type{<:StructProbCircuit}, ::Vtree, ::Bool) =
+    error("Probabilistic circuits do not have constant leafs.")
 
 compile(::Type{<:StructProbCircuit}, vtree::Vtree, l::Lit) =
-    PlainStructLiteralNode(l,find_leaf(lit2var(l),vtree))
+    StructProbLiteralNode(l,find_leaf(lit2var(l),vtree))
 
 
-function compile(::Type{<:StructProbCircuit}, vtree::Vtree, circuit::StructProbCircuit)
-    f_con(n) = error("ProbCircuit does not have a constant node")
+function compile(::Type{<:StructProbCircuit}, vtree::Vtree, circuit::LogicCircuit)
+    f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
     f_lit(n) = compile(StructProbCircuit, vtree, literal(n))
-    f_a(n, cns) = conjoin(cns...) # note: this will use the LCA as vtree node
-    f_o(n, cns) = disjoin(cns) # note: this will use the LCA as vtree node
+    f_a(n, cns) = multiply(cns...) # note: this will use the LCA as vtree node
+    f_o(n, cns) = summate(cns) # note: this will use the LCA as vtree node
     foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, StructProbCircuit)
 end
 
-
-function check_parameter_integrity(circuit::ProbCircuit)
-    for node in or_nodes(circuit)
-        @assert all(θ -> !isnan(θ), node.log_thetas) "There is a NaN in one of the log_thetas"
-    end
-    true
+function fully_factorized_circuit(::Type{<:StructProbCircuit}, vtree::Vtree)
+    ff_logic_circuit = fully_factorized_circuit(PlainStructLogicCircuit, vtree)
+    compile(StructProbCircuit, vtree, ff_logic_circuit)
 end
diff --git a/test/plain_prob_nodes_tests.jl b/test/plain_prob_nodes_tests.jl
index eb43baec..1ace42ce 100644
--- a/test/plain_prob_nodes_tests.jl
+++ b/test/plain_prob_nodes_tests.jl
@@ -21,7 +21,8 @@ include("helper/plain_logic_circuits.jl")
     @test GateType(p1) isa ⋁Gate
     @test GateType(children(p1)[1]) isa ⋀Gate
     @test GateType(lit3) isa LiteralGate
-
+    @test length(mul_nodes(p1)) == 4
+    
     # methods
     @test num_parameters(p1) == 10
 
@@ -36,4 +37,6 @@ include("helper/plain_logic_circuits.jl")
     r1 = fully_factorized_circuit(ProbCircuit,10)
     @test num_parameters(r1) == 2*10+1
 
+    @test length(mul_nodes(r1)) == 1
+
 end
\ No newline at end of file
diff --git a/test/structured_prob_nodes_tests.jl b/test/structured_prob_nodes_tests.jl
new file mode 100644
index 00000000..2947c9f5
--- /dev/null
+++ b/test/structured_prob_nodes_tests.jl
@@ -0,0 +1,100 @@
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+
+
+@testset "structured probabilistic circuit nodes" begin
+
+    vtree = PlainVtree(10, :balanced)
+    f = fully_factorized_circuit(StructProbCircuit, vtree)
+    @test f isa StructProbCircuit
+    @test num_nodes(f) == 20+10+9*2+1
+    @test num_edges(f) == 20+18+9+1
+    @test length(mul_nodes(f)) == 9
+    @test length(sum_nodes(f)) == 10+9+1
+
+    @test respects_vtree(f)
+    @test respects_vtree(f, PlainVtree(10, :balanced))
+    @test !respects_vtree(f, PlainVtree(5, :balanced))
+    @test !respects_vtree(f, PlainVtree(10, :rightlinear))
+    @test !respects_vtree(f, PlainVtree(10, :leftlinear))
+
+    @test variable(left_most_descendent(f)) == Var(1)
+    @test variable(right_most_descendent(f)) == Var(10)
+    @test ispositive(left_most_descendent(f))
+    @test isnegative(right_most_descendent(f))
+
+    @test literal((StructProbCircuit,vtree)(Lit(-5))) == Lit(-5)
+
+    @test_throws Exception multiply(StructProbCircuit[])
+    @test_throws Exception summate(StructProbCircuit[])
+
+    @test isdecomposable(f)
+
+    @test variables(f) == BitSet(1:10)
+    @test num_variables(f) == 10
+    @test issmooth(f)
+
+    @test f(DataFrame(BitArray([1 0 1 0 1 0 1 0 1 0;
+                    1 1 1 1 1 1 1 1 1 1;
+                    0 0 0 0 0 0 0 0 0 0;
+                    0 1 1 0 1 0 0 1 0 1]))) == BitVector([1,1,1,1])
+
+    plainf = PlainLogicCircuit(f) 
+    foreach(plainf) do n
+        @test n isa PlainLogicCircuit
+    end
+    @test plainf !== f
+    @test num_edges(plainf) == num_edges(f)
+    @test num_nodes(plainf) == num_nodes(f) 
+    @test length(and_nodes(plainf)) == 9
+    @test length(or_nodes(plainf)) == 10+9+1
+    @test model_count(plainf) == BigInt(2)^10
+    @test isempty(intersect(linearize(f),linearize(plainf)))
+
+    ref = StructProbCircuit(vtree,plainf)
+    foreach(ref) do n
+        @test n isa StructProbCircuit
+    end
+    @test plainf !== ref
+    @test f !== ref
+    @test f.vtree === ref.vtree
+    @test num_edges(ref) == num_edges(f)
+    @test num_nodes(ref) == num_nodes(f) 
+    @test length(and_nodes(ref)) == 9
+    @test length(or_nodes(ref)) == 10+9+1
+    @test model_count(ref) == BigInt(2)^10
+    @test isempty(intersect(linearize(f),linearize(ref)))
+
+    ref = StructProbCircuit(vtree,f)
+    foreach(ref) do n
+        @test n isa StructProbCircuit
+    end
+    @test plainf !== ref
+    @test f !== ref
+    @test f.vtree === ref.vtree
+    @test num_edges(ref) == num_edges(f)
+    @test num_nodes(ref) == num_nodes(f) 
+    @test length(and_nodes(ref)) == 9
+    @test length(or_nodes(ref)) == 10+9+1
+    @test model_count(ref) == BigInt(2)^10
+    @test isempty(intersect(linearize(f),linearize(ref)))
+
+    mgr = SddMgr(7, :balanced)
+    v = Dict([(i => compile(mgr, Lit(i))) for i=1:7])
+    c = (v[1] | !v[2] | v[3]) &
+        (v[2] | !v[7] | v[6]) &
+        (v[3] | !v[4] | v[5]) &
+        (v[1] | !v[4] | v[6])
+
+    c2 = StructLogicCircuit(mgr, c)
+    c2 = propagate_constants(c2; remove_unary=true)
+    
+    c3 = StructProbCircuit(mgr, c2)
+    foreach(c3) do n
+      @test n isa StructProbCircuit
+    end
+    @test num_edges(c3) == 69
+    @test num_variables(c3) == 7
+
+end
\ No newline at end of file

From 8b230e4db987e3ab4d519d9befd3c94d9335e172 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 30 Aug 2020 22:29:40 -0500
Subject: [PATCH 073/131] clean up dependencies

---
 Project.toml                        | 1 +
 src/{ => reasoning}/informations.jl | 0
 test/Project.toml                   | 4 ----
 3 files changed, 1 insertion(+), 4 deletions(-)
 rename src/{ => reasoning}/informations.jl (100%)

diff --git a/Project.toml b/Project.toml
index 7094194f..5152a47b 100644
--- a/Project.toml
+++ b/Project.toml
@@ -28,6 +28,7 @@ StatsFuns = "4c63d2b9-4356-54db-8cca-17b64c39e42c"
 BlossomV = "0.4"
 CUDA = "1.2"
 Clustering = "0.14"
+DataFrames = "0.21"
 DataStructures = "0.17"
 LightGraphs = "1.3"
 LogicCircuits = "0.1.1"
diff --git a/src/informations.jl b/src/reasoning/informations.jl
similarity index 100%
rename from src/informations.jl
rename to src/reasoning/informations.jl
diff --git a/test/Project.toml b/test/Project.toml
index 77513980..90671629 100644
--- a/test/Project.toml
+++ b/test/Project.toml
@@ -1,10 +1,6 @@
 [deps]
-DataStructures = "864edb3b-99cc-5e75-8d2d-829cb0a9cfe8"
 Distributed = "8ba89e20-285c-5b6f-9357-94700520ee1b"
 Jive = "ba5e3d4b-8524-549f-bc71-e76ad9e9deed"
-LightGraphs = "093fc24a-ae57-5d10-9952-331d41423f4d"
-LogicCircuits = "a7847b3b-b7f1-4dd5-83c3-60e0aa0f8599"
-MetaGraphs = "626554b9-1ddb-594c-aa3c-2596fe9399a5"
 Pkg = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
 Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40"

From aece7d02e547f3ae68e3b8b7e13ac83e32dae661 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Mon, 31 Aug 2020 02:12:17 -0500
Subject: [PATCH 074/131]  likelihood computation on CPU

---
 src/LoadSave/circuit_line_compiler.jl         |   4 +-
 src/LoadSave/circuit_savers.jl                |   6 +-
 src/ProbabilisticCircuits.jl                  |   3 +-
 src/abstract_prob_nodes.jl                    |   7 +-
 src/exp_flows.jl                              | 219 ------------------
 src/mixtures/em.jl                            |  10 +-
 src/mixtures/shared_prob_nodes.jl             |   4 +-
 src/parameters.jl                             |  14 +-
 src/plain_prob_nodes.jl                       |   2 +-
 src/{reasoning => queries}/expectation.jl     |  71 +++++-
 .../expected_flows.jl}                        |   2 +-
 src/queries/expected_flows2.jl                | 217 +++++++++++++++++
 .../information.jl}                           |  93 ++------
 src/queries/likelihood.jl                     | 123 ++++++++++
 src/{ => queries}/queries.jl                  |  35 +--
 src/structured_prob_nodes.jl                  |   2 +-
 test/broken/LoadSave/circuit_loaders_tests.jl |  18 +-
 test/broken/StructureLearner/init_tests.jl    |   2 +-
 18 files changed, 466 insertions(+), 366 deletions(-)
 delete mode 100644 src/exp_flows.jl
 rename src/{reasoning => queries}/expectation.jl (77%)
 rename src/{reasoning/exp_flow_circuits.jl => queries/expected_flows.jl} (99%)
 create mode 100644 src/queries/expected_flows2.jl
 rename src/{reasoning/informations.jl => queries/information.jl} (66%)
 create mode 100644 src/queries/likelihood.jl
 rename src/{ => queries}/queries.jl (78%)

diff --git a/src/LoadSave/circuit_line_compiler.jl b/src/LoadSave/circuit_line_compiler.jl
index a0d09d7e..2aca9f95 100644
--- a/src/LoadSave/circuit_line_compiler.jl
+++ b/src/LoadSave/circuit_line_compiler.jl
@@ -62,11 +62,11 @@ function decorate_prob(lines::CircuitFormatLines, logic_circuit::LogicCircuit, i
     function compile(ln::WeightedNamedConstantLine)
         @assert lnconstant(ln) == true
         root = id2probnode(ln.node_id)
-        root.log_thetas .= [ln.weight, log1p(-exp(ln.weight))]
+        root.log_probs .= [ln.weight, log1p(-exp(ln.weight))]
     end
     function compile(ln::DecisionLine{<:PSDDElement})
         root = id2probnode(ln.node_id)
-        root.log_thetas .= [x.weight for x in ln.elements]
+        root.log_probs .= [x.weight for x in ln.elements]
     end
 
     foreach(compile, lines)
diff --git a/src/LoadSave/circuit_savers.jl b/src/LoadSave/circuit_savers.jl
index 180e54a2..fd22fc52 100644
--- a/src/LoadSave/circuit_savers.jl
+++ b/src/LoadSave/circuit_savers.jl
@@ -27,9 +27,9 @@ istrue_node(n)::Bool =
 
 function decompile(n::StructSumNode, node2id, vtree2id)::Union{WeightedNamedConstantLine, DecisionLine{PSDDElement}} 
     if istrue_node(n)
-        WeightedNamedConstantLine(node2id[n], vtree2id[n.vtree], lit2var(children(n)[1].literal), n.log_thetas[1]) # TODO
+        WeightedNamedConstantLine(node2id[n], vtree2id[n.vtree], lit2var(children(n)[1].literal), n.log_probs[1]) # TODO
     else
-        DecisionLine(node2id[n], vtree2id[n.vtree], UInt32(num_children(n)), map(x -> make_element(x[1], x[2], node2id), zip(children(n), n.log_thetas)))
+        DecisionLine(node2id[n], vtree2id[n.vtree], UInt32(num_children(n)), map(x -> make_element(x[1], x[2], node2id), zip(children(n), n.log_probs)))
     end
 end
 
@@ -158,7 +158,7 @@ function save_as_dot(circuit::ProbCircuit, file::String)
                 write(f, "$(node_cache[n]) -> $(node_cache[c])\n")
             end
         elseif n isa Prob⋁
-            for (c, p) in zip(children(n), exp.(n.log_thetas))
+            for (c, p) in zip(children(n), exp.(n.log_probs))
                 prob = @sprintf "%0.1f" p
                 write(f, "$(node_cache[n]) -> $(node_cache[c]) [label=\"$prob\"]\n")
             end
diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 83b3588d..6aa05804 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -13,9 +13,10 @@ include("Utils/Utils.jl")
 include("abstract_prob_nodes.jl")
 include("plain_prob_nodes.jl")
 include("parameters.jl")
-
 include("structured_prob_nodes.jl")
 
+include("queries/likelihood.jl")
+
 # include("exp_flows.jl")
 # include("queries.jl")
 # include("informations.jl")
diff --git a/src/abstract_prob_nodes.jl b/src/abstract_prob_nodes.jl
index 4d9c0127..46e37c66 100644
--- a/src/abstract_prob_nodes.jl
+++ b/src/abstract_prob_nodes.jl
@@ -13,9 +13,12 @@ using LogicCircuits: LogicCircuit
 abstract type ProbCircuit <: LogicCircuit end
 
 #####################
-# node functions that need to be implemented for each type of circuit
+# node functions that need to be implemented for each type of probabilistic circuit
 #####################
 
+"Get the parameters associated with a sum node"
+params(n) = n.log_probs
+
 import LogicCircuits: children, compile # extend
 
 "Multiply nodes into a single circuit"
@@ -70,7 +73,7 @@ sum_nodes(c::ProbCircuit) = ⋁_nodes(c)
 
 function check_parameter_integrity(circuit::ProbCircuit)
     for node in sum_nodes(circuit)
-        @assert all(θ -> !isnan(θ), node.log_thetas) "There is a NaN in one of the log_thetas"
+        @assert all(θ -> !isnan(θ), node.log_probs) "There is a NaN in one of the log_probs"
     end
     true
 end
\ No newline at end of file
diff --git a/src/exp_flows.jl b/src/exp_flows.jl
deleted file mode 100644
index d356bdc3..00000000
--- a/src/exp_flows.jl
+++ /dev/null
@@ -1,219 +0,0 @@
-#TODO: reinstate in new framework
-
-# export evaluate_exp, compute_exp_flows, get_downflow, get_upflow, get_exp_downflow, get_exp_upflow
-
-
-# using StatsFuns: logsumexp
-
-# # TODO move to LogicCircuits
-# # TODO downflow struct
-# using LogicCircuits: materialize, UpFlow, UpDownFlow, UpDownFlow1, UpDownFlow2
-
-# """
-# Get upflow from logic circuit
-# """
-# @inline get_upflow(n::LogicCircuit) = get_upflow(n.data)
-# @inline get_upflow(elems::UpDownFlow1) = elems.upflow
-# @inline get_upflow(elems::UpFlow) = materialize(elems)
-
-# """
-# Get the node/edge flow from logic circuit
-# """
-# function get_downflow(n::LogicCircuit; root=nothing)::BitVector
-#     downflow(x::UpDownFlow1) = x.downflow
-#     downflow(x::UpDownFlow2) = begin
-#         ors = or_nodes(root)
-#         p = findall(p -> n in children(p), ors)
-#         @assert length(p) == 1
-#         get_downflow(ors[p[1]], n)
-#     end
-#     downflow(n.data)
-# end
-
-# function get_downflow(n::LogicCircuit, c::LogicCircuit)::BitVector
-#     @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
-#     get_downflow(n) .& get_upflow(c)
-# end
-
-# #####################
-# # performance-critical queries related to circuit flows
-# #####################
-
-# "Container for circuit flows represented as a float vector"
-# const ExpUpFlow1 = Vector{Float64}
-
-# "Container for circuit flows represented as an implicit conjunction of a prime and sub float vector (saves memory allocations in circuits with many binary conjunctions)"
-# struct ExpUpFlow2
-#     prime_flow::Vector{Float64}
-#     sub_flow::Vector{Float64}
-# end
-
-# const ExpUpFlow = Union{ExpUpFlow1,ExpUpFlow2}
-
-# @inline ExpUpFlow1(elems::ExpUpFlow1) = elems
-# @inline ExpUpFlow1(elems::ExpUpFlow2) = elems.prime_flow .+ elems.sub_flow
-
-# function evaluate_exp(root::ProbCircuit, data;
-#                    nload = nload, nsave = nsave, reset=true)::Vector{Float64}
-#     n_ex::Int = num_examples(data)
-#     ϵ = 0.0
-
-#     @inline f_lit(n) = begin
-#         uf = convert(Vector{Int8}, feature_values(data, variable(n)))
-#         if ispositive(n)
-#             uf[uf.==-1] .= 1
-#         else
-#             uf .= 1 .- uf
-#             uf[uf.==2] .= 1
-#         end
-#         uf = convert(Vector{Float64}, uf)
-#         uf .= log.(uf .+ ϵ)
-#     end
-    
-#     @inline f_con(n) = begin
-#         uf = istrue(n) ? ones(Float64, n_ex) : zeros(Float64, n_ex)
-#         uf .= log.(uf .+ ϵ)
-#     end
-    
-#     @inline fa(n, call) = begin
-#         if num_children(n) == 1
-#             return ExpUpFlow1(call(@inbounds children(n)[1]))
-#         else
-#             c1 = call(@inbounds children(n)[1])::ExpUpFlow
-#             c2 = call(@inbounds children(n)[2])::ExpUpFlow
-#             if num_children(n) == 2 && c1 isa ExpUpFlow1 && c2 isa ExpUpFlow1 
-#                 return ExpUpFlow2(c1, c2) # no need to allocate a new BitVector
-#             end
-#             x = flowop(c1, c2, +)
-#             for c in children(n)[3:end]
-#                 accumulate(x, call(c), +)
-#             end
-#             return x
-#         end
-#     end
-    
-#     @inline fo(n, call) = begin
-#         if num_children(n) == 1
-#             return ExpUpFlow1(call(@inbounds children(n)[1]))
-#         else
-#             log_thetas = n.log_thetas
-#             c1 = call(@inbounds children(n)[1])::ExpUpFlow
-#             c2 = call(@inbounds children(n)[2])::ExpUpFlow
-#             x = flowop(c1, log_thetas[1], c2, log_thetas[2], logsumexp)
-#             for (i, c) in enumerate(children(n)[3:end])
-#                 accumulate(x, call(c), log_thetas[i+2], logsumexp)
-#             end
-#             return x
-#         end
-#     end
-    
-#     # ensure flow us Flow1 at the root, even when it's a conjunction
-#     root_flow = ExpUpFlow1(foldup(root, f_con, f_lit, fa, fo, ExpUpFlow; nload, nsave, reset))
-#     return nsave(root, root_flow)
-# end
-
-# @inline flowop(x::ExpUpFlow, y::ExpUpFlow, op)::ExpUpFlow1 =
-#     op.(ExpUpFlow1(x), ExpUpFlow1(y))
-
-# @inline flowop(x::ExpUpFlow, w1::Float64, y::ExpUpFlow, w2::Float64, op)::ExpUpFlow1 =
-#     op.(ExpUpFlow1(x) .+ w1, ExpUpFlow1(y) .+ w2)
-
-# import Base.accumulate
-# @inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, op) = 
-#     @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v)); nothing
-
-# @inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, w::Float64, op) = 
-#     @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v) + w); nothing
-
-
-# #####################
-# # downward pass
-# #####################
-
-# struct ExpUpDownFlow1
-#     upflow::ExpUpFlow1
-#     downflow::Vector{Float64}
-#     ExpUpDownFlow1(upf::ExpUpFlow1) = new(upf, log.(zeros(Float64, length(upf)) .+ 1e-300))
-# end
-
-# const ExpUpDownFlow2 = ExpUpFlow2
-
-# const ExpUpDownFlow = Union{ExpUpDownFlow1, ExpUpDownFlow2}
-
-
-# function compute_exp_flows(circuit::ProbCircuit, data)
-
-#     # upward pass
-#     @inline upflow!(n, v) = begin
-#         n.data = (v isa ExpUpFlow1) ? ExpUpDownFlow1(v) : v
-#         v
-#     end
-
-#     @inline upflow(n) = begin
-#         d = n.data::ExpUpDownFlow
-#         (d isa ExpUpDownFlow1) ? d.upflow : d
-#     end
-
-#     evaluate_exp(circuit, data; nload=upflow, nsave=upflow!, reset=false)
-    
-#     # downward pass
-
-#     @inline downflow(n) = (n.data::ExpUpDownFlow1).downflow
-#     @inline isfactorized(n) = n.data::ExpUpDownFlow isa ExpUpDownFlow2
-
-#     downflow(circuit) .= 0.0
-
-#     foreach_down(circuit; setcounter=false) do n
-#         if isinner(n) && !isfactorized(n)
-#             downflow_n = downflow(n)
-#             upflow_n = upflow(n)
-#             for ite in 1 : num_children(n)
-#                 c = children(n)[ite]
-#                 log_theta = is⋀gate(n) ? 0.0 : n.log_thetas[ite]
-#                 if isfactorized(c)
-#                     upflow2_c = c.data::ExpUpDownFlow2
-#                     # propagate one level further down
-#                     for i = 1:2
-#                         downflow_c = downflow(@inbounds children(c)[i])
-#                         accumulate(downflow_c, downflow_n .+ log_theta .+ upflow2_c.prime_flow 
-#                         .+ upflow2_c.sub_flow .- upflow_n, logsumexp)
-#                     end
-#                 else
-#                     upflow1_c = (c.data::ExpUpDownFlow1).upflow
-#                     downflow_c = downflow(c)
-#                     accumulate(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n, logsumexp)
-#                 end
-#             end 
-#         end
-#         nothing
-#     end
-#     nothing
-# end
-
-
-# """
-# Get upflow of a probabilistic circuit
-# """
-# @inline get_exp_upflow(pc::ProbCircuit) = get_exp_upflow(pc.data)
-# @inline get_exp_upflow(elems::ExpUpDownFlow1) = elems.upflow
-# @inline get_exp_upflow(elems::ExpUpFlow) = ExpUpFlow1(elems)
-
-# """
-# Get the node/edge downflow from probabilistic circuit
-# """
-# function get_exp_downflow(n::ProbCircuit; root=nothing)::Vector{Float64}
-#     downflow(x::ExpUpDownFlow1) = x.downflow
-#     downflow(x::ExpUpDownFlow2) = begin
-#         ors = or_nodes(root)
-#         p = findall(p -> n in children(p), ors)
-#         @assert length(p) == 1
-#         get_exp_downflow(ors[p[1]], n)
-#     end
-#     downflow(n.data)
-# end
-
-# function get_exp_downflow(n::ProbCircuit, c::ProbCircuit)::Vector{Float64}
-#     @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
-#     log_theta = n.log_thetas[findfirst(x -> x == c, children(n))]
-#     return get_exp_downflow(n) .+ log_theta .+ get_exp_upflow(c) .- get_exp_upflow(n)
-# end
\ No newline at end of file
diff --git a/src/mixtures/em.jl b/src/mixtures/em.jl
index ddb1d518..fb0aa461 100644
--- a/src/mixtures/em.jl
+++ b/src/mixtures/em.jl
@@ -72,7 +72,7 @@ function log_likelihood_per_instance_per_component(pc::SharedProbCircuit, data)
         if num_children(n) != 1 # other nodes have no effect on likelihood
             for i in 1 : num_children(n)
                 c = children(n)[i]
-                log_theta = reshape(n.log_thetas[i, :], 1, num_mix)
+                log_theta = reshape(n.log_probs[i, :], 1, num_mix)
                 indices = get_downflow(n, c)
                 view(log_likelihoods, indices::BitVector, :) .+=  log_theta # see MixedProductKernelBenchmark.jl
             end
@@ -87,15 +87,15 @@ function estimate_parameters_cached(pc::SharedProbCircuit, example_weights; pseu
     foreach(pc) do pn
         if is⋁gate(pn)
             if num_children(pn) == 1
-                pn.log_thetas .= 0.0
+                pn.log_probs .= 0.0
             else
                 smoothed_flow = Float64.(sum(example_weights[get_downflow(pn), :], dims=1)) .+ pseudocount
                 uniform_pseudocount = pseudocount / num_children(pn)
                 children_flows = vcat(map(c -> sum(example_weights[get_downflow(pn, c), :], dims=1), children(pn))...)
-                @. pn.log_thetas = log((children_flows + uniform_pseudocount) / smoothed_flow)
-                @assert all(sum(exp.(pn.log_thetas), dims=1) .≈ 1.0) "Parameters do not sum to one locally"
+                @. pn.log_probs = log((children_flows + uniform_pseudocount) / smoothed_flow)
+                @assert all(sum(exp.(pn.log_probs), dims=1) .≈ 1.0) "Parameters do not sum to one locally"
                 # normalize away any leftover error
-                pn.log_thetas .-= logsumexp(pn.log_thetas, dims=1)
+                pn.log_probs .-= logsumexp(pn.log_probs, dims=1)
             end
         end
     end
diff --git a/src/mixtures/shared_prob_nodes.jl b/src/mixtures/shared_prob_nodes.jl
index e1af2011..9f0f9821 100644
--- a/src/mixtures/shared_prob_nodes.jl
+++ b/src/mixtures/shared_prob_nodes.jl
@@ -45,7 +45,7 @@ A probabilistic disjunction node (Or node)
 """
 mutable struct SharedPlainSumNode <: SharedPlainProbInnerNode
     children::Vector{<:SharedProbCircuit}
-    log_thetas::Matrix{Float64}
+    log_probs::Matrix{Float64}
     data
     counter::UInt32
     SharedPlainSumNode(children, n_mixture) = begin
@@ -78,4 +78,4 @@ end
 import LogicCircuits: children # make available for extension
 
 @inline children(n::SharedPlainProbInnerNode) = n.children
-@inline num_components(n::SharedProbCircuit) = size(n.log_thetas)[2]
+@inline num_components(n::SharedProbCircuit) = size(n.log_probs)[2]
diff --git a/src/parameters.jl b/src/parameters.jl
index e8e144f5..646763e1 100644
--- a/src/parameters.jl
+++ b/src/parameters.jl
@@ -9,7 +9,7 @@ Maximum likilihood estimation of parameters given data
 """
 function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
     @assert isbinarydata(data) "Probabilistic circuit parameter estimation for binary data only"
-    bc = BitCircuit(pc, data; reset=false, on_gpu = isgpu(data))
+    bc = BitCircuit(pc, data; reset=false, gpu = isgpu(data))
     on_node, on_edge, get_params = if isgpu(data)
         estimate_parameters_gpu(bc, pseudocount)
     else
@@ -20,14 +20,14 @@ function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
     foreach_reset(pc) do pn
         if is⋁gate(pn)
             if num_children(pn) == 1
-                pn.log_thetas .= zero(Float64)
+                pn.log_probs .= zero(Float64)
             else
                 id = (pn.data::⋁NodeId).node_id
                 @inbounds els_start = bc.nodes[1,id]
                 @inbounds els_end = bc.nodes[2,id]
-                @inbounds @views pn.log_thetas .= params[els_start:els_end]
-                @assert isapprox(sum(exp.(pn.log_thetas)), 1.0, atol=1e-6) "Parameters do not sum to one locally: $(sum(exp.(pn.log_thetas))); $(pn.log_thetas)"
-                pn.log_thetas .-= logsumexp(pn.log_thetas) # normalize away any leftover error
+                @inbounds @views pn.log_probs .= params[els_start:els_end]
+                @assert isapprox(sum(exp.(pn.log_probs)), 1.0, atol=1e-6) "Parameters do not sum to one locally: $(sum(exp.(pn.log_probs))); $(pn.log_probs)"
+                pn.log_probs .-= logsumexp(pn.log_probs) # normalize away any leftover error
             end
         end
     end
@@ -112,9 +112,9 @@ function uniform_parameters(pc::ProbCircuit)
     foreach(pc) do pn
         if is⋁gate(pn)
             if num_children(pn) == 1
-                pn.log_thetas .= 0.0
+                pn.log_probs .= 0.0
             else
-                pn.log_thetas .= log.(ones(Float64, num_children(pn)) ./ num_children(pn))
+                pn.log_probs .= log.(ones(Float64, num_children(pn)) ./ num_children(pn))
             end
         end
     end
diff --git a/src/plain_prob_nodes.jl b/src/plain_prob_nodes.jl
index 3403ecee..c37cf49e 100644
--- a/src/plain_prob_nodes.jl
+++ b/src/plain_prob_nodes.jl
@@ -36,7 +36,7 @@ end
 "A probabilistic disjunction node (summation node)"
 mutable struct PlainSumNode <: PlainProbInnerNode
     children::Vector{PlainProbCircuit}
-    log_thetas::Vector{Float64}
+    log_probs::Vector{Float64}
     data
     counter::UInt32
     PlainSumNode(c) = begin
diff --git a/src/reasoning/expectation.jl b/src/queries/expectation.jl
similarity index 77%
rename from src/reasoning/expectation.jl
rename to src/queries/expectation.jl
index 9bc70047..6d241d04 100644
--- a/src/reasoning/expectation.jl
+++ b/src/queries/expectation.jl
@@ -1,4 +1,67 @@
-export Expectation, ExpectationUpward, Moment
+export pr_constraint, Expectation, ExpectationUpward, Moment
+
+
+const StrutCircuit = Union{ProbCircuit, StructLogicCircuit}
+const PRCache = Dict{Tuple{ProbCircuit, StrutCircuit}, Float64}
+
+# Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability
+# spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
+
+"""
+Calculate the probability of the logic formula given by sdd for the psdd
+"""
+function pr_constraint(psdd_node::ProbCircuit, sdd_node::StrutCircuit,
+    cache::PRCache=PRCache())::Float64
+    
+    # Cache hit
+    if (psdd_node, sdd_node) in keys(cache) 
+        return cache[psdd_node, sdd_node]
+    
+    # Boundary cases
+    elseif psdd_node isa StructProbLiteralNode
+        # Both are literals, just check whether they agrees with each other 
+        if isliteralgate(sdd_node)
+            if literal(psdd_node) == literal(sdd_node)
+                return get!(cache, (psdd_node, sdd_node), 1.0)
+            else
+                return get!(cache, (psdd_node, sdd_node), 0.0)
+            end
+        else
+            pr_constraint(psdd_node, children(sdd_node)[1], cache)
+            if length(children(sdd_node)) > 1
+                pr_constraint(psdd_node, children(sdd_node)[2], cache)
+                return get!(cache, (psdd_node, sdd_node), 1.0)
+            else
+                return get!(cache, (psdd_node, sdd_node),
+                    literal(children(sdd_node)[1]) == literal(psdd_node) ? 1.0 : 0.0)
+            end
+        end
+    
+    # The psdd is true
+    elseif children(psdd_node)[1] isa StructProbLiteralNode 
+        theta = exp(psdd_node.log_probs[1])
+        return get!(cache, (psdd_node, sdd_node),
+            theta * pr_constraint(children(psdd_node)[1], sdd_node, cache) +
+            (1.0 - theta) * pr_constraint(children(psdd_node)[2], sdd_node, cache))
+    
+    # Both psdds are not trivial
+    else 
+        prob = 0.0
+        for (prob⋀_node, log_theta) in zip(children(psdd_node), psdd_node.log_probs)
+            p = children(prob⋀_node)[1]
+            s = children(prob⋀_node)[2]
+
+            theta = exp(log_theta)
+            for sdd⋀_node in children(sdd_node)
+                r = children(sdd⋀_node)[1]
+                t = children(sdd⋀_node)[2]
+                prob += theta * pr_constraint(p, r, cache) * pr_constraint(s, t, cache)
+            end
+        end
+        return get!(cache, (psdd_node, sdd_node), prob)
+    end
+end
+
 
 ExpCacheDict = Dict{Pair{ProbCircuit, LogisticCircuit}, Array{Float64, 2}}
 MomentCacheDict = Dict{Tuple{ProbCircuit, LogisticCircuit, Int64}, Array{Float64, 2}}
@@ -98,7 +161,7 @@ end
 function exp_f(n::PlainSumNode, m::Logistic⋁Node, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = zeros(1 , num_examples(data) )
-        pthetas = [exp(n.log_thetas[i]) for i in 1:num_children(n)]
+        pthetas = [exp(n.log_probs[i]) for i in 1:num_children(n)]
         @fastmath @simd for i in 1:num_children(n)
             @simd for j in 1:num_children(m)
                 value .+= (pthetas[i] .* exp_f(children(n)[i], children(m)[j], data, cache))
@@ -168,7 +231,7 @@ end
 function exp_fg(n::PlainSumNode, m::Logistic⋁Node, data, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         value = zeros(classes(m) , num_examples(data) )
-        pthetas = [exp(n.log_thetas[i]) for i in 1:num_children(n)]
+        pthetas = [exp(n.log_probs[i]) for i in 1:num_children(n)]
         @fastmath @simd for i in 1:num_children(n)
             for j in 1:num_children(m)
                 value .+= (pthetas[i] .* m.thetas[j,:]) .* exp_f(children(n)[i], children(m)[j], data, cache)
@@ -223,7 +286,7 @@ function moment_fg(n::PlainSumNode, m::Logistic⋁Node, data, moment::Int, cache
 
     get!(cache.fg, (n, m, moment)) do
         value = zeros(classes(m) , num_examples(data) )
-        pthetas = [exp(n.log_thetas[i]) for i in 1:num_children(n)]
+        pthetas = [exp(n.log_probs[i]) for i in 1:num_children(n)]
         @fastmath @simd for i in 1:num_children(n)
             for j in 1:num_children(m)
                 for z in 0:moment
diff --git a/src/reasoning/exp_flow_circuits.jl b/src/queries/expected_flows.jl
similarity index 99%
rename from src/reasoning/exp_flow_circuits.jl
rename to src/queries/expected_flows.jl
index eef7575b..aab0ae9e 100644
--- a/src/reasoning/exp_flow_circuits.jl
+++ b/src/queries/expected_flows.jl
@@ -97,7 +97,7 @@ function exp_pass_up_node(node::ExpFlowNode{E}, data) where E
 
     if node.p_origin isa PlainSumNode && node.f_origin isa Logistic⋁Node
         #todo this ordering might be different than the ExpFlowNode children
-        pthetas = [exp(node.p_origin.log_thetas[i])
+        pthetas = [exp(node.p_origin.log_probs[i])
                     for i in 1:length(children(node.p_origin)) for j in 1:length(children(node.f_origin))]
         fthetas = [node.f_origin.thetas[j,:] # only taking the first class for now
             for i in 1:length(node.p_origin.children) for j in 1:length(node.f_origin.children)]
diff --git a/src/queries/expected_flows2.jl b/src/queries/expected_flows2.jl
new file mode 100644
index 00000000..9c2d3bdd
--- /dev/null
+++ b/src/queries/expected_flows2.jl
@@ -0,0 +1,217 @@
+export evaluate_exp, compute_exp_flows, get_downflow, get_upflow, get_exp_downflow, get_exp_upflow
+
+
+using StatsFuns: logsumexp
+
+# TODO move to LogicCircuits
+# TODO downflow struct
+using LogicCircuits: materialize, UpFlow, UpDownFlow, UpDownFlow1, UpDownFlow2
+
+"""
+Get upflow from logic circuit
+"""
+@inline get_upflow(n::LogicCircuit) = get_upflow(n.data)
+@inline get_upflow(elems::UpDownFlow1) = elems.upflow
+@inline get_upflow(elems::UpFlow) = materialize(elems)
+
+"""
+Get the node/edge flow from logic circuit
+"""
+function get_downflow(n::LogicCircuit; root=nothing)::BitVector
+    downflow(x::UpDownFlow1) = x.downflow
+    downflow(x::UpDownFlow2) = begin
+        ors = or_nodes(root)
+        p = findall(p -> n in children(p), ors)
+        @assert length(p) == 1
+        get_downflow(ors[p[1]], n)
+    end
+    downflow(n.data)
+end
+
+function get_downflow(n::LogicCircuit, c::LogicCircuit)::BitVector
+    @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
+    get_downflow(n) .& get_upflow(c)
+end
+
+#####################
+# performance-critical queries related to circuit flows
+#####################
+
+"Container for circuit flows represented as a float vector"
+const ExpUpFlow1 = Vector{Float64}
+
+"Container for circuit flows represented as an implicit conjunction of a prime and sub float vector (saves memory allocations in circuits with many binary conjunctions)"
+struct ExpUpFlow2
+    prime_flow::Vector{Float64}
+    sub_flow::Vector{Float64}
+end
+
+const ExpUpFlow = Union{ExpUpFlow1,ExpUpFlow2}
+
+@inline ExpUpFlow1(elems::ExpUpFlow1) = elems
+@inline ExpUpFlow1(elems::ExpUpFlow2) = elems.prime_flow .+ elems.sub_flow
+
+function evaluate_exp(root::ProbCircuit, data;
+                   nload = nload, nsave = nsave, reset=true)::Vector{Float64}
+    n_ex::Int = num_examples(data)
+    ϵ = 0.0
+
+    @inline f_lit(n) = begin
+        uf = convert(Vector{Int8}, feature_values(data, variable(n)))
+        if ispositive(n)
+            uf[uf.==-1] .= 1
+        else
+            uf .= 1 .- uf
+            uf[uf.==2] .= 1
+        end
+        uf = convert(Vector{Float64}, uf)
+        uf .= log.(uf .+ ϵ)
+    end
+    
+    @inline f_con(n) = begin
+        uf = istrue(n) ? ones(Float64, n_ex) : zeros(Float64, n_ex)
+        uf .= log.(uf .+ ϵ)
+    end
+    
+    @inline fa(n, call) = begin
+        if num_children(n) == 1
+            return ExpUpFlow1(call(@inbounds children(n)[1]))
+        else
+            c1 = call(@inbounds children(n)[1])::ExpUpFlow
+            c2 = call(@inbounds children(n)[2])::ExpUpFlow
+            if num_children(n) == 2 && c1 isa ExpUpFlow1 && c2 isa ExpUpFlow1 
+                return ExpUpFlow2(c1, c2) # no need to allocate a new BitVector
+            end
+            x = flowop(c1, c2, +)
+            for c in children(n)[3:end]
+                accumulate(x, call(c), +)
+            end
+            return x
+        end
+    end
+    
+    @inline fo(n, call) = begin
+        if num_children(n) == 1
+            return ExpUpFlow1(call(@inbounds children(n)[1]))
+        else
+            log_probs = n.log_probs
+            c1 = call(@inbounds children(n)[1])::ExpUpFlow
+            c2 = call(@inbounds children(n)[2])::ExpUpFlow
+            x = flowop(c1, log_probs[1], c2, log_probs[2], logsumexp)
+            for (i, c) in enumerate(children(n)[3:end])
+                accumulate(x, call(c), log_probs[i+2], logsumexp)
+            end
+            return x
+        end
+    end
+    
+    # ensure flow us Flow1 at the root, even when it's a conjunction
+    root_flow = ExpUpFlow1(foldup(root, f_con, f_lit, fa, fo, ExpUpFlow; nload, nsave, reset))
+    return nsave(root, root_flow)
+end
+
+@inline flowop(x::ExpUpFlow, y::ExpUpFlow, op)::ExpUpFlow1 =
+    op.(ExpUpFlow1(x), ExpUpFlow1(y))
+
+@inline flowop(x::ExpUpFlow, w1::Float64, y::ExpUpFlow, w2::Float64, op)::ExpUpFlow1 =
+    op.(ExpUpFlow1(x) .+ w1, ExpUpFlow1(y) .+ w2)
+
+import Base.accumulate
+@inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, op) = 
+    @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v)); nothing
+
+@inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, w::Float64, op) = 
+    @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v) + w); nothing
+
+
+#####################
+# downward pass
+#####################
+
+struct ExpUpDownFlow1
+    upflow::ExpUpFlow1
+    downflow::Vector{Float64}
+    ExpUpDownFlow1(upf::ExpUpFlow1) = new(upf, log.(zeros(Float64, length(upf)) .+ 1e-300))
+end
+
+const ExpUpDownFlow2 = ExpUpFlow2
+
+const ExpUpDownFlow = Union{ExpUpDownFlow1, ExpUpDownFlow2}
+
+
+function compute_exp_flows(circuit::ProbCircuit, data)
+
+    # upward pass
+    @inline upflow!(n, v) = begin
+        n.data = (v isa ExpUpFlow1) ? ExpUpDownFlow1(v) : v
+        v
+    end
+
+    @inline upflow(n) = begin
+        d = n.data::ExpUpDownFlow
+        (d isa ExpUpDownFlow1) ? d.upflow : d
+    end
+
+    evaluate_exp(circuit, data; nload=upflow, nsave=upflow!, reset=false)
+    
+    # downward pass
+
+    @inline downflow(n) = (n.data::ExpUpDownFlow1).downflow
+    @inline isfactorized(n) = n.data::ExpUpDownFlow isa ExpUpDownFlow2
+
+    downflow(circuit) .= 0.0
+
+    foreach_down(circuit; setcounter=false) do n
+        if isinner(n) && !isfactorized(n)
+            downflow_n = downflow(n)
+            upflow_n = upflow(n)
+            for ite in 1 : num_children(n)
+                c = children(n)[ite]
+                log_theta = is⋀gate(n) ? 0.0 : n.log_probs[ite]
+                if isfactorized(c)
+                    upflow2_c = c.data::ExpUpDownFlow2
+                    # propagate one level further down
+                    for i = 1:2
+                        downflow_c = downflow(@inbounds children(c)[i])
+                        accumulate(downflow_c, downflow_n .+ log_theta .+ upflow2_c.prime_flow 
+                        .+ upflow2_c.sub_flow .- upflow_n, logsumexp)
+                    end
+                else
+                    upflow1_c = (c.data::ExpUpDownFlow1).upflow
+                    downflow_c = downflow(c)
+                    accumulate(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n, logsumexp)
+                end
+            end 
+        end
+        nothing
+    end
+    nothing
+end
+
+
+"""
+Get upflow of a probabilistic circuit
+"""
+@inline get_exp_upflow(pc::ProbCircuit) = get_exp_upflow(pc.data)
+@inline get_exp_upflow(elems::ExpUpDownFlow1) = elems.upflow
+@inline get_exp_upflow(elems::ExpUpFlow) = ExpUpFlow1(elems)
+
+"""
+Get the node/edge downflow from probabilistic circuit
+"""
+function get_exp_downflow(n::ProbCircuit; root=nothing)::Vector{Float64}
+    downflow(x::ExpUpDownFlow1) = x.downflow
+    downflow(x::ExpUpDownFlow2) = begin
+        ors = or_nodes(root)
+        p = findall(p -> n in children(p), ors)
+        @assert length(p) == 1
+        get_exp_downflow(ors[p[1]], n)
+    end
+    downflow(n.data)
+end
+
+function get_exp_downflow(n::ProbCircuit, c::ProbCircuit)::Vector{Float64}
+    @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
+    log_theta = n.log_probs[findfirst(x -> x == c, children(n))]
+    return get_exp_downflow(n) .+ log_theta .+ get_exp_upflow(c) .- get_exp_upflow(n)
+end
\ No newline at end of file
diff --git a/src/reasoning/informations.jl b/src/queries/information.jl
similarity index 66%
rename from src/reasoning/informations.jl
rename to src/queries/information.jl
index 67d0f3af..e87d2f59 100644
--- a/src/reasoning/informations.jl
+++ b/src/queries/information.jl
@@ -1,67 +1,6 @@
-export pr_constraint, kl_divergence
+export kl_divergence
 
-const StrutCircuit = Union{ProbCircuit, StructLogicCircuit}
 const KLDCache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}
-const PRCache = Dict{Tuple{ProbCircuit, StrutCircuit}, Float64}
-
-# Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability
-# spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
-
-"""
-Calculate the probability of the logic formula given by sdd for the psdd
-"""
-function pr_constraint(psdd_node::ProbCircuit, sdd_node::StrutCircuit,
-    cache::PRCache=PRCache())::Float64
-    
-    # Cache hit
-    if (psdd_node, sdd_node) in keys(cache) 
-        return cache[psdd_node, sdd_node]
-    
-    # Boundary cases
-    elseif psdd_node isa StructProbLiteralNode
-        # Both are literals, just check whether they agrees with each other 
-        if isliteralgate(sdd_node)
-            if literal(psdd_node) == literal(sdd_node)
-                return get!(cache, (psdd_node, sdd_node), 1.0)
-            else
-                return get!(cache, (psdd_node, sdd_node), 0.0)
-            end
-        else
-            pr_constraint(psdd_node, children(sdd_node)[1], cache)
-            if length(children(sdd_node)) > 1
-                pr_constraint(psdd_node, children(sdd_node)[2], cache)
-                return get!(cache, (psdd_node, sdd_node), 1.0)
-            else
-                return get!(cache, (psdd_node, sdd_node),
-                    literal(children(sdd_node)[1]) == literal(psdd_node) ? 1.0 : 0.0)
-            end
-        end
-    
-    # The psdd is true
-    elseif children(psdd_node)[1] isa StructProbLiteralNode 
-        theta = exp(psdd_node.log_thetas[1])
-        return get!(cache, (psdd_node, sdd_node),
-            theta * pr_constraint(children(psdd_node)[1], sdd_node, cache) +
-            (1.0 - theta) * pr_constraint(children(psdd_node)[2], sdd_node, cache))
-    
-    # Both psdds are not trivial
-    else 
-        prob = 0.0
-        for (prob⋀_node, log_theta) in zip(children(psdd_node), psdd_node.log_thetas)
-            p = children(prob⋀_node)[1]
-            s = children(prob⋀_node)[2]
-
-            theta = exp(log_theta)
-            for sdd⋀_node in children(sdd_node)
-                r = children(sdd⋀_node)[1]
-                t = children(sdd⋀_node)[2]
-                prob += theta * pr_constraint(p, r, cache) * pr_constraint(s, t, cache)
-            end
-        end
-        return get!(cache, (psdd_node, sdd_node), prob)
-    end
-end
-
 
 """"
 Calculate entropy of the distribution of the input psdd."
@@ -73,11 +12,11 @@ function entropy(psdd_node::StructSumNode, psdd_entropy_cache::Dict{ProbCircuit,
         return psdd_entropy_cache[psdd_node]
     elseif children(psdd_node)[1] isa StructProbLiteralNode
         return get!(psdd_entropy_cache, psdd_node,
-            - exp(psdd_node.log_thetas[1]) * psdd_node.log_thetas[1] -
-            exp(psdd_node.log_thetas[2]) * psdd_node.log_thetas[2])
+            - exp(psdd_node.log_probs[1]) * psdd_node.log_probs[1] -
+            exp(psdd_node.log_probs[2]) * psdd_node.log_probs[2])
     else
         local_entropy = 0.0
-        for (prob⋀_node, log_prob) in zip(children(psdd_node), psdd_node.log_thetas)
+        for (prob⋀_node, log_prob) in zip(children(psdd_node), psdd_node.log_probs)
             p = children(prob⋀_node)[1]
             s = children(prob⋀_node)[2]
 
@@ -113,11 +52,11 @@ function kl_divergence(psdd_node1::StructSumNode, psdd_node2::StructSumNode,
             kl_divergence(children(psdd_node1)[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
             if literal(children(psdd_node1)[1]) == literal(psdd_node2)
                 return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                    psdd_node1.log_thetas[1] * exp(psdd_node1.log_thetas[1])
+                    psdd_node1.log_probs[1] * exp(psdd_node1.log_probs[1])
                 )
             else
                 return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                    psdd_node1.log_thetas[2] * exp(psdd_node1.log_thetas[2])
+                    psdd_node1.log_probs[2] * exp(psdd_node1.log_probs[2])
                 )
             end
         else
@@ -130,13 +69,13 @@ function kl_divergence(psdd_node1::StructSumNode, psdd_node2::StructSumNode,
             # There are two possible matches
             if literal(children(psdd_node1)[1]) == literal(children(psdd_node2)[1])
                 return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                    exp(psdd_node1.log_thetas[1]) * (psdd_node1.log_thetas[1] - psdd_node2.log_thetas[1]) +
-                    exp(psdd_node1.log_thetas[2]) * (psdd_node1.log_thetas[2] - psdd_node2.log_thetas[2])
+                    exp(psdd_node1.log_probs[1]) * (psdd_node1.log_probs[1] - psdd_node2.log_probs[1]) +
+                    exp(psdd_node1.log_probs[2]) * (psdd_node1.log_probs[2] - psdd_node2.log_probs[2])
                 )
             else
                 return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                    exp(psdd_node1.log_thetas[1]) * (psdd_node1.log_thetas[1] - psdd_node2.log_thetas[2]) +
-                    exp(psdd_node1.log_thetas[2]) * (psdd_node1.log_thetas[2] - psdd_node2.log_thetas[1])
+                    exp(psdd_node1.log_probs[1]) * (psdd_node1.log_probs[1] - psdd_node2.log_probs[2]) +
+                    exp(psdd_node1.log_probs[2]) * (psdd_node1.log_probs[2] - psdd_node2.log_probs[1])
                 )
             end
         end
@@ -144,8 +83,8 @@ function kl_divergence(psdd_node1::StructSumNode, psdd_node2::StructSumNode,
         kld = 0.0
 
         # loop through every combination of prim and sub
-        for (prob⋀_node1, log_theta1) in zip(children(psdd_node1), psdd_node1.log_thetas)
-            for (prob⋀_node2, log_theta2) in zip(children(psdd_node2), psdd_node2.log_thetas)
+        for (prob⋀_node1, log_theta1) in zip(children(psdd_node1), psdd_node1.log_probs)
+            for (prob⋀_node2, log_theta2) in zip(children(psdd_node2), psdd_node2.log_probs)
                 p = children(prob⋀_node1)[1]
                 s = children(prob⋀_node1)[2]
 
@@ -193,11 +132,11 @@ function kl_divergence(psdd_node1::StructSumNode, psdd_node2::StructProbLiteralN
         kl_divergence(children(psdd_node1)[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
         if literal(children(psdd_node1)[1]) == literal(psdd_node2)
             return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                psdd_node1.log_thetas[1] * exp(psdd_node1.log_thetas[1])
+                psdd_node1.log_probs[1] * exp(psdd_node1.log_probs[1])
             )
         else
             return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                psdd_node1.log_thetas[2] * exp(psdd_node1.log_thetas[2])
+                psdd_node1.log_probs[2] * exp(psdd_node1.log_probs[2])
             )
         end
     end
@@ -214,11 +153,11 @@ function kl_divergence(psdd_node1::StructProbLiteralNode, psdd_node2::StructSumN
         kl_divergence(psdd_node1, children(psdd_node2)[2], kl_divergence_cache, pr_constraint_cache)
         if literal(psdd_node1) == literal(children(psdd_node2)[1])
             return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                -psdd_node2.log_thetas[1]
+                -psdd_node2.log_probs[1]
             )
         else
             return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                -psdd_node2.log_thetas[2]
+                -psdd_node2.log_probs[2]
             )
         end
     end
diff --git a/src/queries/likelihood.jl b/src/queries/likelihood.jl
new file mode 100644
index 00000000..f6466e95
--- /dev/null
+++ b/src/queries/likelihood.jl
@@ -0,0 +1,123 @@
+export EVI, log_likelihood_per_instance, log_likelihood, log_likelihood_avg
+
+"""
+Complete evidence queries
+"""
+# function log_likelihood_per_instance(pc::ProbCircuit, data)
+#     @assert isbinarydata(data) "Can only calculate EVI on Bool data"
+    
+#     compute_flows(pc, data)
+#     log_likelihoods = zeros(Float64, num_examples(data))
+#     indices = init_array(Bool, num_examples(data))::BitVector
+    
+#     ll(n::ProbCircuit) = ()
+#     ll(n::Union{PlainSumNode, StructSumNode}) = begin
+#         if num_children(n) != 1 # other nodes have no effect on likelihood
+#             foreach(children(n), n.log_probs) do c, log_theta
+#                 indices = get_downflow(n, c)
+#                 view(log_likelihoods, indices::BitVector) .+=  log_theta # see MixedProductKernelBenchmark.jl
+#             end
+#          end
+#     end
+
+#     foreach(ll, pc)
+#     log_likelihoods
+# end
+
+function bitcircuit_with_params(pc, data)
+    params::Vector{Float64} = Vector{Float64}()
+    on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
+        if isnothing(n) # this decision node is not part of the PC
+            # @assert first_element == last_element
+            push!(params, 0.0)
+        else
+            # @assert last_element-first_element+1 == length(n.log_probs) "$last_element-$first_element+1 != $(length(n.log_probs))"
+            append!(params, n.log_probs)
+        end
+    end
+    bc = BitCircuit(pc, data; gpu = isgpu(data), on_decision)
+    params = isgpu(data) ? to_gpu(params) : params
+    (bc, params)
+end
+
+function log_likelihood_per_instance(pc::ProbCircuit, data)
+    @assert isbinarydata(data) "Probabilistic circuit likelihoods are for binary data only"
+    bc, params = bitcircuit_with_params(pc, data)
+    if isgpu(data)
+        log_likelihood_per_instance_gpu(bc, data, params)
+    else
+        log_likelihood_per_instance_cpu(bc, data, params)
+    end
+end
+
+function log_likelihood_per_instance_cpu(bc, data, params)
+    n_ex::Int = num_examples(data)
+    ll::Vector{Float64} = zeros(Float64, n_ex)
+    ll_lock::Threads.ReentrantLock = Threads.ReentrantLock()
+    
+    @inline function on_edge(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
+        if els_start != els_end
+            lock(ll_lock) do # TODO: move lock to inner loop?
+                for i = 1:size(flows,1)
+                    @inbounds edge_flow = values[i, p] & values[i, s] & flows[i, dec_id]
+                    first_true_bit = trailing_zeros(edge_flow)+1
+                    last_true_bit = 64-leading_zeros(edge_flow)
+                    @simd for j= first_true_bit:last_true_bit
+                        ex_id = ((i-1) << 6) + j
+                        if get_bit(edge_flow, j)
+                            @inbounds ll[ex_id] += params[el_id]
+                        end
+                    end
+                end
+            end
+        end
+        nothing
+    end
+
+    compute_values_flows(bc, data; on_edge)
+    return ll
+end
+
+function log_likelihood_per_instance_gpu(bc, pseudocount)
+    # node_counts::CuVector{Int32} = CUDA.zeros(Int32, num_nodes(bc))
+    # edge_counts::CuVector{Int32} = CUDA.zeros(Int32, num_elements(bc))
+    # params::CuVector{Float64} = CuVector{Float64}(undef, num_elements(bc))
+    # # need to manually cudaconvert closure variables
+    # node_counts_device = CUDA.cudaconvert(node_counts)
+    # edge_counts_device = CUDA.cudaconvert(edge_counts)
+    # params_device = CUDA.cudaconvert(params)
+    
+    # @inline function on_node(flows, values, dec_id, els_start, els_end, ex_id)
+    #     if els_start != els_end
+    #         @inbounds c::Int32 = count_ones(flows[ex_id, dec_id]) # cast for @atomic to be happy
+    #         CUDA.@atomic node_counts_device[dec_id] += c
+    #     end
+    #     if isone(ex_id) # only do this once
+    #         for i=els_start:els_end
+    #             params_device[i] = pseudocount/(els_end-els_start+1)
+    #         end
+    #     end
+    #     nothing
+    # end
+    
+    # @inline function on_edge(flows, values, dec_id, el_id, p, s, els_start, els_end, ex_id, edge_flow)
+    #     if els_start != els_end
+    #         c::Int32 = count_ones(edge_flow) # cast for @atomic to be happy
+    #         CUDA.@atomic edge_counts_device[el_id] += c
+    #     end
+    #     nothing
+    # end
+
+    # function get_params()
+    #     parent_counts = @views node_counts[bc.elements[1,:]]
+    #     params .= log.(params .+ edge_counts) .- log.(parent_counts .+ pseudocount)
+    #     to_cpu(params)
+    # end
+
+    # return (on_node, on_edge, get_params)
+end
+
+EVI = log_likelihood_per_instance
+
+log_likelihood(pc, data) = sum(log_likelihood_per_instance(pc, data))
+log_likelihood_avg(pc, data) = log_likelihood(pc, data)/num_examples(data)
\ No newline at end of file
diff --git a/src/queries.jl b/src/queries/queries.jl
similarity index 78%
rename from src/queries.jl
rename to src/queries/queries.jl
index 190c536a..e181dc53 100644
--- a/src/queries.jl
+++ b/src/queries/queries.jl
@@ -1,33 +1,6 @@
-export EVI, log_likelihood_per_instance, MAR, marginal_log_likelihood_per_instance, 
+export MAR, marginal_log_likelihood_per_instance, 
 MPE, MAP, sample
 
-"""
-Complete evidence queries
-"""
-function log_likelihood_per_instance(pc::ProbCircuit, data)
-    @assert isbinarydata(data) "Can only calculate EVI on Bool data"
-    
-    compute_flows(pc, data)
-    log_likelihoods = zeros(Float64, num_examples(data))
-    indices = init_array(Bool, num_examples(data))::BitVector
-    
-    ll(n::ProbCircuit) = ()
-    ll(n::Union{PlainSumNode, StructSumNode}) = begin
-        if num_children(n) != 1 # other nodes have no effect on likelihood
-            foreach(children(n), n.log_thetas) do c, log_theta
-                indices = get_downflow(n, c)
-                view(log_likelihoods, indices::BitVector) .+=  log_theta # see MixedProductKernelBenchmark.jl
-            end
-         end
-    end
-
-    foreach(ll, pc)
-    log_likelihoods
-end
-
-EVI = log_likelihood_per_instance
-
-
 """
 Marginal queries
 """
@@ -61,7 +34,7 @@ function MPE(pc::ProbCircuit, evidence)::BitMatrix
     function mpe_simulate(node::Union{PlainSumNode, StructSumNode}, active_samples::BitVector, result::BitMatrix)
         prs = zeros(length(children(node)), size(active_samples)[1] )
         @simd  for i=1:length(children(node))
-            prs[i,:] .= get_exp_upflow(children(node)[i]) .+ (node.log_thetas[i])
+            prs[i,:] .= get_exp_upflow(children(node)[i]) .+ (node.log_probs[i])
         end
     
         max_child_ids = [a[1] for a in argmax(prs, dims = 1) ]
@@ -97,7 +70,7 @@ function sample(circuit::ProbCircuit)::AbstractVector{Bool}
     end
     
     simulate(node::Union{PlainSumNode, StructSumNode}) = begin
-        idx = sample(exp.(node.log_thetas))
+        idx = sample(exp.(node.log_probs))
         simulate(children(node)[idx])
     end
 
@@ -127,7 +100,7 @@ function sample(circuit::ProbCircuit, evidence)::AbstractVector{Bool}
     
     function simulate(node::Union{PlainSumNode, StructSumNode})
         prs = [get_exp_upflow(ch)[1] for ch in children(node)] # #evidence == 1
-        idx = sample(exp.(node.log_thetas .+ prs))
+        idx = sample(exp.(node.log_probs .+ prs))
         simulate(children(node)[idx])
     end
     
diff --git a/src/structured_prob_nodes.jl b/src/structured_prob_nodes.jl
index f1817ee5..f88a1311 100644
--- a/src/structured_prob_nodes.jl
+++ b/src/structured_prob_nodes.jl
@@ -45,7 +45,7 @@ end
 "A plain structured probabilistic disjunction node"
 mutable struct StructSumNode <: StructProbInnerNode
     children::Vector{StructProbCircuit}
-    log_thetas::Vector{Float64}
+    log_probs::Vector{Float64}
     vtree::Vtree # could be leaf or inner
     data
     counter::UInt32
diff --git a/test/broken/LoadSave/circuit_loaders_tests.jl b/test/broken/LoadSave/circuit_loaders_tests.jl
index 8110ef46..1829c16b 100644
--- a/test/broken/LoadSave/circuit_loaders_tests.jl
+++ b/test/broken/LoadSave/circuit_loaders_tests.jl
@@ -14,18 +14,18 @@ using ProbabilisticCircuits
    # Testing Read Parameters
    EPS = 1e-7
    or1 = children(children(prob_circuit)[1])[2]
-   @test abs(or1.log_thetas[1] - (-1.6094379124341003)) < EPS
-   @test abs(or1.log_thetas[2] - (-1.2039728043259361)) < EPS
-   @test abs(or1.log_thetas[3] - (-0.916290731874155)) < EPS
-   @test abs(or1.log_thetas[4] - (-2.3025850929940455)) < EPS
+   @test abs(or1.log_probs[1] - (-1.6094379124341003)) < EPS
+   @test abs(or1.log_probs[2] - (-1.2039728043259361)) < EPS
+   @test abs(or1.log_probs[3] - (-0.916290731874155)) < EPS
+   @test abs(or1.log_probs[4] - (-2.3025850929940455)) < EPS
 
    or2 = children(children(prob_circuit)[1])[1]
-   @test abs(or2.log_thetas[1] - (-2.3025850929940455)) < EPS
-   @test abs(or2.log_thetas[2] - (-2.3025850929940455)) < EPS
-   @test abs(or2.log_thetas[3] - (-2.3025850929940455)) < EPS
-   @test abs(or2.log_thetas[4] - (-0.35667494393873245)) < EPS
+   @test abs(or2.log_probs[1] - (-2.3025850929940455)) < EPS
+   @test abs(or2.log_probs[2] - (-2.3025850929940455)) < EPS
+   @test abs(or2.log_probs[3] - (-2.3025850929940455)) < EPS
+   @test abs(or2.log_probs[4] - (-0.35667494393873245)) < EPS
 
-   @test abs(prob_circuit.log_thetas[1] - (0.0)) < EPS
+   @test abs(prob_circuit.log_probs[1] - (0.0)) < EPS
 end
 
 psdd_files = ["little_4var.psdd", "msnbc-yitao-a.psdd", "msnbc-yitao-b.psdd", "msnbc-yitao-c.psdd", "msnbc-yitao-d.psdd", "msnbc-yitao-e.psdd", "mnist-antonio.psdd"]
diff --git a/test/broken/StructureLearner/init_tests.jl b/test/broken/StructureLearner/init_tests.jl
index b8063df3..eb38727a 100644
--- a/test/broken/StructureLearner/init_tests.jl
+++ b/test/broken/StructureLearner/init_tests.jl
@@ -20,7 +20,7 @@
 #     @test num_parameters(pc) == 74 
 
 #     # test below has started to fail -- unclear whether that is a bug or randomness...?
-#     # @test pc[28].log_thetas[1] ≈ -1.1870882896239272 atol=1.0e-7
+#     # @test pc[28].log_probs[1] ≈ -1.1870882896239272 atol=1.0e-7
 
 #     # is structured decomposable 
 #     for (n, vars) in variables_by_node(pc)

From f9fc54f9dfee340817e385ce23bbe07587b0feca Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Wed, 2 Sep 2020 00:38:59 -0500
Subject: [PATCH 075/131] chore: formats

---
 src/Logistic/logistic_nodes.jl    | 16 ++++++---------
 src/Logistic/parameter_circuit.jl | 33 +++++++++++++++++++------------
 src/Probabilistic/prob_nodes.jl   |  6 ++++--
 3 files changed, 30 insertions(+), 25 deletions(-)

diff --git a/src/Logistic/logistic_nodes.jl b/src/Logistic/logistic_nodes.jl
index 632867d8..f480879f 100644
--- a/src/Logistic/logistic_nodes.jl
+++ b/src/Logistic/logistic_nodes.jl
@@ -1,12 +1,8 @@
 export 
     LogisticCircuit, 
-    LogisticLeafNode, 
-    LogisticInnerNode, 
-    LogisticLiteral,
-    Logistic⋀Node,
-    Logistic⋁Node,
-    classes,
-    num_parameters_perclass
+    LogisticLeafNode, LogisticInnerNode, 
+    LogisticLiteral, Logistic⋀Node, Logistic⋁Node,
+    num_classes, num_parameters_per_class
     
 #####################
 # Infrastructure for logistic circuit nodes
@@ -54,7 +50,7 @@ A logistic disjunction node (Or node)
 """
 mutable struct Logistic⋁Node <: LogisticInnerNode
     children::Vector{<:LogisticCircuit}
-    thetas::Array{Float32, 2}
+    thetas::Matrix{Float32}
     data
     counter::UInt32
     Logistic⋁Node(children, class::Int) = begin
@@ -77,11 +73,11 @@ import LogicCircuits.GateType # make available for extension
 
 import LogicCircuits: children # make available for extension
 @inline children(n::LogisticInnerNode) = n.children
-@inline classes(n::Logistic⋁Node) = size(n.thetas)[2]
+@inline num_classes(n::Logistic⋁Node) = size(n.thetas)[2]
 
 import ..Utils: num_parameters
 @inline num_parameters(c::LogisticCircuit) = sum(n -> num_children(n) * classes(n), ⋁_nodes(c))
-@inline num_parameters_perclass(c::LogisticCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
+@inline num_parameters_per_class(c::LogisticCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
 
 #####################
 # constructors and conversions
diff --git a/src/Logistic/parameter_circuit.jl b/src/Logistic/parameter_circuit.jl
index 91da4bb7..dc338e77 100644
--- a/src/Logistic/parameter_circuit.jl
+++ b/src/Logistic/parameter_circuit.jl
@@ -90,6 +90,8 @@ struct CuLayeredParameterCircuit
     CuLayeredParameterCircuit(l::LayeredParameterCircuit) = new(CuLayeredBitCircuit(l.layered_circuit), map(CuMatrix, l.layered_parameters))
 end
 
+
+
 function class_likelihood(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing, reuse_cp=nothing)
     cw, flow, v = class_weights(circuit, nc, data, reuse_up, reuse_down, reuse_cp)
     one = Float32(1.0)
@@ -141,8 +143,8 @@ function calculate_class_weights_layer_kernel_cuda(cw, v, flow, decisions, eleme
                 last_elem = @inbounds decisions[3, i]
                 n_down = @inbounds flow[j, decision_id]
                 for e = first_elem:last_elem
-                    e1 = @inbounds elements[1,first_elem]
-                    e2 = @inbounds elements[2,first_elem]
+                    e1 = @inbounds elements[1, first_elem]
+                    e2 = @inbounds elements[2, first_elem]
                     e_up = @inbounds (v[j, e1] * v[j, e2])
                     edge_flow = e_up / n_up * n_down
                     # following needs to be memory safe
@@ -157,6 +159,8 @@ function calculate_class_weights_layer_kernel_cuda(cw, v, flow, decisions, eleme
     return nothing
 end
 
+
+
 function one_hot(labels::Vector, nc::Integer)    
     ne = length(labels) 
     one_hot_labels = zeros(Float32, ne, nc)
@@ -167,26 +171,26 @@ function one_hot(labels::Vector, nc::Integer)
 end
 
 function learn_parameters(circuit::CuLayeredParameterCircuit, nc::Integer, data::CuMatrix{Float32}, labels::CuMatrix{Float32}, reuse_up=nothing, reuse_down=nothing, reuse_cp=nothing, num_epochs=20, step_size=0.0001)
-    cp, node_flow, edge_flow, v = class_likelihood(circuit, nc, data, reuse_up, reuse_down, reuse_cp)
-    update_parameters(circuit, labels, cp, edge_flow, step_size)
+    cp, flow, v = class_likelihood(circuit, nc, data, reuse_up, reuse_down, reuse_cp)
+    update_parameters(circuit, labels, cp, flow, step_size)
     for _ = 2:num_epochs
-        cp, node_flow, edge_flow, v = class_likelihood(circuit, nc, data, v, (node_flow, edge_flow), cp)
-        update_parameters(circuit, labels, cp, edge_flow, step_size)
+        cp, flow, v = class_likelihood(circuit, nc, data, v, flow, cp)
+        update_parameters(circuit, labels, cp, v, flow, step_size)
     end
     return nothing
 end
 
-function update_parameters(circuit::CuLayeredParameterCircuit, labels, cp, flow, step_size=0.0001)
+function update_parameters(circuit::CuLayeredParameterCircuit, labels, cp, v, flow, step_size=0.0001)
     _, nc = size(labels)
     step_size = Float32(step_size)
-    class_per_thread = 1
     CUDA.@sync for i = 1:length(circuit.layered_circuit.layers)
         circuit_layer = circuit.layered_circuit.layers[i]
         flow_layer = flow[i]
         parameter_layer = circuit.layered_parameters[i]
         ndl = num_decisions(circuit_layer)
-        num_threads = balance_threads(ndl, nc / class_per_thread, 8)
-        num_blocks = ceil(Int, ndl / num_threads[1]), ceil(Int, ndl / num_threads[2] / class_per_thread)
+        num_threads = balance_threads(ndl, nc, 6)
+        num_threads = num_threads[1], num_threads[2], 
+        num_blocks = ceil(Int, ndl / num_threads[1]), ceil(Int, nc / num_threads[2]), 4
         @cuda threads=num_threads blocks=num_blocks update_parameters_layer_kernel_cuda(labels, cp, flow_layer, circuit_layer.decisions, parameter_layer, step_size)
     end
     return nothing
@@ -195,8 +199,10 @@ end
 function update_parameters_layer_kernel_cuda(labels, cp, flow, decisions, parameters, step_size)
     index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
     index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
+    index_z = (blockIdx().z - 1) * blockDim().z + threadIdx().z
     stride_x = blockDim().x * gridDim().x
     stride_y = blockDim().y * gridDim().y
+    stride_z = blockDim().z * gridDim().z
     ne, nc = size(labels)
     _, num_decisions = size(decisions)
     
@@ -205,9 +211,10 @@ function update_parameters_layer_kernel_cuda(labels, cp, flow, decisions, parame
             first_elem = @inbounds decisions[2, i]
             last_elem = @inbounds decisions[3, i]
             for e = first_elem:last_elem
-                for j = 1:ne
-                    u = @inbounds flow[j, e] * (cp[j, class] - labels[j, class]) * step_size
-                    # following are memory safe
+                for j = index_z:stride_z:ne
+                    edge_flow = e_up / n_up * n_down
+                    u = @inbounds edge_flow * (cp[j, class] - labels[j, class]) * step_size
+                    # following needs to be memory safe
                     @inbounds parameters[class, e] -= u 
                 end
             end
diff --git a/src/Probabilistic/prob_nodes.jl b/src/Probabilistic/prob_nodes.jl
index f002baea..4cb10f16 100644
--- a/src/Probabilistic/prob_nodes.jl
+++ b/src/Probabilistic/prob_nodes.jl
@@ -1,5 +1,7 @@
-export PlainProbCircuit, ProbLeafNode, ProbInnerNode, ProbLiteralNode, Prob⋀Node, 
-Prob⋁Node
+export 
+    PlainProbCircuit,
+    ProbLeafNode, ProbInnerNode, 
+    ProbLiteralNode, Prob⋀Node, Prob⋁Node
 
 #####################
 # Infrastructure for probabilistic circuit nodes

From 61bb161a49b3d5d7a53b0f72fe038f627ba815ef Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Wed, 2 Sep 2020 01:15:04 -0500
Subject: [PATCH 076/131] fixes to BitCircuits on GPU

---
 src/abstract_prob_nodes.jl |   2 +-
 src/parameters.jl          |  35 +++++++------
 src/queries/likelihood.jl  | 100 +++++++++++++------------------------
 3 files changed, 54 insertions(+), 83 deletions(-)

diff --git a/src/abstract_prob_nodes.jl b/src/abstract_prob_nodes.jl
index 46e37c66..0f091a6a 100644
--- a/src/abstract_prob_nodes.jl
+++ b/src/abstract_prob_nodes.jl
@@ -3,7 +3,7 @@ export ProbCircuit,
     num_parameters,
     mul_nodes, sum_nodes
 
-using LogicCircuits: LogicCircuit
+using LogicCircuits
 
 #####################
 # Abstract probabilistic circuit nodes
diff --git a/src/parameters.jl b/src/parameters.jl
index 646763e1..257b2961 100644
--- a/src/parameters.jl
+++ b/src/parameters.jl
@@ -9,14 +9,12 @@ Maximum likilihood estimation of parameters given data
 """
 function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
     @assert isbinarydata(data) "Probabilistic circuit parameter estimation for binary data only"
-    bc = BitCircuit(pc, data; reset=false, gpu = isgpu(data))
-    on_node, on_edge, get_params = if isgpu(data)
-        estimate_parameters_gpu(bc, pseudocount)
+    bc = BitCircuit(pc, data; reset=false)
+    params::Vector{Float64} = if isgpu(data)
+        estimate_parameters_gpu(to_gpu(bc), data, pseudocount)
     else
-        estimate_parameters_cpu(bc, pseudocount)
+        estimate_parameters_cpu(bc, data, pseudocount)
     end
-    compute_values_flows(bc, data; on_node, on_edge)
-    params::Vector{Float64} = get_params()
     foreach_reset(pc) do pn
         if is⋁gate(pn)
             if num_children(pn) == 1
@@ -34,7 +32,7 @@ function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
     params
 end
 
-function estimate_parameters_cpu(bc, pseudocount)
+function estimate_parameters_cpu(bc, data, pseudocount)
     # no need to synchronize, since each computation is unique to a decision node
     node_counts::Vector{UInt} = Vector{UInt}(undef, num_nodes(bc))
     log_params::Vector{Float64} = Vector{Float64}(undef, num_elements(bc))
@@ -61,12 +59,11 @@ function estimate_parameters_cpu(bc, pseudocount)
         nothing
     end
 
-    get_params() = log_params
-
-    return (on_node, on_edge, get_params)
+    compute_values_flows(bc, data; on_node, on_edge)
+    return log_params
 end
 
-function estimate_parameters_gpu(bc, pseudocount)
+function estimate_parameters_gpu(bc, data, pseudocount)
     node_counts::CuVector{Int32} = CUDA.zeros(Int32, num_nodes(bc))
     edge_counts::CuVector{Int32} = CUDA.zeros(Int32, num_elements(bc))
     params::CuVector{Float64} = CuVector{Float64}(undef, num_elements(bc))
@@ -82,7 +79,7 @@ function estimate_parameters_gpu(bc, pseudocount)
         end
         if isone(ex_id) # only do this once
             for i=els_start:els_end
-                params_device[i] = pseudocount/(els_end-els_start+1)
+                @inbounds params_device[i] = pseudocount/(els_end-els_start+1)
             end
         end
         nothing
@@ -96,13 +93,15 @@ function estimate_parameters_gpu(bc, pseudocount)
         nothing
     end
 
-    function get_params()
-        parent_counts = @views node_counts[bc.elements[1,:]]
-        params .= log.(params .+ edge_counts) .- log.(parent_counts .+ pseudocount)
-        to_cpu(params)
-    end
+    v, f = compute_values_flows(bc, data; on_node, on_edge)
+    # TODO: manually garbage collect v,f
 
-    return (on_node, on_edge, get_params)
+    # TODO: reinstate following implementation once https://github.com/JuliaGPU/GPUArrays.jl/issues/313 is fixed and released
+    # parent_counts = @views node_counts[bc.elements[1,:]]
+    @inbounds parents = bc.elements[1,:]
+    @inbounds parent_counts = node_counts[parents]
+    params .= log.(params .+ edge_counts) .- log.(parent_counts .+ pseudocount)
+    return to_cpu(params)
 end
 
 """
diff --git a/src/queries/likelihood.jl b/src/queries/likelihood.jl
index f6466e95..5f7a2f3e 100644
--- a/src/queries/likelihood.jl
+++ b/src/queries/likelihood.jl
@@ -1,29 +1,8 @@
 export EVI, log_likelihood_per_instance, log_likelihood, log_likelihood_avg
 
 """
-Complete evidence queries
+Construct a `BitCircuit` while storing edge parameters in a separate array
 """
-# function log_likelihood_per_instance(pc::ProbCircuit, data)
-#     @assert isbinarydata(data) "Can only calculate EVI on Bool data"
-    
-#     compute_flows(pc, data)
-#     log_likelihoods = zeros(Float64, num_examples(data))
-#     indices = init_array(Bool, num_examples(data))::BitVector
-    
-#     ll(n::ProbCircuit) = ()
-#     ll(n::Union{PlainSumNode, StructSumNode}) = begin
-#         if num_children(n) != 1 # other nodes have no effect on likelihood
-#             foreach(children(n), n.log_probs) do c, log_theta
-#                 indices = get_downflow(n, c)
-#                 view(log_likelihoods, indices::BitVector) .+=  log_theta # see MixedProductKernelBenchmark.jl
-#             end
-#          end
-#     end
-
-#     foreach(ll, pc)
-#     log_likelihoods
-# end
-
 function bitcircuit_with_params(pc, data)
     params::Vector{Float64} = Vector{Float64}()
     on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
@@ -35,24 +14,25 @@ function bitcircuit_with_params(pc, data)
             append!(params, n.log_probs)
         end
     end
-    bc = BitCircuit(pc, data; gpu = isgpu(data), on_decision)
-    params = isgpu(data) ? to_gpu(params) : params
+    bc = BitCircuit(pc, data; on_decision)
     (bc, params)
 end
 
+"""
+Compute the likelihood of the PC given each individual instance in the data
+"""
 function log_likelihood_per_instance(pc::ProbCircuit, data)
     @assert isbinarydata(data) "Probabilistic circuit likelihoods are for binary data only"
     bc, params = bitcircuit_with_params(pc, data)
     if isgpu(data)
-        log_likelihood_per_instance_gpu(bc, data, params)
+        log_likelihood_per_instance_gpu(to_gpu(bc), data, to_gpu(params))
     else
         log_likelihood_per_instance_cpu(bc, data, params)
     end
 end
 
 function log_likelihood_per_instance_cpu(bc, data, params)
-    n_ex::Int = num_examples(data)
-    ll::Vector{Float64} = zeros(Float64, n_ex)
+    ll::Vector{Float64} = zeros(Float64, num_examples(data))
     ll_lock::Threads.ReentrantLock = Threads.ReentrantLock()
     
     @inline function on_edge(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
@@ -62,7 +42,7 @@ function log_likelihood_per_instance_cpu(bc, data, params)
                     @inbounds edge_flow = values[i, p] & values[i, s] & flows[i, dec_id]
                     first_true_bit = trailing_zeros(edge_flow)+1
                     last_true_bit = 64-leading_zeros(edge_flow)
-                    @simd for j= first_true_bit:last_true_bit
+                    @simd for j = first_true_bit:last_true_bit
                         ex_id = ((i-1) << 6) + j
                         if get_bit(edge_flow, j)
                             @inbounds ll[ex_id] += params[el_id]
@@ -78,46 +58,38 @@ function log_likelihood_per_instance_cpu(bc, data, params)
     return ll
 end
 
-function log_likelihood_per_instance_gpu(bc, pseudocount)
-    # node_counts::CuVector{Int32} = CUDA.zeros(Int32, num_nodes(bc))
-    # edge_counts::CuVector{Int32} = CUDA.zeros(Int32, num_elements(bc))
-    # params::CuVector{Float64} = CuVector{Float64}(undef, num_elements(bc))
-    # # need to manually cudaconvert closure variables
-    # node_counts_device = CUDA.cudaconvert(node_counts)
-    # edge_counts_device = CUDA.cudaconvert(edge_counts)
-    # params_device = CUDA.cudaconvert(params)
-    
-    # @inline function on_node(flows, values, dec_id, els_start, els_end, ex_id)
-    #     if els_start != els_end
-    #         @inbounds c::Int32 = count_ones(flows[ex_id, dec_id]) # cast for @atomic to be happy
-    #         CUDA.@atomic node_counts_device[dec_id] += c
-    #     end
-    #     if isone(ex_id) # only do this once
-    #         for i=els_start:els_end
-    #             params_device[i] = pseudocount/(els_end-els_start+1)
-    #         end
-    #     end
-    #     nothing
-    # end
-    
-    # @inline function on_edge(flows, values, dec_id, el_id, p, s, els_start, els_end, ex_id, edge_flow)
-    #     if els_start != els_end
-    #         c::Int32 = count_ones(edge_flow) # cast for @atomic to be happy
-    #         CUDA.@atomic edge_counts_device[el_id] += c
-    #     end
-    #     nothing
-    # end
-
-    # function get_params()
-    #     parent_counts = @views node_counts[bc.elements[1,:]]
-    #     params .= log.(params .+ edge_counts) .- log.(parent_counts .+ pseudocount)
-    #     to_cpu(params)
-    # end
+function log_likelihood_per_instance_gpu(bc, data, params)
+    ll::CuVector{Int32} = CUDA.zeros(Float64, num_examples(data))
+    ll_device = CUDA.cudaconvert(ll)
+        
+    @inline function on_edge(flows, values, dec_id, el_id, p, s, els_start, els_end, ex_id, edge_flow)
+        if els_start != els_end
+            first_true_bit = trailing_zeros(edge_flow)+1
+            last_true_bit = 64-leading_zeros(edge_flow)
+            for j = first_true_bit:last_true_bit
+                ex_id = ((i-1) << 6) + j
+                if get_bit(edge_flow, j)
+                    CUDA.@atomic ll_device[ex_id] += params[el_id]
+                end
+            end
+        end
+        nothing
+    end
 
-    # return (on_node, on_edge, get_params)
+    return ll
 end
 
+"""
+Complete evidence queries
+"""
 EVI = log_likelihood_per_instance
 
+"""
+Compute the likelihood of the PC given the data
+"""
 log_likelihood(pc, data) = sum(log_likelihood_per_instance(pc, data))
+
+"""
+Compute the likelihood of the PC given the data, averaged over all instances in the data
+"""
 log_likelihood_avg(pc, data) = log_likelihood(pc, data)/num_examples(data)
\ No newline at end of file

From 52204da8643da7bf5de33c130c88e12f7e868765 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Wed, 2 Sep 2020 01:59:25 -0500
Subject: [PATCH 077/131] fix GPU likelihood computation

---
 src/queries/likelihood.jl | 13 ++++++++-----
 1 file changed, 8 insertions(+), 5 deletions(-)

diff --git a/src/queries/likelihood.jl b/src/queries/likelihood.jl
index 5f7a2f3e..989af930 100644
--- a/src/queries/likelihood.jl
+++ b/src/queries/likelihood.jl
@@ -59,22 +59,25 @@ function log_likelihood_per_instance_cpu(bc, data, params)
 end
 
 function log_likelihood_per_instance_gpu(bc, data, params)
-    ll::CuVector{Int32} = CUDA.zeros(Float64, num_examples(data))
+    params_device = CUDA.cudaconvert(params)
+    ll::CuVector{Float64} = CUDA.zeros(Float64, num_examples(data))
     ll_device = CUDA.cudaconvert(ll)
         
-    @inline function on_edge(flows, values, dec_id, el_id, p, s, els_start, els_end, ex_id, edge_flow)
+    @inline function on_edge(flows, values, dec_id, el_id, p, s, els_start, els_end, chunk_id, edge_flow)
         if els_start != els_end
-            first_true_bit = trailing_zeros(edge_flow)+1
+            first_true_bit = 1+trailing_zeros(edge_flow)
             last_true_bit = 64-leading_zeros(edge_flow)
             for j = first_true_bit:last_true_bit
-                ex_id = ((i-1) << 6) + j
+                ex_id = ((chunk_id-1) << 6) + j
                 if get_bit(edge_flow, j)
-                    CUDA.@atomic ll_device[ex_id] += params[el_id]
+                    CUDA.@atomic ll_device[ex_id] += params_device[el_id]
                 end
             end
         end
         nothing
     end
+    
+    compute_values_flows(bc, data; on_edge)
 
     return ll
 end

From 18e1d1d4aeeac717c5ef6cbdd598fdecb3ccfcd6 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Wed, 2 Sep 2020 02:15:27 -0500
Subject: [PATCH 078/131] manually collect some CUDA gerbage

---
 src/parameters.jl         | 3 ++-
 src/queries/likelihood.jl | 6 ++++--
 2 files changed, 6 insertions(+), 3 deletions(-)

diff --git a/src/parameters.jl b/src/parameters.jl
index 257b2961..39ecd243 100644
--- a/src/parameters.jl
+++ b/src/parameters.jl
@@ -94,7 +94,8 @@ function estimate_parameters_gpu(bc, data, pseudocount)
     end
 
     v, f = compute_values_flows(bc, data; on_node, on_edge)
-    # TODO: manually garbage collect v,f
+    CUDA.unsafe_free!(v) # save the GC some effort
+    CUDA.unsafe_free!(f) # save the GC some effort
 
     # TODO: reinstate following implementation once https://github.com/JuliaGPU/GPUArrays.jl/issues/313 is fixed and released
     # parent_counts = @views node_counts[bc.elements[1,:]]
diff --git a/src/queries/likelihood.jl b/src/queries/likelihood.jl
index 989af930..cb338457 100644
--- a/src/queries/likelihood.jl
+++ b/src/queries/likelihood.jl
@@ -77,8 +77,10 @@ function log_likelihood_per_instance_gpu(bc, data, params)
         nothing
     end
     
-    compute_values_flows(bc, data; on_edge)
-
+    v, f = compute_values_flows(bc, data; on_edge)
+    CUDA.unsafe_free!(v) # save the GC some effort
+    CUDA.unsafe_free!(f) # save the GC some effort
+    
     return ll
 end
 

From b2e0fad6b8d68bee99c3e10f81efdafffaeafb57 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Wed, 2 Sep 2020 02:29:44 -0500
Subject: [PATCH 079/131] add tests for likelihood

---
 test/parameters_tests.jl | 19 ++++++++++++++++---
 1 file changed, 16 insertions(+), 3 deletions(-)

diff --git a/test/parameters_tests.jl b/test/parameters_tests.jl
index 3c05f660..5bebd138 100644
--- a/test/parameters_tests.jl
+++ b/test/parameters_tests.jl
@@ -7,10 +7,23 @@ using DataFrames: DataFrame
     
     dfb = DataFrame(BitMatrix([true false; true true; false true]))
     r = fully_factorized_circuit(ProbCircuit,num_features(dfb))
+    
     estimate_parameters(r,dfb; pseudocount=1.0)
+    @test log_likelihood_avg(r,dfb) ≈ LogicCircuits.Utils.fully_factorized_log_likelihood(dfb; pseudocount=1.0)
+
+    estimate_parameters(r,dfb; pseudocount=0.0)
+    @test log_likelihood_avg(r,dfb) ≈ LogicCircuits.Utils.fully_factorized_log_likelihood(dfb; pseudocount=0.0)
+
+    if CUDA.functional()
+
+        dfb_gpu = to_gpu(dfb)
+        
+        estimate_parameters(r,dfb_gpu; pseudocount=1.0)
+        @test log_likelihood_avg(r,dfb_gpu) ≈ LogicCircuits.Utils.fully_factorized_log_likelihood(dfb; pseudocount=1.0)
+
+        estimate_parameters(r,dfb_gpu; pseudocount=0.0)
+        @test log_likelihood_avg(r,dfb_gpu) ≈ LogicCircuits.Utils.fully_factorized_log_likelihood(dfb; pseudocount=0.0)
 
-    # TODO test identical likelihoods with
-    # ll1  = LogicCircuits.Utils.fully_factorized_log_likelihood(dfb; pseudocount=1)
-    # ll0 = LogicCircuits.Utils.fully_factorized_log_likelihood(dfb)
+    end
 
 end
\ No newline at end of file

From 0d27ede24f6817f063860b3bb1843ce30cb7a0fb Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Wed, 2 Sep 2020 23:19:25 -0500
Subject: [PATCH 080/131] ParamBitCircuit wrapper for parameterized bit circuit

---
 .../{expected_flows.jl => expectation2.jl}    |  0
 src/queries/likelihood.jl                     | 44 ++++++++++++-------
 test/parameters_tests.jl                      |  1 +
 3 files changed, 30 insertions(+), 15 deletions(-)
 rename src/queries/{expected_flows.jl => expectation2.jl} (100%)

diff --git a/src/queries/expected_flows.jl b/src/queries/expectation2.jl
similarity index 100%
rename from src/queries/expected_flows.jl
rename to src/queries/expectation2.jl
diff --git a/src/queries/likelihood.jl b/src/queries/likelihood.jl
index cb338457..061d1019 100644
--- a/src/queries/likelihood.jl
+++ b/src/queries/likelihood.jl
@@ -1,21 +1,35 @@
 export EVI, log_likelihood_per_instance, log_likelihood, log_likelihood_avg
 
+"A `BitCircuit` with parameters attached to the elements"
+struct ParamBitCircuit{V,M,W}
+    bitcircuit::BitCircuit{V,M}
+    params::W
+end
+
+import LogicCircuits: to_gpu, to_cpu #extend
+
+to_gpu(c::ParamBitCircuit) = 
+    ParamBitCircuit(to_gpu(c.bitcircuit), to_gpu(c.params))
+
+to_cpu(c::ParamBitCircuit) = 
+    ParamBitCircuit(to_cpu(c.bitcircuit), to_cpu(c.params))
+
 """
 Construct a `BitCircuit` while storing edge parameters in a separate array
 """
-function bitcircuit_with_params(pc, data)
-    params::Vector{Float64} = Vector{Float64}()
+function ParamBitCircuit(pc::ProbCircuit, data)
+    logprobs::Vector{Float64} = Vector{Float64}()
     on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
         if isnothing(n) # this decision node is not part of the PC
             # @assert first_element == last_element
-            push!(params, 0.0)
+            push!(logprobs, 0.0)
         else
-            # @assert last_element-first_element+1 == length(n.log_probs) "$last_element-$first_element+1 != $(length(n.log_probs))"
-            append!(params, n.log_probs)
+            # @assert last_element-first_element+1 == length(n.log_probs) 
+            append!(logprobs, n.log_probs)
         end
     end
     bc = BitCircuit(pc, data; on_decision)
-    (bc, params)
+    ParamBitCircuit(bc, logprobs)
 end
 
 """
@@ -23,15 +37,15 @@ Compute the likelihood of the PC given each individual instance in the data
 """
 function log_likelihood_per_instance(pc::ProbCircuit, data)
     @assert isbinarydata(data) "Probabilistic circuit likelihoods are for binary data only"
-    bc, params = bitcircuit_with_params(pc, data)
+    bc = ParamBitCircuit(pc, data)
     if isgpu(data)
-        log_likelihood_per_instance_gpu(to_gpu(bc), data, to_gpu(params))
+        log_likelihood_per_instance_gpu(to_gpu(bc), data)
     else
-        log_likelihood_per_instance_cpu(bc, data, params)
+        log_likelihood_per_instance_cpu(bc, data)
     end
 end
 
-function log_likelihood_per_instance_cpu(bc, data, params)
+function log_likelihood_per_instance_cpu(bc, data)
     ll::Vector{Float64} = zeros(Float64, num_examples(data))
     ll_lock::Threads.ReentrantLock = Threads.ReentrantLock()
     
@@ -45,7 +59,7 @@ function log_likelihood_per_instance_cpu(bc, data, params)
                     @simd for j = first_true_bit:last_true_bit
                         ex_id = ((i-1) << 6) + j
                         if get_bit(edge_flow, j)
-                            @inbounds ll[ex_id] += params[el_id]
+                            @inbounds ll[ex_id] += bc.params[el_id]
                         end
                     end
                 end
@@ -54,12 +68,12 @@ function log_likelihood_per_instance_cpu(bc, data, params)
         nothing
     end
 
-    compute_values_flows(bc, data; on_edge)
+    compute_values_flows(bc.bitcircuit, data; on_edge)
     return ll
 end
 
-function log_likelihood_per_instance_gpu(bc, data, params)
-    params_device = CUDA.cudaconvert(params)
+function log_likelihood_per_instance_gpu(bc, data)
+    params_device = CUDA.cudaconvert(bc.params)
     ll::CuVector{Float64} = CUDA.zeros(Float64, num_examples(data))
     ll_device = CUDA.cudaconvert(ll)
         
@@ -77,7 +91,7 @@ function log_likelihood_per_instance_gpu(bc, data, params)
         nothing
     end
     
-    v, f = compute_values_flows(bc, data; on_edge)
+    v, f = compute_values_flows(bc.bitcircuit, data; on_edge)
     CUDA.unsafe_free!(v) # save the GC some effort
     CUDA.unsafe_free!(f) # save the GC some effort
     
diff --git a/test/parameters_tests.jl b/test/parameters_tests.jl
index 5bebd138..650411a8 100644
--- a/test/parameters_tests.jl
+++ b/test/parameters_tests.jl
@@ -2,6 +2,7 @@ using Test
 using LogicCircuits
 using ProbabilisticCircuits
 using DataFrames: DataFrame
+using CUDA: CUDA
 
 @testset "MLE tests" begin
     

From 4e7ae1234878fe8b3eb35549adccd175ae437080 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Thu, 3 Sep 2020 01:59:15 -0500
Subject: [PATCH 081/131] [refactoring] logistic circuits: class probs based on
 bit_circuit

---
 src/Logistic/Logistic.jl        |   4 +-
 src/Logistic/logistic_nodes.jl  |   2 +-
 src/Logistic/queries.jl         | 201 +++++++++++++++++++-------------
 test/Logistic/logistic_tests.jl |  62 +++++-----
 4 files changed, 156 insertions(+), 113 deletions(-)

diff --git a/src/Logistic/Logistic.jl b/src/Logistic/Logistic.jl
index cd45019e..d5b03b10 100644
--- a/src/Logistic/Logistic.jl
+++ b/src/Logistic/Logistic.jl
@@ -5,8 +5,8 @@ using ..Utils
 
 include("logistic_nodes.jl")
 include("queries.jl")
-include("parameter_circuit.jl")
-include("learn_parameters.jl")
+# include("parameter_circuit.jl")
+# include("learn_parameters.jl")
 
 # TODO structure learning
 
diff --git a/src/Logistic/logistic_nodes.jl b/src/Logistic/logistic_nodes.jl
index f480879f..0232ca2b 100644
--- a/src/Logistic/logistic_nodes.jl
+++ b/src/Logistic/logistic_nodes.jl
@@ -50,7 +50,7 @@ A logistic disjunction node (Or node)
 """
 mutable struct Logistic⋁Node <: LogisticInnerNode
     children::Vector{<:LogisticCircuit}
-    thetas::Matrix{Float32}
+    thetas::Matrix{Float64}
     data
     counter::UInt32
     Logistic⋁Node(children, class::Int) = begin
diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index f4324637..7ceba404 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -1,122 +1,165 @@
-export class_weights_per_instance, class_likelihood_per_instance, downflow, accuracy, predict_class, 
-    do_nothing_test, access_flow_test, dummy_calculation_test, dummy_calculation_test2
+export class_likelihood_per_instance, class_weights_per_instance
 
-using LogicCircuits: UpDownFlow1, UpDownFlow2, or_nodes
-using ..Probabilistic: get_downflow, get_upflow
+using CUDA
 using LoopVectorization: @avx, vifelse
 
 
+
 """
 Class Conditional Probability
 """
-# with flows computed (2.03 s (80704 allocations: 3.32 MiB))
-# 5.136 s (275778 allocations: 6.99 GiB) on mnist.circuit
-@inline function class_likelihood_per_instance(lc::LogisticCircuit,  classes::Int, data; flows_computed=false)
-    if !flows_computed
-        compute_flows(lc, data)
+
+function bitcircuit_with_params(lc, nc, data)
+    params::Vector{Vector{Float64}} = Vector{Vector{Float64}}()
+    on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
+        if isnothing(n)
+            # @assert first_element == last_element
+            push!(params, zeros(Float64, nc))
+        else
+            # @assert last_element-first_element+1 == length(n.log_probs) "$last_element-$first_element+1 != $(length(n.log_probs))"
+            for theta in eachrow(n.thetas)
+                push!(params, theta)
+            end
+        end
     end
-    
-    weights = class_weights_per_instance(lc, classes, data; flows_computed=true)
-    @avx @. 1.0 / (1.0 + exp(-weights))
+    bc = BitCircuit(lc, data; on_decision)
+    (bc, permutedims(hcat(params...), (2, 1)))
 end
 
-@inline function class_weights_per_instance(lc::LogisticCircuit,  classes::Int, data; flows_computed=false)
-    if !flows_computed
-        compute_flows(lc, data)
-    end
-    
-    weights = zeros(num_examples(data), classes)
-    foreach(or_nodes(lc)) do ln
-        foreach(eachrow(ln.thetas), children(ln)) do theta, c
-            flow = Float32.(downflow(ln, c))
-            @avx @. weights +=  flow * theta'
-        end        
-    end
-    
-    weights
+function class_likelihood_per_instance(lc::LogicCircuit, nc::Int, data)    
+    cw = class_weights_per_instance(lc, nc, data)
+    isgpu(data) ? (@. 1.0 / (1.0 + exp(-cw))) : (@. @avx 1.0 / (1.0 + exp(-cw)))
 end
 
-# 5.795 ms (72350 allocations: 6.58 MiB)
-@inline function do_nothing_test(lc::LogisticCircuit,  classes::Int, data)
-    likelihoods = zeros(num_examples(data), classes)
-    foreach(or_nodes(lc)) do ln
-        foreach(eachrow(ln.thetas), children(ln)) do theta, c
-            nothing
-        end        
+function class_weights_per_instance(lc::LogisticCircuit, nc::Int, data)
+    bc, params = bitcircuit_with_params(lc, nc, data)
+    if isgpu(data)
+        class_weights_per_instance_gpu(to_gpu(bc), data, to_gpu(params))
+    else
+        class_weights_per_instance_cpu(bc, data, params)
     end
-    @avx @. likelihoods = 1.0 / (1.0 + exp(-likelihoods))
-    likelihoods
 end
 
-# 1.574 s (193840 allocations: 6.98 GiB)
-@inline function access_flow_test(lc::LogisticCircuit,  classes::Int, data)
-    foreach(or_nodes(lc)) do ln
-        foreach(eachrow(ln.thetas), children(ln)) do theta, c
-            flow = Float32.(downflow(ln, c)) 
-        end        
+function class_weights_per_instance_cpu(bc, data, params)
+    ne::Int = num_examples(data)
+    nc::Int = size(params, 2)
+    cw::Matrix{Float64} = zeros(Float64, ne, nc)
+    cw_lock::Threads.ReentrantLock = Threads.ReentrantLock()
+ 
+    @inline function on_edge_binary(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
+        if els_start != els_end
+            lock(cw_lock) do # TODO: move lock to inner loop?
+                for i = 1:size(flows, 1)
+                    @inbounds edge_flow = values[i, p] & values[i, s] & flows[i, dec_id]
+                    first_true_bit = trailing_zeros(edge_flow) + 1
+                    last_true_bit = 64 - leading_zeros(edge_flow)
+                    @simd for j = first_true_bit:last_true_bit
+                        if get_bit(edge_flow, j)
+                            ex_id = ((i-1) << 6) + j
+                            for class = 1:size(cw, 2)
+                                @inbounds cw[ex_id, class] += params[el_id, class]
+                            end
+                        end
+                    end
+                end
+            end
+        end
+        nothing
     end
-    nothing
-end
 
-# 2.943 s (82272 allocations: 6.74 MiB)
-@inline function dummy_calculation_test(lc::LogisticCircuit,  classes::Int, data)
-    likelihoods = zeros(num_examples(data), classes)
-    foreach(or_nodes(lc)) do ln
-        foreach(eachrow(ln.thetas), children(ln)) do theta, c
-            @avx @. likelihoods += likelihoods
-        end        
+    @inline function on_edge_float(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
+        if els_start != els_end
+            lock(cw_lock) do # TODO: move lock to inner loop?
+                @avx for i = 1:size(flows, 1)
+                    @inbounds edge_flow = values[i, p] * values[i, s] / values[i, dec_id] * flows[i, dec_id]
+                    edge_flow = vifelse(isfinite(edge_flow), edge_flow, zero(Float32))
+                    for class = 1:size(cw, 2)
+                        @inbounds cw[i, class] += edge_flow * params[el_id, class]
+                    end
+                end
+            end
+        end
+        nothing
     end
-    @avx @. likelihoods = 1.0 / (1.0 + exp(-likelihoods))
-    likelihoods
-end
 
-# 4.790 s (193843 allocations: 6.99 GiB)
-@inline function dummy_calculation_test2(lc::LogisticCircuit,  classes::Int, data)
-    likelihoods = zeros(num_examples(data), classes)
-    foreach(or_nodes(lc)) do ln
-        foreach(eachrow(ln.thetas), children(ln)) do theta, c
-            flow = Float32.(downflow(ln, c))
-            @avx @. likelihoods += likelihoods
-        end        
+    if isbinarydata(data)
+        compute_values_flows(bc, data; on_edge = on_edge_binary)
+    else
+        compute_values_flows(bc, data; on_edge = on_edge_float)
     end
-    @avx @. likelihoods = 1.0 / (1.0 + exp(-likelihoods))
-    likelihoods
+
+    return cw
 end
 
-@inline downflow(or_parent::Logistic⋁Node, c) = 
-    (c.data isa UpDownFlow1) ? c.data.downflow : flow_and(or_parent.data.downflow, c.data, or_parent.data.upflow)
+function class_weights_per_instance_gpu(bc, data, params)
+    ne::Int = num_examples(data)
+    nc::Int = size(params, 2)
+    cw::CuMatrix{Float64} = CUDA.zeros(Float64, num_examples(data), nc)
+    cw_device = CUDA.cudaconvert(cw)
+    params_device = CUDA.cudaconvert(params)
+
+    @inline function on_edge_binary(flows, values, dec_id, el_id, p, s, els_start, els_end, chunk_id, edge_flow)
+        if els_start != els_end
+            first_true_bit = 1+trailing_zeros(edge_flow)
+            last_true_bit = 64-leading_zeros(edge_flow)
+            for j = first_true_bit:last_true_bit
+                if get_bit(edge_flow, j)
+                    ex_id = ((chunk_id-1) << 6) + j
+                    for class = 1:size(cw_device, 2)
+                        CUDA.@atomic cw_device[ex_id, class] += params_device[el_id, class]
+                    end
+                end
+            end
+        end
+        nothing
+    end
 
-@inline flow_and(downflow_n::BitVector, c_flow::UpDownFlow2, upflow_n::BitVector) = 
-    @. downflow_n & c_flow.prime_flow & c_flow.sub_flow
+    @inline function on_edge_float(flows, values, dec_id, el_id, p, s, els_start, els_end, ex_id, edge_flow)
+        if els_start != els_end
+            for class = 1:size(cw_device, 2)
+                CUDA.@atomic cw_device[ex_id, class] += edge_flow * params_device[el_id, class]
+            end
+        end
+        nothing
+    end
+    
+    if isbinarydata(data)
+        v,f = compute_values_flows(bc, data; on_edge = on_edge_binary)
+    else
+        @assert isfpdata(data) "Only floating point and binary data are supported"
+        v,f = compute_values_flows(bc, data; on_edge = on_edge_float)
+    end
+    CUDA.unsafe_free!(v) # save the GC some effort
+    CUDA.unsafe_free!(f) # save the GC some effort
 
-@inline flow_and(downflow_n::Vector{<:AbstractFloat}, c_flow::UpDownFlow2, upflow_n::Vector{<:AbstractFloat}) = 
-    @avx @. downflow_n * c_flow.prime_flow * make_finite(c_flow.sub_flow/upflow_n)
+    return cw
+end
 
-@inline make_finite(x::T) where T = vifelse(isfinite(x), x, zero(T))
 
 
 """
 Class Predictions
 """
-@inline function predict_class(lc::LogisticCircuit, classes::Int, data)
-    class_likelihoods = class_likelihood_per_instance(lc, classes, data)
+function predict_class(lc::LogisticCircuit, nc::Int, data)
+    class_likelihoods = class_likelihood_per_instance(lc, nc, data)
     predict_class(class_likelihoods)
 end
 
-@inline function predict_class(class_likelihoods::AbstractMatrix)
+function predict_class(class_likelihoods)
     _, mxindex = findmax(class_likelihoods; dims=2)
     dropdims(getindex.(mxindex, 2); dims=2)
 end
 
+
+
 """
 Prediction accuracy
 """
-@inline accuracy(predicted_class::Vector, labels) = 
-    Float64(sum(@. predicted_class == labels)) / length(labels)
+accuracy(lc::LogisticCircuit, nc::Int, data, labels) = 
+    accuracy(predict_class(lc, nc, data), labels)
 
-@inline accuracy(lc::LogisticCircuit, classes::Int, data, labels) = 
-    accuracy(predict_class(lc, classes, data), labels)
+accuracy(predicted_class, labels) = 
+    Float64(sum(@. predicted_class == labels)) / length(labels)
 
-@inline accuracy(class_likelihoods::AbstractMatrix, labels) = 
+accuracy(class_likelihoods, labels) = 
     accuracy(predict_class(class_likelihoods), labels)
-
diff --git a/test/Logistic/logistic_tests.jl b/test/Logistic/logistic_tests.jl
index a58ddc76..9a63f0aa 100644
--- a/test/Logistic/logistic_tests.jl
+++ b/test/Logistic/logistic_tests.jl
@@ -45,38 +45,38 @@ using ProbabilisticCircuits
     # check accuracy
     @test accuracy(logistic_circuit, CLASSES, data, true_labels) == 1.0
 
-    # check parameter updates
-    original_literal_parameters = Dict{Int, Vector{Float64}}()
-    foreach(logistic_circuit) do ln
-        if ln isa Logistic⋁Node
-            foreach(ln.children, eachrow(ln.thetas)) do c, theta
-                if c isa LogisticLiteral
-                    original_literal_parameters[c.literal] = copy(theta)
-                end
-            end
-        end
-    end
+    # # check parameter updates
+    # original_literal_parameters = Dict{Int, Vector{Float64}}()
+    # foreach(logistic_circuit) do ln
+    #     if ln isa Logistic⋁Node
+    #         foreach(ln.children, eachrow(ln.thetas)) do c, theta
+    #             if c isa LogisticLiteral
+    #                 original_literal_parameters[c.literal] = copy(theta)
+    #             end
+    #         end
+    #     end
+    # end
     
-    one_hot_labels = [0.0 1.0;
-                      1.0 0.0;
-                      0.0 1.0]
-    one_hot_labels = Float32.(one_hot_labels)
-    true_error = true_prob .- one_hot_labels
-    step_size = 0.1
-    learn_parameters(logistic_circuit, CLASSES, data, true_labels; num_epochs=1, step_size=step_size, flows_computed=true)
+    # one_hot_labels = [0.0 1.0;
+    #                   1.0 0.0;
+    #                   0.0 1.0]
+    # one_hot_labels = Float32.(one_hot_labels)
+    # true_error = true_prob .- one_hot_labels
+    # step_size = 0.1
+    # learn_parameters(logistic_circuit, CLASSES, data, true_labels; num_epochs=1, step_size=step_size, flows_computed=true)
     
-    foreach(logistic_circuit) do ln
-        if ln isa Logistic⋁Node
-            foreach(ln.children, eachrow(ln.thetas)) do c, theta
-                if c isa LogisticLiteral
-                    for class = 1:CLASSES
-                        true_update_amount = -step_size * sum(c.data.upflow .* true_error[:, class]) / size(true_error)[1]
-                        updated_amount = theta[class] - original_literal_parameters[c.literal][class]
-                        @test updated_amount ≈ true_update_amount atol=1e-7
-                    end
-                end
-            end
-        end
-    end
+    # foreach(logistic_circuit) do ln
+    #     if ln isa Logistic⋁Node
+    #         foreach(ln.children, eachrow(ln.thetas)) do c, theta
+    #             if c isa LogisticLiteral
+    #                 for class = 1:CLASSES
+    #                     true_update_amount = -step_size * sum(c.data.upflow .* true_error[:, class]) / size(true_error)[1]
+    #                     updated_amount = theta[class] - original_literal_parameters[c.literal][class]
+    #                     @test updated_amount ≈ true_update_amount atol=1e-7
+    #                 end
+    #             end
+    #         end
+    #     end
+    # end
 
 end
\ No newline at end of file

From a2cf964a6664b1d9ef9185f3e2459cf5309579af Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Thu, 3 Sep 2020 02:19:33 -0500
Subject: [PATCH 082/131] [fix] deps

---
 Project.toml | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/Project.toml b/Project.toml
index b34f52e6..c61156e4 100644
--- a/Project.toml
+++ b/Project.toml
@@ -14,6 +14,7 @@ LogicCircuits = "a7847b3b-b7f1-4dd5-83c3-60e0aa0f8599"
 LoopVectorization = "bdcacae8-1622-11e9-2a5c-532679323890"
 MetaGraphs = "626554b9-1ddb-594c-aa3c-2596fe9399a5"
 Metis = "2679e427-3c69-5b7f-982b-ece356f1e94b"
+MLDatasets = "eb30cadb-4394-5ae3-aed4-317e484a6458"
 Pkg = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f"
 Printf = "de0858da-6303-5e67-8744-51eddeeeb8d7"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
@@ -23,8 +24,6 @@ SparseArrays = "2f01184e-e22b-5df5-ae63-d93ebab69eaf"
 Statistics = "10745b16-79ce-11e8-11f9-7d13ad32a3b2"
 StatsBase = "2913bbd2-ae8a-5f71-8c99-4fb6c76f3a91"
 StatsFuns = "4c63d2b9-4356-54db-8cca-17b64c39e42c"
-LoopVectorization = "bdcacae8-1622-11e9-2a5c-532679323890"
-MLDatasets = "eb30cadb-4394-5ae3-aed4-317e484a6458"
 
 [compat]
 BlossomV = "0.4"
@@ -36,10 +35,10 @@ LightGraphs = "1.3"
 LogicCircuits = "0.1.1"
 MetaGraphs = "0.6"
 Metis = "1.0"
+MLDatasets = "0.4, 0.5"
 Reexport = "0.2"
 SimpleWeightedGraphs = "1.1"
 StatsBase = "0.33"
 StatsFuns = "0.9"
 LoopVectorization = "0.8.20"
-MLDatasets = "0.4, 0.5"
 julia = "1.5"

From c8e083d5dbfd4ecde33c2fa500168075187b46ab Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Thu, 3 Sep 2020 02:30:04 -0500
Subject: [PATCH 083/131] [tests] temporarily diable logistic tests

---
 test/Logistic/logistic_tests.jl | 62 ++++++++++++++++-----------------
 1 file changed, 31 insertions(+), 31 deletions(-)

diff --git a/test/Logistic/logistic_tests.jl b/test/Logistic/logistic_tests.jl
index 9a63f0aa..579176b3 100644
--- a/test/Logistic/logistic_tests.jl
+++ b/test/Logistic/logistic_tests.jl
@@ -7,43 +7,43 @@ using ProbabilisticCircuits
     # Uses a Logistic Circuit with 4 variables, and tests 3 of the configurations to 
     # match with python version.
     
-    CLASSES = 2
+    # CLASSES = 2
 
-    logistic_circuit = zoo_lc("little_4var.circuit", CLASSES)
-    @test logistic_circuit isa LogisticCircuit
+    # logistic_circuit = zoo_lc("little_4var.circuit", CLASSES)
+    # @test logistic_circuit isa LogisticCircuit
 
-    # check probabilities for binary samples
-    data = @. Bool([0 0 0 0; 0 1 1 0; 0 0 1 1])
-    # true_weight_func = [3.43147972 4.66740416; 
-    #                     4.27595352 2.83503504;
-    #                     3.67415087 4.93793472]
-    true_prob = [0.9686740008311808 0.9906908445371728;
-                 0.9862917392724188 0.9445399509069984; 
-                 0.9752568185086389 0.9928816444223209]
+    # # check probabilities for binary samples
+    # data = @. Bool([0 0 0 0; 0 1 1 0; 0 0 1 1])
+    # # true_weight_func = [3.43147972 4.66740416; 
+    # #                     4.27595352 2.83503504;
+    # #                     3.67415087 4.93793472]
+    # true_prob = [0.9686740008311808 0.9906908445371728;
+    #              0.9862917392724188 0.9445399509069984; 
+    #              0.9752568185086389 0.9928816444223209]
             
-    class_prob = class_likelihood_per_instance(logistic_circuit, CLASSES, data)
-    for i = 1:size(true_prob)[1]
-        for j = 1:CLASSES
-            @test true_prob[i,j] ≈ class_prob[i,j]
-        end
-    end
+    # class_prob = class_likelihood_per_instance(logistic_circuit, CLASSES, data)
+    # for i = 1:size(true_prob)[1]
+    #     for j = 1:CLASSES
+    #         @test true_prob[i,j] ≈ class_prob[i,j]
+    #     end
+    # end
 
-    # check probabilities for float samples
-    data = Float32.(data)
-    class_prob = class_likelihood_per_instance(logistic_circuit, CLASSES, data)
-    for i = 1:size(true_prob)[1]
-        for j = 1:CLASSES
-            @test true_prob[i,j] ≈ class_prob[i,j]
-        end
-    end
+    # # check probabilities for float samples
+    # data = Float32.(data)
+    # class_prob = class_likelihood_per_instance(logistic_circuit, CLASSES, data)
+    # for i = 1:size(true_prob)[1]
+    #     for j = 1:CLASSES
+    #         @test true_prob[i,j] ≈ class_prob[i,j]
+    #     end
+    # end
 
-    # check predicted_classes
-    true_labels = [2, 1, 2]
-    predicted_classes = predict_class(logistic_circuit, CLASSES, data)
-    @test all(predicted_classes .== true_labels)
+    # # check predicted_classes
+    # true_labels = [2, 1, 2]
+    # predicted_classes = predict_class(logistic_circuit, CLASSES, data)
+    # @test all(predicted_classes .== true_labels)
     
-    # check accuracy
-    @test accuracy(logistic_circuit, CLASSES, data, true_labels) == 1.0
+    # # check accuracy
+    # @test accuracy(logistic_circuit, CLASSES, data, true_labels) == 1.0
 
     # # check parameter updates
     # original_literal_parameters = Dict{Int, Vector{Float64}}()

From b863b2ee7c044cda79c8d901da9e6aef469252ff Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Thu, 3 Sep 2020 02:30:22 -0500
Subject: [PATCH 084/131] [renaming] logistic circuits

---
 .../learn_parameters.jl                       |  0
 src/{logistic => Logistic}/logistic_nodes.jl  |  0
 .../parameter_circuit.jl                      |  0
 src/logistic/queries.jl                       | 24 -------------------
 4 files changed, 24 deletions(-)
 rename src/{logistic => Logistic}/learn_parameters.jl (100%)
 rename src/{logistic => Logistic}/logistic_nodes.jl (100%)
 rename src/{logistic => Logistic}/parameter_circuit.jl (100%)
 delete mode 100644 src/logistic/queries.jl

diff --git a/src/logistic/learn_parameters.jl b/src/Logistic/learn_parameters.jl
similarity index 100%
rename from src/logistic/learn_parameters.jl
rename to src/Logistic/learn_parameters.jl
diff --git a/src/logistic/logistic_nodes.jl b/src/Logistic/logistic_nodes.jl
similarity index 100%
rename from src/logistic/logistic_nodes.jl
rename to src/Logistic/logistic_nodes.jl
diff --git a/src/logistic/parameter_circuit.jl b/src/Logistic/parameter_circuit.jl
similarity index 100%
rename from src/logistic/parameter_circuit.jl
rename to src/Logistic/parameter_circuit.jl
diff --git a/src/logistic/queries.jl b/src/logistic/queries.jl
deleted file mode 100644
index a89b4984..00000000
--- a/src/logistic/queries.jl
+++ /dev/null
@@ -1,24 +0,0 @@
-#TODO: reinstate
-
-# export class_conditional_likelihood_per_instance
-
-# using ..Probabilistic: get_downflow, get_upflow
-# """
-# Class Conditional Probability
-# """
-# function class_conditional_likelihood_per_instance(lc::LogisticCircuit,  classes::Int, data)
-#     compute_flows(lc, data)
-#     likelihoods = zeros(num_examples(data), classes)
-#     foreach(lc) do ln
-#         if ln isa Logistic⋁Node
-#             # For each class. orig.thetas is 2D so used eachcol
-#             for (idx, thetaC) in enumerate(eachcol(ln.thetas))
-#                 foreach(children(ln), thetaC) do c, theta
-#                     likelihoods[:, idx] .+= Float64.(get_downflow(ln) .& get_upflow(c)) .* theta
-#                 end
-#             end
-#         end
-#     end
-#     likelihoods
-# end
-

From db0c6559d6368c07f048e91e582af04d77d90574 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Thu, 3 Sep 2020 02:58:21 -0500
Subject: [PATCH 085/131] [refactoring] param_bit_circuit

---
 src/ProbabilisticCircuits.jl |  3 +--
 src/param_bit_circuit.jl     | 18 ++++++++++++++++++
 src/queries/likelihood.jl    | 14 --------------
 3 files changed, 19 insertions(+), 16 deletions(-)
 create mode 100644 src/param_bit_circuit.jl

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 6aa05804..ce5a494f 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -12,6 +12,7 @@ include("Utils/Utils.jl")
 
 include("abstract_prob_nodes.jl")
 include("plain_prob_nodes.jl")
+include("param_bit_circuit.jl")
 include("parameters.jl")
 include("structured_prob_nodes.jl")
 
@@ -21,8 +22,6 @@ include("queries/likelihood.jl")
 # include("queries.jl")
 # include("informations.jl")
 
-# include("logistic/logistic_nodes.jl")
-# include("logistic/queries.jl")
 
 # include("reasoning/expectation.jl")
 # include("reasoning/exp_flow_circuits.jl")
diff --git a/src/param_bit_circuit.jl b/src/param_bit_circuit.jl
new file mode 100644
index 00000000..95eb487a
--- /dev/null
+++ b/src/param_bit_circuit.jl
@@ -0,0 +1,18 @@
+
+#####################
+# Paramter Bit Circuits
+#####################
+
+"A `BitCircuit` with parameters attached to the elements"
+struct ParamBitCircuit{V,M,W}
+    bitcircuit::BitCircuit{V,M}
+    params::W
+end
+
+import LogicCircuits: to_gpu, to_cpu #extend
+
+to_gpu(c::ParamBitCircuit) = 
+    ParamBitCircuit(to_gpu(c.bitcircuit), to_gpu(c.params))
+
+to_cpu(c::ParamBitCircuit) = 
+    ParamBitCircuit(to_cpu(c.bitcircuit), to_cpu(c.params))
diff --git a/src/queries/likelihood.jl b/src/queries/likelihood.jl
index 061d1019..55bd32a7 100644
--- a/src/queries/likelihood.jl
+++ b/src/queries/likelihood.jl
@@ -1,19 +1,5 @@
 export EVI, log_likelihood_per_instance, log_likelihood, log_likelihood_avg
 
-"A `BitCircuit` with parameters attached to the elements"
-struct ParamBitCircuit{V,M,W}
-    bitcircuit::BitCircuit{V,M}
-    params::W
-end
-
-import LogicCircuits: to_gpu, to_cpu #extend
-
-to_gpu(c::ParamBitCircuit) = 
-    ParamBitCircuit(to_gpu(c.bitcircuit), to_gpu(c.params))
-
-to_cpu(c::ParamBitCircuit) = 
-    ParamBitCircuit(to_cpu(c.bitcircuit), to_cpu(c.params))
-
 """
 Construct a `BitCircuit` while storing edge parameters in a separate array
 """

From 1b779715bb9902488bf2df87e336b00010fb80ab Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Fri, 4 Sep 2020 01:11:58 -0500
Subject: [PATCH 086/131] marginal upward pass

---
 src/ProbabilisticCircuits.jl   |   1 +
 src/parameters.jl              |   4 +-
 src/queries/expected_flows2.jl | 217 -------------------
 src/queries/likelihood.jl      |  12 +-
 src/queries/marginal_flow.jl   | 366 +++++++++++++++++++++++++++++++++
 5 files changed, 378 insertions(+), 222 deletions(-)
 delete mode 100644 src/queries/expected_flows2.jl
 create mode 100644 src/queries/marginal_flow.jl

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 6aa05804..e6088bdc 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -16,6 +16,7 @@ include("parameters.jl")
 include("structured_prob_nodes.jl")
 
 include("queries/likelihood.jl")
+include("queries/marginal_flow.jl")
 
 # include("exp_flows.jl")
 # include("queries.jl")
diff --git a/src/parameters.jl b/src/parameters.jl
index 39ecd243..492b0a90 100644
--- a/src/parameters.jl
+++ b/src/parameters.jl
@@ -59,7 +59,7 @@ function estimate_parameters_cpu(bc, data, pseudocount)
         nothing
     end
 
-    compute_values_flows(bc, data; on_node, on_edge)
+    satisfies_flows(bc, data; on_node, on_edge)
     return log_params
 end
 
@@ -93,7 +93,7 @@ function estimate_parameters_gpu(bc, data, pseudocount)
         nothing
     end
 
-    v, f = compute_values_flows(bc, data; on_node, on_edge)
+    v, f = satisfies_flows(bc, data; on_node, on_edge)
     CUDA.unsafe_free!(v) # save the GC some effort
     CUDA.unsafe_free!(f) # save the GC some effort
 
diff --git a/src/queries/expected_flows2.jl b/src/queries/expected_flows2.jl
deleted file mode 100644
index 9c2d3bdd..00000000
--- a/src/queries/expected_flows2.jl
+++ /dev/null
@@ -1,217 +0,0 @@
-export evaluate_exp, compute_exp_flows, get_downflow, get_upflow, get_exp_downflow, get_exp_upflow
-
-
-using StatsFuns: logsumexp
-
-# TODO move to LogicCircuits
-# TODO downflow struct
-using LogicCircuits: materialize, UpFlow, UpDownFlow, UpDownFlow1, UpDownFlow2
-
-"""
-Get upflow from logic circuit
-"""
-@inline get_upflow(n::LogicCircuit) = get_upflow(n.data)
-@inline get_upflow(elems::UpDownFlow1) = elems.upflow
-@inline get_upflow(elems::UpFlow) = materialize(elems)
-
-"""
-Get the node/edge flow from logic circuit
-"""
-function get_downflow(n::LogicCircuit; root=nothing)::BitVector
-    downflow(x::UpDownFlow1) = x.downflow
-    downflow(x::UpDownFlow2) = begin
-        ors = or_nodes(root)
-        p = findall(p -> n in children(p), ors)
-        @assert length(p) == 1
-        get_downflow(ors[p[1]], n)
-    end
-    downflow(n.data)
-end
-
-function get_downflow(n::LogicCircuit, c::LogicCircuit)::BitVector
-    @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
-    get_downflow(n) .& get_upflow(c)
-end
-
-#####################
-# performance-critical queries related to circuit flows
-#####################
-
-"Container for circuit flows represented as a float vector"
-const ExpUpFlow1 = Vector{Float64}
-
-"Container for circuit flows represented as an implicit conjunction of a prime and sub float vector (saves memory allocations in circuits with many binary conjunctions)"
-struct ExpUpFlow2
-    prime_flow::Vector{Float64}
-    sub_flow::Vector{Float64}
-end
-
-const ExpUpFlow = Union{ExpUpFlow1,ExpUpFlow2}
-
-@inline ExpUpFlow1(elems::ExpUpFlow1) = elems
-@inline ExpUpFlow1(elems::ExpUpFlow2) = elems.prime_flow .+ elems.sub_flow
-
-function evaluate_exp(root::ProbCircuit, data;
-                   nload = nload, nsave = nsave, reset=true)::Vector{Float64}
-    n_ex::Int = num_examples(data)
-    ϵ = 0.0
-
-    @inline f_lit(n) = begin
-        uf = convert(Vector{Int8}, feature_values(data, variable(n)))
-        if ispositive(n)
-            uf[uf.==-1] .= 1
-        else
-            uf .= 1 .- uf
-            uf[uf.==2] .= 1
-        end
-        uf = convert(Vector{Float64}, uf)
-        uf .= log.(uf .+ ϵ)
-    end
-    
-    @inline f_con(n) = begin
-        uf = istrue(n) ? ones(Float64, n_ex) : zeros(Float64, n_ex)
-        uf .= log.(uf .+ ϵ)
-    end
-    
-    @inline fa(n, call) = begin
-        if num_children(n) == 1
-            return ExpUpFlow1(call(@inbounds children(n)[1]))
-        else
-            c1 = call(@inbounds children(n)[1])::ExpUpFlow
-            c2 = call(@inbounds children(n)[2])::ExpUpFlow
-            if num_children(n) == 2 && c1 isa ExpUpFlow1 && c2 isa ExpUpFlow1 
-                return ExpUpFlow2(c1, c2) # no need to allocate a new BitVector
-            end
-            x = flowop(c1, c2, +)
-            for c in children(n)[3:end]
-                accumulate(x, call(c), +)
-            end
-            return x
-        end
-    end
-    
-    @inline fo(n, call) = begin
-        if num_children(n) == 1
-            return ExpUpFlow1(call(@inbounds children(n)[1]))
-        else
-            log_probs = n.log_probs
-            c1 = call(@inbounds children(n)[1])::ExpUpFlow
-            c2 = call(@inbounds children(n)[2])::ExpUpFlow
-            x = flowop(c1, log_probs[1], c2, log_probs[2], logsumexp)
-            for (i, c) in enumerate(children(n)[3:end])
-                accumulate(x, call(c), log_probs[i+2], logsumexp)
-            end
-            return x
-        end
-    end
-    
-    # ensure flow us Flow1 at the root, even when it's a conjunction
-    root_flow = ExpUpFlow1(foldup(root, f_con, f_lit, fa, fo, ExpUpFlow; nload, nsave, reset))
-    return nsave(root, root_flow)
-end
-
-@inline flowop(x::ExpUpFlow, y::ExpUpFlow, op)::ExpUpFlow1 =
-    op.(ExpUpFlow1(x), ExpUpFlow1(y))
-
-@inline flowop(x::ExpUpFlow, w1::Float64, y::ExpUpFlow, w2::Float64, op)::ExpUpFlow1 =
-    op.(ExpUpFlow1(x) .+ w1, ExpUpFlow1(y) .+ w2)
-
-import Base.accumulate
-@inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, op) = 
-    @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v)); nothing
-
-@inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, w::Float64, op) = 
-    @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v) + w); nothing
-
-
-#####################
-# downward pass
-#####################
-
-struct ExpUpDownFlow1
-    upflow::ExpUpFlow1
-    downflow::Vector{Float64}
-    ExpUpDownFlow1(upf::ExpUpFlow1) = new(upf, log.(zeros(Float64, length(upf)) .+ 1e-300))
-end
-
-const ExpUpDownFlow2 = ExpUpFlow2
-
-const ExpUpDownFlow = Union{ExpUpDownFlow1, ExpUpDownFlow2}
-
-
-function compute_exp_flows(circuit::ProbCircuit, data)
-
-    # upward pass
-    @inline upflow!(n, v) = begin
-        n.data = (v isa ExpUpFlow1) ? ExpUpDownFlow1(v) : v
-        v
-    end
-
-    @inline upflow(n) = begin
-        d = n.data::ExpUpDownFlow
-        (d isa ExpUpDownFlow1) ? d.upflow : d
-    end
-
-    evaluate_exp(circuit, data; nload=upflow, nsave=upflow!, reset=false)
-    
-    # downward pass
-
-    @inline downflow(n) = (n.data::ExpUpDownFlow1).downflow
-    @inline isfactorized(n) = n.data::ExpUpDownFlow isa ExpUpDownFlow2
-
-    downflow(circuit) .= 0.0
-
-    foreach_down(circuit; setcounter=false) do n
-        if isinner(n) && !isfactorized(n)
-            downflow_n = downflow(n)
-            upflow_n = upflow(n)
-            for ite in 1 : num_children(n)
-                c = children(n)[ite]
-                log_theta = is⋀gate(n) ? 0.0 : n.log_probs[ite]
-                if isfactorized(c)
-                    upflow2_c = c.data::ExpUpDownFlow2
-                    # propagate one level further down
-                    for i = 1:2
-                        downflow_c = downflow(@inbounds children(c)[i])
-                        accumulate(downflow_c, downflow_n .+ log_theta .+ upflow2_c.prime_flow 
-                        .+ upflow2_c.sub_flow .- upflow_n, logsumexp)
-                    end
-                else
-                    upflow1_c = (c.data::ExpUpDownFlow1).upflow
-                    downflow_c = downflow(c)
-                    accumulate(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n, logsumexp)
-                end
-            end 
-        end
-        nothing
-    end
-    nothing
-end
-
-
-"""
-Get upflow of a probabilistic circuit
-"""
-@inline get_exp_upflow(pc::ProbCircuit) = get_exp_upflow(pc.data)
-@inline get_exp_upflow(elems::ExpUpDownFlow1) = elems.upflow
-@inline get_exp_upflow(elems::ExpUpFlow) = ExpUpFlow1(elems)
-
-"""
-Get the node/edge downflow from probabilistic circuit
-"""
-function get_exp_downflow(n::ProbCircuit; root=nothing)::Vector{Float64}
-    downflow(x::ExpUpDownFlow1) = x.downflow
-    downflow(x::ExpUpDownFlow2) = begin
-        ors = or_nodes(root)
-        p = findall(p -> n in children(p), ors)
-        @assert length(p) == 1
-        get_exp_downflow(ors[p[1]], n)
-    end
-    downflow(n.data)
-end
-
-function get_exp_downflow(n::ProbCircuit, c::ProbCircuit)::Vector{Float64}
-    @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
-    log_theta = n.log_probs[findfirst(x -> x == c, children(n))]
-    return get_exp_downflow(n) .+ log_theta .+ get_exp_upflow(c) .- get_exp_upflow(n)
-end
\ No newline at end of file
diff --git a/src/queries/likelihood.jl b/src/queries/likelihood.jl
index 061d1019..40d4abca 100644
--- a/src/queries/likelihood.jl
+++ b/src/queries/likelihood.jl
@@ -1,4 +1,4 @@
-export EVI, log_likelihood_per_instance, log_likelihood, log_likelihood_avg
+export ParamBitCircuit, EVI, log_likelihood_per_instance, log_likelihood, log_likelihood_avg
 
 "A `BitCircuit` with parameters attached to the elements"
 struct ParamBitCircuit{V,M,W}
@@ -6,6 +6,12 @@ struct ParamBitCircuit{V,M,W}
     params::W
 end
 
+import LogicCircuits: num_nodes, num_elements, num_features
+
+num_nodes(c::ParamBitCircuit) = num_nodes(c.bitcircuit)
+num_elements(c::ParamBitCircuit) = num_elements(c.bitcircuit)
+num_features(c::ParamBitCircuit) = num_features(c.bitcircuit)
+
 import LogicCircuits: to_gpu, to_cpu #extend
 
 to_gpu(c::ParamBitCircuit) = 
@@ -68,7 +74,7 @@ function log_likelihood_per_instance_cpu(bc, data)
         nothing
     end
 
-    compute_values_flows(bc.bitcircuit, data; on_edge)
+    satisfies_flows(bc.bitcircuit, data; on_edge)
     return ll
 end
 
@@ -91,7 +97,7 @@ function log_likelihood_per_instance_gpu(bc, data)
         nothing
     end
     
-    v, f = compute_values_flows(bc.bitcircuit, data; on_edge)
+    v, f = satisfies_flows(bc.bitcircuit, data; on_edge)
     CUDA.unsafe_free!(v) # save the GC some effort
     CUDA.unsafe_free!(f) # save the GC some effort
     
diff --git a/src/queries/marginal_flow.jl b/src/queries/marginal_flow.jl
new file mode 100644
index 00000000..349c75a1
--- /dev/null
+++ b/src/queries/marginal_flow.jl
@@ -0,0 +1,366 @@
+using StatsFuns: logsumexp, log1pexp
+
+using CUDA: CUDA, @cuda
+using DataFrames: DataFrame
+using LoopVectorization: @avx
+using LogicCircuits: balance_threads
+
+export marginal, marginal_all
+
+#####################
+# Circuit marginal evaluation
+#####################
+  
+# evaluate a probabilistic circuit as a function
+function (root::ProbCircuit)(data...)
+    marginal(root, data...)
+end
+
+"Evaluate marginals of the circuit bottom-up for a given input"
+marginal(root::ProbCircuit, data::Union{Real,Missing}...) =
+    marginal(root, collect(Union{Bool,Missing}, data))
+
+marginal(root::ProbCircuit, data::Union{Vector{Union{Bool,Missing}},CuVector{UInt8}}) =
+    marginal(root, DataFrame(reshape(data, 1, :)))[1]
+
+marginal(circuit::ProbCircuit, data::DataFrame) =
+    marginal(same_device(ParamBitCircuit(circuit, data), data) , data)
+
+function marginal(circuit::ParamBitCircuit, data::DataFrame)::AbstractVector
+    marginal_all(circuit,data)[:,end]
+end
+
+#####################
+# Circuit evaluation of *all* nodes in circuit
+#####################
+
+"Evaluate the probabilistic circuit bottom-up for a given input and return the marginal probability value of all nodes"
+function marginal_all(circuit::ParamBitCircuit, data, reuse=nothing)
+    @assert num_features(data) == num_features(circuit) 
+    @assert isbinarydata(data)
+    values = init_marginal(data, reuse, num_nodes(circuit))
+    marginal_layers(circuit, values)
+    return values
+end
+
+"Initialize values from the data (data frames)"
+function init_marginal(data, reuse, num_nodes)
+    flowtype = isgpu(data) ? CuMatrix{Float64} : Matrix{Float64}
+    values = similar!(reuse, flowtype, num_examples(data), num_nodes)
+    @views values[:,LogicCircuits.TRUE_BITS] .= log(one(Float64))
+    @views values[:,LogicCircuits.FALSE_BITS] .= log(zero(Float64))
+    # here we should use a custom CUDA kernel to extract Float marginals from bit vectors
+    # for now the lazy solution is to move everything to the CPU and do the work there...
+    data_cpu = to_cpu(data)
+    for i=1:num_features(data)
+        marg_pos::Vector{Float64} = log.(coalesce.(data_cpu[:,i], 1.0))
+        marg_neg::Vector{Float64} = log.(coalesce.(1.0 .- data_cpu[:,i], 1.0))
+        values[:,2+i] .= same_device(marg_pos, values)
+        values[:,2+num_features(data)+i] .= same_device(marg_neg, values)
+    end
+    return values
+end
+
+# upward pass helpers on CPU
+
+"Compute marginals on the CPU (SIMD & multi-threaded)"
+function marginal_layers(circuit::ParamBitCircuit, values::Matrix)
+    bc = circuit.bitcircuit
+    els = bc.elements
+    pars = circuit.params
+    for layer in bc.layers
+        Threads.@threads for dec_id in layer
+            j = @inbounds bc.nodes[1,dec_id]
+            els_end = @inbounds bc.nodes[2,dec_id]
+            if j == els_end
+                assign_marginal(values, dec_id, els[2,j], els[3,j], pars[j])
+                j += 1
+            else
+                assign_marginal(values, dec_id, els[2,j], els[3,j], els[2,j+1], els[3,j+1], pars[j], pars[j+1])
+                j += 2
+            end
+            while j <= els_end
+                accum_marginal(values, dec_id, els[2,j], els[3,j], pars[j])
+                j += 1
+            end
+        end
+    end
+end
+
+assign_marginal(v::Matrix{<:AbstractFloat}, i, e1p, e1s, p1) =
+    @views @. @avx v[:,i] = v[:,e1p] + v[:,e1s] + p1
+
+accum_marginal(v::Matrix{<:AbstractFloat}, i, e1p, e1s, p1) = begin
+    @avx for j=1:size(v,1)
+        @inbounds x = v[j,i]
+        @inbounds y = v[j,e1p] + v[j,e1s] + p1
+        Δ = ifelse(x == y, zero(Float64), abs(x - y))
+        @inbounds  v[j,i] = max(x, y) + log1p(exp(-Δ))
+    end
+end
+
+assign_marginal(v::Matrix{<:AbstractFloat}, i, e1p, e1s, e2p, e2s, p1, p2) = begin
+    @avx for j=1:size(v,1)
+        @inbounds x = v[j,e1p] + v[j,e1s] + p1
+        @inbounds y = v[j,e2p] + v[j,e2s] + p2
+        Δ = ifelse(x == y, zero(Float64), abs(x - y))
+        @inbounds  v[j,i] = max(x, y) + log1p(exp(-Δ))
+    end
+end
+
+# upward pass helpers on GPU
+
+"Compute marginals on the GPU"
+function marginal_layers(circuit::ParamBitCircuit, values::CuMatrix;  dec_per_thread = 8, log2_threads_per_block = 8)
+    bc = circuit.bitcircuit
+    CUDA.@sync for layer in bc.layers
+        num_examples = size(values, 1)
+        num_decision_sets = length(layer)/dec_per_thread
+        num_threads =  balance_threads(num_examples, num_decision_sets, log2_threads_per_block)
+        num_blocks = (ceil(Int, num_examples/num_threads[1]), 
+                      ceil(Int, num_decision_sets/num_threads[2]))
+        @cuda threads=num_threads blocks=num_blocks marginal_layers_cuda(layer, bc.nodes, bc.elements, circuit.params, values)
+    end
+end
+
+"CUDA kernel for circuit evaluation"
+function marginal_layers_cuda(layer, nodes, elements, params, values)
+    index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
+    index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
+    stride_x = blockDim().x * gridDim().x
+    stride_y = blockDim().y * gridDim().y
+    for j = index_x:stride_x:size(values,1)
+        for i = index_y:stride_y:length(layer)
+            decision_id = @inbounds layer[i]
+            k = @inbounds nodes[1,decision_id]
+            els_end = @inbounds nodes[2,decision_id]
+            @inbounds x = values[j, elements[2,k]] + values[j, elements[3,k]] + params[k]
+            while k < els_end
+                k += 1
+                @inbounds y = values[j, elements[2,k]] + values[j, elements[3,k]] + params[k]
+                Δ = ifelse(x == y, zero(Float64), CUDA.abs(x - y))
+                x = max(x, y) + CUDA.log1p(CUDA.exp(-Δ))
+            end
+            values[j, decision_id] = x
+        end
+    end
+    return nothing
+end
+
+
+# export evaluate_exp, compute_exp_flows, get_downflow, get_upflow, get_exp_downflow, get_exp_upflow
+
+
+
+# # TODO move to LogicCircuits
+# # TODO downflow struct
+# using LogicCircuits: materialize, UpFlow, UpDownFlow, UpDownFlow1, UpDownFlow2
+
+# """
+# Get upflow from logic circuit
+# """
+# @inline get_upflow(n::LogicCircuit) = get_upflow(n.data)
+# @inline get_upflow(elems::UpDownFlow1) = elems.upflow
+# @inline get_upflow(elems::UpFlow) = materialize(elems)
+
+# """
+# Get the node/edge flow from logic circuit
+# """
+# function get_downflow(n::LogicCircuit; root=nothing)::BitVector
+#     downflow(x::UpDownFlow1) = x.downflow
+#     downflow(x::UpDownFlow2) = begin
+#         ors = or_nodes(root)
+#         p = findall(p -> n in children(p), ors)
+#         @assert length(p) == 1
+#         get_downflow(ors[p[1]], n)
+#     end
+#     downflow(n.data)
+# end
+
+# function get_downflow(n::LogicCircuit, c::LogicCircuit)::BitVector
+#     @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
+#     get_downflow(n) .& get_upflow(c)
+# end
+
+# #####################
+# # performance-critical queries related to circuit flows
+# #####################
+
+# "Container for circuit flows represented as a float vector"
+# const ExpUpFlow1 = Vector{Float64}
+
+# "Container for circuit flows represented as an implicit conjunction of a prime and sub float vector (saves memory allocations in circuits with many binary conjunctions)"
+# struct ExpUpFlow2
+#     prime_flow::Vector{Float64}
+#     sub_flow::Vector{Float64}
+# end
+
+# const ExpUpFlow = Union{ExpUpFlow1,ExpUpFlow2}
+
+# @inline ExpUpFlow1(elems::ExpUpFlow1) = elems
+# @inline ExpUpFlow1(elems::ExpUpFlow2) = elems.prime_flow .+ elems.sub_flow
+
+# function evaluate_exp(root::ProbCircuit, data;
+#                    nload = nload, nsave = nsave, reset=true)::Vector{Float64}
+#     n_ex::Int = num_examples(data)
+#     ϵ = 0.0
+
+#     @inline f_lit(n) = begin
+#         uf = convert(Vector{Int8}, feature_values(data, variable(n)))
+#         if ispositive(n)
+#             uf[uf.==-1] .= 1
+#         else
+#             uf .= 1 .- uf
+#             uf[uf.==2] .= 1
+#         end
+#         uf = convert(Vector{Float64}, uf)
+#         uf .= log.(uf .+ ϵ)
+#     end
+    
+#     @inline f_con(n) = begin
+#         uf = istrue(n) ? ones(Float64, n_ex) : zeros(Float64, n_ex)
+#         uf .= log.(uf .+ ϵ)
+#     end
+    
+#     @inline fa(n, call) = begin
+#         if num_children(n) == 1
+#             return ExpUpFlow1(call(@inbounds children(n)[1]))
+#         else
+#             c1 = call(@inbounds children(n)[1])::ExpUpFlow
+#             c2 = call(@inbounds children(n)[2])::ExpUpFlow
+#             if num_children(n) == 2 && c1 isa ExpUpFlow1 && c2 isa ExpUpFlow1 
+#                 return ExpUpFlow2(c1, c2) # no need to allocate a new BitVector
+#             end
+#             x = flowop(c1, c2, +)
+#             for c in children(n)[3:end]
+#                 accumulate(x, call(c), +)
+#             end
+#             return x
+#         end
+#     end
+    
+#     @inline fo(n, call) = begin
+#         if num_children(n) == 1
+#             return ExpUpFlow1(call(@inbounds children(n)[1]))
+#         else
+#             log_probs = n.log_probs
+#             c1 = call(@inbounds children(n)[1])::ExpUpFlow
+#             c2 = call(@inbounds children(n)[2])::ExpUpFlow
+#             x = flowop(c1, log_probs[1], c2, log_probs[2], logsumexp)
+#             for (i, c) in enumerate(children(n)[3:end])
+#                 accumulate(x, call(c), log_probs[i+2], logsumexp)
+#             end
+#             return x
+#         end
+#     end
+    
+#     # ensure flow us Flow1 at the root, even when it's a conjunction
+#     root_flow = ExpUpFlow1(foldup(root, f_con, f_lit, fa, fo, ExpUpFlow; nload, nsave, reset))
+#     return nsave(root, root_flow)
+# end
+
+# @inline flowop(x::ExpUpFlow, y::ExpUpFlow, op)::ExpUpFlow1 =
+#     op.(ExpUpFlow1(x), ExpUpFlow1(y))
+
+# @inline flowop(x::ExpUpFlow, w1::Float64, y::ExpUpFlow, w2::Float64, op)::ExpUpFlow1 =
+#     op.(ExpUpFlow1(x) .+ w1, ExpUpFlow1(y) .+ w2)
+
+# import Base.accumulate
+# @inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, op) = 
+#     @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v)); nothing
+
+# @inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, w::Float64, op) = 
+#     @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v) + w); nothing
+
+
+# #####################
+# # downward pass
+# #####################
+
+# struct ExpUpDownFlow1
+#     upflow::ExpUpFlow1
+#     downflow::Vector{Float64}
+#     ExpUpDownFlow1(upf::ExpUpFlow1) = new(upf, log.(zeros(Float64, length(upf)) .+ 1e-300))
+# end
+
+# const ExpUpDownFlow2 = ExpUpFlow2
+
+# const ExpUpDownFlow = Union{ExpUpDownFlow1, ExpUpDownFlow2}
+
+
+# function compute_exp_flows(circuit::ProbCircuit, data)
+
+#     # upward pass
+#     @inline upflow!(n, v) = begin
+#         n.data = (v isa ExpUpFlow1) ? ExpUpDownFlow1(v) : v
+#         v
+#     end
+
+#     @inline upflow(n) = begin
+#         d = n.data::ExpUpDownFlow
+#         (d isa ExpUpDownFlow1) ? d.upflow : d
+#     end
+
+#     evaluate_exp(circuit, data; nload=upflow, nsave=upflow!, reset=false)
+    
+#     # downward pass
+
+#     @inline downflow(n) = (n.data::ExpUpDownFlow1).downflow
+#     @inline isfactorized(n) = n.data::ExpUpDownFlow isa ExpUpDownFlow2
+
+#     downflow(circuit) .= 0.0
+
+#     foreach_down(circuit; setcounter=false) do n
+#         if isinner(n) && !isfactorized(n)
+#             downflow_n = downflow(n)
+#             upflow_n = upflow(n)
+#             for ite in 1 : num_children(n)
+#                 c = children(n)[ite]
+#                 log_theta = is⋀gate(n) ? 0.0 : n.log_probs[ite]
+#                 if isfactorized(c)
+#                     upflow2_c = c.data::ExpUpDownFlow2
+#                     # propagate one level further down
+#                     for i = 1:2
+#                         downflow_c = downflow(@inbounds children(c)[i])
+#                         accumulate(downflow_c, downflow_n .+ log_theta .+ upflow2_c.prime_flow 
+#                         .+ upflow2_c.sub_flow .- upflow_n, logsumexp)
+#                     end
+#                 else
+#                     upflow1_c = (c.data::ExpUpDownFlow1).upflow
+#                     downflow_c = downflow(c)
+#                     accumulate(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n, logsumexp)
+#                 end
+#             end 
+#         end
+#         nothing
+#     end
+#     nothing
+# end
+
+
+# """
+# Get upflow of a probabilistic circuit
+# """
+# @inline get_exp_upflow(pc::ProbCircuit) = get_exp_upflow(pc.data)
+# @inline get_exp_upflow(elems::ExpUpDownFlow1) = elems.upflow
+# @inline get_exp_upflow(elems::ExpUpFlow) = ExpUpFlow1(elems)
+
+# """
+# Get the node/edge downflow from probabilistic circuit
+# """
+# function get_exp_downflow(n::ProbCircuit; root=nothing)::Vector{Float64}
+#     downflow(x::ExpUpDownFlow1) = x.downflow
+#     downflow(x::ExpUpDownFlow2) = begin
+#         ors = or_nodes(root)
+#         p = findall(p -> n in children(p), ors)
+#         @assert length(p) == 1
+#         get_exp_downflow(ors[p[1]], n)
+#     end
+#     downflow(n.data)
+# end
+
+# function get_exp_downflow(n::ProbCircuit, c::ProbCircuit)::Vector{Float64}
+#     @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
+#     log_theta = n.log_probs[findfirst(x -> x == c, children(n))]
+#     return get_exp_downflow(n) .+ log_theta .+ get_exp_upflow(c) .- get_exp_upflow(n)
+# end
\ No newline at end of file

From db42ace794fcf548dc8a979aa01c95de326cd17f Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Fri, 4 Sep 2020 01:20:06 -0500
Subject: [PATCH 087/131] additional merge

---
 src/param_bit_circuit.jl | 26 ++++++++++++++++++++++----
 1 file changed, 22 insertions(+), 4 deletions(-)

diff --git a/src/param_bit_circuit.jl b/src/param_bit_circuit.jl
index 95eb487a..6f4a685e 100644
--- a/src/param_bit_circuit.jl
+++ b/src/param_bit_circuit.jl
@@ -1,7 +1,4 @@
-
-#####################
-# Paramter Bit Circuits
-#####################
+export ParamBitCircuit
 
 "A `BitCircuit` with parameters attached to the elements"
 struct ParamBitCircuit{V,M,W}
@@ -9,6 +6,12 @@ struct ParamBitCircuit{V,M,W}
     params::W
 end
 
+import LogicCircuits: num_nodes, num_elements, num_features
+
+num_nodes(c::ParamBitCircuit) = num_nodes(c.bitcircuit)
+num_elements(c::ParamBitCircuit) = num_elements(c.bitcircuit)
+num_features(c::ParamBitCircuit) = num_features(c.bitcircuit)
+
 import LogicCircuits: to_gpu, to_cpu #extend
 
 to_gpu(c::ParamBitCircuit) = 
@@ -16,3 +19,18 @@ to_gpu(c::ParamBitCircuit) =
 
 to_cpu(c::ParamBitCircuit) = 
     ParamBitCircuit(to_cpu(c.bitcircuit), to_cpu(c.params))
+
+function ParamBitCircuit(pc::ProbCircuit, data)
+    logprobs::Vector{Float64} = Vector{Float64}()
+    on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
+        if isnothing(n) # this decision node is not part of the PC
+            # @assert first_element == last_element
+            push!(logprobs, 0.0)
+        else
+            # @assert last_element-first_element+1 == length(n.log_probs) 
+            append!(logprobs, n.log_probs)
+        end
+    end
+    bc = BitCircuit(pc, data; on_decision)
+    ParamBitCircuit(bc, logprobs)
+end

From a3cdefacfac065faffae4543e2e7f5734a83653f Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Fri, 4 Sep 2020 21:10:45 -0500
Subject: [PATCH 088/131] [refactor] logistic circuits: parameter learning

---
 src/Logistic/Logistic.jl       |   4 +-
 src/Logistic/logistic_nodes.jl |  26 +++++++-
 src/Logistic/parameters.jl     | 116 +++++++++++++++++++++++++++++++++
 src/Logistic/queries.jl        |  66 ++++++++-----------
 4 files changed, 170 insertions(+), 42 deletions(-)
 create mode 100644 src/Logistic/parameters.jl

diff --git a/src/Logistic/Logistic.jl b/src/Logistic/Logistic.jl
index d5b03b10..69afd0a4 100644
--- a/src/Logistic/Logistic.jl
+++ b/src/Logistic/Logistic.jl
@@ -1,12 +1,10 @@
 module Logistic
 
 using LogicCircuits
-using ..Utils
 
 include("logistic_nodes.jl")
 include("queries.jl")
-# include("parameter_circuit.jl")
-# include("learn_parameters.jl")
+include("parameters.jl")
 
 # TODO structure learning
 
diff --git a/src/Logistic/logistic_nodes.jl b/src/Logistic/logistic_nodes.jl
index 0232ca2b..d22580b7 100644
--- a/src/Logistic/logistic_nodes.jl
+++ b/src/Logistic/logistic_nodes.jl
@@ -1,5 +1,5 @@
 export 
-    LogisticCircuit, 
+    LogisticCircuit, ParamBitCircuit,
     LogisticLeafNode, LogisticInnerNode, 
     LogisticLiteral, Logistic⋀Node, Logistic⋁Node,
     num_classes, num_parameters_per_class
@@ -79,6 +79,8 @@ import ..Utils: num_parameters
 @inline num_parameters(c::LogisticCircuit) = sum(n -> num_children(n) * classes(n), ⋁_nodes(c))
 @inline num_parameters_per_class(c::LogisticCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
 
+
+
 #####################
 # constructors and conversions
 #####################
@@ -90,3 +92,25 @@ function LogisticCircuit(circuit::LogicCircuit, classes::Int)
     f_o(n, cn) = Logistic⋁Node(cn, classes)
     foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, LogisticCircuit)
 end
+
+
+
+"""
+Construct a `BitCircuit` while storing edge parameters in a separate array
+"""
+function ParamBitCircuit(lc::LogisticCircuit, nc, data)
+    thetas::Vector{Vector{Float64}} = Vector{Vector{Float64}}()
+    on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
+        if isnothing(n)
+            # @assert first_element == last_element
+            push!(thetas, zeros(Float64, nc))
+        else
+            # @assert last_element-first_element+1 == length(n.log_probs) "$last_element-$first_element+1 != $(length(n.log_probs))"
+            for theta in eachrow(n.thetas)
+                push!(thetas, theta)
+            end
+        end
+    end
+    bc = BitCircuit(lc, data; on_decision)
+    ParamBitCircuit(bc, permutedims(hcat(params...), (2, 1)))
+end
\ No newline at end of file
diff --git a/src/Logistic/parameters.jl b/src/Logistic/parameters.jl
new file mode 100644
index 00000000..f13dceda
--- /dev/null
+++ b/src/Logistic/parameters.jl
@@ -0,0 +1,116 @@
+export learn_parameters
+
+using CUDA
+using LoopVectorization: @avx, vifelse
+
+"""
+Parameter learning through gradient descents
+"""
+function learn_parameters(lc::LogisticCircuit, nc::Int, data, labels; num_epochs=25, step_size=0.01)
+    bc = ParamBitCircuit(lc, nc, data)
+    labels = one_hot(labels, nc)
+    if isgpu(data)
+        for _ = 1:num_epochs
+            cl = class_likelihood_per_instance(bc, data)
+            update_parameters_gpu(to_gpu(bc), cl, to_gpu(labels), step_size)
+        end
+    else
+        for _ = 1:num_epochs
+            cl = class_likelihood_per_instance(bc, data)
+            update_parameters_cpu(bc, cw, labels, step_size)
+        end
+    end
+end
+
+function update_parameters_cpu(bc, cl, labels, step_size)
+    ne::Int = num_examples(data)
+    nc::Int = size(bc.params, 2)
+    params_lock::Threads.ReentrantLock = Threads.ReentrantLock()
+
+    @inline function on_edge_binary(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
+        lock(cw_lock) do # TODO: move lock to inner loop?
+            for i = 1:size(flows, 1)
+                @inbounds edge_flow = values[i, p] & values[i, s] & flows[i, dec_id]
+                first_true_bit = trailing_zeros(edge_flow) + 1
+                last_true_bit = 64 - leading_zeros(edge_flow)
+                @simd for j = first_true_bit:last_true_bit
+                    if get_bit(edge_flow, j)
+                        ex_id = ((i-1) << 6) + j
+                        for class = 1:nc
+                            @inbounds bc.params[el_id, class] -= (cl[ex_id, class] - labels[ex_id, class]) * step_size
+                        end
+                    end
+                end
+            end
+        end
+    end
+    
+    @inline function on_edge_float(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
+        if els_start != els_end
+            lock(cw_lock) do # TODO: move lock to inner loop?
+                @avx for i = 1:size(flows, 1)
+                    @inbounds edge_flow = values[i, p] * values[i, s] / values[i, dec_id] * flows[i, dec_id]
+                    edge_flow = vifelse(isfinite(edge_flow), edge_flow, zero(Float32))
+                    for class = 1:nc
+                        @inbounds bc.parames[el_id, class] -= (cl[i, class] - labels[i, class]) * edge_flow * step_size
+                    end
+                end
+            end
+        end
+        nothing
+    end
+end
+
+function update_parameters_gpu(bc, cl, labels, step_size)
+    ne::Int = num_examples(data)
+    nc::Int = size(bc.params, 2)
+    cl_device = CUDA.cudaconvert(cl)
+    labels = CUDA.cudaconvert(labels)
+    params_device = CUDA.cudaconvert(bc.params)
+
+    @inline function on_edge_binary(flows, values, dec_id, el_id, p, s, els_start, els_end, chunk_id, edge_flow)
+        if els_start != els_end
+            first_true_bit = 1 + trailing_zeros(edge_flow)
+            last_true_bit = 64 - leading_zeros(edge_flow)
+            for j = first_true_bit:last_true_bit
+                if get_bit(edge_flow, j)
+                    ex_id = ((chunk_id-1) << 6) + j
+                    for class = 1:nc
+                        CUDA.@atomic params_device[el_id, class] -= (cl_device[ex_id, class] - labels[ex_id, class]) * step_size
+                    end
+            end
+        end
+        nothing 
+    end
+
+    @inline function on_edge_float(flows, values, dec_id, el_id, p, s, els_start, els_end, ex_id, edge_flow)
+        if els_start != els_end
+            for class = 1:nc
+                CUDA.@atomic params_device[el_id, class] -= (cl_device[ex_id, class] - lables[ex_id, class]) * edge_flow * step_size
+            end
+        end      
+        nothing
+    end
+
+    if isbinarydata()
+        v,f = compute_values_flows(bc, data; on_edge = on_edge_binary) 
+    else
+        @assert isfpdata(data) "Only floating point and binary data are supported"
+        v,f = compute_values_flows(bc, data; on_edge = on_edge_float)
+    end
+    CUDA.unsafe_free!(v) # save the GC some effort
+    CUDA.unsafe_free!(f) # save the GC some effort
+
+    nothing
+end
+
+
+
+function one_hot(labels::Vector, nc::Integer)    
+    ne = length(labels) 
+    one_hot_labels = zeros(Float32, ne, nc)
+    for (i, j) in enumerate(labels)
+        one_hot_labels[i, j + 1] = 1.0
+    end
+    one_hot_labels
+end
\ No newline at end of file
diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index 7ceba404..5a177851 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -4,45 +4,35 @@ using CUDA
 using LoopVectorization: @avx, vifelse
 
 
-
 """
 Class Conditional Probability
 """
-
-function bitcircuit_with_params(lc, nc, data)
-    params::Vector{Vector{Float64}} = Vector{Vector{Float64}}()
-    on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
-        if isnothing(n)
-            # @assert first_element == last_element
-            push!(params, zeros(Float64, nc))
-        else
-            # @assert last_element-first_element+1 == length(n.log_probs) "$last_element-$first_element+1 != $(length(n.log_probs))"
-            for theta in eachrow(n.thetas)
-                push!(params, theta)
-            end
-        end
-    end
-    bc = BitCircuit(lc, data; on_decision)
-    (bc, permutedims(hcat(params...), (2, 1)))
-end
-
 function class_likelihood_per_instance(lc::LogicCircuit, nc::Int, data)    
     cw = class_weights_per_instance(lc, nc, data)
     isgpu(data) ? (@. 1.0 / (1.0 + exp(-cw))) : (@. @avx 1.0 / (1.0 + exp(-cw)))
 end
 
+function class_likelihood_per_instance(bc, data)
+    cw = class_likelihood_per_instance(bc, data)
+    isgpu(data) ? (@. 1.0 / (1.0 + exp(-cw))) : (@. @avx 1.0 / (1.0 + exp(-cw)))
+end
+
 function class_weights_per_instance(lc::LogisticCircuit, nc::Int, data)
-    bc, params = bitcircuit_with_params(lc, nc, data)
+    bc = ParamBitCircuit(lc, nc, data)
+    class_weights_per_instance(bc, data)
+end
+
+function class_weights_per_instance(bc, data)
     if isgpu(data)
-        class_weights_per_instance_gpu(to_gpu(bc), data, to_gpu(params))
+        class_weights_per_instance_gpu(to_gpu(bc), data)
     else
-        class_weights_per_instance_cpu(bc, data, params)
+        class_weights_per_instance_cpu(bc, data)
     end
 end
 
-function class_weights_per_instance_cpu(bc, data, params)
+function class_weights_per_instance_cpu(bc, data)
     ne::Int = num_examples(data)
-    nc::Int = size(params, 2)
+    nc::Int = size(bc.params, 2)
     cw::Matrix{Float64} = zeros(Float64, ne, nc)
     cw_lock::Threads.ReentrantLock = Threads.ReentrantLock()
  
@@ -56,8 +46,8 @@ function class_weights_per_instance_cpu(bc, data, params)
                     @simd for j = first_true_bit:last_true_bit
                         if get_bit(edge_flow, j)
                             ex_id = ((i-1) << 6) + j
-                            for class = 1:size(cw, 2)
-                                @inbounds cw[ex_id, class] += params[el_id, class]
+                            for class = 1:nc
+                                @inbounds cw[ex_id, class] += bc.params[el_id, class]
                             end
                         end
                     end
@@ -73,8 +63,8 @@ function class_weights_per_instance_cpu(bc, data, params)
                 @avx for i = 1:size(flows, 1)
                     @inbounds edge_flow = values[i, p] * values[i, s] / values[i, dec_id] * flows[i, dec_id]
                     edge_flow = vifelse(isfinite(edge_flow), edge_flow, zero(Float32))
-                    for class = 1:size(cw, 2)
-                        @inbounds cw[i, class] += edge_flow * params[el_id, class]
+                    for class = 1:nc
+                        @inbounds cw[i, class] += edge_flow * bc.params[el_id, class]
                     end
                 end
             end
@@ -91,21 +81,21 @@ function class_weights_per_instance_cpu(bc, data, params)
     return cw
 end
 
-function class_weights_per_instance_gpu(bc, data, params)
+function class_weights_per_instance_gpu(bc, data)
     ne::Int = num_examples(data)
-    nc::Int = size(params, 2)
+    nc::Int = size(bc.params, 2)
     cw::CuMatrix{Float64} = CUDA.zeros(Float64, num_examples(data), nc)
     cw_device = CUDA.cudaconvert(cw)
-    params_device = CUDA.cudaconvert(params)
+    params_device = CUDA.cudaconvert(bc.params)
 
     @inline function on_edge_binary(flows, values, dec_id, el_id, p, s, els_start, els_end, chunk_id, edge_flow)
         if els_start != els_end
-            first_true_bit = 1+trailing_zeros(edge_flow)
-            last_true_bit = 64-leading_zeros(edge_flow)
+            first_true_bit = 1 + trailing_zeros(edge_flow)
+            last_true_bit = 64 - leading_zeros(edge_flow)
             for j = first_true_bit:last_true_bit
                 if get_bit(edge_flow, j)
                     ex_id = ((chunk_id-1) << 6) + j
-                    for class = 1:size(cw_device, 2)
+                    for class = 1:nc
                         CUDA.@atomic cw_device[ex_id, class] += params_device[el_id, class]
                     end
                 end
@@ -116,7 +106,7 @@ function class_weights_per_instance_gpu(bc, data, params)
 
     @inline function on_edge_float(flows, values, dec_id, el_id, p, s, els_start, els_end, ex_id, edge_flow)
         if els_start != els_end
-            for class = 1:size(cw_device, 2)
+            for class = 1:nc
                 CUDA.@atomic cw_device[ex_id, class] += edge_flow * params_device[el_id, class]
             end
         end
@@ -155,11 +145,11 @@ end
 """
 Prediction accuracy
 """
-accuracy(lc::LogisticCircuit, nc::Int, data, labels) = 
+accuracy(lc::LogisticCircuit, nc::Int, data, labels::Vector) = 
     accuracy(predict_class(lc, nc, data), labels)
 
-accuracy(predicted_class, labels) = 
+accuracy(predicted_class::Vector, labels::Vector) = 
     Float64(sum(@. predicted_class == labels)) / length(labels)
 
-accuracy(class_likelihoods, labels) = 
+accuracy(class_likelihoods::Matrix, labels::Vector) = 
     accuracy(predict_class(class_likelihoods), labels)

From d5a0b09018e02ee415ec82c0f262311416df26de Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Fri, 4 Sep 2020 21:33:57 -0500
Subject: [PATCH 089/131] [fix] missing partial commit

---
 src/Logistic/logistic_nodes.jl |  2 +-
 src/Logistic/parameters.jl     | 13 ++++++++++++-
 2 files changed, 13 insertions(+), 2 deletions(-)

diff --git a/src/Logistic/logistic_nodes.jl b/src/Logistic/logistic_nodes.jl
index d22580b7..099e51e7 100644
--- a/src/Logistic/logistic_nodes.jl
+++ b/src/Logistic/logistic_nodes.jl
@@ -1,5 +1,5 @@
 export 
-    LogisticCircuit, ParamBitCircuit,
+    LogisticCircuit,
     LogisticLeafNode, LogisticInnerNode, 
     LogisticLiteral, Logistic⋀Node, Logistic⋁Node,
     num_classes, num_parameters_per_class
diff --git a/src/Logistic/parameters.jl b/src/Logistic/parameters.jl
index f13dceda..5b548c52 100644
--- a/src/Logistic/parameters.jl
+++ b/src/Logistic/parameters.jl
@@ -59,8 +59,18 @@ function update_parameters_cpu(bc, cl, labels, step_size)
         end
         nothing
     end
+
+    if isbinarydata(data)
+        v,f = compute_values_flows(bc, data; on_edge = on_edge_binary) 
+    else
+        @assert isfpdata(data) "Only floating point and binary data are supported"
+        v,f = compute_values_flows(bc, data; on_edge = on_edge_float)
+    end
+
+    nothing
 end
 
+
 function update_parameters_gpu(bc, cl, labels, step_size)
     ne::Int = num_examples(data)
     nc::Int = size(bc.params, 2)
@@ -78,6 +88,7 @@ function update_parameters_gpu(bc, cl, labels, step_size)
                     for class = 1:nc
                         CUDA.@atomic params_device[el_id, class] -= (cl_device[ex_id, class] - labels[ex_id, class]) * step_size
                     end
+                end
             end
         end
         nothing 
@@ -92,7 +103,7 @@ function update_parameters_gpu(bc, cl, labels, step_size)
         nothing
     end
 
-    if isbinarydata()
+    if isbinarydata(data)
         v,f = compute_values_flows(bc, data; on_edge = on_edge_binary) 
     else
         @assert isfpdata(data) "Only floating point and binary data are supported"

From 74ecc195670f93fef0eb698d33bd938719da5e0e Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Fri, 4 Sep 2020 23:24:59 -0500
Subject: [PATCH 090/131] [fix] typo

---
 src/Logistic/logistic_nodes.jl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Logistic/logistic_nodes.jl b/src/Logistic/logistic_nodes.jl
index 099e51e7..5d3f957e 100644
--- a/src/Logistic/logistic_nodes.jl
+++ b/src/Logistic/logistic_nodes.jl
@@ -112,5 +112,5 @@ function ParamBitCircuit(lc::LogisticCircuit, nc, data)
         end
     end
     bc = BitCircuit(lc, data; on_decision)
-    ParamBitCircuit(bc, permutedims(hcat(params...), (2, 1)))
+    ParamBitCircuit(bc, permutedims(hcat(thetas...), (2, 1)))
 end
\ No newline at end of file

From 7ededfbf7a3b5bd2a30f6f05ca9f18fac04452af Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Fri, 4 Sep 2020 23:56:42 -0500
Subject: [PATCH 091/131] [refactoring] move lc nodes out of submodule

---
 src/Logistic/Logistic.jl             |  2 +-
 src/Logistic/learn_parameters.jl     | 49 ----------------------------
 src/ProbabilisticCircuits.jl         |  6 +++-
 src/{Logistic => }/logistic_nodes.jl | 22 -------------
 src/param_bit_circuit.jl             | 21 ++++++++++++
 5 files changed, 27 insertions(+), 73 deletions(-)
 delete mode 100644 src/Logistic/learn_parameters.jl
 rename src/{Logistic => }/logistic_nodes.jl (76%)

diff --git a/src/Logistic/Logistic.jl b/src/Logistic/Logistic.jl
index 69afd0a4..e36fcb59 100644
--- a/src/Logistic/Logistic.jl
+++ b/src/Logistic/Logistic.jl
@@ -1,8 +1,8 @@
 module Logistic
 
 using LogicCircuits
+using ...ProbabilisticCircuits
 
-include("logistic_nodes.jl")
 include("queries.jl")
 include("parameters.jl")
 
diff --git a/src/Logistic/learn_parameters.jl b/src/Logistic/learn_parameters.jl
deleted file mode 100644
index 1bb8219c..00000000
--- a/src/Logistic/learn_parameters.jl
+++ /dev/null
@@ -1,49 +0,0 @@
-export learn_parameters
-
-using LogicCircuits: compute_flows, or_nodes
-using LoopVectorization: @avx
-
-"""
-Maximum likilihood estimation of parameters given data through gradient descent
-"""
-function learn_parameters(lc::LogisticCircuit, classes::Int, data, labels; num_epochs=30, step_size=0.1, flows_computed=false)
-
-    @inline function one_hot(labels::Vector, classes::Int)        
-        one_hot_labels = zeros(length(labels), classes)
-        for (i, j) in enumerate(labels)
-            one_hot_labels[i, j] = 1.0
-        end
-        one_hot_labels
-    end
-
-    one_hot_labels = one_hot(labels, classes)
-    if !flows_computed
-        compute_flows(lc, data)
-    end
-
-    for _ = 1:num_epochs
-        class_probs = class_likelihood_per_instance(lc, classes, data; flows_computed=true)
-        update_parameters(lc, class_probs, one_hot_labels)
-    end
-
-    nothing
-end
-
-
-@inline function update_parameters(lc::LogisticCircuit, class_probs, one_hot_labels; step_size=0.1)
-    num_samples = Float64(size(one_hot_labels)[1])
-    error = class_probs .- one_hot_labels
-    
-    foreach(or_nodes(lc)) do ln
-        foreach(eachrow(ln.thetas), children(ln)) do theta, c
-            flow = Float64.(downflow(ln, c))
-            @avx update_amount = flow' * error / num_samples * step_size
-            update_amount = dropdims(update_amount; dims=1)
-            @avx @. theta -= update_amount
-        end
-    end
-    
-    nothing
-end
-
-
diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 01e6e11c..62e3fb4d 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -12,13 +12,17 @@ include("Utils/Utils.jl")
 
 include("abstract_prob_nodes.jl")
 include("plain_prob_nodes.jl")
+include("structured_prob_nodes.jl")
+include("logistic_nodes.jl")
 include("param_bit_circuit.jl")
 include("parameters.jl")
-include("structured_prob_nodes.jl")
 
 include("queries/likelihood.jl")
 include("queries/marginal_flow.jl")
 
+include("Logistic/Logistic.jl")
+@reexport using .Logistic
+
 # include("exp_flows.jl")
 # include("queries.jl")
 # include("informations.jl")
diff --git a/src/Logistic/logistic_nodes.jl b/src/logistic_nodes.jl
similarity index 76%
rename from src/Logistic/logistic_nodes.jl
rename to src/logistic_nodes.jl
index 5d3f957e..158bb685 100644
--- a/src/Logistic/logistic_nodes.jl
+++ b/src/logistic_nodes.jl
@@ -91,26 +91,4 @@ function LogisticCircuit(circuit::LogicCircuit, classes::Int)
     f_a(n, cn) = Logistic⋀Node(cn)
     f_o(n, cn) = Logistic⋁Node(cn, classes)
     foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, LogisticCircuit)
-end
-
-
-
-"""
-Construct a `BitCircuit` while storing edge parameters in a separate array
-"""
-function ParamBitCircuit(lc::LogisticCircuit, nc, data)
-    thetas::Vector{Vector{Float64}} = Vector{Vector{Float64}}()
-    on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
-        if isnothing(n)
-            # @assert first_element == last_element
-            push!(thetas, zeros(Float64, nc))
-        else
-            # @assert last_element-first_element+1 == length(n.log_probs) "$last_element-$first_element+1 != $(length(n.log_probs))"
-            for theta in eachrow(n.thetas)
-                push!(thetas, theta)
-            end
-        end
-    end
-    bc = BitCircuit(lc, data; on_decision)
-    ParamBitCircuit(bc, permutedims(hcat(thetas...), (2, 1)))
 end
\ No newline at end of file
diff --git a/src/param_bit_circuit.jl b/src/param_bit_circuit.jl
index 6f4a685e..ed143d38 100644
--- a/src/param_bit_circuit.jl
+++ b/src/param_bit_circuit.jl
@@ -20,6 +20,10 @@ to_gpu(c::ParamBitCircuit) =
 to_cpu(c::ParamBitCircuit) = 
     ParamBitCircuit(to_cpu(c.bitcircuit), to_cpu(c.params))
 
+
+"""
+Construct a `BitCircuit` while storing edge parameters in a separate array
+"""
 function ParamBitCircuit(pc::ProbCircuit, data)
     logprobs::Vector{Float64} = Vector{Float64}()
     on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
@@ -34,3 +38,20 @@ function ParamBitCircuit(pc::ProbCircuit, data)
     bc = BitCircuit(pc, data; on_decision)
     ParamBitCircuit(bc, logprobs)
 end
+
+function ParamBitCircuit(lc::LogisticCircuit, nc, data)
+    thetas::Vector{Vector{Float64}} = Vector{Vector{Float64}}()
+    on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
+        if isnothing(n)
+            # @assert first_element == last_element
+            push!(thetas, zeros(Float64, nc))
+        else
+            # @assert last_element-first_element+1 == length(n.log_probs) "$last_element-$first_element+1 != $(length(n.log_probs))"
+            for theta in eachrow(n.thetas)
+                push!(thetas, theta)
+            end
+        end
+    end
+    bc = BitCircuit(lc, data; on_decision)
+    ParamBitCircuit(bc, permutedims(hcat(thetas...), (2, 1)))
+end

From c8d51a22f9eafc0050b9bddfd8679cd1d47aea5d Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Sat, 5 Sep 2020 00:04:27 -0500
Subject: [PATCH 092/131] [rename] api name changes

---
 src/Logistic/parameters.jl | 8 ++++----
 src/Logistic/queries.jl    | 8 ++++----
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/src/Logistic/parameters.jl b/src/Logistic/parameters.jl
index 5b548c52..dbb19430 100644
--- a/src/Logistic/parameters.jl
+++ b/src/Logistic/parameters.jl
@@ -61,10 +61,10 @@ function update_parameters_cpu(bc, cl, labels, step_size)
     end
 
     if isbinarydata(data)
-        v,f = compute_values_flows(bc, data; on_edge = on_edge_binary) 
+        v,f = satisfies_flows(bc, data; on_edge = on_edge_binary) 
     else
         @assert isfpdata(data) "Only floating point and binary data are supported"
-        v,f = compute_values_flows(bc, data; on_edge = on_edge_float)
+        v,f = satisfies_flows(bc, data; on_edge = on_edge_float)
     end
 
     nothing
@@ -104,10 +104,10 @@ function update_parameters_gpu(bc, cl, labels, step_size)
     end
 
     if isbinarydata(data)
-        v,f = compute_values_flows(bc, data; on_edge = on_edge_binary) 
+        v,f = satisfies_flows(bc, data; on_edge = on_edge_binary) 
     else
         @assert isfpdata(data) "Only floating point and binary data are supported"
-        v,f = compute_values_flows(bc, data; on_edge = on_edge_float)
+        v,f = satisfies_flows(bc, data; on_edge = on_edge_float)
     end
     CUDA.unsafe_free!(v) # save the GC some effort
     CUDA.unsafe_free!(f) # save the GC some effort
diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index 5a177851..a0e65602 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -73,9 +73,9 @@ function class_weights_per_instance_cpu(bc, data)
     end
 
     if isbinarydata(data)
-        compute_values_flows(bc, data; on_edge = on_edge_binary)
+        satisfies_flows(bc, data; on_edge = on_edge_binary)
     else
-        compute_values_flows(bc, data; on_edge = on_edge_float)
+        satisfies_flows(bc, data; on_edge = on_edge_float)
     end
 
     return cw
@@ -114,10 +114,10 @@ function class_weights_per_instance_gpu(bc, data)
     end
     
     if isbinarydata(data)
-        v,f = compute_values_flows(bc, data; on_edge = on_edge_binary)
+        v,f = satisfies_flows(bc, data; on_edge = on_edge_binary)
     else
         @assert isfpdata(data) "Only floating point and binary data are supported"
-        v,f = compute_values_flows(bc, data; on_edge = on_edge_float)
+        v,f = satisfies_flows(bc, data; on_edge = on_edge_float)
     end
     CUDA.unsafe_free!(v) # save the GC some effort
     CUDA.unsafe_free!(f) # save the GC some effort

From d17f264479ec23b1e9d4f458f3cd353c17f4d7e7 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 6 Sep 2020 01:10:54 -0500
Subject: [PATCH 093/131] fixes for CPU parameter estimation

---
 src/ProbabilisticCircuits.jl |   4 +-
 src/parameters.jl            |  36 ++--
 src/queries/marginal_flow.jl | 360 ++++++++++++++---------------------
 3 files changed, 170 insertions(+), 230 deletions(-)

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 01e6e11c..8b6012ae 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -16,8 +16,8 @@ include("param_bit_circuit.jl")
 include("parameters.jl")
 include("structured_prob_nodes.jl")
 
-include("queries/likelihood.jl")
-include("queries/marginal_flow.jl")
+# include("queries/likelihood.jl")
+# include("queries/marginal_flow.jl")
 
 # include("exp_flows.jl")
 # include("queries.jl")
diff --git a/src/parameters.jl b/src/parameters.jl
index 492b0a90..d977c451 100644
--- a/src/parameters.jl
+++ b/src/parameters.jl
@@ -20,7 +20,7 @@ function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
             if num_children(pn) == 1
                 pn.log_probs .= zero(Float64)
             else
-                id = (pn.data::⋁NodeId).node_id
+                id = (pn.data::⋁NodeIds).node_id
                 @inbounds els_start = bc.nodes[1,id]
                 @inbounds els_end = bc.nodes[2,id]
                 @inbounds @views pn.log_probs .= params[els_start:els_end]
@@ -37,29 +37,41 @@ function estimate_parameters_cpu(bc, data, pseudocount)
     node_counts::Vector{UInt} = Vector{UInt}(undef, num_nodes(bc))
     log_params::Vector{Float64} = Vector{Float64}(undef, num_elements(bc))
 
-    @inline function on_node(flows, values, dec_id, els_start, els_end, locks)
-        if els_start != els_end
+    @inline function on_node(flows, values, dec_id)
+        if !has_single_child(bc.nodes, dec_id)
             @inbounds node_counts[dec_id] = sum(1:size(flows,1)) do i
                 count_ones(flows[i, dec_id]) 
             end
         end
-        nothing
+    end
+
+    @inline function estimate(el_id, parent, edge_count)
+        num_els = num_elements(bc.nodes, parent)
+        @inbounds log_params[el_id] = 
+            log((edge_count+pseudocount/num_els)
+                   /(node_counts[parent]+pseudocount))
     end
     
-    @inline function on_edge(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
-        if els_start != els_end
+    @inline function on_edge(flows, values, dec_id, par, grandpa)
+        if !has_single_child(bc.nodes, grandpa)
             edge_count = sum(1:size(flows,1)) do i
-                @inbounds count_ones(values[i, p] & values[i, s] & flows[i, dec_id]) 
+                @inbounds count_ones(flows[i, grandpa]) 
             end
-            # TODO do the log before the division?
-            log_param = log((edge_count+pseudocount/(els_end-els_start+1))
-                            /(node_counts[dec_id]+pseudocount))
-            @inbounds log_params[el_id] = log_param
+            estimate(par, grandpa, edge_count)
+        end
+    end
+
+    @inline function on_edge(flows, values, dec_id, par, grandpa, sib_id)
+        if !has_single_child(bc.nodes, grandpa)
+            edge_count = sum(1:size(flows,1)) do i
+                @inbounds count_ones(values[i, dec_id] & values[i, sib_id] & flows[i, grandpa]) 
+            end
+            estimate(par, grandpa, edge_count)
         end
-        nothing
     end
 
     satisfies_flows(bc, data; on_node, on_edge)
+
     return log_params
 end
 
diff --git a/src/queries/marginal_flow.jl b/src/queries/marginal_flow.jl
index 349c75a1..ef23a059 100644
--- a/src/queries/marginal_flow.jl
+++ b/src/queries/marginal_flow.jl
@@ -148,219 +148,147 @@ function marginal_layers_cuda(layer, nodes, elements, params, values)
 end
 
 
-# export evaluate_exp, compute_exp_flows, get_downflow, get_upflow, get_exp_downflow, get_exp_upflow
-
-
-
-# # TODO move to LogicCircuits
-# # TODO downflow struct
-# using LogicCircuits: materialize, UpFlow, UpDownFlow, UpDownFlow1, UpDownFlow2
-
-# """
-# Get upflow from logic circuit
-# """
-# @inline get_upflow(n::LogicCircuit) = get_upflow(n.data)
-# @inline get_upflow(elems::UpDownFlow1) = elems.upflow
-# @inline get_upflow(elems::UpFlow) = materialize(elems)
-
-# """
-# Get the node/edge flow from logic circuit
-# """
-# function get_downflow(n::LogicCircuit; root=nothing)::BitVector
-#     downflow(x::UpDownFlow1) = x.downflow
-#     downflow(x::UpDownFlow2) = begin
-#         ors = or_nodes(root)
-#         p = findall(p -> n in children(p), ors)
-#         @assert length(p) == 1
-#         get_downflow(ors[p[1]], n)
-#     end
-#     downflow(n.data)
-# end
-
-# function get_downflow(n::LogicCircuit, c::LogicCircuit)::BitVector
-#     @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
-#     get_downflow(n) .& get_upflow(c)
-# end
-
-# #####################
-# # performance-critical queries related to circuit flows
-# #####################
-
-# "Container for circuit flows represented as a float vector"
-# const ExpUpFlow1 = Vector{Float64}
-
-# "Container for circuit flows represented as an implicit conjunction of a prime and sub float vector (saves memory allocations in circuits with many binary conjunctions)"
-# struct ExpUpFlow2
-#     prime_flow::Vector{Float64}
-#     sub_flow::Vector{Float64}
-# end
-
-# const ExpUpFlow = Union{ExpUpFlow1,ExpUpFlow2}
-
-# @inline ExpUpFlow1(elems::ExpUpFlow1) = elems
-# @inline ExpUpFlow1(elems::ExpUpFlow2) = elems.prime_flow .+ elems.sub_flow
-
-# function evaluate_exp(root::ProbCircuit, data;
-#                    nload = nload, nsave = nsave, reset=true)::Vector{Float64}
-#     n_ex::Int = num_examples(data)
-#     ϵ = 0.0
-
-#     @inline f_lit(n) = begin
-#         uf = convert(Vector{Int8}, feature_values(data, variable(n)))
-#         if ispositive(n)
-#             uf[uf.==-1] .= 1
-#         else
-#             uf .= 1 .- uf
-#             uf[uf.==2] .= 1
-#         end
-#         uf = convert(Vector{Float64}, uf)
-#         uf .= log.(uf .+ ϵ)
-#     end
-    
-#     @inline f_con(n) = begin
-#         uf = istrue(n) ? ones(Float64, n_ex) : zeros(Float64, n_ex)
-#         uf .= log.(uf .+ ϵ)
-#     end
-    
-#     @inline fa(n, call) = begin
-#         if num_children(n) == 1
-#             return ExpUpFlow1(call(@inbounds children(n)[1]))
-#         else
-#             c1 = call(@inbounds children(n)[1])::ExpUpFlow
-#             c2 = call(@inbounds children(n)[2])::ExpUpFlow
-#             if num_children(n) == 2 && c1 isa ExpUpFlow1 && c2 isa ExpUpFlow1 
-#                 return ExpUpFlow2(c1, c2) # no need to allocate a new BitVector
-#             end
-#             x = flowop(c1, c2, +)
-#             for c in children(n)[3:end]
-#                 accumulate(x, call(c), +)
-#             end
-#             return x
-#         end
-#     end
-    
-#     @inline fo(n, call) = begin
-#         if num_children(n) == 1
-#             return ExpUpFlow1(call(@inbounds children(n)[1]))
-#         else
-#             log_probs = n.log_probs
-#             c1 = call(@inbounds children(n)[1])::ExpUpFlow
-#             c2 = call(@inbounds children(n)[2])::ExpUpFlow
-#             x = flowop(c1, log_probs[1], c2, log_probs[2], logsumexp)
-#             for (i, c) in enumerate(children(n)[3:end])
-#                 accumulate(x, call(c), log_probs[i+2], logsumexp)
-#             end
-#             return x
-#         end
-#     end
-    
-#     # ensure flow us Flow1 at the root, even when it's a conjunction
-#     root_flow = ExpUpFlow1(foldup(root, f_con, f_lit, fa, fo, ExpUpFlow; nload, nsave, reset))
-#     return nsave(root, root_flow)
-# end
-
-# @inline flowop(x::ExpUpFlow, y::ExpUpFlow, op)::ExpUpFlow1 =
-#     op.(ExpUpFlow1(x), ExpUpFlow1(y))
-
-# @inline flowop(x::ExpUpFlow, w1::Float64, y::ExpUpFlow, w2::Float64, op)::ExpUpFlow1 =
-#     op.(ExpUpFlow1(x) .+ w1, ExpUpFlow1(y) .+ w2)
-
-# import Base.accumulate
-# @inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, op) = 
-#     @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v)); nothing
-
-# @inline accumulate(x::ExpUpFlow1, v::ExpUpFlow, w::Float64, op) = 
-#     @inbounds @. x = op($ExpUpFlow1(x), $ExpUpFlow1(v) + w); nothing
-
-
-# #####################
-# # downward pass
-# #####################
-
-# struct ExpUpDownFlow1
-#     upflow::ExpUpFlow1
-#     downflow::Vector{Float64}
-#     ExpUpDownFlow1(upf::ExpUpFlow1) = new(upf, log.(zeros(Float64, length(upf)) .+ 1e-300))
-# end
-
-# const ExpUpDownFlow2 = ExpUpFlow2
-
-# const ExpUpDownFlow = Union{ExpUpDownFlow1, ExpUpDownFlow2}
-
-
-# function compute_exp_flows(circuit::ProbCircuit, data)
-
-#     # upward pass
-#     @inline upflow!(n, v) = begin
-#         n.data = (v isa ExpUpFlow1) ? ExpUpDownFlow1(v) : v
-#         v
-#     end
-
-#     @inline upflow(n) = begin
-#         d = n.data::ExpUpDownFlow
-#         (d isa ExpUpDownFlow1) ? d.upflow : d
-#     end
-
-#     evaluate_exp(circuit, data; nload=upflow, nsave=upflow!, reset=false)
-    
-#     # downward pass
-
-#     @inline downflow(n) = (n.data::ExpUpDownFlow1).downflow
-#     @inline isfactorized(n) = n.data::ExpUpDownFlow isa ExpUpDownFlow2
-
-#     downflow(circuit) .= 0.0
-
-#     foreach_down(circuit; setcounter=false) do n
-#         if isinner(n) && !isfactorized(n)
-#             downflow_n = downflow(n)
-#             upflow_n = upflow(n)
-#             for ite in 1 : num_children(n)
-#                 c = children(n)[ite]
-#                 log_theta = is⋀gate(n) ? 0.0 : n.log_probs[ite]
-#                 if isfactorized(c)
-#                     upflow2_c = c.data::ExpUpDownFlow2
-#                     # propagate one level further down
-#                     for i = 1:2
-#                         downflow_c = downflow(@inbounds children(c)[i])
-#                         accumulate(downflow_c, downflow_n .+ log_theta .+ upflow2_c.prime_flow 
-#                         .+ upflow2_c.sub_flow .- upflow_n, logsumexp)
-#                     end
-#                 else
-#                     upflow1_c = (c.data::ExpUpDownFlow1).upflow
-#                     downflow_c = downflow(c)
-#                     accumulate(downflow_c, downflow_n .+ log_theta .+ upflow1_c .- upflow_n, logsumexp)
-#                 end
-#             end 
-#         end
-#         nothing
-#     end
-#     nothing
-# end
-
-
-# """
-# Get upflow of a probabilistic circuit
-# """
-# @inline get_exp_upflow(pc::ProbCircuit) = get_exp_upflow(pc.data)
-# @inline get_exp_upflow(elems::ExpUpDownFlow1) = elems.upflow
-# @inline get_exp_upflow(elems::ExpUpFlow) = ExpUpFlow1(elems)
-
-# """
-# Get the node/edge downflow from probabilistic circuit
-# """
-# function get_exp_downflow(n::ProbCircuit; root=nothing)::Vector{Float64}
-#     downflow(x::ExpUpDownFlow1) = x.downflow
-#     downflow(x::ExpUpDownFlow2) = begin
-#         ors = or_nodes(root)
-#         p = findall(p -> n in children(p), ors)
-#         @assert length(p) == 1
-#         get_exp_downflow(ors[p[1]], n)
-#     end
-#     downflow(n.data)
-# end
-
-# function get_exp_downflow(n::ProbCircuit, c::ProbCircuit)::Vector{Float64}
-#     @assert !is⋁gate(c) && is⋁gate(n) && c in children(n)
-#     log_theta = n.log_probs[findfirst(x -> x == c, children(n))]
-#     return get_exp_downflow(n) .+ log_theta .+ get_exp_upflow(c) .- get_exp_upflow(n)
-# end
\ No newline at end of file
+
+#####################
+# Bit circuit values and flows (up and downward pass)
+#####################
+
+"Compute the value and flow of each node"
+function marginal_flows(circuit::ProbCircuit, data, 
+    reuse_values=nothing, reuse_flows=nothing; on_node=noop, on_edge=noop) 
+    bc = same_device(ProbBitCircuit(circuit, data), data)
+    marginal_flows(bc, data, reuse_values, reuse_flows; on_node, on_edge)
+end
+
+function marginal_flows(circuit::ParamBitCircuit, data, 
+            reuse_values=nothing, reuse_flows=nothing; on_node=noop, on_edge=noop)
+    values = marginal_all(circuit, data, reuse_values)
+    flows = marginal_flows_down(circuit, values, reuse_flows; on_node, on_edge)
+    return values, flows
+end
+
+#####################
+# Bit circuit flows downward pass
+#####################
+
+"When marginals at nodes have already been computed, do a downward pass computing the marginal flows at each node"
+function marginal_flows_down(circuit::ParamBitCircuit, values, reuse=nothing; on_node=noop, on_edge=noop)
+    flows = similar!(reuse, typeof(values), size(values)...)
+    init_marginal_flows(flows, values)
+    marginal_flows_down_layers(circuit, flows, values, on_node, on_edge)
+    return flows
+end
+
+function init_marginal_flows(flows::AbstractArray{F}, values::AbstractArray{F}) where F
+    flows .= zero(F)
+    @views flows[:,end] .= values[:,end] # set flow at root
+end
+
+# downward pass helpers on CPU
+
+function marginal_flows_down_layers(circuit::ParamBitCircuit, flows::Matrix, values::Matrix, on_node, on_edge)
+    els = circuit.bitcircuit.elements
+    locks = [Threads.ReentrantLock() for i=1:num_nodes(circuit)]    
+    for layer in Iterators.reverse(circuit.bitcircuit.layers)
+        Threads.@threads for dec_id in layer
+            els_start = @inbounds circuit.bitcircuit.nodes[1,dec_id]
+            els_end = @inbounds circuit.bitcircuit.nodes[2,dec_id]
+            on_node(flows, values, dec_id, els_start, els_end, locks)
+            #TODO do something faster when els_start == els_end?
+            for j = els_start:els_end
+                p = els[2,j]
+                s = els[3,j]
+                θ = circuit.params[j]
+                accum_marginal_flow(flows, values, dec_id, p, s, θ, locks)
+                on_edge(flows, values, dec_id, j, p, s, els_start, els_end, locks)
+            end
+        end
+    end
+end
+
+function accum_marginal_flow(f::Matrix{<:AbstractFloat}, v, d, p, s, θ, locks)
+    # retrieve locks in index order to avoid deadlock
+    l1, l2 = order_asc(p,s)
+    lock(locks[l1]) do 
+        lock(locks[l2]) do 
+            # note: in future, if there is a need to scale to many more threads, it would be beneficial to avoid this synchronization by ordering downward pass layers by child id, not parent id, so that there is no contention when processing a single layer and no need for synchronization, as in the upward pass
+            @avx for j in 1:size(f,1)
+                edge_flow = v[j, p] + v[j, s] - v[j, d] + f[j, d] + θ
+                edge_flow = vifelse(isfinite(edge_flow), edge_flow, log(zero(Float32)))
+                x = f[j, p]
+                y = edge_flow
+                Δ = ifelse(x == y, zero(Float64), abs(x - y))
+                @inbounds f[j,p] = max(x, y) + log1p(exp(-Δ))
+                x = f[j, s]
+                Δ = ifelse(x == y, zero(Float64), abs(x - y))
+                @inbounds f[j,s] = max(x, y) + log1p(exp(-Δ))
+            end
+        end
+    end
+end
+
+
+# downward pass helpers on GPU
+
+"Pass flows down the layers of a bit circuit on the GPU"
+function marginal_flows_down_layers(circuit::ParamBitCircuit, flows::CuMatrix, values::CuMatrix, on_node, on_edge; 
+            dec_per_thread = 4, log2_threads_per_block = 8)
+    bc = circuit.bitcircuit
+    CUDA.@sync for layer in Iterators.reverse(bc.layers)
+        num_examples = size(values, 1)
+        num_decision_sets = length(layer)/dec_per_thread
+        num_threads =  balance_threads(num_examples, num_decision_sets, log2_threads_per_block)
+        num_blocks = (ceil(Int, num_examples/num_threads[1]), 
+                      ceil(Int, num_decision_sets/num_threads[2])) 
+        @cuda threads=num_threads blocks=num_blocks marginal_flows_down_layers_cuda(layer, bc.nodes, bc.elements, circuit.params, flows, values, on_node, on_edge)
+    end
+end
+
+"CUDA kernel for passing flows down circuit"
+function marginal_flows_down_layers_cuda(layer, nodes, elements, params, flows, values, on_node, on_edge)
+    index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
+    index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
+    stride_x = blockDim().x * gridDim().x
+    stride_y = blockDim().y * gridDim().y
+    for k = index_x:stride_x:size(values,1)
+        for i = index_y:stride_y:length(layer) #TODO swap loops??
+            dec_id = @inbounds layer[i]
+            els_start = @inbounds nodes[1,dec_id]
+            els_end = @inbounds nodes[2,dec_id]
+            n_up = @inbounds values[k, dec_id]
+            on_node(flows, values, dec_id, els_start, els_end, k)
+            if !iszero(n_up) # on_edge will only get called when edge flows are non-zero
+                n_down = @inbounds flows[k, dec_id]
+                #TODO do something faster when els_start == els_end?
+                for j = els_start:els_end
+                    p = @inbounds elements[2,j]
+                    s = @inbounds elements[3,j]
+                    @inbounds edge_flow = values[k, p] + values[k, s] - n_up + n_down + params[j]
+                    # following needs to be memory safe, hence @atomic
+
+                    @inbounds y = values[j, elements[2,k]] + values[j, elements[3,k]] + params[k]
+                    Δ = ifelse(x == y, zero(Float64), CUDA.abs(x - y))
+                    x = max(x, y) + CUDA.log1p(CUDA.exp(-Δ))
+
+                    
+                    accum_flow(flows, k, p, edge_flow)
+                    accum_flow(flows, k, s, edge_flow)
+
+
+                    
+                    on_edge(flows, values, dec_id, j, p, s, els_start, els_end, k, edge_flow)
+                end
+            end
+        end
+    end
+    return nothing
+end
+
+compute_edge_flow(p_up::AbstractFloat, s_up, n_up, n_down) = p_up * s_up / n_up * n_down
+compute_edge_flow(p_up::Unsigned, s_up, n_up, n_down) = p_up & s_up & n_down
+
+accum_flow(flows, j, e, edge_flow::AbstractFloat) = 
+    CUDA.@atomic flows[j, e] += edge_flow #atomic is automatically inbounds
+
+accum_flow(flows, j, e, edge_flow::Unsigned) = 
+    CUDA.@atomic flows[j, e] |= edge_flow #atomic is automatically inbounds

From 350ddfcb0dd45235095b4e52f9709af33a590adc Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 6 Sep 2020 14:52:16 -0500
Subject: [PATCH 094/131] fixed parameter estimation

---
 Project.toml      |  6 ++--
 src/parameters.jl | 78 ++++++++++++++++++++---------------------------
 2 files changed, 36 insertions(+), 48 deletions(-)

diff --git a/Project.toml b/Project.toml
index c61156e4..7b255547 100644
--- a/Project.toml
+++ b/Project.toml
@@ -12,9 +12,9 @@ LightGraphs = "093fc24a-ae57-5d10-9952-331d41423f4d"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
 LogicCircuits = "a7847b3b-b7f1-4dd5-83c3-60e0aa0f8599"
 LoopVectorization = "bdcacae8-1622-11e9-2a5c-532679323890"
+MLDatasets = "eb30cadb-4394-5ae3-aed4-317e484a6458"
 MetaGraphs = "626554b9-1ddb-594c-aa3c-2596fe9399a5"
 Metis = "2679e427-3c69-5b7f-982b-ece356f1e94b"
-MLDatasets = "eb30cadb-4394-5ae3-aed4-317e484a6458"
 Pkg = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f"
 Printf = "de0858da-6303-5e67-8744-51eddeeeb8d7"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
@@ -33,12 +33,12 @@ DataFrames = "0.21"
 DataStructures = "0.17"
 LightGraphs = "1.3"
 LogicCircuits = "0.1.1"
+LoopVectorization = "0.8.20"
+MLDatasets = "0.4, 0.5"
 MetaGraphs = "0.6"
 Metis = "1.0"
-MLDatasets = "0.4, 0.5"
 Reexport = "0.2"
 SimpleWeightedGraphs = "1.1"
 StatsBase = "0.33"
 StatsFuns = "0.9"
-LoopVectorization = "0.8.20"
 julia = "1.5"
diff --git a/src/parameters.jl b/src/parameters.jl
index d977c451..3f115367 100644
--- a/src/parameters.jl
+++ b/src/parameters.jl
@@ -10,7 +10,7 @@ Maximum likilihood estimation of parameters given data
 function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
     @assert isbinarydata(data) "Probabilistic circuit parameter estimation for binary data only"
     bc = BitCircuit(pc, data; reset=false)
-    params::Vector{Float64} = if isgpu(data)
+    params = if isgpu(data)
         estimate_parameters_gpu(to_gpu(bc), data, pseudocount)
     else
         estimate_parameters_cpu(bc, data, pseudocount)
@@ -38,39 +38,34 @@ function estimate_parameters_cpu(bc, data, pseudocount)
     log_params::Vector{Float64} = Vector{Float64}(undef, num_elements(bc))
 
     @inline function on_node(flows, values, dec_id)
-        if !has_single_child(bc.nodes, dec_id)
-            @inbounds node_counts[dec_id] = sum(1:size(flows,1)) do i
+        # if !has_single_child(bc.nodes, dec_id)
+            node_counts[dec_id] = sum(1:size(flows,1)) do i
                 count_ones(flows[i, dec_id]) 
             end
-        end
+        # end
     end
 
-    @inline function estimate(el_id, parent, edge_count)
-        num_els = num_elements(bc.nodes, parent)
-        @inbounds log_params[el_id] = 
+    @inline function estimate(element, decision, edge_count)
+        num_els = num_elements(bc.nodes, decision)
+        log_params[element] = 
             log((edge_count+pseudocount/num_els)
-                   /(node_counts[parent]+pseudocount))
-    end
-    
-    @inline function on_edge(flows, values, dec_id, par, grandpa)
-        if !has_single_child(bc.nodes, grandpa)
-            edge_count = sum(1:size(flows,1)) do i
-                @inbounds count_ones(flows[i, grandpa]) 
-            end
-            estimate(par, grandpa, edge_count)
-        end
+                   /(node_counts[decision]+pseudocount))
     end
 
-    @inline function on_edge(flows, values, dec_id, par, grandpa, sib_id)
-        if !has_single_child(bc.nodes, grandpa)
-            edge_count = sum(1:size(flows,1)) do i
-                @inbounds count_ones(values[i, dec_id] & values[i, sib_id] & flows[i, grandpa]) 
+    @inline function on_edge(flows, values, prime, sub, element, grandpa, single_child)
+        edge_count = if single_child
+            sum(1:size(flows,1)) do i
+                count_ones(flows[i, grandpa]) 
+            end
+        else
+            sum(1:size(flows,1)) do i
+                count_ones(values[i, prime] & values[i, sub] & flows[i, grandpa]) 
             end
-            estimate(par, grandpa, edge_count)
         end
+        estimate(element, grandpa, edge_count)
     end
 
-    satisfies_flows(bc, data; on_node, on_edge)
+    v, f = satisfies_flows(bc, data; on_node, on_edge)
 
     return log_params
 end
@@ -78,42 +73,35 @@ end
 function estimate_parameters_gpu(bc, data, pseudocount)
     node_counts::CuVector{Int32} = CUDA.zeros(Int32, num_nodes(bc))
     edge_counts::CuVector{Int32} = CUDA.zeros(Int32, num_elements(bc))
-    params::CuVector{Float64} = CuVector{Float64}(undef, num_elements(bc))
     # need to manually cudaconvert closure variables
     node_counts_device = CUDA.cudaconvert(node_counts)
     edge_counts_device = CUDA.cudaconvert(edge_counts)
-    params_device = CUDA.cudaconvert(params)
     
-    @inline function on_node(flows, values, dec_id, els_start, els_end, ex_id)
-        if els_start != els_end
-            @inbounds c::Int32 = count_ones(flows[ex_id, dec_id]) # cast for @atomic to be happy
+    @inline function on_node(flows, values, dec_id, ex_id, flow)
+        # # # if els_start != els_end
+            c::Int32 = count_ones(flow) # cast for @atomic to be happy
             CUDA.@atomic node_counts_device[dec_id] += c
-        end
-        if isone(ex_id) # only do this once
-            for i=els_start:els_end
-                @inbounds params_device[i] = pseudocount/(els_end-els_start+1)
-            end
-        end
-        nothing
+        # # # end
     end
-    
-    @inline function on_edge(flows, values, dec_id, el_id, p, s, els_start, els_end, ex_id, edge_flow)
-        if els_start != els_end
+
+    @inline function on_edge(flows, values, prime, sub, element, grandpa, ex_id, edge_flow, single_child)
+        # # # if els_start != els_end
             c::Int32 = count_ones(edge_flow) # cast for @atomic to be happy
-            CUDA.@atomic edge_counts_device[el_id] += c
-        end
-        nothing
+            CUDA.@atomic edge_counts_device[element] += c
+        # # # end
     end
 
     v, f = satisfies_flows(bc, data; on_node, on_edge)
+
     CUDA.unsafe_free!(v) # save the GC some effort
     CUDA.unsafe_free!(f) # save the GC some effort
 
-    # TODO: reinstate following implementation once https://github.com/JuliaGPU/GPUArrays.jl/issues/313 is fixed and released
-    # parent_counts = @views node_counts[bc.elements[1,:]]
+    # TODO: reinstate simpler implementation once https://github.com/JuliaGPU/GPUArrays.jl/issues/313 is fixed and released
     @inbounds parents = bc.elements[1,:]
     @inbounds parent_counts = node_counts[parents]
-    params .= log.(params .+ edge_counts) .- log.(parent_counts .+ pseudocount)
+    @inbounds parent_elcount = bc.nodes[2,parents] .- bc.nodes[1,parents] .+ 1 
+    params = log.((edge_counts .+ (pseudocount ./ parent_elcount)) 
+                    ./ (parent_counts .+ pseudocount))
     return to_cpu(params)
 end
 
@@ -132,4 +120,4 @@ function uniform_parameters(pc::ProbCircuit)
     end
 end
 
-# TODO add em paramaters learning 
\ No newline at end of file
+# TODO add em parameter learning 
\ No newline at end of file

From 074c74295163e3af15f9e8526603563d1c124912 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 6 Sep 2020 15:18:39 -0500
Subject: [PATCH 095/131] fix likelihood computation

---
 src/ProbabilisticCircuits.jl |  2 +-
 src/parameters.jl            | 36 ++++++++++++++----------------------
 src/queries/likelihood.jl    | 16 ++++++++--------
 3 files changed, 23 insertions(+), 31 deletions(-)

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 8b6012ae..f7fbc191 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -16,7 +16,7 @@ include("param_bit_circuit.jl")
 include("parameters.jl")
 include("structured_prob_nodes.jl")
 
-# include("queries/likelihood.jl")
+include("queries/likelihood.jl")
 # include("queries/marginal_flow.jl")
 
 # include("exp_flows.jl")
diff --git a/src/parameters.jl b/src/parameters.jl
index 3f115367..39accebc 100644
--- a/src/parameters.jl
+++ b/src/parameters.jl
@@ -38,11 +38,9 @@ function estimate_parameters_cpu(bc, data, pseudocount)
     log_params::Vector{Float64} = Vector{Float64}(undef, num_elements(bc))
 
     @inline function on_node(flows, values, dec_id)
-        # if !has_single_child(bc.nodes, dec_id)
-            node_counts[dec_id] = sum(1:size(flows,1)) do i
-                count_ones(flows[i, dec_id]) 
-            end
-        # end
+        node_counts[dec_id] = sum(1:size(flows,1)) do i
+            count_ones(flows[i, dec_id]) 
+        end
     end
 
     @inline function estimate(element, decision, edge_count)
@@ -53,16 +51,12 @@ function estimate_parameters_cpu(bc, data, pseudocount)
     end
 
     @inline function on_edge(flows, values, prime, sub, element, grandpa, single_child)
-        edge_count = if single_child
-            sum(1:size(flows,1)) do i
-                count_ones(flows[i, grandpa]) 
-            end
-        else
-            sum(1:size(flows,1)) do i
+        if !single_child
+            edge_count = sum(1:size(flows,1)) do i
                 count_ones(values[i, prime] & values[i, sub] & flows[i, grandpa]) 
             end
-        end
-        estimate(element, grandpa, edge_count)
+            estimate(element, grandpa, edge_count)
+        end # no need to estimate single child params, they are always prob 1
     end
 
     v, f = satisfies_flows(bc, data; on_node, on_edge)
@@ -77,18 +71,16 @@ function estimate_parameters_gpu(bc, data, pseudocount)
     node_counts_device = CUDA.cudaconvert(node_counts)
     edge_counts_device = CUDA.cudaconvert(edge_counts)
     
-    @inline function on_node(flows, values, dec_id, ex_id, flow)
-        # # # if els_start != els_end
-            c::Int32 = count_ones(flow) # cast for @atomic to be happy
-            CUDA.@atomic node_counts_device[dec_id] += c
-        # # # end
+    @inline function on_node(flows, values, dec_id, chunk_id, flow)
+        c::Int32 = CUDA.count_ones(flow) # cast for @atomic to be happy
+        CUDA.@atomic node_counts_device[dec_id] += c
     end
 
-    @inline function on_edge(flows, values, prime, sub, element, grandpa, ex_id, edge_flow, single_child)
-        # # # if els_start != els_end
-            c::Int32 = count_ones(edge_flow) # cast for @atomic to be happy
+    @inline function on_edge(flows, values, prime, sub, element, grandpa, chunk_id, edge_flow, single_child)
+        if !single_child
+            c::Int32 = CUDA.count_ones(edge_flow) # cast for @atomic to be happy
             CUDA.@atomic edge_counts_device[element] += c
-        # # # end
+        end
     end
 
     v, f = satisfies_flows(bc, data; on_node, on_edge)
diff --git a/src/queries/likelihood.jl b/src/queries/likelihood.jl
index 6c991ea9..9cb3d5fa 100644
--- a/src/queries/likelihood.jl
+++ b/src/queries/likelihood.jl
@@ -17,17 +17,17 @@ function log_likelihood_per_instance_cpu(bc, data)
     ll::Vector{Float64} = zeros(Float64, num_examples(data))
     ll_lock::Threads.ReentrantLock = Threads.ReentrantLock()
     
-    @inline function on_edge(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
-        if els_start != els_end
-            lock(ll_lock) do # TODO: move lock to inner loop?
+    @inline function on_edge(flows, values, prime, sub, element, grandpa, single_child)
+        if !single_child
+            lock(ll_lock) do # TODO: move lock to inner loop? change to atomic float?
                 for i = 1:size(flows,1)
-                    @inbounds edge_flow = values[i, p] & values[i, s] & flows[i, dec_id]
+                    @inbounds edge_flow = values[i, prime] & values[i, sub] & flows[i, grandpa]
                     first_true_bit = trailing_zeros(edge_flow)+1
                     last_true_bit = 64-leading_zeros(edge_flow)
                     @simd for j = first_true_bit:last_true_bit
                         ex_id = ((i-1) << 6) + j
                         if get_bit(edge_flow, j)
-                            @inbounds ll[ex_id] += bc.params[el_id]
+                            @inbounds ll[ex_id] += bc.params[element]
                         end
                     end
                 end
@@ -45,14 +45,14 @@ function log_likelihood_per_instance_gpu(bc, data)
     ll::CuVector{Float64} = CUDA.zeros(Float64, num_examples(data))
     ll_device = CUDA.cudaconvert(ll)
         
-    @inline function on_edge(flows, values, dec_id, el_id, p, s, els_start, els_end, chunk_id, edge_flow)
-        if els_start != els_end
+    @inline function on_edge(flows, values, prime, sub, element, grandpa, chunk_id, edge_flow, single_child)
+        if !single_child
             first_true_bit = 1+trailing_zeros(edge_flow)
             last_true_bit = 64-leading_zeros(edge_flow)
             for j = first_true_bit:last_true_bit
                 ex_id = ((chunk_id-1) << 6) + j
                 if get_bit(edge_flow, j)
-                    CUDA.@atomic ll_device[ex_id] += params_device[el_id]
+                    CUDA.@atomic ll_device[ex_id] += params_device[element]
                 end
             end
         end

From a00d7dc77157afca9bc812bd11f5059f8298a7c2 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 6 Sep 2020 15:35:47 -0500
Subject: [PATCH 096/131] reinstate marginal pass up

---
 src/ProbabilisticCircuits.jl        |   2 +-
 src/queries/marginal_flow.jl        | 282 ++++++++++++++--------------
 test/structured_prob_nodes_tests.jl |   9 +-
 3 files changed, 146 insertions(+), 147 deletions(-)

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index f7fbc191..01e6e11c 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -17,7 +17,7 @@ include("parameters.jl")
 include("structured_prob_nodes.jl")
 
 include("queries/likelihood.jl")
-# include("queries/marginal_flow.jl")
+include("queries/marginal_flow.jl")
 
 # include("exp_flows.jl")
 # include("queries.jl")
diff --git a/src/queries/marginal_flow.jl b/src/queries/marginal_flow.jl
index ef23a059..707ba22f 100644
--- a/src/queries/marginal_flow.jl
+++ b/src/queries/marginal_flow.jl
@@ -68,7 +68,7 @@ function marginal_layers(circuit::ParamBitCircuit, values::Matrix)
     bc = circuit.bitcircuit
     els = bc.elements
     pars = circuit.params
-    for layer in bc.layers
+    for layer in bc.layers[2:end]
         Threads.@threads for dec_id in layer
             j = @inbounds bc.nodes[1,dec_id]
             els_end = @inbounds bc.nodes[2,dec_id]
@@ -113,7 +113,7 @@ end
 "Compute marginals on the GPU"
 function marginal_layers(circuit::ParamBitCircuit, values::CuMatrix;  dec_per_thread = 8, log2_threads_per_block = 8)
     bc = circuit.bitcircuit
-    CUDA.@sync for layer in bc.layers
+    CUDA.@sync for layer in bc.layers[2:end]
         num_examples = size(values, 1)
         num_decision_sets = length(layer)/dec_per_thread
         num_threads =  balance_threads(num_examples, num_decision_sets, log2_threads_per_block)
@@ -147,148 +147,146 @@ function marginal_layers_cuda(layer, nodes, elements, params, values)
     return nothing
 end
 
-
-
-#####################
-# Bit circuit values and flows (up and downward pass)
-#####################
-
-"Compute the value and flow of each node"
-function marginal_flows(circuit::ProbCircuit, data, 
-    reuse_values=nothing, reuse_flows=nothing; on_node=noop, on_edge=noop) 
-    bc = same_device(ProbBitCircuit(circuit, data), data)
-    marginal_flows(bc, data, reuse_values, reuse_flows; on_node, on_edge)
-end
-
-function marginal_flows(circuit::ParamBitCircuit, data, 
-            reuse_values=nothing, reuse_flows=nothing; on_node=noop, on_edge=noop)
-    values = marginal_all(circuit, data, reuse_values)
-    flows = marginal_flows_down(circuit, values, reuse_flows; on_node, on_edge)
-    return values, flows
-end
-
-#####################
-# Bit circuit flows downward pass
-#####################
-
-"When marginals at nodes have already been computed, do a downward pass computing the marginal flows at each node"
-function marginal_flows_down(circuit::ParamBitCircuit, values, reuse=nothing; on_node=noop, on_edge=noop)
-    flows = similar!(reuse, typeof(values), size(values)...)
-    init_marginal_flows(flows, values)
-    marginal_flows_down_layers(circuit, flows, values, on_node, on_edge)
-    return flows
-end
-
-function init_marginal_flows(flows::AbstractArray{F}, values::AbstractArray{F}) where F
-    flows .= zero(F)
-    @views flows[:,end] .= values[:,end] # set flow at root
-end
-
-# downward pass helpers on CPU
-
-function marginal_flows_down_layers(circuit::ParamBitCircuit, flows::Matrix, values::Matrix, on_node, on_edge)
-    els = circuit.bitcircuit.elements
-    locks = [Threads.ReentrantLock() for i=1:num_nodes(circuit)]    
-    for layer in Iterators.reverse(circuit.bitcircuit.layers)
-        Threads.@threads for dec_id in layer
-            els_start = @inbounds circuit.bitcircuit.nodes[1,dec_id]
-            els_end = @inbounds circuit.bitcircuit.nodes[2,dec_id]
-            on_node(flows, values, dec_id, els_start, els_end, locks)
-            #TODO do something faster when els_start == els_end?
-            for j = els_start:els_end
-                p = els[2,j]
-                s = els[3,j]
-                θ = circuit.params[j]
-                accum_marginal_flow(flows, values, dec_id, p, s, θ, locks)
-                on_edge(flows, values, dec_id, j, p, s, els_start, els_end, locks)
-            end
-        end
-    end
-end
-
-function accum_marginal_flow(f::Matrix{<:AbstractFloat}, v, d, p, s, θ, locks)
-    # retrieve locks in index order to avoid deadlock
-    l1, l2 = order_asc(p,s)
-    lock(locks[l1]) do 
-        lock(locks[l2]) do 
-            # note: in future, if there is a need to scale to many more threads, it would be beneficial to avoid this synchronization by ordering downward pass layers by child id, not parent id, so that there is no contention when processing a single layer and no need for synchronization, as in the upward pass
-            @avx for j in 1:size(f,1)
-                edge_flow = v[j, p] + v[j, s] - v[j, d] + f[j, d] + θ
-                edge_flow = vifelse(isfinite(edge_flow), edge_flow, log(zero(Float32)))
-                x = f[j, p]
-                y = edge_flow
-                Δ = ifelse(x == y, zero(Float64), abs(x - y))
-                @inbounds f[j,p] = max(x, y) + log1p(exp(-Δ))
-                x = f[j, s]
-                Δ = ifelse(x == y, zero(Float64), abs(x - y))
-                @inbounds f[j,s] = max(x, y) + log1p(exp(-Δ))
-            end
-        end
-    end
-end
-
-
-# downward pass helpers on GPU
-
-"Pass flows down the layers of a bit circuit on the GPU"
-function marginal_flows_down_layers(circuit::ParamBitCircuit, flows::CuMatrix, values::CuMatrix, on_node, on_edge; 
-            dec_per_thread = 4, log2_threads_per_block = 8)
-    bc = circuit.bitcircuit
-    CUDA.@sync for layer in Iterators.reverse(bc.layers)
-        num_examples = size(values, 1)
-        num_decision_sets = length(layer)/dec_per_thread
-        num_threads =  balance_threads(num_examples, num_decision_sets, log2_threads_per_block)
-        num_blocks = (ceil(Int, num_examples/num_threads[1]), 
-                      ceil(Int, num_decision_sets/num_threads[2])) 
-        @cuda threads=num_threads blocks=num_blocks marginal_flows_down_layers_cuda(layer, bc.nodes, bc.elements, circuit.params, flows, values, on_node, on_edge)
-    end
-end
-
-"CUDA kernel for passing flows down circuit"
-function marginal_flows_down_layers_cuda(layer, nodes, elements, params, flows, values, on_node, on_edge)
-    index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
-    index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
-    stride_x = blockDim().x * gridDim().x
-    stride_y = blockDim().y * gridDim().y
-    for k = index_x:stride_x:size(values,1)
-        for i = index_y:stride_y:length(layer) #TODO swap loops??
-            dec_id = @inbounds layer[i]
-            els_start = @inbounds nodes[1,dec_id]
-            els_end = @inbounds nodes[2,dec_id]
-            n_up = @inbounds values[k, dec_id]
-            on_node(flows, values, dec_id, els_start, els_end, k)
-            if !iszero(n_up) # on_edge will only get called when edge flows are non-zero
-                n_down = @inbounds flows[k, dec_id]
-                #TODO do something faster when els_start == els_end?
-                for j = els_start:els_end
-                    p = @inbounds elements[2,j]
-                    s = @inbounds elements[3,j]
-                    @inbounds edge_flow = values[k, p] + values[k, s] - n_up + n_down + params[j]
-                    # following needs to be memory safe, hence @atomic
-
-                    @inbounds y = values[j, elements[2,k]] + values[j, elements[3,k]] + params[k]
-                    Δ = ifelse(x == y, zero(Float64), CUDA.abs(x - y))
-                    x = max(x, y) + CUDA.log1p(CUDA.exp(-Δ))
+# #####################
+# # Bit circuit values and flows (up and downward pass)
+# #####################
+
+# "Compute the value and flow of each node"
+# function marginal_flows(circuit::ProbCircuit, data, 
+#     reuse_values=nothing, reuse_flows=nothing; on_node=noop, on_edge=noop) 
+#     bc = same_device(ProbBitCircuit(circuit, data), data)
+#     marginal_flows(bc, data, reuse_values, reuse_flows; on_node, on_edge)
+# end
+
+# function marginal_flows(circuit::ParamBitCircuit, data, 
+#             reuse_values=nothing, reuse_flows=nothing; on_node=noop, on_edge=noop)
+#     values = marginal_all(circuit, data, reuse_values)
+#     flows = marginal_flows_down(circuit, values, reuse_flows; on_node, on_edge)
+#     return values, flows
+# end
+
+# #####################
+# # Bit circuit flows downward pass
+# #####################
+
+# "When marginals at nodes have already been computed, do a downward pass computing the marginal flows at each node"
+# function marginal_flows_down(circuit::ParamBitCircuit, values, reuse=nothing; on_node=noop, on_edge=noop)
+#     flows = similar!(reuse, typeof(values), size(values)...)
+#     init_marginal_flows(flows, values)
+#     marginal_flows_down_layers(circuit, flows, values, on_node, on_edge)
+#     return flows
+# end
+
+# function init_marginal_flows(flows::AbstractArray{F}, values::AbstractArray{F}) where F
+#     flows .= zero(F)
+#     @views flows[:,end] .= values[:,end] # set flow at root
+# end
+
+# # downward pass helpers on CPU
+
+# function marginal_flows_down_layers(circuit::ParamBitCircuit, flows::Matrix, values::Matrix, on_node, on_edge)
+#     els = circuit.bitcircuit.elements
+#     locks = [Threads.ReentrantLock() for i=1:num_nodes(circuit)]    
+#     for layer in Iterators.reverse(circuit.bitcircuit.layers)
+#         Threads.@threads for dec_id in layer
+#             els_start = @inbounds circuit.bitcircuit.nodes[1,dec_id]
+#             els_end = @inbounds circuit.bitcircuit.nodes[2,dec_id]
+#             on_node(flows, values, dec_id, els_start, els_end, locks)
+#             #TODO do something faster when els_start == els_end?
+#             for j = els_start:els_end
+#                 p = els[2,j]
+#                 s = els[3,j]
+#                 θ = circuit.params[j]
+#                 accum_marginal_flow(flows, values, dec_id, p, s, θ, locks)
+#                 on_edge(flows, values, dec_id, j, p, s, els_start, els_end, locks)
+#             end
+#         end
+#     end
+# end
+
+# function accum_marginal_flow(f::Matrix{<:AbstractFloat}, v, d, p, s, θ, locks)
+#     # retrieve locks in index order to avoid deadlock
+#     l1, l2 = order_asc(p,s)
+#     lock(locks[l1]) do 
+#         lock(locks[l2]) do 
+#             # note: in future, if there is a need to scale to many more threads, it would be beneficial to avoid this synchronization by ordering downward pass layers by child id, not parent id, so that there is no contention when processing a single layer and no need for synchronization, as in the upward pass
+#             @avx for j in 1:size(f,1)
+#                 edge_flow = v[j, p] + v[j, s] - v[j, d] + f[j, d] + θ
+#                 edge_flow = vifelse(isfinite(edge_flow), edge_flow, log(zero(Float32)))
+#                 x = f[j, p]
+#                 y = edge_flow
+#                 Δ = ifelse(x == y, zero(Float64), abs(x - y))
+#                 @inbounds f[j,p] = max(x, y) + log1p(exp(-Δ))
+#                 x = f[j, s]
+#                 Δ = ifelse(x == y, zero(Float64), abs(x - y))
+#                 @inbounds f[j,s] = max(x, y) + log1p(exp(-Δ))
+#             end
+#         end
+#     end
+# end
+
+
+# # downward pass helpers on GPU
+
+# "Pass flows down the layers of a bit circuit on the GPU"
+# function marginal_flows_down_layers(circuit::ParamBitCircuit, flows::CuMatrix, values::CuMatrix, on_node, on_edge; 
+#             dec_per_thread = 4, log2_threads_per_block = 8)
+#     bc = circuit.bitcircuit
+#     CUDA.@sync for layer in Iterators.reverse(bc.layers)
+#         num_examples = size(values, 1)
+#         num_decision_sets = length(layer)/dec_per_thread
+#         num_threads =  balance_threads(num_examples, num_decision_sets, log2_threads_per_block)
+#         num_blocks = (ceil(Int, num_examples/num_threads[1]), 
+#                       ceil(Int, num_decision_sets/num_threads[2])) 
+#         @cuda threads=num_threads blocks=num_blocks marginal_flows_down_layers_cuda(layer, bc.nodes, bc.elements, circuit.params, flows, values, on_node, on_edge)
+#     end
+# end
+
+# "CUDA kernel for passing flows down circuit"
+# function marginal_flows_down_layers_cuda(layer, nodes, elements, params, flows, values, on_node, on_edge)
+#     index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
+#     index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
+#     stride_x = blockDim().x * gridDim().x
+#     stride_y = blockDim().y * gridDim().y
+#     for k = index_x:stride_x:size(values,1)
+#         for i = index_y:stride_y:length(layer) #TODO swap loops??
+#             dec_id = @inbounds layer[i]
+#             els_start = @inbounds nodes[1,dec_id]
+#             els_end = @inbounds nodes[2,dec_id]
+#             n_up = @inbounds values[k, dec_id]
+#             on_node(flows, values, dec_id, els_start, els_end, k)
+#             if !iszero(n_up) # on_edge will only get called when edge flows are non-zero
+#                 n_down = @inbounds flows[k, dec_id]
+#                 #TODO do something faster when els_start == els_end?
+#                 for j = els_start:els_end
+#                     p = @inbounds elements[2,j]
+#                     s = @inbounds elements[3,j]
+#                     @inbounds edge_flow = values[k, p] + values[k, s] - n_up + n_down + params[j]
+#                     # following needs to be memory safe, hence @atomic
+
+#                     @inbounds y = values[j, elements[2,k]] + values[j, elements[3,k]] + params[k]
+#                     Δ = ifelse(x == y, zero(Float64), CUDA.abs(x - y))
+#                     x = max(x, y) + CUDA.log1p(CUDA.exp(-Δ))
 
                     
-                    accum_flow(flows, k, p, edge_flow)
-                    accum_flow(flows, k, s, edge_flow)
+#                     accum_flow(flows, k, p, edge_flow)
+#                     accum_flow(flows, k, s, edge_flow)
 
 
                     
-                    on_edge(flows, values, dec_id, j, p, s, els_start, els_end, k, edge_flow)
-                end
-            end
-        end
-    end
-    return nothing
-end
-
-compute_edge_flow(p_up::AbstractFloat, s_up, n_up, n_down) = p_up * s_up / n_up * n_down
-compute_edge_flow(p_up::Unsigned, s_up, n_up, n_down) = p_up & s_up & n_down
-
-accum_flow(flows, j, e, edge_flow::AbstractFloat) = 
-    CUDA.@atomic flows[j, e] += edge_flow #atomic is automatically inbounds
-
-accum_flow(flows, j, e, edge_flow::Unsigned) = 
-    CUDA.@atomic flows[j, e] |= edge_flow #atomic is automatically inbounds
+#                     on_edge(flows, values, dec_id, j, p, s, els_start, els_end, k, edge_flow)
+#                 end
+#             end
+#         end
+#     end
+#     return nothing
+# end
+
+# compute_edge_flow(p_up::AbstractFloat, s_up, n_up, n_down) = p_up * s_up / n_up * n_down
+# compute_edge_flow(p_up::Unsigned, s_up, n_up, n_down) = p_up & s_up & n_down
+
+# accum_flow(flows, j, e, edge_flow::AbstractFloat) = 
+#     CUDA.@atomic flows[j, e] += edge_flow #atomic is automatically inbounds
+
+# accum_flow(flows, j, e, edge_flow::Unsigned) = 
+#     CUDA.@atomic flows[j, e] |= edge_flow #atomic is automatically inbounds
diff --git a/test/structured_prob_nodes_tests.jl b/test/structured_prob_nodes_tests.jl
index 984fa65b..25374217 100644
--- a/test/structured_prob_nodes_tests.jl
+++ b/test/structured_prob_nodes_tests.jl
@@ -36,10 +36,11 @@ using DataFrames: DataFrame
     @test num_variables(f) == 10
     @test issmooth(f)
 
-    @test f(DataFrame(BitArray([1 0 1 0 1 0 1 0 1 0;
-                    1 1 1 1 1 1 1 1 1 1;
-                    0 0 0 0 0 0 0 0 0 0;
-                    0 1 1 0 1 0 0 1 0 1]))) == BitVector([1,1,1,1])
+    input = DataFrame(BitArray([1 0 1 0 1 0 1 0 1 0;
+                1 1 1 1 1 1 1 1 1 1;
+                0 0 0 0 0 0 0 0 0 0;
+                0 1 1 0 1 0 0 1 0 1]))
+    @test satisfies(f,input) == BitVector([1,1,1,1])
 
     plainf = PlainLogicCircuit(f) 
     foreach(plainf) do n

From e5c988c16a9b6ba9485506c31ce2c6c77fa5deab Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 6 Sep 2020 16:58:16 -0500
Subject: [PATCH 097/131] marginal flows on CPU

---
 src/param_bit_circuit.jl     |  32 +++---
 src/queries/marginal_flow.jl | 183 ++++++++++++++++++++++++++++++++++-
 2 files changed, 198 insertions(+), 17 deletions(-)

diff --git a/src/param_bit_circuit.jl b/src/param_bit_circuit.jl
index 6f4a685e..d5f6d4dc 100644
--- a/src/param_bit_circuit.jl
+++ b/src/param_bit_circuit.jl
@@ -6,20 +6,6 @@ struct ParamBitCircuit{V,M,W}
     params::W
 end
 
-import LogicCircuits: num_nodes, num_elements, num_features
-
-num_nodes(c::ParamBitCircuit) = num_nodes(c.bitcircuit)
-num_elements(c::ParamBitCircuit) = num_elements(c.bitcircuit)
-num_features(c::ParamBitCircuit) = num_features(c.bitcircuit)
-
-import LogicCircuits: to_gpu, to_cpu #extend
-
-to_gpu(c::ParamBitCircuit) = 
-    ParamBitCircuit(to_gpu(c.bitcircuit), to_gpu(c.params))
-
-to_cpu(c::ParamBitCircuit) = 
-    ParamBitCircuit(to_cpu(c.bitcircuit), to_cpu(c.params))
-
 function ParamBitCircuit(pc::ProbCircuit, data)
     logprobs::Vector{Float64} = Vector{Float64}()
     on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
@@ -34,3 +20,21 @@ function ParamBitCircuit(pc::ProbCircuit, data)
     bc = BitCircuit(pc, data; on_decision)
     ParamBitCircuit(bc, logprobs)
 end
+
+import LogicCircuits: num_nodes, num_elements, num_features
+
+num_nodes(c::ParamBitCircuit) = num_nodes(c.bitcircuit)
+num_elements(c::ParamBitCircuit) = num_elements(c.bitcircuit)
+num_features(c::ParamBitCircuit) = num_features(c.bitcircuit)
+
+import LogicCircuits: to_gpu, to_cpu, isgpu #extend
+
+to_gpu(c::ParamBitCircuit) = 
+    ParamBitCircuit(to_gpu(c.bitcircuit), to_gpu(c.params))
+
+to_cpu(c::ParamBitCircuit) = 
+    ParamBitCircuit(to_cpu(c.bitcircuit), to_cpu(c.params))
+
+
+isgpu(c::ParamBitCircuit) = 
+    isgpu(c.bitcircuit) && isgpu(c.params)
diff --git a/src/queries/marginal_flow.jl b/src/queries/marginal_flow.jl
index 707ba22f..82c4c9f1 100644
--- a/src/queries/marginal_flow.jl
+++ b/src/queries/marginal_flow.jl
@@ -5,7 +5,7 @@ using DataFrames: DataFrame
 using LoopVectorization: @avx
 using LogicCircuits: balance_threads
 
-export marginal, marginal_all
+export marginal, marginal_all, marginal_flows, marginal_flows_down
 
 #####################
 # Circuit marginal evaluation
@@ -94,7 +94,7 @@ accum_marginal(v::Matrix{<:AbstractFloat}, i, e1p, e1s, p1) = begin
     @avx for j=1:size(v,1)
         @inbounds x = v[j,i]
         @inbounds y = v[j,e1p] + v[j,e1s] + p1
-        Δ = ifelse(x == y, zero(Float64), abs(x - y))
+        Δ = ifelse(x == y, zero(eltype(v)), abs(x - y))
         @inbounds  v[j,i] = max(x, y) + log1p(exp(-Δ))
     end
 end
@@ -103,7 +103,7 @@ assign_marginal(v::Matrix{<:AbstractFloat}, i, e1p, e1s, e2p, e2s, p1, p2) = beg
     @avx for j=1:size(v,1)
         @inbounds x = v[j,e1p] + v[j,e1s] + p1
         @inbounds y = v[j,e2p] + v[j,e2s] + p2
-        Δ = ifelse(x == y, zero(Float64), abs(x - y))
+        Δ = ifelse(x == y, zero(eltype(v)), abs(x - y))
         @inbounds  v[j,i] = max(x, y) + log1p(exp(-Δ))
     end
 end
@@ -147,6 +147,183 @@ function marginal_layers_cuda(layer, nodes, elements, params, values)
     return nothing
 end
 
+
+#####################
+# Bit circuit marginals and flows (up and downward pass)
+#####################
+
+"Compute the marginal and flow of each node"
+function marginal_flows(circuit::ProbCircuit, data, 
+    reuse_values=nothing, reuse_flows=nothing; on_node=noop, on_edge=noop) 
+    bc = same_device(ParamBitCircuit(circuit, data), data)
+    marginal_flows(bc, data, reuse_values, reuse_flows; on_node, on_edge)
+end
+
+function marginal_flows(circuit::ParamBitCircuit, data, 
+            reuse_values=nothing, reuse_flows=nothing; on_node=noop, on_edge=noop)
+    @assert isgpu(data) == isgpu(circuit) "ParamBitCircuit and data need to be on the same device"
+    values = marginal_all(circuit, data, reuse_values)
+    flows = marginal_flows_down(circuit, values, reuse_flows; on_node, on_edge)
+    return values, flows
+end
+
+#####################
+# Bit circuit marginal flows downward pass
+#####################
+
+"When marginals of nodes have already been computed, do a downward pass computing the marginal flows at each node"
+function marginal_flows_down(circuit::ParamBitCircuit, values, reuse=nothing; on_node=noop, on_edge=noop)
+    flows = similar!(reuse, typeof(values), size(values)...)
+    flows .= 42
+    marginal_flows_down_layers(circuit, flows, values, on_node, on_edge)
+    return flows
+end
+
+# downward pass helpers on CPU
+
+"Evaluate marginals of the layers of a bit circuit on the CPU (SIMD & multi-threaded)"
+function marginal_flows_down_layers(pbc::ParamBitCircuit, flows::Matrix, values::Matrix, on_node, on_edge)
+    @assert flows !== values
+    circuit = pbc.bitcircuit 
+    els = circuit.elements   
+    for layer in Iterators.reverse(circuit.layers)
+        Threads.@threads for dec_id in layer
+            par_start = @inbounds circuit.nodes[3,dec_id]
+            if iszero(par_start)
+                if dec_id == num_nodes(circuit)
+                    # populate root flow from values
+                    @inbounds @views @. flows[:, dec_id] = values[:, dec_id]
+                end
+                # no parents, ignore (can happen for false/true node and root)
+            else
+                par_end = @inbounds circuit.nodes[4,dec_id]
+                for j = par_start:par_end
+                    par = @inbounds circuit.parents[j]
+                    grandpa = @inbounds els[1,par]
+                    sib_id = sibling(els, par, dec_id)
+                    single_child = has_single_child(circuit.nodes, grandpa)
+                    if single_child
+                        if j == par_start
+                            @inbounds @views @. flows[:, dec_id] = flows[:, grandpa]
+                        else
+                            accum_marg_flow(flows, dec_id, grandpa)
+                        end
+                    else
+                        θ = pbc.params[par]
+                        if j == par_start
+                            assign_marg_flow(flows, values, dec_id, grandpa, sib_id, θ)
+                        else
+                            accum_marg_flow(flows, values, dec_id, grandpa, sib_id, θ)
+                        end
+                    end
+                    # report edge flow only once:
+                    sib_id > dec_id && on_edge(flows, values, dec_id, sib_id, par, grandpa, single_child)
+                end
+            end
+            on_node(flows, values, dec_id)
+        end
+    end
+end 
+
+function assign_marg_flow(f::Matrix{<:AbstractFloat}, v, d, g, s, θ)
+    @inbounds @simd for j in 1:size(f,1) #@avx gives incorrect results
+        edge_flow = v[j, s] + v[j, d] - v[j, g] + f[j, g] + θ
+        edge_flow = ifelse(isnan(edge_flow), typemin(eltype(f)), edge_flow)
+        f[j, d] = edge_flow 
+    end
+    # @assert !any(isnan, f[:,d])
+end
+
+function accum_marg_flow(f::Matrix{<:AbstractFloat}, d, g)
+    @avx for j=1:size(f,1) #@avx gives incorrect results
+        x = f[j, d]
+        y = f[j, g]
+        Δ = ifelse(x == y, zero(eltype(f)), abs(x - y))
+        f[j, d] = max(x, y) + log1p(exp(-Δ))
+    end
+    # @assert !any(isnan, f[:,d])
+end
+
+function accum_marg_flow(f::Matrix{<:AbstractFloat}, v, d, g, s, θ)
+    @inbounds @simd for j=1:size(f,1) #@avx gives incorrect results
+        x = f[j, d]
+        y = v[j, s] + v[j, d] - v[j, g] + f[j, g] + θ
+        y = ifelse(isnan(y), typemin(eltype(f)), y)
+        Δ = ifelse(x == y, zero(eltype(f)), abs(x - y))
+        f[j, d] = max(x, y) + log1p(exp(-Δ))
+    end
+    # @assert !any(isnan, f[:,d])
+end
+
+# # # downward pass helpers on GPU
+
+# "Pass flows down the layers of a bit circuit on the GPU"
+# function satisfies_flows_down_layers(circuit::BitCircuit, flows::CuMatrix, values::CuMatrix, on_node, on_edge; 
+#             dec_per_thread = 8, log2_threads_per_block = 7)
+#     CUDA.@sync for layer in Iterators.reverse(circuit.layers)
+#         num_examples = size(values, 1)
+#         num_decision_sets = length(layer)/dec_per_thread
+#         num_threads =  balance_threads(num_examples, num_decision_sets, log2_threads_per_block)
+#         num_blocks = (ceil(Int, num_examples/num_threads[1]), 
+#                       ceil(Int, num_decision_sets/num_threads[2])) 
+#         @cuda threads=num_threads blocks=num_blocks satisfies_flows_down_layers_cuda(layer, circuit.nodes, circuit.elements, circuit.parents, flows, values, on_node, on_edge)
+#     end
+# end
+
+# "CUDA kernel for passing flows down circuit"
+# function satisfies_flows_down_layers_cuda(layer, nodes, elements, parents, flows, values, on_node, on_edge)
+#     index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
+#     index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
+#     stride_x = blockDim().x * gridDim().x
+#     stride_y = blockDim().y * gridDim().y
+#     for k = index_x:stride_x:size(values,1)
+#         for i = index_y:stride_y:length(layer)
+#             dec_id = @inbounds layer[i]
+#             if dec_id == size(nodes,2)
+#                 # populate root flow from values
+#                 flow = values[k, dec_id]
+#             else
+#                 par_start = @inbounds nodes[3,dec_id]
+#                 flow = zero(eltype(flows))
+#                 if !iszero(par_start)
+#                     par_end = @inbounds nodes[4,dec_id]
+#                     for j = par_start:par_end
+#                         par = @inbounds parents[j]
+#                         grandpa = @inbounds elements[1,par]
+#                         v_gp = @inbounds values[k, grandpa]
+#                         prime = elements[2,par]
+#                         sub = elements[3,par]
+#                         if !iszero(v_gp) # edge flow only gets reported when non-zero
+#                             f_gp = @inbounds flows[k, grandpa]
+#                             single_child = has_single_child(nodes, grandpa)
+#                             if single_child
+#                                 edge_flow = f_gp
+#                             else
+#                                 v_prime = @inbounds values[k, prime]
+#                                 v_sub = @inbounds values[k, sub]
+#                                 edge_flow = compute_edge_flow( v_prime, v_sub, v_gp, f_gp)  
+#                             end
+#                             flow = sum_flows(flow, edge_flow)
+#                             # report edge flow only once:
+#                             dec_id == prime && on_edge(flows, values, prime, sub, par, grandpa, k, edge_flow, single_child)
+#                         end
+#                     end
+#                 end
+#             end
+#             @inbounds flows[k, dec_id] = flow
+#             on_node(flows, values, dec_id, k, flow)
+#         end
+#     end
+#     return nothing
+# end
+
+# @inline sum_flows(a,b::AbstractFloat) = a + b
+# @inline sum_flows(a,b::Unsigned) = a | b
+
+# @inline compute_edge_flow(p_up::AbstractFloat, s_up, n_up, n_down) = p_up * s_up / n_up * n_down
+# @inline compute_edge_flow(p_up::Unsigned, s_up, n_up, n_down) = p_up & s_up & n_down
+
+
 # #####################
 # # Bit circuit values and flows (up and downward pass)
 # #####################

From bb901b65ea629220fe6bc24712093fa742fdb418 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 6 Sep 2020 17:40:30 -0500
Subject: [PATCH 098/131] marginal downward pass GPU

---
 src/queries/marginal_flow.jl | 303 ++++++++++-------------------------
 1 file changed, 82 insertions(+), 221 deletions(-)

diff --git a/src/queries/marginal_flow.jl b/src/queries/marginal_flow.jl
index 82c4c9f1..bf501823 100644
--- a/src/queries/marginal_flow.jl
+++ b/src/queries/marginal_flow.jl
@@ -44,17 +44,17 @@ function marginal_all(circuit::ParamBitCircuit, data, reuse=nothing)
 end
 
 "Initialize values from the data (data frames)"
-function init_marginal(data, reuse, num_nodes)
-    flowtype = isgpu(data) ? CuMatrix{Float64} : Matrix{Float64}
+function init_marginal(data, reuse, num_nodes; Float=Float32)
+    flowtype = isgpu(data) ? CuMatrix{Float} : Matrix{Float}
     values = similar!(reuse, flowtype, num_examples(data), num_nodes)
-    @views values[:,LogicCircuits.TRUE_BITS] .= log(one(Float64))
-    @views values[:,LogicCircuits.FALSE_BITS] .= log(zero(Float64))
+    @views values[:,LogicCircuits.TRUE_BITS] .= log(one(Float))
+    @views values[:,LogicCircuits.FALSE_BITS] .= log(zero(Float))
     # here we should use a custom CUDA kernel to extract Float marginals from bit vectors
     # for now the lazy solution is to move everything to the CPU and do the work there...
     data_cpu = to_cpu(data)
     for i=1:num_features(data)
-        marg_pos::Vector{Float64} = log.(coalesce.(data_cpu[:,i], 1.0))
-        marg_neg::Vector{Float64} = log.(coalesce.(1.0 .- data_cpu[:,i], 1.0))
+        marg_pos::Vector{Float} = log.(coalesce.(data_cpu[:,i], one(Float)))
+        marg_neg::Vector{Float} = log.(coalesce.(1.0 .- data_cpu[:,i], one(Float)))
         values[:,2+i] .= same_device(marg_pos, values)
         values[:,2+num_features(data)+i] .= same_device(marg_neg, values)
     end
@@ -138,7 +138,7 @@ function marginal_layers_cuda(layer, nodes, elements, params, values)
             while k < els_end
                 k += 1
                 @inbounds y = values[j, elements[2,k]] + values[j, elements[3,k]] + params[k]
-                Δ = ifelse(x == y, zero(Float64), CUDA.abs(x - y))
+                Δ = ifelse(x == y, zero(eltype(values)), CUDA.abs(x - y))
                 x = max(x, y) + CUDA.log1p(CUDA.exp(-Δ))
             end
             values[j, decision_id] = x
@@ -174,7 +174,6 @@ end
 "When marginals of nodes have already been computed, do a downward pass computing the marginal flows at each node"
 function marginal_flows_down(circuit::ParamBitCircuit, values, reuse=nothing; on_node=noop, on_edge=noop)
     flows = similar!(reuse, typeof(values), size(values)...)
-    flows .= 42
     marginal_flows_down_layers(circuit, flows, values, on_node, on_edge)
     return flows
 end
@@ -209,7 +208,7 @@ function marginal_flows_down_layers(pbc::ParamBitCircuit, flows::Matrix, values:
                             accum_marg_flow(flows, dec_id, grandpa)
                         end
                     else
-                        θ = pbc.params[par]
+                        θ = eltype(flows)(pbc.params[par])
                         if j == par_start
                             assign_marg_flow(flows, values, dec_id, grandpa, sib_id, θ)
                         else
@@ -255,215 +254,77 @@ function accum_marg_flow(f::Matrix{<:AbstractFloat}, v, d, g, s, θ)
     # @assert !any(isnan, f[:,d])
 end
 
-# # # downward pass helpers on GPU
-
-# "Pass flows down the layers of a bit circuit on the GPU"
-# function satisfies_flows_down_layers(circuit::BitCircuit, flows::CuMatrix, values::CuMatrix, on_node, on_edge; 
-#             dec_per_thread = 8, log2_threads_per_block = 7)
-#     CUDA.@sync for layer in Iterators.reverse(circuit.layers)
-#         num_examples = size(values, 1)
-#         num_decision_sets = length(layer)/dec_per_thread
-#         num_threads =  balance_threads(num_examples, num_decision_sets, log2_threads_per_block)
-#         num_blocks = (ceil(Int, num_examples/num_threads[1]), 
-#                       ceil(Int, num_decision_sets/num_threads[2])) 
-#         @cuda threads=num_threads blocks=num_blocks satisfies_flows_down_layers_cuda(layer, circuit.nodes, circuit.elements, circuit.parents, flows, values, on_node, on_edge)
-#     end
-# end
-
-# "CUDA kernel for passing flows down circuit"
-# function satisfies_flows_down_layers_cuda(layer, nodes, elements, parents, flows, values, on_node, on_edge)
-#     index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
-#     index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
-#     stride_x = blockDim().x * gridDim().x
-#     stride_y = blockDim().y * gridDim().y
-#     for k = index_x:stride_x:size(values,1)
-#         for i = index_y:stride_y:length(layer)
-#             dec_id = @inbounds layer[i]
-#             if dec_id == size(nodes,2)
-#                 # populate root flow from values
-#                 flow = values[k, dec_id]
-#             else
-#                 par_start = @inbounds nodes[3,dec_id]
-#                 flow = zero(eltype(flows))
-#                 if !iszero(par_start)
-#                     par_end = @inbounds nodes[4,dec_id]
-#                     for j = par_start:par_end
-#                         par = @inbounds parents[j]
-#                         grandpa = @inbounds elements[1,par]
-#                         v_gp = @inbounds values[k, grandpa]
-#                         prime = elements[2,par]
-#                         sub = elements[3,par]
-#                         if !iszero(v_gp) # edge flow only gets reported when non-zero
-#                             f_gp = @inbounds flows[k, grandpa]
-#                             single_child = has_single_child(nodes, grandpa)
-#                             if single_child
-#                                 edge_flow = f_gp
-#                             else
-#                                 v_prime = @inbounds values[k, prime]
-#                                 v_sub = @inbounds values[k, sub]
-#                                 edge_flow = compute_edge_flow( v_prime, v_sub, v_gp, f_gp)  
-#                             end
-#                             flow = sum_flows(flow, edge_flow)
-#                             # report edge flow only once:
-#                             dec_id == prime && on_edge(flows, values, prime, sub, par, grandpa, k, edge_flow, single_child)
-#                         end
-#                     end
-#                 end
-#             end
-#             @inbounds flows[k, dec_id] = flow
-#             on_node(flows, values, dec_id, k, flow)
-#         end
-#     end
-#     return nothing
-# end
-
-# @inline sum_flows(a,b::AbstractFloat) = a + b
-# @inline sum_flows(a,b::Unsigned) = a | b
-
-# @inline compute_edge_flow(p_up::AbstractFloat, s_up, n_up, n_down) = p_up * s_up / n_up * n_down
-# @inline compute_edge_flow(p_up::Unsigned, s_up, n_up, n_down) = p_up & s_up & n_down
-
-
-# #####################
-# # Bit circuit values and flows (up and downward pass)
-# #####################
-
-# "Compute the value and flow of each node"
-# function marginal_flows(circuit::ProbCircuit, data, 
-#     reuse_values=nothing, reuse_flows=nothing; on_node=noop, on_edge=noop) 
-#     bc = same_device(ProbBitCircuit(circuit, data), data)
-#     marginal_flows(bc, data, reuse_values, reuse_flows; on_node, on_edge)
-# end
-
-# function marginal_flows(circuit::ParamBitCircuit, data, 
-#             reuse_values=nothing, reuse_flows=nothing; on_node=noop, on_edge=noop)
-#     values = marginal_all(circuit, data, reuse_values)
-#     flows = marginal_flows_down(circuit, values, reuse_flows; on_node, on_edge)
-#     return values, flows
-# end
-
-# #####################
-# # Bit circuit flows downward pass
-# #####################
-
-# "When marginals at nodes have already been computed, do a downward pass computing the marginal flows at each node"
-# function marginal_flows_down(circuit::ParamBitCircuit, values, reuse=nothing; on_node=noop, on_edge=noop)
-#     flows = similar!(reuse, typeof(values), size(values)...)
-#     init_marginal_flows(flows, values)
-#     marginal_flows_down_layers(circuit, flows, values, on_node, on_edge)
-#     return flows
-# end
-
-# function init_marginal_flows(flows::AbstractArray{F}, values::AbstractArray{F}) where F
-#     flows .= zero(F)
-#     @views flows[:,end] .= values[:,end] # set flow at root
-# end
-
-# # downward pass helpers on CPU
-
-# function marginal_flows_down_layers(circuit::ParamBitCircuit, flows::Matrix, values::Matrix, on_node, on_edge)
-#     els = circuit.bitcircuit.elements
-#     locks = [Threads.ReentrantLock() for i=1:num_nodes(circuit)]    
-#     for layer in Iterators.reverse(circuit.bitcircuit.layers)
-#         Threads.@threads for dec_id in layer
-#             els_start = @inbounds circuit.bitcircuit.nodes[1,dec_id]
-#             els_end = @inbounds circuit.bitcircuit.nodes[2,dec_id]
-#             on_node(flows, values, dec_id, els_start, els_end, locks)
-#             #TODO do something faster when els_start == els_end?
-#             for j = els_start:els_end
-#                 p = els[2,j]
-#                 s = els[3,j]
-#                 θ = circuit.params[j]
-#                 accum_marginal_flow(flows, values, dec_id, p, s, θ, locks)
-#                 on_edge(flows, values, dec_id, j, p, s, els_start, els_end, locks)
-#             end
-#         end
-#     end
-# end
-
-# function accum_marginal_flow(f::Matrix{<:AbstractFloat}, v, d, p, s, θ, locks)
-#     # retrieve locks in index order to avoid deadlock
-#     l1, l2 = order_asc(p,s)
-#     lock(locks[l1]) do 
-#         lock(locks[l2]) do 
-#             # note: in future, if there is a need to scale to many more threads, it would be beneficial to avoid this synchronization by ordering downward pass layers by child id, not parent id, so that there is no contention when processing a single layer and no need for synchronization, as in the upward pass
-#             @avx for j in 1:size(f,1)
-#                 edge_flow = v[j, p] + v[j, s] - v[j, d] + f[j, d] + θ
-#                 edge_flow = vifelse(isfinite(edge_flow), edge_flow, log(zero(Float32)))
-#                 x = f[j, p]
-#                 y = edge_flow
-#                 Δ = ifelse(x == y, zero(Float64), abs(x - y))
-#                 @inbounds f[j,p] = max(x, y) + log1p(exp(-Δ))
-#                 x = f[j, s]
-#                 Δ = ifelse(x == y, zero(Float64), abs(x - y))
-#                 @inbounds f[j,s] = max(x, y) + log1p(exp(-Δ))
-#             end
-#         end
-#     end
-# end
-
-
-# # downward pass helpers on GPU
-
-# "Pass flows down the layers of a bit circuit on the GPU"
-# function marginal_flows_down_layers(circuit::ParamBitCircuit, flows::CuMatrix, values::CuMatrix, on_node, on_edge; 
-#             dec_per_thread = 4, log2_threads_per_block = 8)
-#     bc = circuit.bitcircuit
-#     CUDA.@sync for layer in Iterators.reverse(bc.layers)
-#         num_examples = size(values, 1)
-#         num_decision_sets = length(layer)/dec_per_thread
-#         num_threads =  balance_threads(num_examples, num_decision_sets, log2_threads_per_block)
-#         num_blocks = (ceil(Int, num_examples/num_threads[1]), 
-#                       ceil(Int, num_decision_sets/num_threads[2])) 
-#         @cuda threads=num_threads blocks=num_blocks marginal_flows_down_layers_cuda(layer, bc.nodes, bc.elements, circuit.params, flows, values, on_node, on_edge)
-#     end
-# end
-
-# "CUDA kernel for passing flows down circuit"
-# function marginal_flows_down_layers_cuda(layer, nodes, elements, params, flows, values, on_node, on_edge)
-#     index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
-#     index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
-#     stride_x = blockDim().x * gridDim().x
-#     stride_y = blockDim().y * gridDim().y
-#     for k = index_x:stride_x:size(values,1)
-#         for i = index_y:stride_y:length(layer) #TODO swap loops??
-#             dec_id = @inbounds layer[i]
-#             els_start = @inbounds nodes[1,dec_id]
-#             els_end = @inbounds nodes[2,dec_id]
-#             n_up = @inbounds values[k, dec_id]
-#             on_node(flows, values, dec_id, els_start, els_end, k)
-#             if !iszero(n_up) # on_edge will only get called when edge flows are non-zero
-#                 n_down = @inbounds flows[k, dec_id]
-#                 #TODO do something faster when els_start == els_end?
-#                 for j = els_start:els_end
-#                     p = @inbounds elements[2,j]
-#                     s = @inbounds elements[3,j]
-#                     @inbounds edge_flow = values[k, p] + values[k, s] - n_up + n_down + params[j]
-#                     # following needs to be memory safe, hence @atomic
-
-#                     @inbounds y = values[j, elements[2,k]] + values[j, elements[3,k]] + params[k]
-#                     Δ = ifelse(x == y, zero(Float64), CUDA.abs(x - y))
-#                     x = max(x, y) + CUDA.log1p(CUDA.exp(-Δ))
-
-                    
-#                     accum_flow(flows, k, p, edge_flow)
-#                     accum_flow(flows, k, s, edge_flow)
-
-
-                    
-#                     on_edge(flows, values, dec_id, j, p, s, els_start, els_end, k, edge_flow)
-#                 end
-#             end
-#         end
-#     end
-#     return nothing
-# end
-
-# compute_edge_flow(p_up::AbstractFloat, s_up, n_up, n_down) = p_up * s_up / n_up * n_down
-# compute_edge_flow(p_up::Unsigned, s_up, n_up, n_down) = p_up & s_up & n_down
-
-# accum_flow(flows, j, e, edge_flow::AbstractFloat) = 
-#     CUDA.@atomic flows[j, e] += edge_flow #atomic is automatically inbounds
-
-# accum_flow(flows, j, e, edge_flow::Unsigned) = 
-#     CUDA.@atomic flows[j, e] |= edge_flow #atomic is automatically inbounds
+# downward pass helpers on GPU
+
+"Pass marginal flows down the layers of a bit circuit on the GPU"
+function marginal_flows_down_layers(pbc::ParamBitCircuit, flows::CuMatrix, values::CuMatrix, 
+            on_node, on_edge; 
+            dec_per_thread = 8, log2_threads_per_block = 7)
+    bc = pbc.bitcircuit
+    CUDA.@sync for layer in Iterators.reverse(bc.layers)
+        num_examples = size(values, 1)
+        num_decision_sets = length(layer)/dec_per_thread
+        num_threads =  balance_threads(num_examples, num_decision_sets, log2_threads_per_block)
+        num_blocks = (ceil(Int, num_examples/num_threads[1]), 
+                      ceil(Int, num_decision_sets/num_threads[2])) 
+        @cuda threads=num_threads blocks=num_blocks marginal_flows_down_layers_cuda(layer, bc.nodes, bc.elements, bc.parents, pbc.params, flows, values, on_node, on_edge)
+    end
+end
+
+"CUDA kernel for passing marginal flows down circuit"
+function marginal_flows_down_layers_cuda(layer, nodes, elements, parents, params, flows, values, on_node, on_edge)
+    index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
+    index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
+    stride_x = blockDim().x * gridDim().x
+    stride_y = blockDim().y * gridDim().y
+    for k = index_x:stride_x:size(values,1)
+        for i = index_y:stride_y:length(layer)
+            dec_id = @inbounds layer[i]
+            if dec_id == size(nodes,2)
+                # populate root flow from values
+                flow = values[k, dec_id]
+            else
+                par_start = @inbounds nodes[3,dec_id]
+                flow = typemin(eltype(flows)) # log(0)
+                if !iszero(par_start)
+                    par_end = @inbounds nodes[4,dec_id]
+                    for j = par_start:par_end
+                        par = @inbounds parents[j]
+                        grandpa = @inbounds elements[1,par]
+                        v_gp = @inbounds values[k, grandpa]
+                        prime = elements[2,par]
+                        sub = elements[3,par]
+                        θ = eltype(flows)(params[par])
+                        if !iszero(v_gp) # edge flow only gets reported when non-zero
+                            f_gp = @inbounds flows[k, grandpa]
+                            single_child = has_single_child(nodes, grandpa)
+                            if single_child
+                                edge_flow = f_gp
+                            else
+                                v_prime = @inbounds values[k, prime]
+                                v_sub = @inbounds values[k, sub]
+                                edge_flow = compute_marg_edge_flow(v_prime, v_sub, v_gp, f_gp, θ)
+                            end
+                            flow = sum_marg_flows(flow, edge_flow)
+                            # report edge flow only once:
+                            dec_id == prime && on_edge(flows, values, prime, sub, par, grandpa, k, edge_flow, single_child)
+                        end
+                    end
+                end
+            end
+            @inbounds flows[k, dec_id] = flow
+            on_node(flows, values, dec_id, k, flow)
+        end
+    end
+    return nothing
+end
+
+@inline function sum_marg_flows(x,y) 
+    Δ = ifelse(x == y, zero(x), CUDA.abs(x - y))
+    max(x, y) + CUDA.log1p(CUDA.exp(-Δ))
+end
+
+@inline function compute_marg_edge_flow(p_up, s_up, n_up, n_down, θ)
+    x = p_up + s_up - n_up + n_down + θ
+    ifelse(isnan(x), typemin(n_down), x)
+end

From 47bf2eb73cb1d68a4be844cdf7ecd4bbeca97503 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Mon, 7 Sep 2020 05:14:53 -0500
Subject: [PATCH 099/131] [refactor] adapt to latest apis

---
 src/Logistic/parameters.jl | 76 ++++++++++++++++++++------------------
 src/Logistic/queries.jl    | 44 +++++++++++-----------
 2 files changed, 62 insertions(+), 58 deletions(-)

diff --git a/src/Logistic/parameters.jl b/src/Logistic/parameters.jl
index dbb19430..855bd12e 100644
--- a/src/Logistic/parameters.jl
+++ b/src/Logistic/parameters.jl
@@ -1,43 +1,47 @@
-export learn_parameters
+export learn_parameters, to_onehot
 
 using CUDA
 using LoopVectorization: @avx, vifelse
 
 """
 Parameter learning through gradient descents
+Note: data need to be DataFrame and Labels need to be in one-hot form.
 """
 function learn_parameters(lc::LogisticCircuit, nc::Int, data, labels; num_epochs=25, step_size=0.01)
     bc = ParamBitCircuit(lc, nc, data)
-    labels = one_hot(labels, nc)
     if isgpu(data)
+        @assert isgpu(labels) "Data and labels must be both stored in either GPU or CPU."
         for _ = 1:num_epochs
             cl = class_likelihood_per_instance(bc, data)
-            update_parameters_gpu(to_gpu(bc), cl, to_gpu(labels), step_size)
+            update_parameters_gpu(to_gpu(bc), data, labels, cl, step_size)
         end
     else
+        @assert !isgpu(labels) "Data and labels must be both stored in either GPU or CPU."
         for _ = 1:num_epochs
             cl = class_likelihood_per_instance(bc, data)
-            update_parameters_cpu(bc, cw, labels, step_size)
+            update_parameters_cpu(bc, data, labels, cl, step_size)
         end
     end
 end
 
-function update_parameters_cpu(bc, cl, labels, step_size)
+function update_parameters_cpu(bc, data, labels, cl, step_size)
     ne::Int = num_examples(data)
     nc::Int = size(bc.params, 2)
     params_lock::Threads.ReentrantLock = Threads.ReentrantLock()
 
-    @inline function on_edge_binary(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
-        lock(cw_lock) do # TODO: move lock to inner loop?
-            for i = 1:size(flows, 1)
-                @inbounds edge_flow = values[i, p] & values[i, s] & flows[i, dec_id]
-                first_true_bit = trailing_zeros(edge_flow) + 1
-                last_true_bit = 64 - leading_zeros(edge_flow)
-                @simd for j = first_true_bit:last_true_bit
-                    if get_bit(edge_flow, j)
-                        ex_id = ((i-1) << 6) + j
-                        for class = 1:nc
-                            @inbounds bc.params[el_id, class] -= (cl[ex_id, class] - labels[ex_id, class]) * step_size
+    @inline function on_edge_binary(flows, values, prime, sub, element, grandpa, single_child)
+        if !single_child
+            lock(params_lock) do # TODO: move lock to inner loop?
+                for i = 1:size(flows, 1)
+                    @inbounds edge_flow = values[i, prime] & values[i, sub] & flows[i, grandpa]
+                    first_true_bit = trailing_zeros(edge_flow) + 1
+                    last_true_bit = 64 - leading_zeros(edge_flow)
+                    @simd for j = first_true_bit:last_true_bit
+                        ex_id = ((i - 1) << 6) + j
+                        if get_bit(edge_flow, j)
+                            for class = 1:nc
+                                @inbounds bc.params[element, class] -= (cl[ex_id, class] - labels[ex_id, class]) * step_size
+                            end
                         end
                     end
                 end
@@ -45,14 +49,14 @@ function update_parameters_cpu(bc, cl, labels, step_size)
         end
     end
     
-    @inline function on_edge_float(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
-        if els_start != els_end
-            lock(cw_lock) do # TODO: move lock to inner loop?
+    @inline function on_edge_float(flows, values, prime, sub, element, grandpa, single_child)
+        if !single_child
+            lock(params_lock) do # TODO: move lock to inner loop?
                 @avx for i = 1:size(flows, 1)
-                    @inbounds edge_flow = values[i, p] * values[i, s] / values[i, dec_id] * flows[i, dec_id]
-                    edge_flow = vifelse(isfinite(edge_flow), edge_flow, zero(Float32))
+                    @inbounds edge_flow = values[i, prime] * values[i, sub] / values[i, grandpa] * flows[i, grandpa]
+                    edge_flow = vifelse(isfinite(edge_flow), edge_flow, zero(eltype(flows)))
                     for class = 1:nc
-                        @inbounds bc.parames[el_id, class] -= (cl[i, class] - labels[i, class]) * edge_flow * step_size
+                        @inbounds bc.parames[element, class] -= (cl[i, class] - labels[i, class]) * edge_flow * step_size
                     end
                 end
             end
@@ -61,32 +65,32 @@ function update_parameters_cpu(bc, cl, labels, step_size)
     end
 
     if isbinarydata(data)
-        v,f = satisfies_flows(bc, data; on_edge = on_edge_binary) 
+        v,f = satisfies_flows(bc.bitcircuit, data; on_edge = on_edge_binary) 
     else
         @assert isfpdata(data) "Only floating point and binary data are supported"
-        v,f = satisfies_flows(bc, data; on_edge = on_edge_float)
+        v,f = satisfies_flows(bc.bitcircuit, data; on_edge = on_edge_float)
     end
 
     nothing
 end
 
 
-function update_parameters_gpu(bc, cl, labels, step_size)
+function update_parameters_gpu(bc, data, labels, cl, step_size)
     ne::Int = num_examples(data)
     nc::Int = size(bc.params, 2)
     cl_device = CUDA.cudaconvert(cl)
-    labels = CUDA.cudaconvert(labels)
+    label_device = CUDA.cudaconvert(labels)
     params_device = CUDA.cudaconvert(bc.params)
 
-    @inline function on_edge_binary(flows, values, dec_id, el_id, p, s, els_start, els_end, chunk_id, edge_flow)
-        if els_start != els_end
+    @inline function on_edge_binary(flows, values, prime, sub, element, grandpa, chunk_id, edge_flow, single_child)
+        if !single_child
             first_true_bit = 1 + trailing_zeros(edge_flow)
             last_true_bit = 64 - leading_zeros(edge_flow)
             for j = first_true_bit:last_true_bit
                 if get_bit(edge_flow, j)
-                    ex_id = ((chunk_id-1) << 6) + j
+                    ex_id = ((chunk_id - 1) << 6) + j
                     for class = 1:nc
-                        CUDA.@atomic params_device[el_id, class] -= (cl_device[ex_id, class] - labels[ex_id, class]) * step_size
+                        CUDA.@atomic params_device[el_id, class] -= (cl_device[ex_id, class] - label_device[ex_id, class]) * step_size
                     end
                 end
             end
@@ -94,20 +98,20 @@ function update_parameters_gpu(bc, cl, labels, step_size)
         nothing 
     end
 
-    @inline function on_edge_float(flows, values, dec_id, el_id, p, s, els_start, els_end, ex_id, edge_flow)
-        if els_start != els_end
+    @inline function on_edge_float(flows, values, prime, sub, element, grandpa, ex_id, edge_flow, single_child)
+        if !single_child
             for class = 1:nc
-                CUDA.@atomic params_device[el_id, class] -= (cl_device[ex_id, class] - lables[ex_id, class]) * edge_flow * step_size
+                CUDA.@atomic params_device[element, class] -= (cl_device[ex_id, class] - label_device[ex_id, class]) * edge_flow * step_size
             end
         end      
         nothing
     end
 
     if isbinarydata(data)
-        v,f = satisfies_flows(bc, data; on_edge = on_edge_binary) 
+        v,f = satisfies_flows(bc.bitcircuit, data; on_edge = on_edge_binary) 
     else
         @assert isfpdata(data) "Only floating point and binary data are supported"
-        v,f = satisfies_flows(bc, data; on_edge = on_edge_float)
+        v,f = satisfies_flows(bc.bitcircuit, data; on_edge = on_edge_float)
     end
     CUDA.unsafe_free!(v) # save the GC some effort
     CUDA.unsafe_free!(f) # save the GC some effort
@@ -117,7 +121,7 @@ end
 
 
 
-function one_hot(labels::Vector, nc::Integer)    
+function to_onehot(labels::Vector, nc::Integer)    
     ne = length(labels) 
     one_hot_labels = zeros(Float32, ne, nc)
     for (i, j) in enumerate(labels)
diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index a0e65602..05380e54 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -13,7 +13,7 @@ function class_likelihood_per_instance(lc::LogicCircuit, nc::Int, data)
 end
 
 function class_likelihood_per_instance(bc, data)
-    cw = class_likelihood_per_instance(bc, data)
+    cw = class_weights_per_instance(bc, data)
     isgpu(data) ? (@. 1.0 / (1.0 + exp(-cw))) : (@. @avx 1.0 / (1.0 + exp(-cw)))
 end
 
@@ -36,18 +36,18 @@ function class_weights_per_instance_cpu(bc, data)
     cw::Matrix{Float64} = zeros(Float64, ne, nc)
     cw_lock::Threads.ReentrantLock = Threads.ReentrantLock()
  
-    @inline function on_edge_binary(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
-        if els_start != els_end
+    @inline function on_edge_binary(flows, values, prime, sub, element, grandpa, single_child)
+        if !single_child
             lock(cw_lock) do # TODO: move lock to inner loop?
                 for i = 1:size(flows, 1)
-                    @inbounds edge_flow = values[i, p] & values[i, s] & flows[i, dec_id]
+                    @inbounds edge_flow = values[i, prime] & values[i, sub] & flows[i, grandpa]
                     first_true_bit = trailing_zeros(edge_flow) + 1
                     last_true_bit = 64 - leading_zeros(edge_flow)
                     @simd for j = first_true_bit:last_true_bit
+                        ex_id = ((i - 1) << 6) + j
                         if get_bit(edge_flow, j)
-                            ex_id = ((i-1) << 6) + j
                             for class = 1:nc
-                                @inbounds cw[ex_id, class] += bc.params[el_id, class]
+                                @inbounds cw[ex_id, class] += bc.params[element, class]
                             end
                         end
                     end
@@ -57,14 +57,14 @@ function class_weights_per_instance_cpu(bc, data)
         nothing
     end
 
-    @inline function on_edge_float(flows, values, dec_id, el_id, p, s, els_start, els_end, locks)
-        if els_start != els_end
+    @inline function on_edge_float(flows, values, prime, sub, element, grandpa, single_child)
+        if !single_child
             lock(cw_lock) do # TODO: move lock to inner loop?
                 @avx for i = 1:size(flows, 1)
-                    @inbounds edge_flow = values[i, p] * values[i, s] / values[i, dec_id] * flows[i, dec_id]
-                    edge_flow = vifelse(isfinite(edge_flow), edge_flow, zero(Float32))
+                    @inbounds edge_flow = values[i, prime] * values[i, sub] / values[i, grandpa] * flows[i, grandpa]
+                    edge_flow = vifelse(isfinite(edge_flow), edge_flow, zero(eltype(flows)))
                     for class = 1:nc
-                        @inbounds cw[i, class] += edge_flow * bc.params[el_id, class]
+                        @inbounds cw[i, class] += edge_flow * bc.params[element, class]
                     end
                 end
             end
@@ -73,9 +73,9 @@ function class_weights_per_instance_cpu(bc, data)
     end
 
     if isbinarydata(data)
-        satisfies_flows(bc, data; on_edge = on_edge_binary)
+        satisfies_flows(bc.bitcircuit, data; on_edge = on_edge_binary)
     else
-        satisfies_flows(bc, data; on_edge = on_edge_float)
+        satisfies_flows(bc.bitcircuit, data; on_edge = on_edge_float)
     end
 
     return cw
@@ -88,15 +88,15 @@ function class_weights_per_instance_gpu(bc, data)
     cw_device = CUDA.cudaconvert(cw)
     params_device = CUDA.cudaconvert(bc.params)
 
-    @inline function on_edge_binary(flows, values, dec_id, el_id, p, s, els_start, els_end, chunk_id, edge_flow)
-        if els_start != els_end
+    @inline function on_edge_binary(flows, values, prime, sub, element, grandpa, chunk_id, edge_flow, single_child)
+        if !single_child
             first_true_bit = 1 + trailing_zeros(edge_flow)
             last_true_bit = 64 - leading_zeros(edge_flow)
             for j = first_true_bit:last_true_bit
+                ex_id = ((chunk_id - 1) << 6) + j
                 if get_bit(edge_flow, j)
-                    ex_id = ((chunk_id-1) << 6) + j
                     for class = 1:nc
-                        CUDA.@atomic cw_device[ex_id, class] += params_device[el_id, class]
+                        CUDA.@atomic cw_device[ex_id, class] += params_device[element, class]
                     end
                 end
             end
@@ -104,20 +104,20 @@ function class_weights_per_instance_gpu(bc, data)
         nothing
     end
 
-    @inline function on_edge_float(flows, values, dec_id, el_id, p, s, els_start, els_end, ex_id, edge_flow)
-        if els_start != els_end
+    @inline function on_edge_float(flows, values, prime, sub, element, grandpa, ex_id, edge_flow, single_child)
+        if !single_child
             for class = 1:nc
-                CUDA.@atomic cw_device[ex_id, class] += edge_flow * params_device[el_id, class]
+                CUDA.@atomic cw_device[ex_id, class] += edge_flow * params_device[element, class]
             end
         end
         nothing
     end
     
     if isbinarydata(data)
-        v,f = satisfies_flows(bc, data; on_edge = on_edge_binary)
+        v,f = satisfies_flows(bc.bitcircuit, data; on_edge = on_edge_binary)
     else
         @assert isfpdata(data) "Only floating point and binary data are supported"
-        v,f = satisfies_flows(bc, data; on_edge = on_edge_float)
+        v,f = satisfies_flows(bc.bitcircuit, data; on_edge = on_edge_float)
     end
     CUDA.unsafe_free!(v) # save the GC some effort
     CUDA.unsafe_free!(f) # save the GC some effort

From 48c7e42e1c6193fa5fe585a3b41f7381ca6b508d Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Mon, 7 Sep 2020 18:32:11 -0500
Subject: [PATCH 100/131] [fix] typo

---
 src/Logistic/parameters.jl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Logistic/parameters.jl b/src/Logistic/parameters.jl
index 855bd12e..3e3d4972 100644
--- a/src/Logistic/parameters.jl
+++ b/src/Logistic/parameters.jl
@@ -90,7 +90,7 @@ function update_parameters_gpu(bc, data, labels, cl, step_size)
                 if get_bit(edge_flow, j)
                     ex_id = ((chunk_id - 1) << 6) + j
                     for class = 1:nc
-                        CUDA.@atomic params_device[el_id, class] -= (cl_device[ex_id, class] - label_device[ex_id, class]) * step_size
+                        CUDA.@atomic params_device[element, class] -= (cl_device[ex_id, class] - label_device[ex_id, class]) * step_size
                     end
                 end
             end

From 0e8f218c11576b01233eee36d954984f81fa7a9b Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Fri, 11 Sep 2020 17:36:16 -0700
Subject: [PATCH 101/131] em estimate parameter for cpu

---
 src/param_bit_circuit.jl     |  8 ++---
 src/parameters.jl            | 62 +++++++++++++++++++++++++++++++++---
 src/queries/marginal_flow.jl |  4 +--
 test/parameters_tests.jl     | 13 ++++++++
 4 files changed, 76 insertions(+), 11 deletions(-)

diff --git a/src/param_bit_circuit.jl b/src/param_bit_circuit.jl
index 5ba09551..33c2d512 100644
--- a/src/param_bit_circuit.jl
+++ b/src/param_bit_circuit.jl
@@ -6,7 +6,7 @@ struct ParamBitCircuit{V,M,W}
     params::W
 end
 
-function ParamBitCircuit(pc::ProbCircuit, data)
+function ParamBitCircuit(pc::ProbCircuit, data; reset=true)
     logprobs::Vector{Float64} = Vector{Float64}()
     on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
         if isnothing(n) # this decision node is not part of the PC
@@ -17,11 +17,11 @@ function ParamBitCircuit(pc::ProbCircuit, data)
             append!(logprobs, n.log_probs)
         end
     end
-    bc = BitCircuit(pc, data; on_decision)
+    bc = BitCircuit(pc, data; reset=reset, on_decision)
     ParamBitCircuit(bc, logprobs)
 end
 
-function ParamBitCircuit(lc::LogisticCircuit, nc, data)
+function ParamBitCircuit(lc::LogisticCircuit, nc, data; reset=true)
     thetas::Vector{Vector{Float64}} = Vector{Vector{Float64}}()
     on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
         if isnothing(n)
@@ -34,7 +34,7 @@ function ParamBitCircuit(lc::LogisticCircuit, nc, data)
             end
         end
     end
-    bc = BitCircuit(lc, data; on_decision)
+    bc = BitCircuit(lc, data; reset=reset, on_decision)
     ParamBitCircuit(bc, permutedims(hcat(thetas...), (2, 1)))
 end
 
diff --git a/src/parameters.jl b/src/parameters.jl
index 39accebc..6a96968a 100644
--- a/src/parameters.jl
+++ b/src/parameters.jl
@@ -1,4 +1,4 @@
-export estimate_parameters, uniform_parameters
+export estimate_parameters, uniform_parameters, estimate_parameters_em, test
 
 using StatsFuns: logsumexp
 using CUDA
@@ -15,6 +15,11 @@ function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
     else
         estimate_parameters_cpu(bc, data, pseudocount)
     end
+    estimate_parameters_cached!(pc, bc, params)
+    params
+end
+
+function estimate_parameters_cached!(pc, bc, params)
     foreach_reset(pc) do pn
         if is⋁gate(pn)
             if num_children(pn) == 1
@@ -29,10 +34,10 @@ function estimate_parameters(pc::ProbCircuit, data; pseudocount::Float64)
             end
         end
     end
-    params
+    nothing
 end
 
-function estimate_parameters_cpu(bc, data, pseudocount)
+function estimate_parameters_cpu(bc::BitCircuit, data, pseudocount)
     # no need to synchronize, since each computation is unique to a decision node
     node_counts::Vector{UInt} = Vector{UInt}(undef, num_nodes(bc))
     log_params::Vector{Float64} = Vector{Float64}(undef, num_elements(bc))
@@ -64,7 +69,7 @@ function estimate_parameters_cpu(bc, data, pseudocount)
     return log_params
 end
 
-function estimate_parameters_gpu(bc, data, pseudocount)
+function estimate_parameters_gpu(bc::BitCircuit, data, pseudocount)
     node_counts::CuVector{Int32} = CUDA.zeros(Int32, num_nodes(bc))
     edge_counts::CuVector{Int32} = CUDA.zeros(Int32, num_elements(bc))
     # need to manually cudaconvert closure variables
@@ -112,4 +117,51 @@ function uniform_parameters(pc::ProbCircuit)
     end
 end
 
-# TODO add em parameter learning 
\ No newline at end of file
+"""
+Expectation maximization parameter learning given missing data
+"""
+function estimate_parameters_em(pc::ProbCircuit, data; pseudocount::Float64)
+    pbc = ParamBitCircuit(pc, data; reset=false)
+    params = if isgpu(data)
+        estimate_parameters_gpu(to_gpu(pbc), data, pseudocount)
+    else
+        estimate_parameters_cpu(pbc, data, pseudocount)
+    end
+    estimate_parameters_cached!(pc, pbc.bitcircuit, params)
+    params
+end
+
+function estimate_parameters_cpu(pbc::ParamBitCircuit, data, pseudocount)
+    # no need to synchronize, since each computation is unique to a decision node
+    bc = pbc.bitcircuit
+    node_counts::Vector{Float64} = Vector{Float64}(undef, num_nodes(bc))
+    log_params::Vector{Float64} = Vector{Float64}(undef, num_elements(bc))
+
+    @inline function on_node(flows, values, dec_id)
+        sum_flows = map(1:size(flows,1)) do i
+            flows[i, dec_id]
+        end
+        node_counts[dec_id] = logsumexp(sum_flows)
+    end
+
+    @inline function estimate(element, decision, edge_count)
+        num_els = num_elements(bc.nodes, decision)
+        log_params[element] = 
+            log((exp(edge_count)+pseudocount/num_els) / (exp(node_counts[decision])+pseudocount))
+    end
+
+    @inline function on_edge(flows, values, prime, sub, element, grandpa, single_child)
+        θ = eltype(flows)(pbc.params[element])
+        if !single_child
+            edge_flows = map(1:size(flows,1)) do i
+                values[i, prime] + values[i, sub] - values[i, grandpa] + flows[i, grandpa] + θ
+            end
+            edge_count = logsumexp(edge_flows)
+            estimate(element, grandpa, edge_count)
+        end # no need to estimate single child params, they are always prob 1
+    end
+
+    v, f = marginal_flows(pbc, data; on_node, on_edge)
+
+    return log_params
+end
diff --git a/src/queries/marginal_flow.jl b/src/queries/marginal_flow.jl
index bf501823..e55e0669 100644
--- a/src/queries/marginal_flow.jl
+++ b/src/queries/marginal_flow.jl
@@ -190,8 +190,8 @@ function marginal_flows_down_layers(pbc::ParamBitCircuit, flows::Matrix, values:
             par_start = @inbounds circuit.nodes[3,dec_id]
             if iszero(par_start)
                 if dec_id == num_nodes(circuit)
-                    # populate root flow from values
-                    @inbounds @views @. flows[:, dec_id] = values[:, dec_id]
+                    # marginal flow start from 0.0
+                    @inbounds @views @. flows[:, dec_id] = 0.0
                 end
                 # no parents, ignore (can happen for false/true node and root)
             else
diff --git a/test/parameters_tests.jl b/test/parameters_tests.jl
index 650411a8..23a93078 100644
--- a/test/parameters_tests.jl
+++ b/test/parameters_tests.jl
@@ -27,4 +27,17 @@ using CUDA: CUDA
 
     end
 
+end
+
+@testset "EM tests" begin
+    data = DataFrame([true missing])
+    vtree2 = PlainVtree(2, :balanced)
+    pc = fully_factorized_circuit(StructProbCircuit, vtree2).children[1]
+    uniform_parameters(pc)
+    pc.children[1].prime.log_probs .= log.([0.3, 0.7])
+    pc.children[1].sub.log_probs .= log.([0.4, 0.6])
+    pbc = ParamBitCircuit(pc, data)
+    estimate_parameters_em(pc, data; pseudocount=0.0)
+    @test all(pc.children[1].prime.log_probs .== log.([1.0, 0.0]))
+    @test pc.children[1].sub.log_probs[1] .≈ log.([0.4, 0.6])[1] atol=1e-6
 end
\ No newline at end of file

From 3ed182dd0ce224b5967cacd7758ee5a70a78fbf2 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 12 Sep 2020 00:11:05 -0500
Subject: [PATCH 102/131] reinstate `LoadSave` module

---
 src/ProbabilisticCircuits.jl                  |   5 +-
 src/queries/likelihood.jl                     |   2 +-
 src/queries/marginal_flow.jl                  |   4 +-
 src/queries/{queries.jl => sample.jl}         |  60 +----
 src/structured_prob_nodes.jl                  |  10 +-
 .../LoadSave/circuit_loaders_tests.jl         |   0
 .../circuit_savers_tests.jl}                  |   0
 test/broken/Probabilistic/queries_tests.jl    | 214 ------------------
 test/queries/likelihood_tests.jl              |  33 +++
 test/queries/marginal_flow_tests.jl           |  75 ++++++
 test/queries/sample_test.jl                   |  73 ++++++
 11 files changed, 199 insertions(+), 277 deletions(-)
 rename src/queries/{queries.jl => sample.jl} (50%)
 rename test/{broken => }/LoadSave/circuit_loaders_tests.jl (100%)
 rename test/{broken/LoadSave/circuit_savers_test.jl => LoadSave/circuit_savers_tests.jl} (100%)
 delete mode 100644 test/broken/Probabilistic/queries_tests.jl
 create mode 100644 test/queries/likelihood_tests.jl
 create mode 100644 test/queries/marginal_flow_tests.jl
 create mode 100644 test/queries/sample_test.jl

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 62e3fb4d..c77e0806 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -19,6 +19,7 @@ include("parameters.jl")
 
 include("queries/likelihood.jl")
 include("queries/marginal_flow.jl")
+include("queries/sample.jl")
 
 include("Logistic/Logistic.jl")
 @reexport using .Logistic
@@ -40,7 +41,7 @@ include("Logistic/Logistic.jl")
 # include("structurelearner/learner.jl")
 
 
-# include("LoadSave/LoadSave.jl")
-# @reexport using .LoadSave
+include("LoadSave/LoadSave.jl")
+@reexport using .LoadSave
 
 end
diff --git a/src/queries/likelihood.jl b/src/queries/likelihood.jl
index 9cb3d5fa..aeb8a174 100644
--- a/src/queries/likelihood.jl
+++ b/src/queries/likelihood.jl
@@ -69,7 +69,7 @@ end
 """
 Complete evidence queries
 """
-EVI = log_likelihood_per_instance
+const EVI = log_likelihood_per_instance
 
 """
 Compute the likelihood of the PC given the data
diff --git a/src/queries/marginal_flow.jl b/src/queries/marginal_flow.jl
index e55e0669..019cae0f 100644
--- a/src/queries/marginal_flow.jl
+++ b/src/queries/marginal_flow.jl
@@ -5,7 +5,7 @@ using DataFrames: DataFrame
 using LoopVectorization: @avx
 using LogicCircuits: balance_threads
 
-export marginal, marginal_all, marginal_flows, marginal_flows_down
+export marginal, MAR, marginal_all, marginal_flows, marginal_flows_down
 
 #####################
 # Circuit marginal evaluation
@@ -30,6 +30,8 @@ function marginal(circuit::ParamBitCircuit, data::DataFrame)::AbstractVector
     marginal_all(circuit,data)[:,end]
 end
 
+const MAR = marginal
+
 #####################
 # Circuit evaluation of *all* nodes in circuit
 #####################
diff --git a/src/queries/queries.jl b/src/queries/sample.jl
similarity index 50%
rename from src/queries/queries.jl
rename to src/queries/sample.jl
index e181dc53..21c9d125 100644
--- a/src/queries/queries.jl
+++ b/src/queries/sample.jl
@@ -1,67 +1,11 @@
-export MAR, marginal_log_likelihood_per_instance, 
-MPE, MAP, sample
-
-"""
-Marginal queries
-"""
-function marginal_log_likelihood_per_instance(pc::ProbCircuit, data)
-    evaluate_exp(pc, data)
-end
-MAR = marginal_log_likelihood_per_instance
-
-
-"""
-Most Probable Explanation (MPE), aka MAP
-"""
-@inline function MAP(pc::ProbCircuit, evidence)::BitMatrix
-    MPE(pc, evidence)
-end
-
-function MPE(pc::ProbCircuit, evidence)::BitMatrix
-    mlls = marginal_log_likelihood_per_instance(pc, evidence)
-    
-    ans = falses(num_examples(evidence), num_features(evidence))
-    active_samples = trues(num_examples(evidence))
-
-    function mpe_simulate(node::Union{PlainProbLiteralNode, StructProbLiteralNode}, active_samples::BitVector, result::BitMatrix)
-        if ispositive(node)
-            result[active_samples, variable(node)] .= 1
-        else
-            result[active_samples, variable(node)] .= 0
-        end
-    end
-    
-    function mpe_simulate(node::Union{PlainSumNode, StructSumNode}, active_samples::BitVector, result::BitMatrix)
-        prs = zeros(length(children(node)), size(active_samples)[1] )
-        @simd  for i=1:length(children(node))
-            prs[i,:] .= get_exp_upflow(children(node)[i]) .+ (node.log_probs[i])
-        end
-    
-        max_child_ids = [a[1] for a in argmax(prs, dims = 1) ]
-        @simd for i=1:length(children(node))
-            # Only active for this child if it was the max for that sample
-            ids = convert(BitVector, active_samples .* (max_child_ids .== i)[1,:])
-            mpe_simulate(children(node)[i], ids, result)
-        end
-    end
-    
-    function mpe_simulate(node::Union{PlainMulNode, StructMulNode}, active_samples::BitVector, result::BitMatrix)
-        for child in children(node)
-            mpe_simulate(child, active_samples, result)
-        end
-    end
-
-    mpe_simulate(pc, active_samples, ans)
-    ans
-end
-
+export sample
 
 ##################
 # Sampling from a psdd
 ##################
 
 """
-Sample from a PSDD without any evidence
+Sample from a PC without any evidence
 """
 function sample(circuit::ProbCircuit)::AbstractVector{Bool}
 
diff --git a/src/structured_prob_nodes.jl b/src/structured_prob_nodes.jl
index f88a1311..6fbfca38 100644
--- a/src/structured_prob_nodes.jl
+++ b/src/structured_prob_nodes.jl
@@ -109,16 +109,24 @@ end
 
 # claim `StructProbCircuit` as the default `ProbCircuit` implementation that has a vtree
 
+compile(::Type{ProbCircuit}, a1::Union{Vtree, StructLogicCircuit}, args...) =
+    compile(StructProbCircuit, a1, args...)
+
 compile(n::StructProbCircuit, args...) = 
     compile(typeof(n), root(vtree(n)), args...)
 
+compile(::Type{<:StructProbCircuit}, c::StructLogicCircuit) =
+    compile(StructProbCircuit, root(vtree(c)), c)
+
+compile(::Type{<:StructLogicCircuit}, c::StructProbCircuit) =
+    compile(StructLogicCircuit, root(vtree(c)), c)
+
 compile(::Type{<:StructProbCircuit}, ::Vtree, ::Bool) =
     error("Probabilistic circuits do not have constant leafs.")
 
 compile(::Type{<:StructProbCircuit}, vtree::Vtree, l::Lit) =
     StructProbLiteralNode(l,find_leaf(lit2var(l),vtree))
 
-
 function compile(::Type{<:StructProbCircuit}, vtree::Vtree, circuit::LogicCircuit)
     f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
     f_lit(n) = compile(StructProbCircuit, vtree, literal(n))
diff --git a/test/broken/LoadSave/circuit_loaders_tests.jl b/test/LoadSave/circuit_loaders_tests.jl
similarity index 100%
rename from test/broken/LoadSave/circuit_loaders_tests.jl
rename to test/LoadSave/circuit_loaders_tests.jl
diff --git a/test/broken/LoadSave/circuit_savers_test.jl b/test/LoadSave/circuit_savers_tests.jl
similarity index 100%
rename from test/broken/LoadSave/circuit_savers_test.jl
rename to test/LoadSave/circuit_savers_tests.jl
diff --git a/test/broken/Probabilistic/queries_tests.jl b/test/broken/Probabilistic/queries_tests.jl
deleted file mode 100644
index 3e1af1f9..00000000
--- a/test/broken/Probabilistic/queries_tests.jl
+++ /dev/null
@@ -1,214 +0,0 @@
-#TODO: reinstate
-
-# using Test
-# using LogicCircuits
-# using ProbabilisticCircuits
-
-# @testset "Probability of Full Evidence" begin
-#     # Uses a PSDD with 4 variables, and tests 3 of the configurations to
-#     # match with python. Also tests all probabilities sum up to 1.
-
-#     EPS = 1e-7;
-#     prob_circuit = zoo_psdd("little_4var.psdd");
-#     @test prob_circuit isa ProbCircuit;
-
-#     # Step 1. Check Probabilities for 3 samples
-#     data = Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]);
-#     true_prob = [0.07; 0.03; 0.13999999999999999]
-
-#     calc_prob = log_likelihood_per_instance(prob_circuit, data)
-#     calc_prob = exp.(calc_prob)
-
-#     for i = 1:3
-#         @test true_prob[i] ≈ calc_prob[i] atol= EPS;
-#     end
-
-#     # Step 2. Add up all probabilities and see if they add up to one
-#     N = 4;
-#     data_all = generate_data_all(N)
-
-#     calc_prob_all = log_likelihood_per_instance(prob_circuit, data_all)
-#     calc_prob_all = exp.(calc_prob_all)
-#     sum_prob_all = sum(calc_prob_all)
-
-#     @test 1 ≈ sum_prob_all atol = EPS;
-# end
-
-# @testset "Probability of partial Evidence (marginals)" begin
-#     EPS = 1e-7;
-#     prob_circuit = zoo_psdd("little_4var.psdd");
-
-#     data = Int8.([0 0 0 0; 0 1 1 0; 0 0 1 1;
-#                 0 0 0 -1; -1 1 0 -1; -1 -1 -1 -1; 0 -1 -1 -1])
-#     true_prob = [0.07; 0.03; 0.13999999999999999;
-#                     0.3499999999999; 0.1; 1.0; 0.8]
-
-#     calc_prob = marginal_log_likelihood_per_instance(prob_circuit, data)
-#     calc_prob = exp.(calc_prob)
-
-#     for i = 1:length(true_prob)
-#         @test true_prob[i] ≈ calc_prob[i] atol= EPS;
-#     end
-# end
-
-# @testset "Marginal Pass Down" begin
-#     EPS = 1e-7;
-#     prob_circuit = zoo_psdd("little_4var.psdd");
-#     logic_circuit = PlainLogicCircuit(prob_circuit)
-
-#     N = 4
-#     data_full = Bool.(generate_data_all(N))
-
-#     # Comparing with down pass with fully obeserved data
-#     compute_flows(logic_circuit, data_full)
-#     compute_exp_flows(prob_circuit, data_full)
-
-#     lin_prob = linearize(prob_circuit)
-#     lin_logic = linearize(logic_circuit)
-#     for i in 1 : length(lin_prob)
-#         pn = lin_prob[i]
-#         ln = lin_logic[i]
-#         @test all(isapprox.(exp.(get_exp_downflow(pn; root=prob_circuit)), 
-#             get_downflow(ln; root=logic_circuit), atol=EPS))
-#     end
-
-#     # Validating one example with missing features done by hand
-#     data_partial = Int8.([-1 1 -1 1])
-#     prob_circuit = zoo_psdd("little_4var.psdd");
-#     compute_exp_flows(prob_circuit, data_partial)
-
-#     # (node index, correct down_flow_value)
-#     true_vals = [(1, 0.5),
-#                 (2, 1.0),
-#                 (3, 0.5),
-#                 (4, 0.0),
-#                 (5, 0.0),
-#                 (6, 0.5),
-#                 (7, 0.5),
-#                 (8, 0.0),
-#                 (9, 1.0),
-#                 (10, 1/3),
-#                 (11, 1),
-#                 (12, 1/3),
-#                 (13, 0.0),
-#                 (14, 0.0),
-#                 (15, 2/3),
-#                 (16, 2/3),
-#                 (17, 0.0),
-#                 (18, 1.0),
-#                 (19, 1.0),
-#                 (20, 1.0)]
-#     lin = linearize(prob_circuit)
-    
-#     for ind_val in true_vals
-#         @test exp(get_exp_downflow(lin[ind_val[1]]; root=prob_circuit)[1]) ≈ ind_val[2] atol= EPS
-#     end
-# end
-
-# function test_mpe_brute_force(prob_circuit, evidence)
-#     EPS = 1e-9;
-#     result = MPE(prob_circuit, evidence);
-#     for idx = 1 : num_examples(evidence)
-#         marg = generate_all(evidence[idx,:])
-#         lls = log_likelihood_per_instance(prob_circuit, marg);
-#         brute_mpe = marg[argmax(lls), :]
-
-#         # Compare and validate p(result[idx]) == p(brute_mpe)
-#         comp_data = vcat(result[idx,:]',  brute_mpe')
-#         lls2 = log_likelihood_per_instance(prob_circuit, comp_data);
-
-#         @test lls2[1] ≈ lls2[2] atol= EPS
-#     end
-# end
-
-# @testset "MPE Brute Force Test Small (4 var)" begin
-#     prob_circuit = zoo_psdd("little_4var.psdd");
-#     evidence = Int8.( [-1 0 0 0;
-#                                 0 -1 -1 0;
-#                                 1 1 1 -1;
-#                                 1 0 1 0;
-#                                 -1 -1 -1 1;
-#                                 -1 -1 -1 -1] )
-
-#     test_mpe_brute_force(prob_circuit, evidence)
-
-# end
-
-# @testset "MPE Brute Force Test Big (15 var)" begin
-#     N = 15
-#     COUNT = 10
-
-#     prob_circuit = zoo_psdd("exp-D15-N1000-C4.psdd");
-#     evidence = Int8.(rand( (-1,0,1), (COUNT, N)))
-
-#     test_mpe_brute_force(prob_circuit, evidence)
-# end
-
-# @testset "Sampling Test" begin
-#     EPS = 1e-2;
-#     prob_circuit = zoo_psdd("little_4var.psdd");
-
-#     N = 4;
-#     data_all = generate_data_all(N);
-
-#     calc_prob_all = log_likelihood_per_instance(prob_circuit, data_all);
-#     calc_prob_all = exp.(calc_prob_all);
-
-#     using DataStructures
-#     hist = DefaultDict{AbstractString,Float64}(0.0)
-
-#     Nsamples = 1000 * 1000
-#     for i = 1:Nsamples
-#         cur = join(Int.(sample(prob_circuit)))
-#         hist[cur] += 1
-#     end
-
-#     for k in keys(hist)
-#         hist[k] /= Nsamples
-#     end
-
-#     for k in keys(hist)
-#         cur = parse(Int32, k, base=2) + 1 # cause Julia arrays start at 1 :(
-#         @test calc_prob_all[cur] ≈ hist[k] atol= EPS;
-#     end
-
-
-# end
-
-# using DataStructures
-# @testset "Sampling With Evidence" begin
-#     # TODO (pashak) this test should be improved by adding few more cases
-#     EPS = 1e-2;
-#     prob_circuit = zoo_psdd("little_4var.psdd");
-
-#     N = 4;
-#     data = Int8.([0 -1 0 -1])
-#     calc_prob = marginal_log_likelihood_per_instance(prob_circuit, data);
-#     calc_prob = exp.(calc_prob);
-
-#     data_all = Int8.([0 0 0 0;
-#                     0 0 0 1;
-#                     0 1 0 0;
-#                     0 1 0 1;]);
-#     calc_prob_all = marginal_log_likelihood_per_instance(prob_circuit, data_all);
-#     calc_prob_all = exp.(calc_prob_all);
-
-#     calc_prob_all ./= calc_prob[1]
-
-#     hist = DefaultDict{AbstractString,Float64}(0.0)
-
-#     Nsamples = 1000 * 1000
-#     for i = 1:Nsamples
-#         cur = join(Int.(sample(prob_circuit, data)))
-#         hist[cur] += 1
-#     end
-
-#     for k in keys(hist)
-#         hist[k] /= Nsamples
-#     end
-
-#     for ind = 1:4
-#         cur = join(data_all[ind, :])
-#         @test calc_prob_all[ind] ≈ hist[cur] atol= EPS;
-#     end
-# end
\ No newline at end of file
diff --git a/test/queries/likelihood_tests.jl b/test/queries/likelihood_tests.jl
new file mode 100644
index 00000000..f3777eb1
--- /dev/null
+++ b/test/queries/likelihood_tests.jl
@@ -0,0 +1,33 @@
+# using Test
+# using LogicCircuits
+# using ProbabilisticCircuits
+
+# @testset "Likelihood" begin
+#     # Uses a PC with 4 variables, and tests 3 of the configurations to
+#     # match with python. Also tests all probabilities sum up to 1.
+
+#     EPS = 1e-7;
+#     prob_circuit = zoo_psdd("little_4var.psdd");
+#     @test prob_circuit isa ProbCircuit;
+
+#     # Step 1. Check Probabilities for 3 samples
+#     data = Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]);
+#     true_prob = [0.07; 0.03; 0.13999999999999999]
+
+#     calc_prob = log_likelihood_per_instance(prob_circuit, data)
+#     calc_prob = exp.(calc_prob)
+
+#     for i = 1:3
+#         @test true_prob[i] ≈ calc_prob[i] atol= EPS;
+#     end
+
+#     # Step 2. Add up all probabilities and see if they add up to one
+#     N = 4;
+#     data_all = generate_data_all(N)
+
+#     calc_prob_all = log_likelihood_per_instance(prob_circuit, data_all)
+#     calc_prob_all = exp.(calc_prob_all)
+#     sum_prob_all = sum(calc_prob_all)
+
+#     @test 1 ≈ sum_prob_all atol = EPS;
+# end
\ No newline at end of file
diff --git a/test/queries/marginal_flow_tests.jl b/test/queries/marginal_flow_tests.jl
new file mode 100644
index 00000000..257fe4a6
--- /dev/null
+++ b/test/queries/marginal_flow_tests.jl
@@ -0,0 +1,75 @@
+# using Test
+# using LogicCircuits
+# using ProbabilisticCircuits
+
+# @testset "Probability of partial Evidence (marginals)" begin
+#     EPS = 1e-7;
+#     prob_circuit = zoo_psdd("little_4var.psdd");
+
+#     data = Int8.([0 0 0 0; 0 1 1 0; 0 0 1 1;
+#                 0 0 0 -1; -1 1 0 -1; -1 -1 -1 -1; 0 -1 -1 -1])
+#     true_prob = [0.07; 0.03; 0.13999999999999999;
+#                     0.3499999999999; 0.1; 1.0; 0.8]
+
+#     calc_prob = marginal_log_likelihood_per_instance(prob_circuit, data)
+#     calc_prob = exp.(calc_prob)
+
+#     for i = 1:length(true_prob)
+#         @test true_prob[i] ≈ calc_prob[i] atol= EPS;
+#     end
+# end
+
+# @testset "Marginal Pass Down" begin
+#     EPS = 1e-7;
+#     prob_circuit = zoo_psdd("little_4var.psdd");
+#     logic_circuit = PlainLogicCircuit(prob_circuit)
+
+#     N = 4
+#     data_full = Bool.(generate_data_all(N))
+
+#     # Comparing with down pass with fully obeserved data
+#     compute_flows(logic_circuit, data_full)
+#     compute_exp_flows(prob_circuit, data_full)
+
+#     lin_prob = linearize(prob_circuit)
+#     lin_logic = linearize(logic_circuit)
+#     for i in 1 : length(lin_prob)
+#         pn = lin_prob[i]
+#         ln = lin_logic[i]
+#         @test all(isapprox.(exp.(get_exp_downflow(pn; root=prob_circuit)), 
+#             get_downflow(ln; root=logic_circuit), atol=EPS))
+#     end
+
+#     # Validating one example with missing features done by hand
+#     data_partial = Int8.([-1 1 -1 1])
+#     prob_circuit = zoo_psdd("little_4var.psdd");
+#     compute_exp_flows(prob_circuit, data_partial)
+
+#     # (node index, correct down_flow_value)
+#     true_vals = [(1, 0.5),
+#                 (2, 1.0),
+#                 (3, 0.5),
+#                 (4, 0.0),
+#                 (5, 0.0),
+#                 (6, 0.5),
+#                 (7, 0.5),
+#                 (8, 0.0),
+#                 (9, 1.0),
+#                 (10, 1/3),
+#                 (11, 1),
+#                 (12, 1/3),
+#                 (13, 0.0),
+#                 (14, 0.0),
+#                 (15, 2/3),
+#                 (16, 2/3),
+#                 (17, 0.0),
+#                 (18, 1.0),
+#                 (19, 1.0),
+#                 (20, 1.0)]
+#     lin = linearize(prob_circuit)
+    
+#     for ind_val in true_vals
+#         @test exp(get_exp_downflow(lin[ind_val[1]]; root=prob_circuit)[1]) ≈ ind_val[2] atol= EPS
+#     end
+# end
+
diff --git a/test/queries/sample_test.jl b/test/queries/sample_test.jl
new file mode 100644
index 00000000..3b44c9c9
--- /dev/null
+++ b/test/queries/sample_test.jl
@@ -0,0 +1,73 @@
+# using Test
+# using LogicCircuits
+# using ProbabilisticCircuits
+
+
+# @testset "Sampling Test" begin
+#     EPS = 1e-2;
+#     prob_circuit = zoo_psdd("little_4var.psdd");
+
+#     N = 4;
+#     data_all = generate_data_all(N);
+
+#     calc_prob_all = log_likelihood_per_instance(prob_circuit, data_all);
+#     calc_prob_all = exp.(calc_prob_all);
+
+#     using DataStructures
+#     hist = DefaultDict{AbstractString,Float64}(0.0)
+
+#     Nsamples = 1000 * 1000
+#     for i = 1:Nsamples
+#         cur = join(Int.(sample(prob_circuit)))
+#         hist[cur] += 1
+#     end
+
+#     for k in keys(hist)
+#         hist[k] /= Nsamples
+#     end
+
+#     for k in keys(hist)
+#         cur = parse(Int32, k, base=2) + 1 # cause Julia arrays start at 1 :(
+#         @test calc_prob_all[cur] ≈ hist[k] atol= EPS;
+#     end
+
+
+# end
+
+# using DataStructures
+# @testset "Sampling With Evidence" begin
+#     # TODO (pashak) this test should be improved by adding few more cases
+#     EPS = 1e-2;
+#     prob_circuit = zoo_psdd("little_4var.psdd");
+
+#     N = 4;
+#     data = Int8.([0 -1 0 -1])
+#     calc_prob = marginal_log_likelihood_per_instance(prob_circuit, data);
+#     calc_prob = exp.(calc_prob);
+
+#     data_all = Int8.([0 0 0 0;
+#                     0 0 0 1;
+#                     0 1 0 0;
+#                     0 1 0 1;]);
+#     calc_prob_all = marginal_log_likelihood_per_instance(prob_circuit, data_all);
+#     calc_prob_all = exp.(calc_prob_all);
+
+#     calc_prob_all ./= calc_prob[1]
+
+#     hist = DefaultDict{AbstractString,Float64}(0.0)
+
+#     Nsamples = 1000 * 1000
+#     for i = 1:Nsamples
+#         cur = join(Int.(sample(prob_circuit, data)))
+#         hist[cur] += 1
+#     end
+
+#     for k in keys(hist)
+#         hist[k] /= Nsamples
+#     end
+
+#     for ind = 1:4
+#         cur = join(data_all[ind, :])
+#         @test calc_prob_all[ind] ≈ hist[cur] atol= EPS;
+#     end
+# end
\ No newline at end of file

From 158b31d0e39cd41b741e1a32b1233582c67f59ae Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 12 Sep 2020 00:46:45 -0500
Subject: [PATCH 103/131] likelihood and marginal tests

---
 src/Utils/misc.jl                   |  6 ++--
 test/queries/likelihood_tests.jl    | 51 +++++++++++++++--------------
 test/queries/marginal_flow_tests.jl | 41 +++++++++++++----------
 test/queries/sample_test.jl         | 10 +++---
 4 files changed, 57 insertions(+), 51 deletions(-)

diff --git a/src/Utils/misc.jl b/src/Utils/misc.jl
index 642ba70e..abea1c69 100644
--- a/src/Utils/misc.jl
+++ b/src/Utils/misc.jl
@@ -37,8 +37,8 @@ end
 """
 Given some missing values generates all possible fillings
 """
-function generate_all(row::Array{Int8})
-    miss_count = count(row .== -1)
+function generate_all(row::Vector)
+    miss_count = count(ismissing, row)
     lits = length(row)
     result = Bool.(zeros(1 << miss_count, lits))
 
@@ -51,7 +51,7 @@ function generate_all(row::Array{Int8})
             result[mask+1,:] = cur
         end
     end
-    result
+    DataFrame(result)
 end
 
 """
diff --git a/test/queries/likelihood_tests.jl b/test/queries/likelihood_tests.jl
index f3777eb1..23a03f1e 100644
--- a/test/queries/likelihood_tests.jl
+++ b/test/queries/likelihood_tests.jl
@@ -1,33 +1,34 @@
-# using Test
-# using LogicCircuits
-# using ProbabilisticCircuits
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+using DataFrames: DataFrame
 
-# @testset "Likelihood" begin
-#     # Uses a PC with 4 variables, and tests 3 of the configurations to
-#     # match with python. Also tests all probabilities sum up to 1.
+@testset "Likelihood" begin
+    # Uses a PC with 4 variables, and tests 3 of the configurations to
+    # match with python. Also tests all probabilities sum up to 1.
 
-#     EPS = 1e-7;
-#     prob_circuit = zoo_psdd("little_4var.psdd");
-#     @test prob_circuit isa ProbCircuit;
+    EPS = 1e-7;
+    prob_circuit = zoo_psdd("little_4var.psdd");
+    @test prob_circuit isa ProbCircuit;
 
-#     # Step 1. Check Probabilities for 3 samples
-#     data = Bool.([0 0 0 0; 0 1 1 0; 0 0 1 1]);
-#     true_prob = [0.07; 0.03; 0.13999999999999999]
+    # Step 1. Check Probabilities for 3 samples
+    data = DataFrame(BitArray([0 0 0 0; 0 1 1 0; 0 0 1 1]));
+    true_prob = [0.07; 0.03; 0.13999999999999999]
 
-#     calc_prob = log_likelihood_per_instance(prob_circuit, data)
-#     calc_prob = exp.(calc_prob)
+    calc_prob = EVI(prob_circuit, data)
+    calc_prob = exp.(calc_prob)
 
-#     for i = 1:3
-#         @test true_prob[i] ≈ calc_prob[i] atol= EPS;
-#     end
+    for i = 1:3
+        @test true_prob[i] ≈ calc_prob[i] atol= EPS;
+    end
 
-#     # Step 2. Add up all probabilities and see if they add up to one
-#     N = 4;
-#     data_all = generate_data_all(N)
+    # Step 2. Add up all probabilities and see if they add up to one
+    N = 4;
+    data_all = generate_data_all(N)
 
-#     calc_prob_all = log_likelihood_per_instance(prob_circuit, data_all)
-#     calc_prob_all = exp.(calc_prob_all)
-#     sum_prob_all = sum(calc_prob_all)
+    calc_prob_all = EVI(prob_circuit, data_all)
+    calc_prob_all = exp.(calc_prob_all)
+    sum_prob_all = sum(calc_prob_all)
 
-#     @test 1 ≈ sum_prob_all atol = EPS;
-# end
\ No newline at end of file
+    @test 1 ≈ sum_prob_all atol = EPS;
+end
\ No newline at end of file
diff --git a/test/queries/marginal_flow_tests.jl b/test/queries/marginal_flow_tests.jl
index 257fe4a6..3032490e 100644
--- a/test/queries/marginal_flow_tests.jl
+++ b/test/queries/marginal_flow_tests.jl
@@ -1,33 +1,38 @@
-# using Test
-# using LogicCircuits
-# using ProbabilisticCircuits
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
 
-# @testset "Probability of partial Evidence (marginals)" begin
-#     EPS = 1e-7;
-#     prob_circuit = zoo_psdd("little_4var.psdd");
+@testset "Probability of partial Evidence (marginals)" begin
+    EPS = 1e-7;
+    prob_circuit = zoo_psdd("little_4var.psdd");
 
-#     data = Int8.([0 0 0 0; 0 1 1 0; 0 0 1 1;
-#                 0 0 0 -1; -1 1 0 -1; -1 -1 -1 -1; 0 -1 -1 -1])
-#     true_prob = [0.07; 0.03; 0.13999999999999999;
-#                     0.3499999999999; 0.1; 1.0; 0.8]
+    data = DataFrame([false false false false; 
+                      false true true false; 
+                      false false true true;
+                      false false false missing; 
+                      missing true false missing; 
+                      missing missing missing missing; 
+                      false missing missing missing])
+    true_prob = [0.07; 0.03; 0.13999999999999999;
+                    0.3499999999999; 0.1; 1.0; 0.8]
 
-#     calc_prob = marginal_log_likelihood_per_instance(prob_circuit, data)
-#     calc_prob = exp.(calc_prob)
+    calc_prob = MAR(prob_circuit, data)
+    calc_prob = exp.(calc_prob)
 
-#     for i = 1:length(true_prob)
-#         @test true_prob[i] ≈ calc_prob[i] atol= EPS;
-#     end
-# end
+    for i = 1:length(true_prob)
+        @test true_prob[i] ≈ calc_prob[i] atol= EPS;
+    end
+end
 
 # @testset "Marginal Pass Down" begin
 #     EPS = 1e-7;
 #     prob_circuit = zoo_psdd("little_4var.psdd");
-#     logic_circuit = PlainLogicCircuit(prob_circuit)
 
 #     N = 4
-#     data_full = Bool.(generate_data_all(N))
+#     data_full = generate_data_all(N)
 
 #     # Comparing with down pass with fully obeserved data
+
 #     compute_flows(logic_circuit, data_full)
 #     compute_exp_flows(prob_circuit, data_full)
 
diff --git a/test/queries/sample_test.jl b/test/queries/sample_test.jl
index 3b44c9c9..bdd19212 100644
--- a/test/queries/sample_test.jl
+++ b/test/queries/sample_test.jl
@@ -10,7 +10,7 @@
 #     N = 4;
 #     data_all = generate_data_all(N);
 
-#     calc_prob_all = log_likelihood_per_instance(prob_circuit, data_all);
+#     calc_prob_all = EVI(prob_circuit, data_all);
 #     calc_prob_all = exp.(calc_prob_all);
 
 #     using DataStructures
@@ -42,14 +42,14 @@
 
 #     N = 4;
 #     data = Int8.([0 -1 0 -1])
-#     calc_prob = marginal_log_likelihood_per_instance(prob_circuit, data);
+#     calc_prob = MAR(prob_circuit, data);
 #     calc_prob = exp.(calc_prob);
 
-#     data_all = Int8.([0 0 0 0;
+#     data_all = DataFrame(BitArray([0 0 0 0;
 #                     0 0 0 1;
 #                     0 1 0 0;
-#                     0 1 0 1;]);
-#     calc_prob_all = marginal_log_likelihood_per_instance(prob_circuit, data_all);
+#                     0 1 0 1;]));
+#     calc_prob_all = MAR(prob_circuit, data_all);
 #     calc_prob_all = exp.(calc_prob_all);
 
 #     calc_prob_all ./= calc_prob[1]

From cc1938caf849c1420cc3e787ac4fef2269a94ded Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 12 Sep 2020 03:05:55 -0500
Subject: [PATCH 104/131] more serious tests for marginals

---
 src/queries/marginal_flow.jl        |   9 +-
 test/queries/marginal_flow_tests.jl | 147 +++++++++++++++++-----------
 2 files changed, 94 insertions(+), 62 deletions(-)

diff --git a/src/queries/marginal_flow.jl b/src/queries/marginal_flow.jl
index 019cae0f..2a200a05 100644
--- a/src/queries/marginal_flow.jl
+++ b/src/queries/marginal_flow.jl
@@ -37,6 +37,9 @@ const MAR = marginal
 #####################
 
 "Evaluate the probabilistic circuit bottom-up for a given input and return the marginal probability value of all nodes"
+marginal_all(circuit::ProbCircuit, data::DataFrame) =
+    marginal_all(same_device(ParamBitCircuit(circuit, data), data) , data)
+
 function marginal_all(circuit::ParamBitCircuit, data, reuse=nothing)
     @assert num_features(data) == num_features(circuit) 
     @assert isbinarydata(data)
@@ -193,7 +196,7 @@ function marginal_flows_down_layers(pbc::ParamBitCircuit, flows::Matrix, values:
             if iszero(par_start)
                 if dec_id == num_nodes(circuit)
                     # marginal flow start from 0.0
-                    @inbounds @views @. flows[:, dec_id] = 0.0
+                    @inbounds @views flows[:, dec_id] .= zero(eltype(flows))
                 end
                 # no parents, ignore (can happen for false/true node and root)
             else
@@ -283,8 +286,8 @@ function marginal_flows_down_layers_cuda(layer, nodes, elements, parents, params
         for i = index_y:stride_y:length(layer)
             dec_id = @inbounds layer[i]
             if dec_id == size(nodes,2)
-                # populate root flow from values
-                flow = values[k, dec_id]
+                # populate root flows
+                flow = zero(eltype(flows))
             else
                 par_start = @inbounds nodes[3,dec_id]
                 flow = typemin(eltype(flows)) # log(0)
diff --git a/test/queries/marginal_flow_tests.jl b/test/queries/marginal_flow_tests.jl
index 3032490e..573727cd 100644
--- a/test/queries/marginal_flow_tests.jl
+++ b/test/queries/marginal_flow_tests.jl
@@ -1,12 +1,17 @@
 using Test
 using LogicCircuits
 using ProbabilisticCircuits
+using DataFrames: DataFrame
+using CUDA
 
-@testset "Probability of partial Evidence (marginals)" begin
-    EPS = 1e-7;
+function cpu_gpu_agree(f, data; atol=1e-7)
+    CUDA.functional() && @test f(data) ≈ to_cpu(f(to_gpu(data))) atol=atol
+end
+
+@testset "Marginals" begin
     prob_circuit = zoo_psdd("little_4var.psdd");
 
-    data = DataFrame([false false false false; 
+    data_marg = DataFrame([false false false false; 
                       false true true false; 
                       false false true true;
                       false false false missing; 
@@ -16,65 +21,89 @@ using ProbabilisticCircuits
     true_prob = [0.07; 0.03; 0.13999999999999999;
                     0.3499999999999; 0.1; 1.0; 0.8]
 
-    calc_prob = MAR(prob_circuit, data)
-    calc_prob = exp.(calc_prob)
+    calc_prob = exp.(MAR(prob_circuit, data_marg))
+    @test true_prob ≈ calc_prob atol=1e-7
+
+    cpu_gpu_agree(data_marg) do d 
+        marginal_all(prob_circuit, d)
+    end
+
+    function test_complete_mar(data)
+        r1 = EVI(prob_circuit, data)
+        r2 = MAR(prob_circuit, data)
+        @test r1 ≈ r2 atol=1e-6
+    end
+
+    data_full = generate_data_all(num_variables(prob_circuit))
+    
+    test_complete_mar(data_full)
+    CUDA.functional() && test_complete_mar(to_gpu(data_full))
 
-    for i = 1:length(true_prob)
-        @test true_prob[i] ≈ calc_prob[i] atol= EPS;
+    cpu_gpu_agree(data_full) do d 
+        marginal_all(prob_circuit, d)
     end
+
 end
 
-# @testset "Marginal Pass Down" begin
-#     EPS = 1e-7;
-#     prob_circuit = zoo_psdd("little_4var.psdd");
-
-#     N = 4
-#     data_full = generate_data_all(N)
-
-#     # Comparing with down pass with fully obeserved data
-
-#     compute_flows(logic_circuit, data_full)
-#     compute_exp_flows(prob_circuit, data_full)
-
-#     lin_prob = linearize(prob_circuit)
-#     lin_logic = linearize(logic_circuit)
-#     for i in 1 : length(lin_prob)
-#         pn = lin_prob[i]
-#         ln = lin_logic[i]
-#         @test all(isapprox.(exp.(get_exp_downflow(pn; root=prob_circuit)), 
-#             get_downflow(ln; root=logic_circuit), atol=EPS))
-#     end
-
-#     # Validating one example with missing features done by hand
-#     data_partial = Int8.([-1 1 -1 1])
-#     prob_circuit = zoo_psdd("little_4var.psdd");
-#     compute_exp_flows(prob_circuit, data_partial)
-
-#     # (node index, correct down_flow_value)
-#     true_vals = [(1, 0.5),
-#                 (2, 1.0),
-#                 (3, 0.5),
-#                 (4, 0.0),
-#                 (5, 0.0),
-#                 (6, 0.5),
-#                 (7, 0.5),
-#                 (8, 0.0),
-#                 (9, 1.0),
-#                 (10, 1/3),
-#                 (11, 1),
-#                 (12, 1/3),
-#                 (13, 0.0),
-#                 (14, 0.0),
-#                 (15, 2/3),
-#                 (16, 2/3),
-#                 (17, 0.0),
-#                 (18, 1.0),
-#                 (19, 1.0),
-#                 (20, 1.0)]
-#     lin = linearize(prob_circuit)
+@testset "Marginal flows" begin
     
-#     for ind_val in true_vals
-#         @test exp(get_exp_downflow(lin[ind_val[1]]; root=prob_circuit)[1]) ≈ ind_val[2] atol= EPS
-#     end
-# end
+    prob_circuit = zoo_psdd("little_4var.psdd");
+
+    function test_flows(data)
+        # Comparing with down pass with fully observed data
+
+        _, f1 = satisfies_flows(prob_circuit, Float64.(data))
+        _, f2 = marginal_flows(prob_circuit, data)
+
+        # note: while downward pass flows should be the same, 
+        # the upward pass is *not* supposed to be the same (parameters used vs not)
+        
+        f1 = to_cpu(f1[:,3:end]) # ignore true and false leaf
+        f2 = to_cpu(f2[:,3:end]) # ignore true and false leaf
+
+        @test f1 ≈ exp.(f2) atol=1e-6
+    end
+
+    data_full = generate_data_all(num_variables(prob_circuit))
+    
+    test_flows(data_full)
+    CUDA.functional() && test_flows(to_gpu(data_full))
+    
+    cpu_gpu_agree(data_full) do d 
+        _, f = marginal_flows(prob_circuit, d)
+        f[:,3:end] # ignore true and false leaf
+    end
+
+    # # Validating one example with missing features done by hand
+    # data_partial = Int8.([-1 1 -1 1])
+    # prob_circuit = zoo_psdd("little_4var.psdd");
+    # compute_exp_flows(prob_circuit, data_partial)
+
+    # # (node index, correct down_flow_value)
+    # true_vals = [(1, 0.5),
+    #             (2, 1.0),
+    #             (3, 0.5),
+    #             (4, 0.0),
+    #             (5, 0.0),
+    #             (6, 0.5),
+    #             (7, 0.5),
+    #             (8, 0.0),
+    #             (9, 1.0),
+    #             (10, 1/3),
+    #             (11, 1),
+    #             (12, 1/3),
+    #             (13, 0.0),
+    #             (14, 0.0),
+    #             (15, 2/3),
+    #             (16, 2/3),
+    #             (17, 0.0),
+    #             (18, 1.0),
+    #             (19, 1.0),
+    #             (20, 1.0)]
+    # lin = linearize(prob_circuit)
+    
+    # for ind_val in true_vals
+    #     @test exp(get_exp_downflow(lin[ind_val[1]]; root=prob_circuit)[1]) ≈ ind_val[2] atol= EPS
+    # end
+end
 

From bd7e5cb259be5dd5a443433bfd7f738b66669e30 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 12 Sep 2020 03:13:43 -0500
Subject: [PATCH 105/131] more marginal flow tests

---
 test/queries/marginal_flow_tests.jl | 50 +++++++++++------------------
 1 file changed, 19 insertions(+), 31 deletions(-)

diff --git a/test/queries/marginal_flow_tests.jl b/test/queries/marginal_flow_tests.jl
index 573727cd..54705ae3 100644
--- a/test/queries/marginal_flow_tests.jl
+++ b/test/queries/marginal_flow_tests.jl
@@ -74,36 +74,24 @@ end
         f[:,3:end] # ignore true and false leaf
     end
 
-    # # Validating one example with missing features done by hand
-    # data_partial = Int8.([-1 1 -1 1])
-    # prob_circuit = zoo_psdd("little_4var.psdd");
-    # compute_exp_flows(prob_circuit, data_partial)
-
-    # # (node index, correct down_flow_value)
-    # true_vals = [(1, 0.5),
-    #             (2, 1.0),
-    #             (3, 0.5),
-    #             (4, 0.0),
-    #             (5, 0.0),
-    #             (6, 0.5),
-    #             (7, 0.5),
-    #             (8, 0.0),
-    #             (9, 1.0),
-    #             (10, 1/3),
-    #             (11, 1),
-    #             (12, 1/3),
-    #             (13, 0.0),
-    #             (14, 0.0),
-    #             (15, 2/3),
-    #             (16, 2/3),
-    #             (17, 0.0),
-    #             (18, 1.0),
-    #             (19, 1.0),
-    #             (20, 1.0)]
-    # lin = linearize(prob_circuit)
-    
-    # for ind_val in true_vals
-    #     @test exp(get_exp_downflow(lin[ind_val[1]]; root=prob_circuit)[1]) ≈ ind_val[2] atol= EPS
-    # end
+    # Validating one example with missing features done by hand
+    data_partial = DataFrame([missing true missing true;])
+    prob_circuit = zoo_psdd("little_4var.psdd");
+    _, f = marginal_flows(prob_circuit, data_partial)
+    f = exp.(f)
+
+    @test f[end] ≈ 1.0
+    @test f[end-1] ≈ 1.0
+    @test f[end-2] ≈ 1.0
+    @test f[end-4] ≈ 2/3
+    @test f[end-5] ≈ 0.0 atol=1e-7
+    @test f[end-6] ≈ 1/2
+    @test f[end-7] ≈ 1.0
+    @test f[end-8] ≈ 1/3
+    @test f[end-9] ≈ 1
+    @test f[end-10] ≈ 1/2
+
+    # correctness on gpu by transitivy with above test
+
 end
 

From 13e490e3e4e7cf5d8b1aedaea88ff228baea9c9f Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 12 Sep 2020 03:25:54 -0500
Subject: [PATCH 106/131] likelihood tests gpu

---
 test/helper/gpu.jl                  |  4 ++++
 test/queries/likelihood_tests.jl    | 14 +++++++++-----
 test/queries/marginal_flow_tests.jl |  4 +---
 3 files changed, 14 insertions(+), 8 deletions(-)
 create mode 100644 test/helper/gpu.jl

diff --git a/test/helper/gpu.jl b/test/helper/gpu.jl
new file mode 100644
index 00000000..0b3cd75d
--- /dev/null
+++ b/test/helper/gpu.jl
@@ -0,0 +1,4 @@
+
+function cpu_gpu_agree(f, data; atol=1e-7)
+    CUDA.functional() && @test f(data) ≈ to_cpu(f(to_gpu(data))) atol=atol
+end
\ No newline at end of file
diff --git a/test/queries/likelihood_tests.jl b/test/queries/likelihood_tests.jl
index 23a03f1e..4ef2afba 100644
--- a/test/queries/likelihood_tests.jl
+++ b/test/queries/likelihood_tests.jl
@@ -3,11 +3,12 @@ using LogicCircuits
 using ProbabilisticCircuits
 using DataFrames: DataFrame
 
+include("../helper/gpu.jl")
+
 @testset "Likelihood" begin
     # Uses a PC with 4 variables, and tests 3 of the configurations to
     # match with python. Also tests all probabilities sum up to 1.
 
-    EPS = 1e-7;
     prob_circuit = zoo_psdd("little_4var.psdd");
     @test prob_circuit isa ProbCircuit;
 
@@ -18,9 +19,7 @@ using DataFrames: DataFrame
     calc_prob = EVI(prob_circuit, data)
     calc_prob = exp.(calc_prob)
 
-    for i = 1:3
-        @test true_prob[i] ≈ calc_prob[i] atol= EPS;
-    end
+    @test true_prob ≈ calc_prob atol=1e-7;
 
     # Step 2. Add up all probabilities and see if they add up to one
     N = 4;
@@ -30,5 +29,10 @@ using DataFrames: DataFrame
     calc_prob_all = exp.(calc_prob_all)
     sum_prob_all = sum(calc_prob_all)
 
-    @test 1 ≈ sum_prob_all atol = EPS;
+    @test 1 ≈ sum_prob_all atol = 1e-7;
+
+    cpu_gpu_agree(data_all) do d 
+        EVI(prob_circuit, d)
+    end
+    
 end
\ No newline at end of file
diff --git a/test/queries/marginal_flow_tests.jl b/test/queries/marginal_flow_tests.jl
index 54705ae3..0207cee5 100644
--- a/test/queries/marginal_flow_tests.jl
+++ b/test/queries/marginal_flow_tests.jl
@@ -4,9 +4,7 @@ using ProbabilisticCircuits
 using DataFrames: DataFrame
 using CUDA
 
-function cpu_gpu_agree(f, data; atol=1e-7)
-    CUDA.functional() && @test f(data) ≈ to_cpu(f(to_gpu(data))) atol=atol
-end
+include("../helper/gpu.jl")
 
 @testset "Marginals" begin
     prob_circuit = zoo_psdd("little_4var.psdd");

From 9266c9b134170e1e024929464175979ab13ebd15 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 12 Sep 2020 13:44:32 -0500
Subject: [PATCH 107/131] cleanup of sampling

---
 src/logistic_nodes.jl       |  1 -
 src/queries/sample.jl       | 63 +++++++--------------------
 test/helper/gpu.jl          |  1 +
 test/queries/sample_test.jl | 87 ++++++++++---------------------------
 4 files changed, 38 insertions(+), 114 deletions(-)

diff --git a/src/logistic_nodes.jl b/src/logistic_nodes.jl
index 158bb685..cb7a2075 100644
--- a/src/logistic_nodes.jl
+++ b/src/logistic_nodes.jl
@@ -75,7 +75,6 @@ import LogicCircuits: children # make available for extension
 @inline children(n::LogisticInnerNode) = n.children
 @inline num_classes(n::Logistic⋁Node) = size(n.thetas)[2]
 
-import ..Utils: num_parameters
 @inline num_parameters(c::LogisticCircuit) = sum(n -> num_children(n) * classes(n), ⋁_nodes(c))
 @inline num_parameters_per_class(c::LogisticCircuit) = sum(n -> num_children(n), ⋁_nodes(c))
 
diff --git a/src/queries/sample.jl b/src/queries/sample.jl
index 21c9d125..ea0065d4 100644
--- a/src/queries/sample.jl
+++ b/src/queries/sample.jl
@@ -1,74 +1,41 @@
 export sample
 
-##################
-# Sampling from a psdd
-##################
+import Random: default_rng
 
 """
 Sample from a PC without any evidence
 """
-function sample(circuit::ProbCircuit)::AbstractVector{Bool}
-
-    simulate(node::Union{PlainProbLiteralNode, StructProbLiteralNode}) = begin
-        inst[variable(node)] = ispositive(node) ? 1 : 0
-    end
+function sample(circuit::ProbCircuit; rng = default_rng())::BitVector
     
-    simulate(node::Union{PlainSumNode, StructSumNode}) = begin
-        idx = sample(exp.(node.log_probs))
-        simulate(children(node)[idx])
-    end
-
-    simulate(node::Union{PlainMulNode, StructMulNode}) = foreach(simulate, children(node))
-
-    inst = Dict{Var,Int64}()
-    simulate(circuit)
-    len = length(keys(inst))
-    ans = Vector{Bool}()
-    for i = 1:len
-        push!(ans, inst[i])
-    end
-    ans
-end
-
-
-"""
-Sampling with Evidence from a psdd.
-"""
-function sample(circuit::ProbCircuit, evidence)::AbstractVector{Bool}
-
-    @assert num_examples(evidence) == 1 "evidence have to be one example"
+    inst = Dict{Var,Bool}()
     
-    simulate(node::Union{PlainProbLiteralNode, StructProbLiteralNode}) = begin
-        inst[variable(node)] = ispositive(node) ? 1 : 0
+    simulate(node) = simulate(node, GateType(node))
+    
+    simulate(node, ::LeafGate) = begin
+        inst[variable(node)] = ispositive(node)
     end
     
-    function simulate(node::Union{PlainSumNode, StructSumNode})
-        prs = [get_exp_upflow(ch)[1] for ch in children(node)] # #evidence == 1
-        idx = sample(exp.(node.log_probs .+ prs))
+    simulate(node, ::⋁Gate) = begin
+        idx = sample_index(exp.(node.log_probs); rng)
         simulate(children(node)[idx])
     end
-    
-    simulate(node::Union{PlainMulNode, StructMulNode}) = foreach(simulate, children(node))
 
-    evaluate_exp(circuit, evidence)
+    simulate(node, ::⋀Gate) = 
+        foreach(simulate, children(node))
 
-    inst = Dict{Var,Int64}()
     simulate(circuit)
+    
     len = length(keys(inst))
-    ans = Vector{Bool}()
-    for i = 1:len
-        push!(ans, inst[i])
-    end
-    ans
+    BitVector([inst[i] for i = 1:len])
 end
 
 
 """
 Uniformly sample based on the probability of the items and return the selected index
 """
-function sample(probs::AbstractVector{<:Number})::Int32
+function sample_index(probs::AbstractVector{<:Number}; rng = default_rng())::Int32
     z = sum(probs)
-    q = rand() * z
+    q = rand(rng) * z
     cur = 0.0
     for i = 1:length(probs)
         cur += probs[i]
diff --git a/test/helper/gpu.jl b/test/helper/gpu.jl
index 0b3cd75d..2c277f95 100644
--- a/test/helper/gpu.jl
+++ b/test/helper/gpu.jl
@@ -1,3 +1,4 @@
+using CUDA: CUDA
 
 function cpu_gpu_agree(f, data; atol=1e-7)
     CUDA.functional() && @test f(data) ≈ to_cpu(f(to_gpu(data))) atol=atol
diff --git a/test/queries/sample_test.jl b/test/queries/sample_test.jl
index bdd19212..fa10c285 100644
--- a/test/queries/sample_test.jl
+++ b/test/queries/sample_test.jl
@@ -1,73 +1,30 @@
-# using Test
-# using LogicCircuits
-# using ProbabilisticCircuits
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+using Random: MersenneTwister
 
+@testset "Sampling Test" begin
 
-# @testset "Sampling Test" begin
-#     EPS = 1e-2;
-#     prob_circuit = zoo_psdd("little_4var.psdd");
+    rng = MersenneTwister(42)
 
-#     N = 4;
-#     data_all = generate_data_all(N);
+    prob_circuit = zoo_psdd("little_4var.psdd");
+    data_all = generate_data_all(num_variables(prob_circuit));
 
-#     calc_prob_all = EVI(prob_circuit, data_all);
-#     calc_prob_all = exp.(calc_prob_all);
+    calc_prob_all = EVI(prob_circuit, data_all)
 
-#     using DataStructures
-#     hist = DefaultDict{AbstractString,Float64}(0.0)
+    hist = Dict{BitVector,Int}()
 
-#     Nsamples = 1000 * 1000
-#     for i = 1:Nsamples
-#         cur = join(Int.(sample(prob_circuit)))
-#         hist[cur] += 1
-#     end
+    Nsamples = 10_0000
+    for i = 1:Nsamples
+        s = sample(prob_circuit; rng)
+        hist[s] = get(hist, s, 0) + 1
+    end
 
-#     for k in keys(hist)
-#         hist[k] /= Nsamples
-#     end
+    for i = 1:num_examples(data_all)
+        exact_prob = exp(calc_prob_all[i])
+        ex = BitVector(example(data_all,i))
+        estim_prob = get(hist, ex, 0) / Nsamples
+        @test exact_prob ≈ estim_prob atol=1e-2;
+    end
 
-#     for k in keys(hist)
-#         cur = parse(Int32, k, base=2) + 1 # cause Julia arrays start at 1 :(
-#         @test calc_prob_all[cur] ≈ hist[k] atol= EPS;
-#     end
-
-
-# end
-
-# using DataStructures
-# @testset "Sampling With Evidence" begin
-#     # TODO (pashak) this test should be improved by adding few more cases
-#     EPS = 1e-2;
-#     prob_circuit = zoo_psdd("little_4var.psdd");
-
-#     N = 4;
-#     data = Int8.([0 -1 0 -1])
-#     calc_prob = MAR(prob_circuit, data);
-#     calc_prob = exp.(calc_prob);
-
-#     data_all = DataFrame(BitArray([0 0 0 0;
-#                     0 0 0 1;
-#                     0 1 0 0;
-#                     0 1 0 1;]));
-#     calc_prob_all = MAR(prob_circuit, data_all);
-#     calc_prob_all = exp.(calc_prob_all);
-
-#     calc_prob_all ./= calc_prob[1]
-
-#     hist = DefaultDict{AbstractString,Float64}(0.0)
-
-#     Nsamples = 1000 * 1000
-#     for i = 1:Nsamples
-#         cur = join(Int.(sample(prob_circuit, data)))
-#         hist[cur] += 1
-#     end
-
-#     for k in keys(hist)
-#         hist[k] /= Nsamples
-#     end
-
-#     for ind = 1:4
-#         cur = join(data_all[ind, :])
-#         @test calc_prob_all[ind] ≈ hist[cur] atol= EPS;
-#     end
-# end
\ No newline at end of file
+end
\ No newline at end of file

From 7505e4d097550bf2b4de2a58eb319202af03d5e5 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 12 Sep 2020 14:23:04 -0500
Subject: [PATCH 108/131] reinstate probability of constraint

---
 src/ProbabilisticCircuits.jl                  |   5 +-
 src/queries/expectation.jl                    |  62 --------
 src/queries/information.jl                    | 150 +++++++++---------
 src/queries/pr_constraint.jl                  |  66 ++++++++
 .../Probabilistic/informations_tests.jl       |  37 -----
 test/queries/pr_constrain_tests.jl            |  30 ++++
 6 files changed, 173 insertions(+), 177 deletions(-)
 create mode 100644 src/queries/pr_constraint.jl
 create mode 100644 test/queries/pr_constrain_tests.jl

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index c77e0806..85524c4a 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -20,14 +20,13 @@ include("parameters.jl")
 include("queries/likelihood.jl")
 include("queries/marginal_flow.jl")
 include("queries/sample.jl")
+include("queries/pr_constraint.jl")
+# include("queries/information.jl")
 
 include("Logistic/Logistic.jl")
 @reexport using .Logistic
 
 # include("exp_flows.jl")
-# include("queries.jl")
-# include("informations.jl")
-
 
 # include("reasoning/expectation.jl")
 # include("reasoning/exp_flow_circuits.jl")
diff --git a/src/queries/expectation.jl b/src/queries/expectation.jl
index 6d241d04..dd561aa7 100644
--- a/src/queries/expectation.jl
+++ b/src/queries/expectation.jl
@@ -1,68 +1,6 @@
 export pr_constraint, Expectation, ExpectationUpward, Moment
 
 
-const StrutCircuit = Union{ProbCircuit, StructLogicCircuit}
-const PRCache = Dict{Tuple{ProbCircuit, StrutCircuit}, Float64}
-
-# Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability
-# spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
-
-"""
-Calculate the probability of the logic formula given by sdd for the psdd
-"""
-function pr_constraint(psdd_node::ProbCircuit, sdd_node::StrutCircuit,
-    cache::PRCache=PRCache())::Float64
-    
-    # Cache hit
-    if (psdd_node, sdd_node) in keys(cache) 
-        return cache[psdd_node, sdd_node]
-    
-    # Boundary cases
-    elseif psdd_node isa StructProbLiteralNode
-        # Both are literals, just check whether they agrees with each other 
-        if isliteralgate(sdd_node)
-            if literal(psdd_node) == literal(sdd_node)
-                return get!(cache, (psdd_node, sdd_node), 1.0)
-            else
-                return get!(cache, (psdd_node, sdd_node), 0.0)
-            end
-        else
-            pr_constraint(psdd_node, children(sdd_node)[1], cache)
-            if length(children(sdd_node)) > 1
-                pr_constraint(psdd_node, children(sdd_node)[2], cache)
-                return get!(cache, (psdd_node, sdd_node), 1.0)
-            else
-                return get!(cache, (psdd_node, sdd_node),
-                    literal(children(sdd_node)[1]) == literal(psdd_node) ? 1.0 : 0.0)
-            end
-        end
-    
-    # The psdd is true
-    elseif children(psdd_node)[1] isa StructProbLiteralNode 
-        theta = exp(psdd_node.log_probs[1])
-        return get!(cache, (psdd_node, sdd_node),
-            theta * pr_constraint(children(psdd_node)[1], sdd_node, cache) +
-            (1.0 - theta) * pr_constraint(children(psdd_node)[2], sdd_node, cache))
-    
-    # Both psdds are not trivial
-    else 
-        prob = 0.0
-        for (prob⋀_node, log_theta) in zip(children(psdd_node), psdd_node.log_probs)
-            p = children(prob⋀_node)[1]
-            s = children(prob⋀_node)[2]
-
-            theta = exp(log_theta)
-            for sdd⋀_node in children(sdd_node)
-                r = children(sdd⋀_node)[1]
-                t = children(sdd⋀_node)[2]
-                prob += theta * pr_constraint(p, r, cache) * pr_constraint(s, t, cache)
-            end
-        end
-        return get!(cache, (psdd_node, sdd_node), prob)
-    end
-end
-
-
 ExpCacheDict = Dict{Pair{ProbCircuit, LogisticCircuit}, Array{Float64, 2}}
 MomentCacheDict = Dict{Tuple{ProbCircuit, LogisticCircuit, Int64}, Array{Float64, 2}}
 
diff --git a/src/queries/information.jl b/src/queries/information.jl
index e87d2f59..d1c10ea4 100644
--- a/src/queries/information.jl
+++ b/src/queries/information.jl
@@ -1,81 +1,81 @@
 export kl_divergence
 
-const KLDCache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}
+const KLDCache = Dict{ProbCircuit, Float64}
 
 """"
-Calculate entropy of the distribution of the input psdd."
+Calculate entropy of the distribution of the input pc."
 """
 
 import ..Utils: entropy
-function entropy(psdd_node::StructSumNode, psdd_entropy_cache::Dict{ProbCircuit, Float64}=Dict{ProbCircuit, Float64}())::Float64
-    if psdd_node in keys(psdd_entropy_cache)
-        return psdd_entropy_cache[psdd_node]
-    elseif children(psdd_node)[1] isa StructProbLiteralNode
-        return get!(psdd_entropy_cache, psdd_node,
-            - exp(psdd_node.log_probs[1]) * psdd_node.log_probs[1] -
-            exp(psdd_node.log_probs[2]) * psdd_node.log_probs[2])
+function entropy(pc_node::StructSumNode, pc_entropy_cache::Dict{ProbCircuit, Float64}=Dict{ProbCircuit, Float64}())::Float64
+    if pc_node in keys(pc_entropy_cache)
+        return pc_entropy_cache[pc_node]
+    elseif children(pc_node)[1] isa StructProbLiteralNode
+        return get!(pc_entropy_cache, pc_node,
+            - exp(pc_node.log_probs[1]) * pc_node.log_probs[1] -
+            exp(pc_node.log_probs[2]) * pc_node.log_probs[2])
     else
         local_entropy = 0.0
-        for (prob⋀_node, log_prob) in zip(children(psdd_node), psdd_node.log_probs)
+        for (prob⋀_node, log_prob) in zip(children(pc_node), pc_node.log_probs)
             p = children(prob⋀_node)[1]
             s = children(prob⋀_node)[2]
 
-            local_entropy += exp(log_prob) * (entropy(p, psdd_entropy_cache) +
-                entropy(s, psdd_entropy_cache) - log_prob)
+            local_entropy += exp(log_prob) * (entropy(p, pc_entropy_cache) +
+                entropy(s, pc_entropy_cache) - log_prob)
         end
-        return get!(psdd_entropy_cache, psdd_node, local_entropy)
+        return get!(pc_entropy_cache, pc_node, local_entropy)
     end
 end
 
-function entropy(psdd_node::StructMulNode, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
-    return get!(psdd_entropy_cache, children(psdd_node)[1], entropy(children(psdd_node)[1], psdd_entropy_cache)) +
-        get!(psdd_entropy_cache, children(psdd_node)[2], entropy(children(psdd_node)[2], psdd_entropy_cache))
+function entropy(pc_node::StructMulNode, pc_entropy_cache::Dict{ProbCircuit, Float64})::Float64
+    return get!(pc_entropy_cache, children(pc_node)[1], entropy(children(pc_node)[1], pc_entropy_cache)) +
+        get!(pc_entropy_cache, children(pc_node)[2], entropy(children(pc_node)[2], pc_entropy_cache))
 end
 
-function entropy(psdd_node::StructProbLiteralNode, psdd_entropy_cache::Dict{ProbCircuit, Float64})::Float64
-    return get!(psdd_entropy_cache, psdd_node, 0.0)
+function entropy(pc_node::StructProbLiteralNode, pc_entropy_cache::Dict{ProbCircuit, Float64})::Float64
+    return get!(pc_entropy_cache, pc_node, 0.0)
 end
 
-"Calculate KL divergence calculation for psdds that are not necessarily identical"
-function kl_divergence(psdd_node1::StructSumNode, psdd_node2::StructSumNode,
+"Calculate KL divergence calculation for pcs that are not necessarily identical"
+function kl_divergence(pc_node1::StructSumNode, pc_node2::StructSumNode,
         kl_divergence_cache::KLDCache=KLDCache(), pr_constraint_cache::PRCache=PRCache())
-    @assert !(psdd_node1 isa StructMulNode || psdd_node2 isa StructMulNode) "Prob⋀ not a valid PSDD node for KL-Divergence"
+    @assert !(pc_node1 isa StructMulNode || pc_node2 isa StructMulNode) "Prob⋀ not a valid pc node for KL-Divergence"
 
     # Check if both nodes are normalized for same vtree node
-    @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
-
-    if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
-        return kl_divergence_cache[(psdd_node1, psdd_node2)]
-    elseif children(psdd_node1)[1] isa StructProbLiteralNode
-        if psdd_node2 isa StructProbLiteralNode
-            kl_divergence(children(psdd_node1)[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-            kl_divergence(children(psdd_node1)[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-            if literal(children(psdd_node1)[1]) == literal(psdd_node2)
-                return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                    psdd_node1.log_probs[1] * exp(psdd_node1.log_probs[1])
+    @assert variables(pc_node1) == variables(pc_node2) "Both nodes not normalized for same vtree node"
+
+    if (pc_node1, pc_node2) in keys(kl_divergence_cache) # Cache hit
+        return kl_divergence_cache[(pc_node1, pc_node2)]
+    elseif children(pc_node1)[1] isa StructProbLiteralNode
+        if pc_node2 isa StructProbLiteralNode
+            kl_divergence(children(pc_node1)[1], pc_node2, kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(children(pc_node1)[2], pc_node2, kl_divergence_cache, pr_constraint_cache)
+            if literal(children(pc_node1)[1]) == literal(pc_node2)
+                return get!(kl_divergence_cache, (pc_node1, pc_node2),
+                    pc_node1.log_probs[1] * exp(pc_node1.log_probs[1])
                 )
             else
-                return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                    psdd_node1.log_probs[2] * exp(psdd_node1.log_probs[2])
+                return get!(kl_divergence_cache, (pc_node1, pc_node2),
+                    pc_node1.log_probs[2] * exp(pc_node1.log_probs[2])
                 )
             end
         else
             # The below four lines actually assign zero, but still we need to
             # call it.
-            kl_divergence(children(psdd_node1)[1], children(psdd_node2)[1], kl_divergence_cache, pr_constraint_cache)
-            kl_divergence(children(psdd_node1)[1], children(psdd_node2)[2], kl_divergence_cache, pr_constraint_cache)
-            kl_divergence(children(psdd_node1)[2], children(psdd_node2)[1], kl_divergence_cache, pr_constraint_cache)
-            kl_divergence(children(psdd_node1)[2], children(psdd_node2)[2], kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(children(pc_node1)[1], children(pc_node2)[1], kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(children(pc_node1)[1], children(pc_node2)[2], kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(children(pc_node1)[2], children(pc_node2)[1], kl_divergence_cache, pr_constraint_cache)
+            kl_divergence(children(pc_node1)[2], children(pc_node2)[2], kl_divergence_cache, pr_constraint_cache)
             # There are two possible matches
-            if literal(children(psdd_node1)[1]) == literal(children(psdd_node2)[1])
-                return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                    exp(psdd_node1.log_probs[1]) * (psdd_node1.log_probs[1] - psdd_node2.log_probs[1]) +
-                    exp(psdd_node1.log_probs[2]) * (psdd_node1.log_probs[2] - psdd_node2.log_probs[2])
+            if literal(children(pc_node1)[1]) == literal(children(pc_node2)[1])
+                return get!(kl_divergence_cache, (pc_node1, pc_node2),
+                    exp(pc_node1.log_probs[1]) * (pc_node1.log_probs[1] - pc_node2.log_probs[1]) +
+                    exp(pc_node1.log_probs[2]) * (pc_node1.log_probs[2] - pc_node2.log_probs[2])
                 )
             else
-                return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                    exp(psdd_node1.log_probs[1]) * (psdd_node1.log_probs[1] - psdd_node2.log_probs[2]) +
-                    exp(psdd_node1.log_probs[2]) * (psdd_node1.log_probs[2] - psdd_node2.log_probs[1])
+                return get!(kl_divergence_cache, (pc_node1, pc_node2),
+                    exp(pc_node1.log_probs[1]) * (pc_node1.log_probs[1] - pc_node2.log_probs[2]) +
+                    exp(pc_node1.log_probs[2]) * (pc_node1.log_probs[2] - pc_node2.log_probs[1])
                 )
             end
         end
@@ -83,8 +83,8 @@ function kl_divergence(psdd_node1::StructSumNode, psdd_node2::StructSumNode,
         kld = 0.0
 
         # loop through every combination of prim and sub
-        for (prob⋀_node1, log_theta1) in zip(children(psdd_node1), psdd_node1.log_probs)
-            for (prob⋀_node2, log_theta2) in zip(children(psdd_node2), psdd_node2.log_probs)
+        for (prob⋀_node1, log_theta1) in zip(children(pc_node1), pc_node1.log_probs)
+            for (prob⋀_node2, log_theta2) in zip(children(pc_node2), pc_node2.log_probs)
                 p = children(prob⋀_node1)[1]
                 s = children(prob⋀_node1)[2]
 
@@ -104,60 +104,60 @@ function kl_divergence(psdd_node1::StructSumNode, psdd_node2::StructSumNode,
                 kld += p11 * p12 * p13 + theta1 * (p11 * p21 + p12 * p31)
             end
         end
-        return get!(kl_divergence_cache, (psdd_node1, psdd_node2), kld)
+        return get!(kl_divergence_cache, (pc_node1, pc_node2), kld)
     end
 end
 
-function kl_divergence(psdd_node1::StructProbLiteralNode, psdd_node2::StructProbLiteralNode,
+function kl_divergence(pc_node1::StructProbLiteralNode, pc_node2::StructProbLiteralNode,
         kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
     # Check if literals are over same variables in vtree
-   @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
+   @assert variables(pc_node1) == variables(pc_node2) "Both nodes not normalized for same vtree node"
 
-    if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
-        return kl_divergence_cache[psdd_node1, psdd_node2]
+    if (pc_node1, pc_node2) in keys(kl_divergence_cache) # Cache hit
+        return kl_divergence_cache[pc_node1, pc_node2]
     else
         # In this case probability is 1, kl divergence is 0
-        return get!(kl_divergence_cache, (psdd_node1, psdd_node2), 0.0)
+        return get!(kl_divergence_cache, (pc_node1, pc_node2), 0.0)
     end
 end
 
-function kl_divergence(psdd_node1::StructSumNode, psdd_node2::StructProbLiteralNode,
+function kl_divergence(pc_node1::StructSumNode, pc_node2::StructProbLiteralNode,
         kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
-    @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
+    @assert variables(pc_node1) == variables(pc_node2) "Both nodes not normalized for same vtree node"
 
-    if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
-        return kl_divergence_cache[psdd_node1, psdd_node2]
+    if (pc_node1, pc_node2) in keys(kl_divergence_cache) # Cache hit
+        return kl_divergence_cache[pc_node1, pc_node2]
     else
-        kl_divergence(children(psdd_node1)[1], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-        kl_divergence(children(psdd_node1)[2], psdd_node2, kl_divergence_cache, pr_constraint_cache)
-        if literal(children(psdd_node1)[1]) == literal(psdd_node2)
-            return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                psdd_node1.log_probs[1] * exp(psdd_node1.log_probs[1])
+        kl_divergence(children(pc_node1)[1], pc_node2, kl_divergence_cache, pr_constraint_cache)
+        kl_divergence(children(pc_node1)[2], pc_node2, kl_divergence_cache, pr_constraint_cache)
+        if literal(children(pc_node1)[1]) == literal(pc_node2)
+            return get!(kl_divergence_cache, (pc_node1, pc_node2),
+                pc_node1.log_probs[1] * exp(pc_node1.log_probs[1])
             )
         else
-            return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                psdd_node1.log_probs[2] * exp(psdd_node1.log_probs[2])
+            return get!(kl_divergence_cache, (pc_node1, pc_node2),
+                pc_node1.log_probs[2] * exp(pc_node1.log_probs[2])
             )
         end
     end
 end
 
-function kl_divergence(psdd_node1::StructProbLiteralNode, psdd_node2::StructSumNode,
+function kl_divergence(pc_node1::StructProbLiteralNode, pc_node2::StructSumNode,
         kl_divergence_cache::KLDCache, pr_constraint_cache::PRCache)
-    @assert variables(psdd_node1) == variables(psdd_node2) "Both nodes not normalized for same vtree node"
+    @assert variables(pc_node1) == variables(pc_node2) "Both nodes not normalized for same vtree node"
 
-    if (psdd_node1, psdd_node2) in keys(kl_divergence_cache) # Cache hit
-        return kl_divergence_cache[psdd_node1, psdd_node2]
+    if (pc_node1, pc_node2) in keys(kl_divergence_cache) # Cache hit
+        return kl_divergence_cache[pc_node1, pc_node2]
     else
-        kl_divergence(psdd_node1, children(psdd_node2)[1], kl_divergence_cache, pr_constraint_cache)
-        kl_divergence(psdd_node1, children(psdd_node2)[2], kl_divergence_cache, pr_constraint_cache)
-        if literal(psdd_node1) == literal(children(psdd_node2)[1])
-            return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                -psdd_node2.log_probs[1]
+        kl_divergence(pc_node1, children(pc_node2)[1], kl_divergence_cache, pr_constraint_cache)
+        kl_divergence(pc_node1, children(pc_node2)[2], kl_divergence_cache, pr_constraint_cache)
+        if literal(pc_node1) == literal(children(pc_node2)[1])
+            return get!(kl_divergence_cache, (pc_node1, pc_node2),
+                -pc_node2.log_probs[1]
             )
         else
-            return get!(kl_divergence_cache, (psdd_node1, psdd_node2),
-                -psdd_node2.log_probs[2]
+            return get!(kl_divergence_cache, (pc_node1, pc_node2),
+                -pc_node2.log_probs[2]
             )
         end
     end
diff --git a/src/queries/pr_constraint.jl b/src/queries/pr_constraint.jl
new file mode 100644
index 00000000..bb04d9ff
--- /dev/null
+++ b/src/queries/pr_constraint.jl
@@ -0,0 +1,66 @@
+export pr_constraint, Expectation, ExpectationUpward, Moment
+
+#TODO relax some of these specific choices
+const StructCircuit = Union{ProbCircuit, StructLogicCircuit}
+const PRCache = Dict{Tuple{ProbCircuit, StructCircuit}, Float64}
+
+# Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability
+# spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
+
+"""
+Calculate the probability of the logic formula given by LC for the PC
+"""
+function pr_constraint(pc_node::ProbCircuit, lc_node::StructCircuit,
+    cache::PRCache=PRCache())::Float64
+
+    # TODO require that both circuits have a vtree for safety. If they don't, then first convert them to have a vtree
+    
+    # Cache hit
+    if (pc_node, lc_node) in keys(cache) 
+        return cache[pc_node, lc_node]
+    
+    # Boundary cases
+    # TODO: make this more general-purpose, use `isliteralgate`
+    elseif pc_node isa StructProbLiteralNode
+        # Both are literals, just check whether they agrees with each other 
+        if isliteralgate(lc_node)
+            if literal(pc_node) == literal(lc_node)
+                return get!(cache, (pc_node, lc_node), 1.0)
+            else
+                return get!(cache, (pc_node, lc_node), 0.0)
+            end
+        else
+            pr_constraint(pc_node, children(lc_node)[1], cache)
+            if length(children(lc_node)) > 1
+                pr_constraint(pc_node, children(lc_node)[2], cache)
+                return get!(cache, (pc_node, lc_node), 1.0)
+            else
+                return get!(cache, (pc_node, lc_node),
+                    literal(children(lc_node)[1]) == literal(pc_node) ? 1.0 : 0.0)
+            end
+        end
+    
+    # The pc is true
+    elseif children(pc_node)[1] isa StructProbLiteralNode 
+        theta = exp(pc_node.log_probs[1])
+        return get!(cache, (pc_node, lc_node),
+            theta * pr_constraint(children(pc_node)[1], lc_node, cache) +
+            (1.0 - theta) * pr_constraint(children(pc_node)[2], lc_node, cache))
+    
+    # Both pcs are not trivial
+    else 
+        prob = 0.0
+        for (prob⋀_node, log_theta) in zip(children(pc_node), pc_node.log_probs)
+            p = children(prob⋀_node)[1]
+            s = children(prob⋀_node)[2]
+
+            theta = exp(log_theta)
+            for lc⋀_node in children(lc_node)
+                r = children(lc⋀_node)[1]
+                t = children(lc⋀_node)[2]
+                prob += theta * pr_constraint(p, r, cache) * pr_constraint(s, t, cache)
+            end
+        end
+        return get!(cache, (pc_node, lc_node), prob)
+    end
+end
\ No newline at end of file
diff --git a/test/broken/Probabilistic/informations_tests.jl b/test/broken/Probabilistic/informations_tests.jl
index f80f41c5..64e30164 100644
--- a/test/broken/Probabilistic/informations_tests.jl
+++ b/test/broken/Probabilistic/informations_tests.jl
@@ -48,40 +48,3 @@ using ProbabilisticCircuits
     @test abs(kl_divergence(pc2, pc3) - 0.38966506) < 1e-8
 
 end
-
-@testset "Pr constraint Query" begin
-    # two nodes
-    simplevtree = zoo_vtree_file("simple2.vtree")
-    pc, vtree = load_struct_prob_circuit(
-                    zoo_psdd_file("simple2.4.psdd"), simplevtree)
-
-    cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
-
-    @test abs(pr_constraint(pc, pc, cache) - 1.0) < 1e-8
-    # @test abs(pr_constraint(pc[5], pc[3], cache) - 0.2) < 1e-8
-    # @test abs(pr_constraint(pc[5], pc[4], cache) - 0.8) < 1e-8
-
-    file_circuit = "little_4var.circuit"
-    file_vtree = "little_4var.vtree"
-    logic_circuit, vtree = load_struct_smooth_logic_circuit(
-                                zoo_lc_file(file_circuit), zoo_vtree_file(file_vtree))
-
-    pc, _ = load_struct_prob_circuit(zoo_psdd_file("little_4var.psdd"), zoo_vtree_file("little_4var.vtree"))
-
-    @test abs(pr_constraint(pc, children(logic_circuit)[1], cache) - 1.0) < 1e-8
-
-    # Test with two psdds
-    pc1, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.5.psdd"), simplevtree)
-    pc2, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.6.psdd"), simplevtree)
-
-    pr_constraint_cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
-    @test abs(pr_constraint(pc1, pc2, pr_constraint_cache) - 1.0) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[1], pc2[1]] - 1.0) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[1], pc2[2]] - 0.0) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[3], pc2[4]] - 1.0) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[3], pc2[5]] - 0.0) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[9], pc2[8]] - 1.0) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[5], pc2[4]] - 0.2) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[5], pc2[5]] - 0.8) < 1e-8
-    # @test abs(pr_constraint_cache[pc1[2], pc2[3]] - 1.0) < 1e-8
-end
diff --git a/test/queries/pr_constrain_tests.jl b/test/queries/pr_constrain_tests.jl
new file mode 100644
index 00000000..d3eb6cb8
--- /dev/null
+++ b/test/queries/pr_constrain_tests.jl
@@ -0,0 +1,30 @@
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+
+@testset "Probability of constraint" begin
+
+    # two nodes
+    simplevtree = zoo_vtree_file("simple2.vtree")
+    pc, vtree = load_struct_prob_circuit(
+                    zoo_psdd_file("simple2.4.psdd"), simplevtree)
+
+  
+    @test pr_constraint(pc, pc) ≈ 1.0
+
+    file_circuit = "little_4var.circuit"
+    file_vtree = "little_4var.vtree"
+    logic_circuit, vtree = load_struct_smooth_logic_circuit(
+                                zoo_lc_file(file_circuit), zoo_vtree_file(file_vtree))
+
+    pc, _ = load_struct_prob_circuit(zoo_psdd_file("little_4var.psdd"), zoo_vtree_file("little_4var.vtree"))
+
+    @test pr_constraint(pc, children(logic_circuit)[1]) ≈ 1.0
+
+    # Test with two psdds
+    pc1, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.5.psdd"), simplevtree)
+    pc2, vtree = load_struct_prob_circuit(zoo_psdd_file("simple2.6.psdd"), simplevtree)
+
+    @test pr_constraint(pc1, pc2) ≈ 1
+
+end

From 7c4e8108d1fa838524d0f225c900ff037b7d908f Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 12 Sep 2020 14:46:55 -0500
Subject: [PATCH 109/131] reinstate entropy and kl divergence

---
 src/ProbabilisticCircuits.jl                  |  2 +-
 src/Utils/Utils.jl                            |  2 +-
 src/Utils/{informations.jl => information.jl} |  1 +
 src/queries/information.jl                    |  2 +-
 src/queries/pr_constraint.jl                  |  9 ++--
 .../Probabilistic/informations_tests.jl       | 50 -------------------
 test/queries/informations_tests.jl            | 20 ++++++++
 test/queries/marginal_flow_tests.jl           |  4 +-
 ...strain_tests.jl => pr_constraint_tests.jl} |  0
 9 files changed, 30 insertions(+), 60 deletions(-)
 rename src/Utils/{informations.jl => information.jl} (99%)
 delete mode 100644 test/broken/Probabilistic/informations_tests.jl
 create mode 100644 test/queries/informations_tests.jl
 rename test/queries/{pr_constrain_tests.jl => pr_constraint_tests.jl} (100%)

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 85524c4a..80555de0 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -21,7 +21,7 @@ include("queries/likelihood.jl")
 include("queries/marginal_flow.jl")
 include("queries/sample.jl")
 include("queries/pr_constraint.jl")
-# include("queries/information.jl")
+include("queries/information.jl")
 
 include("Logistic/Logistic.jl")
 @reexport using .Logistic
diff --git a/src/Utils/Utils.jl b/src/Utils/Utils.jl
index b8ef7cac..6e12f494 100644
--- a/src/Utils/Utils.jl
+++ b/src/Utils/Utils.jl
@@ -5,6 +5,6 @@ that could be useful in any Julia project
 module Utils
 
 include("misc.jl")
-include("informations.jl")
+include("information.jl")
 
 end #module
diff --git a/src/Utils/informations.jl b/src/Utils/information.jl
similarity index 99%
rename from src/Utils/informations.jl
rename to src/Utils/information.jl
index d2933590..1b03b658 100644
--- a/src/Utils/informations.jl
+++ b/src/Utils/information.jl
@@ -82,6 +82,7 @@ end
 #####################
 # Entropy
 #####################
+
 function entropy(dis_cache::DisCache)
     D = dimension(dis_cache)
     px_log_px = @. xlogx(dis_cache.marginal)
diff --git a/src/queries/information.jl b/src/queries/information.jl
index d1c10ea4..127ea0a5 100644
--- a/src/queries/information.jl
+++ b/src/queries/information.jl
@@ -1,6 +1,6 @@
 export kl_divergence
 
-const KLDCache = Dict{ProbCircuit, Float64}
+const KLDCache = Dict{Tuple{ProbCircuit,ProbCircuit}, Float64}
 
 """"
 Calculate entropy of the distribution of the input pc."
diff --git a/src/queries/pr_constraint.jl b/src/queries/pr_constraint.jl
index bb04d9ff..ce581342 100644
--- a/src/queries/pr_constraint.jl
+++ b/src/queries/pr_constraint.jl
@@ -1,8 +1,6 @@
 export pr_constraint, Expectation, ExpectationUpward, Moment
 
-#TODO relax some of these specific choices
-const StructCircuit = Union{ProbCircuit, StructLogicCircuit}
-const PRCache = Dict{Tuple{ProbCircuit, StructCircuit}, Float64}
+const PRCache = Dict{Tuple{ProbCircuit, LogicCircuit}, Float64}
 
 # Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability
 # spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
@@ -10,10 +8,9 @@ const PRCache = Dict{Tuple{ProbCircuit, StructCircuit}, Float64}
 """
 Calculate the probability of the logic formula given by LC for the PC
 """
-function pr_constraint(pc_node::ProbCircuit, lc_node::StructCircuit,
-    cache::PRCache=PRCache())::Float64
+function pr_constraint(pc_node::StructProbCircuit, lc_node, cache::PRCache=PRCache())::Float64
 
-    # TODO require that both circuits have a vtree for safety. If they don't, then first convert them to have a vtree
+    # TODO require that both circuits have an equal vtree for safety. If they don't, then first convert them to have a vtree
     
     # Cache hit
     if (pc_node, lc_node) in keys(cache) 
diff --git a/test/broken/Probabilistic/informations_tests.jl b/test/broken/Probabilistic/informations_tests.jl
deleted file mode 100644
index 64e30164..00000000
--- a/test/broken/Probabilistic/informations_tests.jl
+++ /dev/null
@@ -1,50 +0,0 @@
-using Test
-using LogicCircuits
-using ProbabilisticCircuits
-
-# TODO reinstate after fix tests by replacing indexing circuit node
-
-@testset "Entropy and KLD" begin
-    pc1, vtree = load_struct_prob_circuit(
-                    zoo_psdd_file("simple2.1.psdd"), zoo_vtree_file("simple2.vtree"))
-    pc2, vtree = load_struct_prob_circuit(
-                    zoo_psdd_file("simple2.2.psdd"), zoo_vtree_file("simple2.vtree"))
-    pc3, vtree = load_struct_prob_circuit(
-                    zoo_psdd_file("simple2.3.psdd"), zoo_vtree_file("simple2.vtree"))
-   
-    # Entropy calculation test
-    @test abs(entropy(pc1) - 1.2899219826090118) < 1e-8
-    @test abs(entropy(pc2) - 0.9359472745536583) < 1e-8
-
-    # KLD Tests #
-    # KLD base tests
-    pr_constraint_cache = Dict{Tuple{ProbCircuit, Union{ProbCircuit, StructLogicCircuit}}, Float64}()
-    kl_divergence_cache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}()
-
-    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[3], kl_divergence_cache, pr_constraint_cache)
-    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[2], pc1[3], kl_divergence_cache, pr_constraint_cache)
-    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[4], kl_divergence_cache, pr_constraint_cache)
-    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[1], pc1[5], kl_divergence_cache, pr_constraint_cache)
-    # @test_throws AssertionError("Both nodes not normalized for same vtree node") kl_divergence(pc1[2], pc1[5], kl_divergence_cache, pr_constraint_cache)
-
-    # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[1], pc1[6], kl_divergence_cache, pr_constraint_cache)
-    # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[7], pc1[2], kl_divergence_cache, pr_constraint_cache)
-    # @test_throws AssertionError("Prob⋀ not a valid PSDD node for KL-Divergence") kl_divergence(pc1[6], pc2[7], kl_divergence_cache, pr_constraint_cache)
-
-    # KLD calculation test
-    # @test abs(kl_divergence(pc1[1], pc2[1], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-    # @test abs(kl_divergence(pc1[1], pc1[2], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-    # @test abs(kl_divergence(pc1[1], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.9)) < 1e-8
-    # @test abs(kl_divergence(pc1[2], pc2[3], kl_divergence_cache, pr_constraint_cache) + log(0.1)) < 1e-8
-    # @test abs(kl_divergence(pc1[5], pc2[4], kl_divergence_cache, pr_constraint_cache) - 0.2 * log(0.2)) < 1e-8
-    # @test abs(kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
-    # @test abs(kl_divergence(pc1[5], pc2[5], kl_divergence_cache, pr_constraint_cache) - 0.8 * log(0.8)) < 1e-8
-    @test abs(kl_divergence(pc1, pc2) - 0.5672800167911778) < 1e-8
-
-    kl_divergence_cache = Dict{Tuple{ProbCircuit, ProbCircuit}, Float64}()
-    # @test abs(kl_divergence(pc2[4], pc3[5], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-    # @test abs(kl_divergence(pc2[4], pc3[4], kl_divergence_cache, pr_constraint_cache) - 0.0) < 1e-8
-    # @test abs(kl_divergence(pc2[3], pc3[3], kl_divergence_cache, pr_constraint_cache) - 0.9 * log(0.9 / 0.5) - 0.1 * log(0.1 / 0.5)) < 1e-8
-    @test abs(kl_divergence(pc2, pc3) - 0.38966506) < 1e-8
-
-end
diff --git a/test/queries/informations_tests.jl b/test/queries/informations_tests.jl
new file mode 100644
index 00000000..efc60de4
--- /dev/null
+++ b/test/queries/informations_tests.jl
@@ -0,0 +1,20 @@
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+
+@testset "Entropy and KLD" begin
+
+    pc1, vtree = load_struct_prob_circuit(
+                    zoo_psdd_file("simple2.1.psdd"), zoo_vtree_file("simple2.vtree"))
+    pc2, vtree = load_struct_prob_circuit(
+                    zoo_psdd_file("simple2.2.psdd"), zoo_vtree_file("simple2.vtree"))
+    pc3, vtree = load_struct_prob_circuit(
+                    zoo_psdd_file("simple2.3.psdd"), zoo_vtree_file("simple2.vtree"))
+   
+    @test entropy(pc1) ≈ 1.2899219826090118
+    @test entropy(pc2) ≈ 0.9359472745536583
+
+    @test kl_divergence(pc1, pc2) ≈ 0.5672800167911778
+    @test kl_divergence(pc2, pc3) ≈ 0.38966506
+
+end
diff --git a/test/queries/marginal_flow_tests.jl b/test/queries/marginal_flow_tests.jl
index 0207cee5..4b0e6c12 100644
--- a/test/queries/marginal_flow_tests.jl
+++ b/test/queries/marginal_flow_tests.jl
@@ -50,7 +50,9 @@ end
     function test_flows(data)
         # Comparing with down pass with fully observed data
 
-        _, f1 = satisfies_flows(prob_circuit, Float64.(data))
+        data_f = CUDA.@allowscalar Float64.(data)
+
+        _, f1 = satisfies_flows(prob_circuit, data_f)
         _, f2 = marginal_flows(prob_circuit, data)
 
         # note: while downward pass flows should be the same, 
diff --git a/test/queries/pr_constrain_tests.jl b/test/queries/pr_constraint_tests.jl
similarity index 100%
rename from test/queries/pr_constrain_tests.jl
rename to test/queries/pr_constraint_tests.jl

From 0baa4ef487f6bbbc55a3eb9604e128a165f626fe Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 12 Sep 2020 15:06:34 -0500
Subject: [PATCH 110/131] reinstate expectation code; untested

---
 src/ProbabilisticCircuits.jl                  |   2 +
 .../{expectation2.jl => expectation_graph.jl} |   0
 .../{expectation.jl => expectation_rec.jl}    |   2 +-
 src/queries/pr_constraint.jl                  |   2 +-
 test/broken/Reasoning/expectation_test.jl     | 144 ------------------
 test/broken/expectation_tests.jl              | 142 +++++++++++++++++
 6 files changed, 146 insertions(+), 146 deletions(-)
 rename src/queries/{expectation2.jl => expectation_graph.jl} (100%)
 rename src/queries/{expectation.jl => expectation_rec.jl} (99%)
 delete mode 100644 test/broken/Reasoning/expectation_test.jl
 create mode 100644 test/broken/expectation_tests.jl

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 80555de0..2b0ed0bd 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -22,6 +22,8 @@ include("queries/marginal_flow.jl")
 include("queries/sample.jl")
 include("queries/pr_constraint.jl")
 include("queries/information.jl")
+include("queries/expectation_rec.jl")
+include("queries/expectation_graph.jl")
 
 include("Logistic/Logistic.jl")
 @reexport using .Logistic
diff --git a/src/queries/expectation2.jl b/src/queries/expectation_graph.jl
similarity index 100%
rename from src/queries/expectation2.jl
rename to src/queries/expectation_graph.jl
diff --git a/src/queries/expectation.jl b/src/queries/expectation_rec.jl
similarity index 99%
rename from src/queries/expectation.jl
rename to src/queries/expectation_rec.jl
index dd561aa7..c6164bee 100644
--- a/src/queries/expectation.jl
+++ b/src/queries/expectation_rec.jl
@@ -1,4 +1,4 @@
-export pr_constraint, Expectation, ExpectationUpward, Moment
+export Expectation, ExpectationUpward, Moment
 
 
 ExpCacheDict = Dict{Pair{ProbCircuit, LogisticCircuit}, Array{Float64, 2}}
diff --git a/src/queries/pr_constraint.jl b/src/queries/pr_constraint.jl
index ce581342..c3183128 100644
--- a/src/queries/pr_constraint.jl
+++ b/src/queries/pr_constraint.jl
@@ -1,4 +1,4 @@
-export pr_constraint, Expectation, ExpectationUpward, Moment
+export pr_constraint
 
 const PRCache = Dict{Tuple{ProbCircuit, LogicCircuit}, Float64}
 
diff --git a/test/broken/Reasoning/expectation_test.jl b/test/broken/Reasoning/expectation_test.jl
deleted file mode 100644
index 0e498e88..00000000
--- a/test/broken/Reasoning/expectation_test.jl
+++ /dev/null
@@ -1,144 +0,0 @@
-#TODO: reinstate
-
-# using Test
-# using LogicCircuits
-# using ProbabilisticCircuits
-
-# function test_expectation_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLASSES::Int)
-#     EPS = 1e-7;
-#     COUNT = size(data)[1]
-#     # Compute True expectation brute force
-#     true_exp = zeros(COUNT, CLASSES)
-#     for i in 1:COUNT
-#         row = data[i, :]
-#         cur_data_all = generate_all(row)
-
-#         calc_p = log_likelihood_per_instance(pc, cur_data_all)
-#         calc_p = exp.(calc_p)
-
-#         calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
-#         true_exp[i, :] = sum(calc_p .* calc_f, dims=1)
-#         true_exp[i, :] ./= sum(calc_p) #p_observed
-#     end
-
-#     # Compute Circuit Expect
-#     calc_exp, cache = Expectation(pc, lc, data);
-#     for i = 1:COUNT
-#         for j = 1:CLASSES
-#             @test true_exp[i,j] ≈ calc_exp[i,j] atol= EPS;
-#         end
-#     end    
-#     # Compute Bottom Up Expectation
-#     calc_exp_2, exp_flow = ExpectationUpward(pc, lc, data);
-#     for i = 1:COUNT
-#         for j = 1:CLASSES
-#             @test true_exp[i,j] ≈ calc_exp_2[i,j] atol= EPS;
-#         end
-#     end
-# end
-
-# function test_moment_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLASSES::Int, moment::Int)
-#     EPS = 1e-7;
-#     COUNT = size(data)[1]
-#     # Compute True moment brute force
-#     true_mom = zeros(COUNT, CLASSES)
-#     for i in 1:COUNT
-#         row = data[i, :]
-#         cur_data_all = generate_all(row)
-
-#         calc_p = log_likelihood_per_instance(pc, cur_data_all)
-#         calc_p = exp.(calc_p)
-
-#         calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
-#         true_mom[i, :] = sum(calc_p .* (calc_f .^ moment), dims=1)
-#         true_mom[i, :] ./= sum(calc_p) #p_observed
-#     end
-
-#     # Compute Circuit Moment
-#     calc_mom, cache = Moment(pc, lc, data, moment);
-#     for i = 1:COUNT
-#         for j = 1:CLASSES
-#             @test (true_mom[i,j] / (calc_mom[i,j] )) ≈ 1.0 atol= EPS;
-#         end
-#     end    
-# end
-
-
-# @testset "Expectation Brute Force Test Small (4 Var)" begin
-#     psdd_file       = "little_4var.psdd"
-#     logistic_file   = "little_4var.circuit"
-#     CLASSES = 2
-#     N = 4
-
-#     pc = zoo_psdd(psdd_file);
-#     lc = zoo_lc(logistic_file, CLASSES);
-#     data = Int8.([
-#                         0 0 0 0; 
-#                         0 1 1 0; 
-#                         0 0 1 1;
-#                         -1 -1 -1 -1;
-#                         -1 0 1 -1;
-#                         0 1 -1 1;
-#                         1 -1 0 -1;
-#                         -1 0 1 -1;
-#                         -1 -1 0 1;
-#                         -1 -1 -1 1;
-#                         -1 -1 -1 0;
-#                         ]);
-
-#     test_expectation_brute_force(pc, lc, data, CLASSES)
-# end
-
-
-# @testset "Expectation Brute Force Test Big (15 Var)" begin
-#     psdd_file       = "exp-D15-N1000-C4.psdd"
-#     logistic_file   = "exp-D15-N1000-C4.circuit"
-#     CLASSES = 4
-#     N = 15
-#     COUNT = 10
-
-#     pc = zoo_psdd(psdd_file);
-#     lc = zoo_lc(logistic_file, CLASSES);
-#     data = Int8.(rand( (-1,0,1), (COUNT, N) ))
-    
-#     test_expectation_brute_force(pc, lc, data, CLASSES)
-# end
-
-
-# @testset "Moment Brute Force Test Small (4 Var)" begin
-#     psdd_file       = "little_4var.psdd"
-#     logistic_file   = "little_4var.circuit";
-#     CLASSES = 2
-#     N = 4
-#     COUNT = 100
-
-#     pc = zoo_psdd(psdd_file);
-#     lc = zoo_lc(logistic_file, CLASSES);
-#     data = Int8.(rand( (-1,0,1), (COUNT, N) ))
-
-#     test_moment_brute_force(pc, lc, data, CLASSES, 1)
-#     test_moment_brute_force(pc, lc, data, CLASSES, 2)
-#     test_moment_brute_force(pc, lc, data, CLASSES, 3)
-#     test_moment_brute_force(pc, lc, data, CLASSES, 4)
-#     test_moment_brute_force(pc, lc, data, CLASSES, 10)
-#     test_moment_brute_force(pc, lc, data, CLASSES, 15)
-# end
-
-# @testset "Moment Brute Force Test Big (15 Var)" begin
-#     psdd_file       = "exp-D15-N1000-C4.psdd"
-#     logistic_file   = "exp-D15-N1000-C4.circuit";
-#     CLASSES = 4
-#     N = 15
-#     COUNT = 10
-
-#     pc = zoo_psdd(psdd_file);
-#     lc = zoo_lc(logistic_file, CLASSES);
-#     data = Int8.(rand( (-1,0,1), (COUNT, N) ))
-
-#     test_moment_brute_force(pc, lc, data, CLASSES, 1)
-#     test_moment_brute_force(pc, lc, data, CLASSES, 2)
-#     test_moment_brute_force(pc, lc, data, CLASSES, 3)
-#     test_moment_brute_force(pc, lc, data, CLASSES, 4)
-#     test_moment_brute_force(pc, lc, data, CLASSES, 10)
-#     test_moment_brute_force(pc, lc, data, CLASSES, 15)
-# end
\ No newline at end of file
diff --git a/test/broken/expectation_tests.jl b/test/broken/expectation_tests.jl
new file mode 100644
index 00000000..c8aafc50
--- /dev/null
+++ b/test/broken/expectation_tests.jl
@@ -0,0 +1,142 @@
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+
+function test_expectation_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLASSES::Int)
+    EPS = 1e-7;
+    COUNT = size(data)[1]
+    # Compute True expectation brute force
+    true_exp = zeros(COUNT, CLASSES)
+    for i in 1:COUNT
+        row = data[i, :]
+        cur_data_all = generate_all(row)
+
+        calc_p = log_likelihood_per_instance(pc, cur_data_all)
+        calc_p = exp.(calc_p)
+
+        calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
+        true_exp[i, :] = sum(calc_p .* calc_f, dims=1)
+        true_exp[i, :] ./= sum(calc_p) #p_observed
+    end
+
+    # Compute Circuit Expect
+    calc_exp, cache = Expectation(pc, lc, data);
+    for i = 1:COUNT
+        for j = 1:CLASSES
+            @test true_exp[i,j] ≈ calc_exp[i,j] atol= EPS;
+        end
+    end    
+    # Compute Bottom Up Expectation
+    calc_exp_2, exp_flow = ExpectationUpward(pc, lc, data);
+    for i = 1:COUNT
+        for j = 1:CLASSES
+            @test true_exp[i,j] ≈ calc_exp_2[i,j] atol= EPS;
+        end
+    end
+end
+
+function test_moment_brute_force(pc::ProbCircuit, lc::LogisticCircuit, data, CLASSES::Int, moment::Int)
+    EPS = 1e-7;
+    COUNT = size(data)[1]
+    # Compute True moment brute force
+    true_mom = zeros(COUNT, CLASSES)
+    for i in 1:COUNT
+        row = data[i, :]
+        cur_data_all = generate_all(row)
+
+        calc_p = log_likelihood_per_instance(pc, cur_data_all)
+        calc_p = exp.(calc_p)
+
+        calc_f = class_conditional_likelihood_per_instance(lc, CLASSES, cur_data_all)
+        true_mom[i, :] = sum(calc_p .* (calc_f .^ moment), dims=1)
+        true_mom[i, :] ./= sum(calc_p) #p_observed
+    end
+
+    # Compute Circuit Moment
+    calc_mom, cache = Moment(pc, lc, data, moment);
+    for i = 1:COUNT
+        for j = 1:CLASSES
+            @test (true_mom[i,j] / (calc_mom[i,j] )) ≈ 1.0 atol= EPS;
+        end
+    end    
+end
+
+
+@testset "Expectation Brute Force Test Small (4 Var)" begin
+    psdd_file       = "little_4var.psdd"
+    logistic_file   = "little_4var.circuit"
+    CLASSES = 2
+    N = 4
+
+    pc = zoo_psdd(psdd_file);
+    lc = zoo_lc(logistic_file, CLASSES);
+    data = Int8.([
+                        0 0 0 0; 
+                        0 1 1 0; 
+                        0 0 1 1;
+                        -1 -1 -1 -1;
+                        -1 0 1 -1;
+                        0 1 -1 1;
+                        1 -1 0 -1;
+                        -1 0 1 -1;
+                        -1 -1 0 1;
+                        -1 -1 -1 1;
+                        -1 -1 -1 0;
+                        ]);
+
+    test_expectation_brute_force(pc, lc, data, CLASSES)
+end
+
+
+@testset "Expectation Brute Force Test Big (15 Var)" begin
+    psdd_file       = "exp-D15-N1000-C4.psdd"
+    logistic_file   = "exp-D15-N1000-C4.circuit"
+    CLASSES = 4
+    N = 15
+    COUNT = 10
+
+    pc = zoo_psdd(psdd_file);
+    lc = zoo_lc(logistic_file, CLASSES);
+    data = Int8.(rand( (-1,0,1), (COUNT, N) ))
+    
+    test_expectation_brute_force(pc, lc, data, CLASSES)
+end
+
+
+@testset "Moment Brute Force Test Small (4 Var)" begin
+    psdd_file       = "little_4var.psdd"
+    logistic_file   = "little_4var.circuit";
+    CLASSES = 2
+    N = 4
+    COUNT = 100
+
+    pc = zoo_psdd(psdd_file);
+    lc = zoo_lc(logistic_file, CLASSES);
+    data = Int8.(rand( (-1,0,1), (COUNT, N) ))
+
+    test_moment_brute_force(pc, lc, data, CLASSES, 1)
+    test_moment_brute_force(pc, lc, data, CLASSES, 2)
+    test_moment_brute_force(pc, lc, data, CLASSES, 3)
+    test_moment_brute_force(pc, lc, data, CLASSES, 4)
+    test_moment_brute_force(pc, lc, data, CLASSES, 10)
+    test_moment_brute_force(pc, lc, data, CLASSES, 15)
+end
+
+@testset "Moment Brute Force Test Big (15 Var)" begin
+    psdd_file       = "exp-D15-N1000-C4.psdd"
+    logistic_file   = "exp-D15-N1000-C4.circuit";
+    CLASSES = 4
+    N = 15
+    COUNT = 10
+
+    pc = zoo_psdd(psdd_file);
+    lc = zoo_lc(logistic_file, CLASSES);
+    data = Int8.(rand( (-1,0,1), (COUNT, N) ))
+
+    test_moment_brute_force(pc, lc, data, CLASSES, 1)
+    test_moment_brute_force(pc, lc, data, CLASSES, 2)
+    test_moment_brute_force(pc, lc, data, CLASSES, 3)
+    test_moment_brute_force(pc, lc, data, CLASSES, 4)
+    test_moment_brute_force(pc, lc, data, CLASSES, 10)
+    test_moment_brute_force(pc, lc, data, CLASSES, 15)
+end
\ No newline at end of file

From db318026890595a8f0465c243c8907e6f88822fd Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 12 Sep 2020 15:09:49 -0500
Subject: [PATCH 111/131] remove deprecated mixture code

---
 src/mixtures/deprecated/Bagging.jl |  61 -----------
 src/mixtures/todo/EMLearner.jl     | 160 ---------------------------
 src/mixtures/todo/Mixtures.jl      | 169 -----------------------------
 3 files changed, 390 deletions(-)
 delete mode 100644 src/mixtures/deprecated/Bagging.jl
 delete mode 100644 src/mixtures/todo/EMLearner.jl
 delete mode 100644 src/mixtures/todo/Mixtures.jl

diff --git a/src/mixtures/deprecated/Bagging.jl b/src/mixtures/deprecated/Bagging.jl
deleted file mode 100644
index 980fa4e2..00000000
--- a/src/mixtures/deprecated/Bagging.jl
+++ /dev/null
@@ -1,61 +0,0 @@
-import StatsBase
-
-function bootstrap_samples_ids(train_x::PlainXData, n_samples::Int
-                               #, rand_gen::AbstractRNG
-                               )
-    n_instances = num_examples(train_x)
-    ids = 1:n_instances
-    return [StatsBase.sample(
-        #rand_gen,
-        ids, n_instances, replace=true) for i in 1:n_samples]
-end
-    
-function train_bagging(# pcs::Vector{<:ProbCircuit},
-                        train_x::XBatches{Bool},
-                        n_components::Int64;
-                        init_models=nothing,
-                        mixture_weights,
-                        learn_base_estimator,
-                        base_estimator_params,
-                        logs)
-                        
-    @assert length(logs) == n_components "Dimension not match in train bagging."
-    # bootstrapping samples
-    bagging_samples = init_bagging_samples(train_x, n_components)
-    
-    # weights
-    weights = nothing
-    if mixture_weights == "uniform"
-        weights = ones(Float64, n_components) ./ n_components
-    else
-        throw(DomainError(mixture_weights, "Unrecognized mixture weight mode"))
-    end
-
-    if issomething(init_models)
-        @assert length(init_models) == n_components "Dimension not match in train bagging."
-        for i in 1 : n_components
-            learn_base_estimator(bagging_samples[i], init_models[i]; log=logs[i], base_estimator_params...)
-        end
-    
-    else
-        for i in 1 : n_components
-            learn_base_estimator(bagging_samples[i]; log=logs[i], base_estimator_params...)
-        end
-    end
-end
-
-function init_bagging_samples(train_x::XBatches{Bool}, num_bags::Int64)::Vector{XBatches{Bool}}
-    batch_size = max_batch_size(train_x)
-    
-    unbatched = unbatch(train_x)
-    m = feature_matrix(unbatched)
-    bagging_samples = Vector{XBatches{Bool}}()
-
-    bootstrapped_ids = bootstrap_samples_ids(unbatched, num_bags)
-
-    for i in 1 : num_bags
-        new_examples = PlainXData(m[bootstrapped_ids[i], :])
-        push!(bagging_samples, batch(new_examples, batch_size))
-    end
-    bagging_samples
-end
diff --git a/src/mixtures/todo/EMLearner.jl b/src/mixtures/todo/EMLearner.jl
deleted file mode 100644
index 738379cc..00000000
--- a/src/mixtures/todo/EMLearner.jl
+++ /dev/null
@@ -1,160 +0,0 @@
-"""
-Train a mixture of probabilistic circuits from data, starting with random example weights.
-"""
-function train_mixture( pcs::Vector{<:ProbCircuit},
-                        train_x::XBatches{Bool},
-                        pseudocount, num_iters;
-                        structure_learner=nothing, learnstruct_step = num_iters + 1, # structure learning
-                        logger=nothing, logging_step = 1 # logging or saving results
-                      )::AbstractFlatMixture
-
-
-    # create mixture model with uniform component weights
-    mixture_flow = init_mixture_with_flows(FlatMixture(pcs), train_x)
-
-    # reset aggregate statistics
-    reset_mixture_aggregate_flows(mixture_flow)
-
-    # do a quick maximization step
-    for batch in train_x
-        example_weights = random_example_weights(num_examples(batch), num_components(mixture_flow))
-        aggregate_flows(mixture_flow, batch, example_weights)
-    end
-    estimate_parameters(mixture_flow, component_weights(mixture_flow); pseudocount=pseudocount)
-
-    train_mixture(mixture_flow, train_x, pseudocount, num_iters; 
-                structure_learner=structure_learner, learnstruct_step=learnstruct_step, 
-                logger=logger, logging_step=logging_step)
-end
-
-"""
-Train a mixture model from data.
-Learning is initialized from the parameters stored in the given mixture.
-When a `structure_learner` is given, it will be called between EM steps to update circuit structures.
-"""
-function train_mixture( mixture::AbstractFlatMixture, # we start from component weights that are already given
-                        train_x::XBatches{Bool},
-                        pseudocount, num_iters;
-                        structure_learner=nothing, learnstruct_step = num_iters + 1, # structure learning
-                        logger=nothing, logging_step = 1 # logging or saving results
-                      )::AbstractFlatMixture
-    
-    @assert feature_type(train_x) == Bool "Can only learn probabilistic circuits on Bool data"
-
-    # initialize data structures
-    mixture_flow = init_mixture_with_flows(mixture, train_x)
-
-    if issomething(logger)
-        logger(mixture_flow)
-    end
-    
-    for i in 1:num_iters
-
-        # reset aggregate statistics
-        total_component_probability = ones(Float64, num_components(mixture_flow)) .* pseudocount ./ num_components(mixture_flow)
-        reset_mixture_aggregate_flows(mixture_flow)
-
-        # are we doing structure learning at the end of this iteration?
-        is_learnstruct_iter = issomething(structure_learner) && i % learnstruct_step == 0 
-
-        all_example_weights = Vector{Matrix{Float64}}()
-
-        # Expectation step (update example weights given mixture parameters)
-        # + collecting aggregate statistics for subsequent maximization step
-        for batch in train_x
-            log_p_of_x_and_c = log_likelihood_per_instance_component(mixture_flow, batch)
-            example_weights = component_weights_per_example(log_p_of_x_and_c)
-            
-            # copy the flows already computed by `log_likelihood_per_instance_component` into the underlying aggregate flow circuit
-            # this way the maximization step can use them to estimate new parameters
-            aggregate_flows_cached(mixture_flow, batch, example_weights)
-
-            # store the aggregated component probabilities such that the maximization step can re-estimate the component weights
-            total_component_probability .+= dropdims(sum(example_weights, dims=1), dims=1)
-
-            # cache the example weights for the structure learner at the end of this EM iteration
-            is_learnstruct_iter && push!(all_example_weights, example_weights)
-        end
-
-        # Maximization step (update mixture parameters given example weights (as stored in aggregate circuits))
-        estimate_parameters(mixture_flow, total_component_probability; pseudocount=pseudocount)
-
-        # Structural EM step
-        if is_learnstruct_iter
-            new_mixture_flow = structure_learner(mixture_flow, train_x, all_example_weights)
-            # mixture = replace_prob_circuits(mixture, new_pcs)
-            # re-initialize data structures
-            mixture_flow = init_mixture_with_flows(new_mixture_flow, train_x)
-        end
-
-        if i % logging_step == 0 && issomething(logger)
-            logger(mixture_flow)
-        end
-    end
-
-    return mixture_flow
-end
-
-"Ensure we have a FlatMixtureWithFlow where the flow circuits have aggregate flow circuits as origin"
-function init_mixture_with_flows(mixture::FlatMixtureWithFlow, ::XBatches{Bool})::FlatMixtureWithFlow 
-    if ! all(fc -> grand_origin(fc) isa AggregateFlowΔ, mixture.flowcircuits)
-        init_mixture_with_flows(origin(mixture))
-    else
-        mixture 
-    end
-end
-function init_mixture_with_flows(mixture::FlatMixture, train_x::XBatches{Bool})::FlatMixtureWithFlow
-    aggr_circuits = [AggregateFlowΔ(pc, Float64) for pc in components(mixture)]
-    flow_circuits = [FlowΔ(afc, max_batch_size(train_x), Bool, opts_accumulate_flows) for afc in aggr_circuits]
-    FlatMixtureWithFlow(mixture, flow_circuits)
-end
-
-function reset_mixture_aggregate_flows(mixture_flow::FlatMixtureWithFlow)
-    for fc in mixture_flow.flowcircuits
-        reset_aggregate_flows(grand_origin(fc))
-    end
-end
-
-"Compute the component weights for each example from likelihoods"
-function component_weights_per_example(log_p_of_x_and_c)
-    log_p_of_x = logaddexp(log_p_of_x_and_c, 2) # marginalize out components
-    log_p_of_given_x_query_c = mapslices(col -> col .- log_p_of_x, log_p_of_x_and_c, dims=[1])
-    p_of_given_x_query_c = exp.(log_p_of_given_x_query_c) # no more risk of underflow, so go to linear space
-    @assert sum(p_of_given_x_query_c) ≈ size(log_p_of_x_and_c, 1) # each row has proability 1
-    p_of_given_x_query_c
-end
-
-"Compute and aggregate flows for mixture components"
-function aggregate_flows(mixture_flow, batch, example_weights)
-    for i in 1:num_components(mixture_flow)
-        fc =  mixture_flow.flowcircuits[i]
-        wbatch = weighted_batch_for_component(batch, example_weights,i)
-        accumulate_aggr_flows_batch(fc, wbatch)
-    end
-end
-
-"Aggregate already-computed flows for mixture components"
-function aggregate_flows_cached(mixture_flow, batch, example_weights)
-    for i in 1:num_components(mixture_flow)
-        fc =  mixture_flow.flowcircuits[i]
-        wbatch = weighted_batch_for_component(batch, example_weights,i)
-        accumulate_aggr_flows_cached(fc, wbatch)
-    end
-end
-
-function estimate_parameters(mixture_flow, total_component_probability; pseudocount)
-    component_weights(mixture_flow) .= total_component_probability ./ sum(total_component_probability)
-    for fc in mixture_flow.flowcircuits
-        estimate_parameters_cached(grand_origin(fc); pseudocount=pseudocount)
-    end
-end
-
-"Get a new weighted batch for this component"
-weighted_batch_for_component(batch::PlainXData, example_weights, component_i)::WXData =
-    WXData(batch, example_weights[:,component_i])
-
-"Create random example weights that sum to one overall components"
-function random_example_weights(num_examples::Int, num_components::Int)::Matrix{Float64}
-    w = rand(Float64, num_examples, num_components)
-    w ./ sum(w;dims=2)
-end
\ No newline at end of file
diff --git a/src/mixtures/todo/Mixtures.jl b/src/mixtures/todo/Mixtures.jl
deleted file mode 100644
index 2337ccc9..00000000
--- a/src/mixtures/todo/Mixtures.jl
+++ /dev/null
@@ -1,169 +0,0 @@
-#####################
-# Probabilistic circuit mixtures
-#####################
-
-"A probabilistic mixture model"
-abstract type AbstractMixture end
-
-"A probabilistic mixture model whose components are not themselves mixtures"
-abstract type AbstractFlatMixture <: AbstractMixture end
-
-"A probabilistic mixture model whose components are themselves mixtures"
-abstract type AbstractMetaMixture <: AbstractMixture end
-
-"A probabilistic mixture model of probabilistic circuits"
-struct FlatMixture <: AbstractFlatMixture
-    weights::Vector{Float64}
-    components::Vector{<:ProbCircuit}
-    FlatMixture(w,c) = begin
-        @assert length(w) == length(c)
-        @assert sum(w) ≈ 1.0
-        new(w,c)
-    end
-end
-
-FlatMixture(c) = FlatMixture(uniform(length(c)),c)
-
-"A mixture with cached flow circuits for each component (which are assumed to be ProbCircuits)"
-struct FlatMixtureWithFlow <: AbstractFlatMixture
-    origin::FlatMixture
-    flowcircuits::Vector{<:FlowΔ}
-    FlatMixtureWithFlow(origin,fcs) = begin
-        @assert num_components(origin) == length(fcs)
-        foreach(components(origin), fcs) do or, fc
-            @assert or[end] === prob_origin(fc)[end]
-        end
-        new(origin,fcs)
-    end
-end
-
-FlatMixtureWithFlow(w,c,f) = FlatMixtureWithFlow(FlatMixture(w,c),f)
-
-"A probabilistic mixture model of mixture models"
-struct MetaMixture <: AbstractMetaMixture
-    weights::Vector{Float64}
-    components::Vector{<:AbstractMixture}
-    MetaMixture(w,c) = begin
-        @assert length(w) == length(c)
-        @assert sum(w) ≈ 1.0
-        new(w,c)
-    end
-end
-
-MetaMixture(c) = MetaMixture(uniform(length(c)),c)
-
-Mixture(w, c::Vector{<:AbstractMixture}) = MetaMixture(w, c)
-Mixture(w, c::Vector{<:ProbCircuit}) = FlatMixture(w, c)
-
-#####################
-# Functions
-#####################
-
-"Get the components in this mixture"
-@inline components(m::FlatMixture) = m.components
-@inline components(m::FlatMixtureWithFlow) = components(m.origin)
-@inline components(m::MetaMixture) = m.components
-
-"Get the component weights in this mixture"
-@inline component_weights(m::FlatMixture) = m.weights
-@inline component_weights(m::FlatMixtureWithFlow) = component_weights(m.origin)
-@inline component_weights(m::MetaMixture) = m.weights
-
-"Number of components in a mixture"
-@inline num_components(m::AbstractMixture)::Int = length(components(m))
-
-"Convert a given flat mixture into one with cached flows"
-ensure_with_flows(m::FlatMixture, size_hint::Int)::FlatMixtureWithFlow = begin
-    flowcircuits = [FlowΔ(pc, size_hint, Bool, opts_accumulate_flows) for pc in components(m)]
-    FlatMixtureWithFlow(m,flowcircuits)
-end
-ensure_with_flows(m::FlatMixtureWithFlow, ::Int)::FlatMixtureWithFlow = m
-
-replace_prob_circuits(m::FlatMixture, pcs::Vector{ProbCircuit}) =
-    FlatMixture(component_weights(m), pcs)
-
-# log_likelihood
-
-function log_likelihood(mixture::FlatMixture, batches::XBatches{Bool})::Float64
-    mwf = ensure_with_flows(mixture, max_batch_size(batches))
-    log_likelihood(mwf, batches)
-end
-
-function log_likelihood(mixture::FlatMixtureWithFlow, batches::XBatches{Bool})::Float64
-    # assume the per-batch call will compute a weighted sum over examples
-    sum(batch -> log_likelihood(mixture, batch), batches)
-end
-
-function log_likelihood(mixture::FlatMixtureWithFlow, batch::PlainXData{Bool})::Float64
-    sum(log_likelihood_per_instance(mixture, batch))
-end
-
-function log_likelihood(mixture::MetaMixture, batches::XBatches{Bool})::Float64
-    sum(batch -> log_likelihood(mixture, batch), batches)
-end
-
-function log_likelihood(mixture::MetaMixture, batch::PlainXData{Bool})::Float64
-    sum(log_likelihood_per_instance(mixture, batch))
-end
-
-# log_likelihood_per_instance (including mixture weight likelihood)
-
-function log_likelihood_per_instance(mixture::FlatMixture, batches::XBatches{Bool})::Vector{Float64}
-    mwf = ensure_with_flows(mixture, max_batch_size(batches))
-    log_likelihood_per_instance(mwf, batches)
-end
-
-function log_likelihood_per_instance(mixture::FlatMixtureWithFlow, batches::XBatches{Bool})::Vector{Float64}
-    mapreduce(b -> log_likelihood_per_instance(mixture, b), vcat, batches)
-end
-
-function log_likelihood_per_instance(mixture::FlatMixtureWithFlow, batch::PlainXData{Bool})::Vector{Float64}
-    log_p_of_x_and_c = log_likelihood_per_instance_component(mixture, batch)
-    logaddexp(log_p_of_x_and_c, 2)
-end
-
-function log_likelihood_per_instance(mixture::MetaMixture, batches::XBatches{Bool})::Vector{Float64}
-    mapreduce(b -> log_likelihood_per_instance(mixture, b), vcat, batches)
-end
-
-function log_likelihood_per_instance(mixture::MetaMixture, batches::PlainXData{Bool})::Vector{Float64}
-    log_p_of_x_and_c = log_likelihood_per_instance_component(mixture, batch)
-    logaddexp(log_p_of_x_and_c, 2)
-end
-
-# Log likelihoods per instance and component (including mixture weight likelihood)
-
-
-"Log likelihood per instance and component. A vector of matrices per batch where the first dimension is instance, second is components."
-function log_likelihood_per_instance_component(mixture::FlatMixtureWithFlow, batches::XBatches{Bool})::Vector{Matrix{Float64}}
-    [log_likelihood_per_instance_component(mixture, batch) for batch in batches]
-end
-
-"Log likelihood per instance and component. First dimension is instance, second is components."
-function log_likelihood_per_instance_component(mixture::FlatMixtureWithFlow, batch::PlainXData{Bool})::Matrix{Float64}
-    hcat(log_likelihood_per_component_instance(mixture, batch)...)
-end
-
-"Log likelihood per component and instance. Outer vector is components, inner vector is instances"
-function log_likelihood_per_component_instance(mixture::FlatMixtureWithFlow, batch::PlainXData{Bool})::Vector{Vector{Float64}}
-    map(mixture.flowcircuits, component_weights(mixture)) do fc, component_weight
-        log_likelihood_per_instance(fc, batch) .+ log(component_weight)
-    end
-end
-
-"Log likelihood per instance and component. A vector of matrices per batch where the first dimension is instance, second is components."
-function log_likelihood_per_instance_component(mixture::MetaMixture, batches::XBatches{Bool})::Vector{Matrix{Float64}}
-    [log_likelihood_per_instance_component(mixture, batch) for batch in batches]
-end
-
-"Log likelihood per instance and component. First dimension is instance, second is components."
-function log_likelihood_per_instance_component(mixture::MetaMixture, batch::PlainXData{Bool})::Matrix{Float64}
-    hcat(log_likelihood_per_component_instance(mixture, batch)...)
-end
-
-"Log likelihood per component and instance. Outer vector is components, inner vector is instances"
-function log_likelihood_per_component_instance(mixture::MetaMixture, batch::PlainXData{Bool})::Vector{Vector{Float64}}
-    map(mixture.components, component_weights(mixture)) do c, component_weight
-        log_likelihood_per_instance(c, batch) .+ log(component_weight)
-    end
-end
\ No newline at end of file

From d113f62cf45d0b7a1f6917448448d5eb318f7927 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sat, 12 Sep 2020 20:23:52 -0500
Subject: [PATCH 112/131] reinstate `SharedProbCircuit`

---
 src/ProbabilisticCircuits.jl      |  3 +-
 src/mixtures/shared_prob_nodes.jl | 88 +++++++++++++++++++++----------
 2 files changed, 60 insertions(+), 31 deletions(-)

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 2b0ed0bd..f693e75a 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -28,12 +28,11 @@ include("queries/expectation_graph.jl")
 include("Logistic/Logistic.jl")
 @reexport using .Logistic
 
-# include("exp_flows.jl")
+include("mixtures/shared_prob_nodes.jl")
 
 # include("reasoning/expectation.jl")
 # include("reasoning/exp_flow_circuits.jl")
 
-# include("mixtures/shared_prob_nodes.jl")
 # include("mixtures/em.jl")
 
 # include("structurelearner/chow_liu_tree.jl")
diff --git a/src/mixtures/shared_prob_nodes.jl b/src/mixtures/shared_prob_nodes.jl
index 9f0f9821..c2c3a651 100644
--- a/src/mixtures/shared_prob_nodes.jl
+++ b/src/mixtures/shared_prob_nodes.jl
@@ -1,55 +1,55 @@
-export SharedProbCircuit, SharedPlainProbLeafNode, SharedPlainProbInnerNode, SharedPlainProbLiteralNode,
-SharedPlainMulNode, SharedPlainSumNode, num_components
+export SharedProbCircuit, SharedProbLeafNode, SharedProbInnerNode, SharedProbLiteralNode,
+SharedMulNode, SharedSumNode, num_components
 
 #####################
 # Probabilistic circuits which share the same structure
 #####################
 
 """
-Root of the probabilistic circuit node hierarchy
+Root of the shared probabilistic circuit node hierarchy
 """
-abstract type SharedProbCircuit <: LogicCircuit end
+abstract type SharedProbCircuit <: ProbCircuit end
 
 """
-A probabilistic leaf node
+A shared probabilistic leaf node
 """
-abstract type SharedPlainProbLeafNode <: SharedProbCircuit end
+abstract type SharedProbLeafNode <: SharedProbCircuit end
 
 """
-A probabilistic inner node
+A shared probabilistic inner node
 """
-abstract type SharedPlainProbInnerNode <: SharedProbCircuit end
+abstract type SharedProbInnerNode <: SharedProbCircuit end
 
 """
-A probabilistic literal node
+A shared probabilistic literal node
 """
-mutable struct SharedPlainProbLiteralNode <: SharedPlainProbLeafNode
+mutable struct SharedProbLiteralNode <: SharedProbLeafNode
     literal::Lit
     data
     counter::UInt32
-    SharedPlainProbLiteralNode(l) = new(l, nothing, 0)
+    SharedProbLiteralNode(l) = new(l, nothing, 0)
 end
 
 """
-A probabilistic conjunction node (And node)
+A shared probabilistic multiplcation node
 """
-mutable struct SharedPlainMulNode <: SharedPlainProbInnerNode
+mutable struct SharedMulNode <: SharedProbInnerNode
     children::Vector{<:SharedProbCircuit}
     data
     counter::UInt32
-    SharedPlainMulNode(children) = new(convert(Vector{SharedProbCircuit}, children), nothing, 0)
+    SharedMulNode(children) = new(children, nothing, 0)
 end
 
 """
-A probabilistic disjunction node (Or node)
+A shared probabilistic summation node
 """
-mutable struct SharedPlainSumNode <: SharedPlainProbInnerNode
+mutable struct SharedSumNode <: SharedProbInnerNode
     children::Vector{<:SharedProbCircuit}
     log_probs::Matrix{Float64}
     data
     counter::UInt32
-    SharedPlainSumNode(children, n_mixture) = begin
-        new(convert(Vector{SharedProbCircuit}, children), init_array(Float64, length(children), n_mixture), nothing, 0)
+    SharedSumNode(children, n_mixture) = begin
+        new(children, init_array(Float64, length(children), n_mixture), nothing, 0)
     end
 end
 
@@ -58,24 +58,54 @@ end
 #####################
 
 import LogicCircuits.GateType # make available for extension
-@inline GateType(::Type{<:SharedPlainProbLiteralNode}) = LiteralGate()
-@inline GateType(::Type{<:SharedPlainMulNode}) = ⋀Gate()
-@inline GateType(::Type{<:SharedPlainSumNode}) = ⋁Gate()
+@inline GateType(::Type{<:SharedProbLiteralNode}) = LiteralGate()
+@inline GateType(::Type{<:SharedMulNode}) = ⋀Gate()
+@inline GateType(::Type{<:SharedSumNode}) = ⋁Gate()
+
+#####################
+# methods
+#####################
+
+import LogicCircuits: children # make available for extension
+@inline children(n::SharedProbInnerNode) = n.children
+
+@inline num_parameters_node(n::SharedSumNode) = length(n.log_probs)
+
+"How many components are mixed together in this shared circuit?"
+@inline num_components(n::SharedSumNode) = size(n.log_probs,2)
 
 #####################
 # constructors and conversions
 #####################
 
-function SharedProbCircuit(circuit::LogicCircuit, num_mixture::Int64)::SharedProbCircuit
+function multiply(arguments::Vector{<:SharedProbCircuit};
+    reuse=nothing)
+    @assert length(arguments) > 0
+    reuse isa SharedMulNode && children(reuse) == arguments && return reuse
+    return SharedMulNode(arguments)
+end
+
+function summate(arguments::Vector{<:SharedProbCircuit}, num_components=0;
+       reuse=nothing)
+    @assert length(arguments) > 0
+    reuse isa SharedSumNode && children(reuse) == arguments && return reuse
+    return SharedSumNode(arguments, num_components) # unknwown number of components; resize later
+end
+
+compile(::Type{<:SharedProbCircuit}, l::Lit) =
+    SharedProbLiteralNode(l)
+
+function compile(::Type{<:SharedProbCircuit}, circuit::LogicCircuit, num_components::Int)
     f_con(n) = error("Cannot construct a probabilistic circuit from constant leafs: first smooth and remove unsatisfiable branches.")
-    f_lit(n) = SharedPlainProbLiteralNode(literal(n))
-    f_a(n, cn) = SharedPlainMulNode(cn)
-    f_o(n, cn) = SharedPlainSumNode(cn, num_mixture)
+    f_lit(n) = compile(SharedProbCircuit, literal(n))
+    f_a(_, cns) = multiply(cns)
+    f_o(_, cns) = summate(cns, num_components)
     foldup_aggregate(circuit, f_con, f_lit, f_a, f_o, SharedProbCircuit)
 end
 
+import LogicCircuits: fully_factorized_circuit #extend
 
-import LogicCircuits: children # make available for extension
-
-@inline children(n::SharedPlainProbInnerNode) = n.children
-@inline num_components(n::SharedProbCircuit) = size(n.log_probs)[2]
+function fully_factorized_circuit(::Type{<:SharedProbCircuit}, n::Int)
+    ff_logic_circuit = fully_factorized_circuit(PlainLogicCircuit, n)
+    compile(SharedProbCircuit, ff_logic_circuit)
+end

From 0c7ce720bafb31f970cda3f2ac68b1ecf8f8826d Mon Sep 17 00:00:00 2001
From: Pasha Khosravi <khosravipasha@gmail.com>
Date: Sat, 12 Sep 2020 22:52:38 -0700
Subject: [PATCH 113/131] make expectation codes runnable

---
 src/queries/expectation_graph.jl | 28 ++++++++++++++++++++++++++--
 src/queries/expectation_rec.jl   | 29 +++++------------------------
 2 files changed, 31 insertions(+), 26 deletions(-)

diff --git a/src/queries/expectation_graph.jl b/src/queries/expectation_graph.jl
index aab0ae9e..48e9a182 100644
--- a/src/queries/expectation_graph.jl
+++ b/src/queries/expectation_graph.jl
@@ -1,4 +1,4 @@
-export UpExpFlow, ExpFlowCircuit, exp_pass_up
+export UpExpFlow, ExpFlowCircuit, exp_pass_up, ExpectationUpward
 
 #####################
 # Expectation Flow circuits
@@ -21,6 +21,30 @@ end
 import LogicCircuits: children
 children(x::UpExpFlow) = x.children
 
+"""
+Expected Prediction of LC w.r.t PC.
+This implementation uses the computation graph approach.
+"""
+function ExpectationUpward(pc::ProbCircuit, lc::LogisticCircuit, data)
+    # 1. Get probability of each observation
+    log_likelihoods = marginal(pc, data)
+    p_observed = exp.( log_likelihoods )
+    
+    # 2. Expectation w.r.t. P(x_m, x_o)
+    exps_flow = exp_pass_up(pc, lc, data)
+    results_unnormalized = exps_flow[end].fg
+
+    # 3. Expectation w.r.t P(x_m | x_o)
+    results = transpose(results_unnormalized) ./ p_observed
+
+    # 4. Add Bias terms
+    biases = lc.thetas
+    results .+= biases
+    
+    results, exps_flow
+end
+
+
 """
 Construct a upward expectation flow circuit from a given pair of PC and LC circuits
 Note that its assuming the two circuits share the same vtree
@@ -28,7 +52,7 @@ Note that its assuming the two circuits share the same vtree
 function ExpFlowCircuit(pc::ProbCircuit, lc::LogisticCircuit, batch_size::Int, ::Type{El}) where El
     F = Array{El, 2}
     fmem = () -> zeros(1, batch_size) #Vector{El}(undef, batch_size)  #init_array(El, batch_size) # note: fmem's return type will determine type of all UpFlows in the circuit (should be El)
-    fgmem = () -> zeros(classes(lc), batch_size)
+    fgmem = () -> zeros(num_classes(lc), batch_size)
 
     root_pc = pc
     root_lc = children(lc)[1]
diff --git a/src/queries/expectation_rec.jl b/src/queries/expectation_rec.jl
index c6164bee..2b0ae91b 100644
--- a/src/queries/expectation_rec.jl
+++ b/src/queries/expectation_rec.jl
@@ -1,4 +1,4 @@
-export Expectation, ExpectationUpward, Moment
+export Expectation, Moment
 
 
 ExpCacheDict = Dict{Pair{ProbCircuit, LogisticCircuit}, Array{Float64, 2}}
@@ -32,7 +32,7 @@ Missing values should be denoted by -1
 """
 function Expectation(pc::ProbCircuit, lc::LogisticCircuit, data)
     # 1. Get probability of each observation
-    log_likelihoods = marginal_log_likelihood_per_instance(pc, data)
+    log_likelihoods = marginal(pc, data)
     p_observed = exp.( log_likelihoods )
     
     # 2. Expectation w.r.t. P(x_m, x_o)
@@ -51,13 +51,13 @@ end
 
 function Moment(pc::ProbCircuit, lc::LogisticCircuit, data, moment::Int)
     # 1. Get probability of each observation
-    log_likelihoods = marginal_log_likelihood_per_instance(pc, data)
+    log_likelihoods = marginal(pc, data)
     p_observed = exp.( log_likelihoods )
     
     # 2. Moment w.r.t. P(x_m, x_o)
     cache = MomentCache()
     biases = lc.thetas
-    results_unnormalized = zeros(num_examples(data), classes(lc))
+    results_unnormalized = zeros(num_examples(data), num_classes(lc))
     
     for z = 0:moment-1  
         results_unnormalized .+= choose(moment, z) .* (biases .^ (z)) .* transpose(moment_g(pc, children(lc)[1], data, moment - z, cache))
@@ -73,25 +73,6 @@ function Moment(pc::ProbCircuit, lc::LogisticCircuit, data, moment::Int)
 end
 
 
-function ExpectationUpward(pc::ProbCircuit, lc::LogisticCircuit, data)
-    # 1. Get probability of each observation
-    log_likelihoods = marginal_log_likelihood_per_instance(pc, data)
-    p_observed = exp.( log_likelihoods )
-    
-    # 2. Expectation w.r.t. P(x_m, x_o)
-    exps_flow = exp_pass_up(pc, lc, data)
-    results_unnormalized = exps_flow[end].fg
-
-    # 3. Expectation w.r.t P(x_m | x_o)
-    results = transpose(results_unnormalized) ./ p_observed
-
-    # 4. Add Bias terms
-    biases = lc.thetas
-    results .+= biases
-    
-    results, exps_flow
-end
-
 
 # exp_f (pr-constraint) is originally from:
 #   Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
@@ -168,7 +149,7 @@ end
 
 function exp_fg(n::PlainSumNode, m::Logistic⋁Node, data, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
-        value = zeros(classes(m) , num_examples(data) )
+        value = zeros(num_classes(m) , num_examples(data) )
         pthetas = [exp(n.log_probs[i]) for i in 1:num_children(n)]
         @fastmath @simd for i in 1:num_children(n)
             for j in 1:num_children(m)

From 0f52126f9adc18ad942180fbb920306589998f13 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 13 Sep 2020 17:05:38 -0500
Subject: [PATCH 114/131] minor fixes

---
 src/ProbabilisticCircuits.jl | 5 -----
 src/mixtures/em.jl           | 3 ++-
 2 files changed, 2 insertions(+), 6 deletions(-)

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index f693e75a..1e0f8357 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -29,10 +29,6 @@ include("Logistic/Logistic.jl")
 @reexport using .Logistic
 
 include("mixtures/shared_prob_nodes.jl")
-
-# include("reasoning/expectation.jl")
-# include("reasoning/exp_flow_circuits.jl")
-
 # include("mixtures/em.jl")
 
 # include("structurelearner/chow_liu_tree.jl")
@@ -40,7 +36,6 @@ include("mixtures/shared_prob_nodes.jl")
 # include("structurelearner/heuristics.jl")
 # include("structurelearner/learner.jl")
 
-
 include("LoadSave/LoadSave.jl")
 @reexport using .LoadSave
 
diff --git a/src/mixtures/em.jl b/src/mixtures/em.jl
index fb0aa461..6554bda0 100644
--- a/src/mixtures/em.jl
+++ b/src/mixtures/em.jl
@@ -1,10 +1,11 @@
 export one_step_em, component_weights_per_example, initial_weights, clustering,
 log_likelihood_per_instance_per_component, estimate_parameters_cached, learn_em_model
+
 using Statistics: mean
 using LinearAlgebra: normalize!
 using Clustering: kmeans, nclusters, assignments
 
-function one_step_em(spc, train_x, component_weights;pseudocount)
+function one_step_em(spc, train_x, component_weights; pseudocount)
     # E step
     lls = log_likelihood_per_instance_per_component(spc, train_x)
     lls .+= log.(component_weights)

From ffacb1da0093ebae20fd6f8aa30d2535114a609a Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Mon, 14 Sep 2020 17:58:18 -0700
Subject: [PATCH 115/131] pc compilation helper

---
 src/abstract_prob_nodes.jl          | 13 +++++++++++++
 test/plain_prob_nodes_tests.jl      |  7 +++++++
 test/structured_prob_nodes_tests.jl | 10 ++++++++++
 3 files changed, 30 insertions(+)

diff --git a/src/abstract_prob_nodes.jl b/src/abstract_prob_nodes.jl
index 0f091a6a..f0f1bd56 100644
--- a/src/abstract_prob_nodes.jl
+++ b/src/abstract_prob_nodes.jl
@@ -61,6 +61,19 @@ import LogicCircuits: conjoin, disjoin # make available for extension
 compile(::Type{<:ProbCircuit}, ::Bool) =
     error("Probabilistic circuits do not have constant leafs.")
 
+struct WeightProbCircuit
+    tmp_weight :: Float64
+    circuit :: ProbCircuit
+end
+
+@inline Base.:*(w::Real, x::ProbCircuit) = WeightProbCircuit(w, x)
+@inline Base.:*(x::ProbCircuit, w::Real) = w * x
+@inline Base.:+(wpc1::WeightProbCircuit, wpc2::WeightProbCircuit) = begin
+    pc = wpc1.circuit + wpc2.circuit
+    pc.log_probs .= log.([wpc1.tmp_weight, wpc2.tmp_weight])
+    pc
+end
+
 #####################
 # circuit inspection
 #####################
diff --git a/test/plain_prob_nodes_tests.jl b/test/plain_prob_nodes_tests.jl
index 1ace42ce..592c52a7 100644
--- a/test/plain_prob_nodes_tests.jl
+++ b/test/plain_prob_nodes_tests.jl
@@ -39,4 +39,11 @@ include("helper/plain_logic_circuits.jl")
 
     @test length(mul_nodes(r1)) == 1
 
+    # compilation tests
+    lit1 = compile(PlainProbCircuit, Lit(1))
+    litn1 = compile(PlainProbCircuit, Lit(-1))
+    r = lit1 * 0.3 + 0.7 * litn1
+    @test r isa PlainSumNode
+    @test all(children(r) .== [lit1, litn1])
+    @test all(r.log_probs .≈ log.([0.3, 0.7]))
 end
\ No newline at end of file
diff --git a/test/structured_prob_nodes_tests.jl b/test/structured_prob_nodes_tests.jl
index 25374217..af4ebfb9 100644
--- a/test/structured_prob_nodes_tests.jl
+++ b/test/structured_prob_nodes_tests.jl
@@ -99,4 +99,14 @@ using DataFrames: DataFrame
     @test num_edges(c3) == 69
     @test num_variables(c3) == 7
 
+    # compilation tests
+    v = Vtree(Var(1))
+    lit1 = compile(StructProbCircuit, v, Lit(1))
+    litn1 = compile(StructProbCircuit, v, Lit(-1))
+    r = lit1 * 0.3 + 0.7 * litn1
+    @test r isa StructSumNode
+    @test all(children(r) .== [lit1, litn1])
+    @test vtree(r) === vtree(lit1)
+    @test all(r.log_probs .≈ log.([0.3, 0.7]))
+
 end
\ No newline at end of file

From 3509182becf66d3b11bf0d511489f179f4a3b884 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Mon, 14 Sep 2020 21:48:34 -0700
Subject: [PATCH 116/131] circuit visualizations

---
 src/LoadSave/LoadSave.jl            |  1 +
 src/LoadSave/plot.jl                | 26 ++++++++++++++++++++++++++
 test/structured_prob_nodes_tests.jl |  2 +-
 3 files changed, 28 insertions(+), 1 deletion(-)
 create mode 100644 src/LoadSave/plot.jl

diff --git a/src/LoadSave/LoadSave.jl b/src/LoadSave/LoadSave.jl
index c28a0c77..26ae08f2 100644
--- a/src/LoadSave/LoadSave.jl
+++ b/src/LoadSave/LoadSave.jl
@@ -6,5 +6,6 @@ using ...ProbabilisticCircuits
 include("circuit_line_compiler.jl")
 include("circuit_loaders.jl")
 include("circuit_savers.jl")
+include("plot.jl")
 
 end
\ No newline at end of file
diff --git a/src/LoadSave/plot.jl b/src/LoadSave/plot.jl
new file mode 100644
index 00000000..7e1525a8
--- /dev/null
+++ b/src/LoadSave/plot.jl
@@ -0,0 +1,26 @@
+using LightGraphs
+
+import LightGraphs: DiGraph
+
+function DiGraph(pc::ProbCircuit)
+    edge_labels = Dict()
+    label = label = Vector{String}(undef, num_nodes(pc))
+
+    add_label!(g, dict, n::ProbCircuit) = begin
+        label[dict[n]] = 
+        if isliteralgate(n) "$(literal(n))"
+        elseif ismul(n) "*"
+        else "+"
+        end
+    end
+
+    on_edge(g, id_dict, n, c, n_id, c_id) = noop
+    on_edge(g, id_dict, n::Union{PlainSumNode, StructSumNode}, c, n_id, c_id) = begin
+        edge_labels[(n_id, c_id)] = begin
+            i = findall(x -> x === c, children(n))[1]
+            "$(exp(n.log_probs[i]))"
+        end
+    end
+    g, _ = LogicCircuits.LoadSave.DiGraph(pc;on_edge=on_edge, on_var=add_label!)
+    g, label, edge_labels
+end
\ No newline at end of file
diff --git a/test/structured_prob_nodes_tests.jl b/test/structured_prob_nodes_tests.jl
index af4ebfb9..bf31a710 100644
--- a/test/structured_prob_nodes_tests.jl
+++ b/test/structured_prob_nodes_tests.jl
@@ -106,7 +106,7 @@ using DataFrames: DataFrame
     r = lit1 * 0.3 + 0.7 * litn1
     @test r isa StructSumNode
     @test all(children(r) .== [lit1, litn1])
-    @test vtree(r) === vtree(lit1)
+    @test r.vtree === lit1.vtree
     @test all(r.log_probs .≈ log.([0.3, 0.7]))
 
 end
\ No newline at end of file

From 76b52b60cbfccc169695c39e8a979d016f57f0b5 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Wed, 16 Sep 2020 03:47:04 -0500
Subject: [PATCH 117/131] commenting legacy code

---
 src/Logistic/parameter_circuit.jl | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/src/Logistic/parameter_circuit.jl b/src/Logistic/parameter_circuit.jl
index dc338e77..2c7be6c2 100644
--- a/src/Logistic/parameter_circuit.jl
+++ b/src/Logistic/parameter_circuit.jl
@@ -5,6 +5,13 @@ export LayeredParameterCircuit, CuLayeredParameterCircuit
 export class_likelihood, class_weights
 export one_hot, learn_parameters, update_parameters
 
+#############################################################
+############## This is the old implementation ###############
+#### Not intended to be used under the current framework ####
+#############################################################
+
+
+
 # in a parameter circuit
 # 1 is true, 2 is false
 const TRUE_ID = Int32(1)

From 806f154bbf9c85d4366b8b25d997f0d5ba6d28ed Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Wed, 16 Sep 2020 03:47:23 -0500
Subject: [PATCH 118/131] commenting legacy code

---
 src/Logistic/parameter_circuit.jl | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Logistic/parameter_circuit.jl b/src/Logistic/parameter_circuit.jl
index 2c7be6c2..ee008dd7 100644
--- a/src/Logistic/parameter_circuit.jl
+++ b/src/Logistic/parameter_circuit.jl
@@ -11,7 +11,6 @@ export one_hot, learn_parameters, update_parameters
 #############################################################
 
 
-
 # in a parameter circuit
 # 1 is true, 2 is false
 const TRUE_ID = Int32(1)

From 8eaed70fcd6d63bd6aa5bb05cb3b3c8f1db758e6 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Wed, 16 Sep 2020 02:43:15 -0700
Subject: [PATCH 119/131] compilation helper

---
 Project.toml                   |  1 +
 src/LoadSave/plot.jl           |  8 ++++++++
 src/abstract_prob_nodes.jl     | 11 ++++++++---
 src/queries/expectation_rec.jl |  6 +++---
 src/queries/marginal_flow.jl   | 16 +++++++++++++++-
 5 files changed, 35 insertions(+), 7 deletions(-)

diff --git a/Project.toml b/Project.toml
index 7b255547..94501d5f 100644
--- a/Project.toml
+++ b/Project.toml
@@ -24,6 +24,7 @@ SparseArrays = "2f01184e-e22b-5df5-ae63-d93ebab69eaf"
 Statistics = "10745b16-79ce-11e8-11f9-7d13ad32a3b2"
 StatsBase = "2913bbd2-ae8a-5f71-8c99-4fb6c76f3a91"
 StatsFuns = "4c63d2b9-4356-54db-8cca-17b64c39e42c"
+TikzGraphs = "b4f28e30-c73f-5eaf-a395-8a9db949a742"
 
 [compat]
 BlossomV = "0.4"
diff --git a/src/LoadSave/plot.jl b/src/LoadSave/plot.jl
index 7e1525a8..84e7868c 100644
--- a/src/LoadSave/plot.jl
+++ b/src/LoadSave/plot.jl
@@ -1,4 +1,6 @@
+export DiGraph, plot
 using LightGraphs
+using TikzGraphs
 
 import LightGraphs: DiGraph
 
@@ -23,4 +25,10 @@ function DiGraph(pc::ProbCircuit)
     end
     g, _ = LogicCircuits.LoadSave.DiGraph(pc;on_edge=on_edge, on_var=add_label!)
     g, label, edge_labels
+end
+
+import TikzGraphs: plot
+plot(pc::ProbCircuit) = begin
+    g, label, edge_labels = DiGraph(pc)
+    TikzGraphs.plot(g, label, edge_labels=edge_labels)
 end
\ No newline at end of file
diff --git a/src/abstract_prob_nodes.jl b/src/abstract_prob_nodes.jl
index f0f1bd56..46ace89d 100644
--- a/src/abstract_prob_nodes.jl
+++ b/src/abstract_prob_nodes.jl
@@ -56,7 +56,9 @@ import LogicCircuits: conjoin, disjoin # make available for extension
     summate(args; reuse)
 
 @inline Base.:*(x::ProbCircuit, y::ProbCircuit) = multiply(x,y)
+@inline Base.:*(xs::ProbCircuit...) = multiply(xs...)
 @inline Base.:+(x::ProbCircuit, y::ProbCircuit) = summate(x,y)
+@inline Base.:+(xs::ProbCircuit...) = summate(xs...)
 
 compile(::Type{<:ProbCircuit}, ::Bool) =
     error("Probabilistic circuits do not have constant leafs.")
@@ -68,9 +70,12 @@ end
 
 @inline Base.:*(w::Real, x::ProbCircuit) = WeightProbCircuit(w, x)
 @inline Base.:*(x::ProbCircuit, w::Real) = w * x
-@inline Base.:+(wpc1::WeightProbCircuit, wpc2::WeightProbCircuit) = begin
-    pc = wpc1.circuit + wpc2.circuit
-    pc.log_probs .= log.([wpc1.tmp_weight, wpc2.tmp_weight])
+@inline Base.:+(x::WeightProbCircuit...) = begin
+    ch = collect(x)
+    c = map(x -> x.circuit, ch)
+    w = map(x -> x.tmp_weight, ch)
+    pc = summate(c)
+    pc.log_probs .= log.(w)
     pc
 end
 
diff --git a/src/queries/expectation_rec.jl b/src/queries/expectation_rec.jl
index 2b0ae91b..62db3cac 100644
--- a/src/queries/expectation_rec.jl
+++ b/src/queries/expectation_rec.jl
@@ -110,11 +110,11 @@ end
         if ispositive(n) && ispositive(m) 
             # value[1, X[:, var] .== -1 ] .= 1.0  # missing observation always agrees
             # value[1, X[:, var] .== 1 ] .= 1.0 # positive observations
-            value[1, X[:, var] .!= 0 ] .= 1.0 # positive or missing observations
+            value[1, .!isequal.(X[:, var], 0)] .= 1.0 # positive or missing observations
         elseif isnegative(n) && isnegative(m)
             # value[1, X[:, var] .== -1 ] .= 1.0  # missing observation always agrees
             # value[1, X[:, var] .== 0 ] .= 1.0 # negative observations
-            value[1, X[:, var] .!= 1 ] .= 1.0 # negative or missing observations
+            value[1, .!isequal.(X[:, var], 1)] .= 1.0 # negative or missing observations
         end
         return value
     end
@@ -204,7 +204,7 @@ function moment_fg(n::PlainSumNode, m::Logistic⋁Node, data, moment::Int, cache
     end
 
     get!(cache.fg, (n, m, moment)) do
-        value = zeros(classes(m) , num_examples(data) )
+        value = zeros(num_classes(m) , num_examples(data) )
         pthetas = [exp(n.log_probs[i]) for i in 1:num_children(n)]
         @fastmath @simd for i in 1:num_children(n)
             for j in 1:num_children(m)
diff --git a/src/queries/marginal_flow.jl b/src/queries/marginal_flow.jl
index 2a200a05..ec7d399c 100644
--- a/src/queries/marginal_flow.jl
+++ b/src/queries/marginal_flow.jl
@@ -5,7 +5,8 @@ using DataFrames: DataFrame
 using LoopVectorization: @avx
 using LogicCircuits: balance_threads
 
-export marginal, MAR, marginal_all, marginal_flows, marginal_flows_down
+export marginal, MAR, marginal_all, marginal_log_likelihood, 
+marginal_log_likelihood_avg, marginal_flows, marginal_flows_down
 
 #####################
 # Circuit marginal evaluation
@@ -30,8 +31,21 @@ function marginal(circuit::ParamBitCircuit, data::DataFrame)::AbstractVector
     marginal_all(circuit,data)[:,end]
 end
 
+"""
+Marginal queries
+"""
 const MAR = marginal
 
+"""
+Compute the marginal likelihood of the PC given the data
+"""
+marginal_log_likelihood(pc, data) = sum(marginal(pc, data))
+
+"""
+Compute the marginal likelihood of the PC given the data, averaged over all instances in the data
+"""
+marginal_log_likelihood_avg(pc, data) = marginal_log_likelihood(pc, data)/num_examples(data)
+
 #####################
 # Circuit evaluation of *all* nodes in circuit
 #####################

From dcf1aa888bee09ec804cdae75a340a094e0db573 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Wed, 16 Sep 2020 03:10:32 -0700
Subject: [PATCH 120/131] minor changes

---
 src/queries/expectation_rec.jl | 28 ++++++++++++++--------------
 src/queries/pr_constraint.jl   |  8 ++++----
 2 files changed, 18 insertions(+), 18 deletions(-)

diff --git a/src/queries/expectation_rec.jl b/src/queries/expectation_rec.jl
index 62db3cac..93e90e1d 100644
--- a/src/queries/expectation_rec.jl
+++ b/src/queries/expectation_rec.jl
@@ -77,7 +77,7 @@ end
 # exp_f (pr-constraint) is originally from:
 #   Arthur Choi, Guy Van den Broeck, and Adnan Darwiche. Tractable learning for structured probability spaces: A case study in learning preference distributions. In Proceedings of IJCAI, 2015.
 
-function exp_f(n::PlainSumNode, m::Logistic⋁Node, data, cache::Union{ExpectationCache, MomentCache})
+function exp_f(n::Union{PlainSumNode, StructSumNode}, m::Logistic⋁Node, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = zeros(1 , num_examples(data) )
         pthetas = [exp(n.log_probs[i]) for i in 1:num_children(n)]
@@ -90,7 +90,7 @@ function exp_f(n::PlainSumNode, m::Logistic⋁Node, data, cache::Union{Expectati
     end
 end
 
-function exp_f(n::PlainMulNode, m::Logistic⋀Node, data, cache::Union{ExpectationCache, MomentCache})
+function exp_f(n::Union{PlainMulNode, StructMulNode}, m::Logistic⋀Node, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = ones(1 , num_examples(data) )
         @fastmath for (i,j) in zip(children(n), children(m))
@@ -102,7 +102,7 @@ function exp_f(n::PlainMulNode, m::Logistic⋀Node, data, cache::Union{Expectati
 end
 
 
-@inline function exp_f(n::PlainProbLiteralNode, m::LogisticLiteral, data, cache::Union{ExpectationCache, MomentCache})
+@inline function exp_f(n::Union{PlainProbLiteralNode, StructProbLiteralNode}, m::LogisticLiteral, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         value = zeros(1 , num_examples(data) )
         var = lit2var(literal(m))
@@ -123,7 +123,7 @@ end
 """
 Has to be a Logistic⋁Node with only one child, which is a leaf node 
 """
-@inline function exp_f(n::PlainProbLiteralNode, m::Logistic⋁Node, data, cache::Union{ExpectationCache, MomentCache})
+@inline function exp_f(n::Union{PlainProbLiteralNode, StructProbLiteralNode}, m::Logistic⋁Node, data, cache::Union{ExpectationCache, MomentCache})
     @inbounds get!(cache.f, Pair(n, m)) do
         exp_f(n, children(m)[1], data, cache)
     end
@@ -133,7 +133,7 @@ end
 ######## exp_g, exp_fg
 ########################################################################
 
-@inline function exp_g(n::PlainSumNode, m::Logistic⋁Node, data, cache::ExpectationCache)
+@inline function exp_g(n::Union{PlainSumNode, StructSumNode}, m::Logistic⋁Node, data, cache::ExpectationCache)
     exp_fg(n, m, data, cache) # exp_fg and exp_g are the same for OR nodes
 end
 
@@ -147,7 +147,7 @@ end
 # end
 
 
-function exp_fg(n::PlainSumNode, m::Logistic⋁Node, data, cache::ExpectationCache)
+function exp_fg(n::Union{PlainSumNode, StructSumNode}, m::Logistic⋁Node, data, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         value = zeros(num_classes(m) , num_examples(data) )
         pthetas = [exp(n.log_probs[i]) for i in 1:num_children(n)]
@@ -161,7 +161,7 @@ function exp_fg(n::PlainSumNode, m::Logistic⋁Node, data, cache::ExpectationCac
     end
 end
 
-function exp_fg(n::PlainMulNode, m::Logistic⋀Node, data, cache::ExpectationCache)
+function exp_fg(n::Union{PlainMulNode, StructMulNode}, m::Logistic⋀Node, data, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         # Assuming 2 children
         value = exp_f(children(n)[1], children(m)[1], data, cache) .* exp_fg(children(n)[2], children(m)[2], data, cache)
@@ -174,13 +174,13 @@ end
 """
 Has to be a Logistic⋁Node with only one child, which is a leaf node 
 """
-@inline function exp_fg(n::PlainProbLiteralNode, m::Logistic⋁Node, data, cache::ExpectationCache)
+@inline function exp_fg(n::Union{PlainProbLiteralNode, StructProbLiteralNode}, m::Logistic⋁Node, data, cache::ExpectationCache)
     @inbounds get!(cache.fg, Pair(n, m)) do
         m.thetas[1,:] .* exp_f(n, m, data, cache)
     end
 end
 
-@inline function exp_fg(n::PlainProbLiteralNode, m::LogisticLiteral, data, cache::ExpectationCache)
+@inline function exp_fg(n::Union{PlainProbLiteralNode, StructProbLiteralNode}, m::LogisticLiteral, data, cache::ExpectationCache)
     #dont know how many classes, boradcasting does the job
     zeros(1 , num_examples(data)) 
 end
@@ -189,7 +189,7 @@ end
 ######## moment_g, moment_fg
 ########################################################################
 
-@inline function moment_g(n::PlainSumNode, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
+@inline function moment_g(n::Union{PlainSumNode, StructSumNode}, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
     get!(cache.fg, (n, m, moment)) do
         moment_fg(n, m, data, moment, cache)
     end
@@ -198,7 +198,7 @@ end
 """
 Calculating  E[g^k * f]
 """
-function moment_fg(n::PlainSumNode, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
+function moment_fg(n::Union{PlainSumNode, StructSumNode}, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
     if moment == 0
         return exp_f(n, m, data, cache)
     end
@@ -217,13 +217,13 @@ function moment_fg(n::PlainSumNode, m::Logistic⋁Node, data, moment::Int, cache
     end
 end
 
-@inline function moment_fg(n::PlainProbLiteralNode, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
+@inline function moment_fg(n::Union{PlainProbLiteralNode, StructProbLiteralNode}, m::Logistic⋁Node, data, moment::Int, cache::MomentCache)
     get!(cache.fg, (n, m, moment)) do
         m.thetas[1,:].^(moment) .* exp_f(n, m, data, cache)
     end
 end
 
-@inline function moment_fg(n::PlainProbLiteralNode, m::LogisticLiteral, data, moment::Int, cache::MomentCache)
+@inline function moment_fg(n::Union{PlainProbLiteralNode, StructProbLiteralNode}, m::LogisticLiteral, data, moment::Int, cache::MomentCache)
     #dont know how many classes, boradcasting does the job
     if moment == 0
         exp_f(n, m, data, cache)
@@ -232,7 +232,7 @@ end
     end
 end
 
-function moment_fg(n::PlainMulNode, m::Logistic⋀Node, data, moment::Int, cache::MomentCache)
+function moment_fg(n::Union{PlainMulNode, StructMulNode}, m::Logistic⋀Node, data, moment::Int, cache::MomentCache)
     if moment == 0
         return exp_f(n, m, data, cache)
     end
diff --git a/src/queries/pr_constraint.jl b/src/queries/pr_constraint.jl
index c3183128..4594a5c5 100644
--- a/src/queries/pr_constraint.jl
+++ b/src/queries/pr_constraint.jl
@@ -11,14 +11,14 @@ Calculate the probability of the logic formula given by LC for the PC
 function pr_constraint(pc_node::StructProbCircuit, lc_node, cache::PRCache=PRCache())::Float64
 
     # TODO require that both circuits have an equal vtree for safety. If they don't, then first convert them to have a vtree
-    
+    @assert respects_vtree(lc_node, vtree(pc_node)) "Both circuits do not have an equal vtree"
+
     # Cache hit
     if (pc_node, lc_node) in keys(cache) 
         return cache[pc_node, lc_node]
     
     # Boundary cases
-    # TODO: make this more general-purpose, use `isliteralgate`
-    elseif pc_node isa StructProbLiteralNode
+    elseif isliteralgate(pc_node)
         # Both are literals, just check whether they agrees with each other 
         if isliteralgate(lc_node)
             if literal(pc_node) == literal(lc_node)
@@ -38,7 +38,7 @@ function pr_constraint(pc_node::StructProbCircuit, lc_node, cache::PRCache=PRCac
         end
     
     # The pc is true
-    elseif children(pc_node)[1] isa StructProbLiteralNode 
+    elseif isliteralgate(children(pc_node)[1])
         theta = exp(pc_node.log_probs[1])
         return get!(cache, (pc_node, lc_node),
             theta * pr_constraint(children(pc_node)[1], lc_node, cache) +

From 057e7aab5c1d19d9256b931fc9b27b1e978473e0 Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Wed, 16 Sep 2020 03:36:51 -0700
Subject: [PATCH 121/131] [fix] fix queries of logistic circuits

---
 src/Logistic/queries.jl  | 67 ++++++++++++++++++----------------------
 src/logistic_nodes.jl    |  2 +-
 src/param_bit_circuit.jl |  9 ++++--
 3 files changed, 37 insertions(+), 41 deletions(-)

diff --git a/src/Logistic/queries.jl b/src/Logistic/queries.jl
index 05380e54..9931d766 100644
--- a/src/Logistic/queries.jl
+++ b/src/Logistic/queries.jl
@@ -9,12 +9,13 @@ Class Conditional Probability
 """
 function class_likelihood_per_instance(lc::LogicCircuit, nc::Int, data)    
     cw = class_weights_per_instance(lc, nc, data)
-    isgpu(data) ? (@. 1.0 / (1.0 + exp(-cw))) : (@. @avx 1.0 / (1.0 + exp(-cw)))
+    one = Float32(1.0)
+    isgpu(data) ? (@. one / (one + exp(-cw))) : (@. @avx one / (one + exp(-cw)))
 end
 
 function class_likelihood_per_instance(bc, data)
     cw = class_weights_per_instance(bc, data)
-    isgpu(data) ? (@. 1.0 / (1.0 + exp(-cw))) : (@. @avx 1.0 / (1.0 + exp(-cw)))
+    isgpu(data) ? (@. one / (one + exp(-cw))) : (@. @avx one / (one + exp(-cw)))
 end
 
 function class_weights_per_instance(lc::LogisticCircuit, nc::Int, data)
@@ -33,22 +34,20 @@ end
 function class_weights_per_instance_cpu(bc, data)
     ne::Int = num_examples(data)
     nc::Int = size(bc.params, 2)
-    cw::Matrix{Float64} = zeros(Float64, ne, nc)
+    cw::Matrix{Float32} = zeros(Float32, ne, nc)
     cw_lock::Threads.ReentrantLock = Threads.ReentrantLock()
  
     @inline function on_edge_binary(flows, values, prime, sub, element, grandpa, single_child)
-        if !single_child
-            lock(cw_lock) do # TODO: move lock to inner loop?
-                for i = 1:size(flows, 1)
-                    @inbounds edge_flow = values[i, prime] & values[i, sub] & flows[i, grandpa]
-                    first_true_bit = trailing_zeros(edge_flow) + 1
-                    last_true_bit = 64 - leading_zeros(edge_flow)
-                    @simd for j = first_true_bit:last_true_bit
-                        ex_id = ((i - 1) << 6) + j
-                        if get_bit(edge_flow, j)
-                            for class = 1:nc
-                                @inbounds cw[ex_id, class] += bc.params[element, class]
-                            end
+        lock(cw_lock) do # TODO: move lock to inner loop?
+            for i = 1:size(flows, 1)
+                @inbounds edge_flow = values[i, prime] & values[i, sub] & flows[i, grandpa]
+                first_true_bit = trailing_zeros(edge_flow) + 1
+                last_true_bit = 64 - leading_zeros(edge_flow)
+                @simd for j = first_true_bit:last_true_bit
+                    ex_id = ((i - 1) << 6) + j
+                    if get_bit(edge_flow, j)
+                        for class = 1:nc
+                            @inbounds cw[ex_id, class] += bc.params[element, class]
                         end
                     end
                 end
@@ -58,14 +57,12 @@ function class_weights_per_instance_cpu(bc, data)
     end
 
     @inline function on_edge_float(flows, values, prime, sub, element, grandpa, single_child)
-        if !single_child
-            lock(cw_lock) do # TODO: move lock to inner loop?
-                @avx for i = 1:size(flows, 1)
-                    @inbounds edge_flow = values[i, prime] * values[i, sub] / values[i, grandpa] * flows[i, grandpa]
-                    edge_flow = vifelse(isfinite(edge_flow), edge_flow, zero(eltype(flows)))
-                    for class = 1:nc
-                        @inbounds cw[i, class] += edge_flow * bc.params[element, class]
-                    end
+        lock(cw_lock) do # TODO: move lock to inner loop?
+            @avx for i = 1:size(flows, 1)
+                @inbounds edge_flow = values[i, prime] * values[i, sub] / values[i, grandpa] * flows[i, grandpa]
+                edge_flow = vifelse(isfinite(edge_flow), edge_flow, zero(eltype(flows)))
+                for class = 1:nc
+                    @inbounds cw[i, class] += edge_flow * bc.params[element, class]
                 end
             end
         end
@@ -84,20 +81,18 @@ end
 function class_weights_per_instance_gpu(bc, data)
     ne::Int = num_examples(data)
     nc::Int = size(bc.params, 2)
-    cw::CuMatrix{Float64} = CUDA.zeros(Float64, num_examples(data), nc)
+    cw::CuMatrix{Float32} = CUDA.zeros(Float32, num_examples(data), nc)
     cw_device = CUDA.cudaconvert(cw)
     params_device = CUDA.cudaconvert(bc.params)
 
     @inline function on_edge_binary(flows, values, prime, sub, element, grandpa, chunk_id, edge_flow, single_child)
-        if !single_child
-            first_true_bit = 1 + trailing_zeros(edge_flow)
-            last_true_bit = 64 - leading_zeros(edge_flow)
-            for j = first_true_bit:last_true_bit
-                ex_id = ((chunk_id - 1) << 6) + j
-                if get_bit(edge_flow, j)
-                    for class = 1:nc
-                        CUDA.@atomic cw_device[ex_id, class] += params_device[element, class]
-                    end
+        first_true_bit = 1 + trailing_zeros(edge_flow)
+        last_true_bit = 64 - leading_zeros(edge_flow)
+        for j = first_true_bit:last_true_bit
+            ex_id = ((chunk_id - 1) << 6) + j
+            if get_bit(edge_flow, j)
+                for class = 1:nc
+                    CUDA.@atomic cw_device[ex_id, class] += params_device[element, class]
                 end
             end
         end
@@ -105,10 +100,8 @@ function class_weights_per_instance_gpu(bc, data)
     end
 
     @inline function on_edge_float(flows, values, prime, sub, element, grandpa, ex_id, edge_flow, single_child)
-        if !single_child
-            for class = 1:nc
-                CUDA.@atomic cw_device[ex_id, class] += edge_flow * params_device[element, class]
-            end
+        for class = 1:nc
+            CUDA.@atomic cw_device[ex_id, class] += edge_flow * params_device[element, class]
         end
         nothing
     end
diff --git a/src/logistic_nodes.jl b/src/logistic_nodes.jl
index cb7a2075..78f0d66f 100644
--- a/src/logistic_nodes.jl
+++ b/src/logistic_nodes.jl
@@ -50,7 +50,7 @@ A logistic disjunction node (Or node)
 """
 mutable struct Logistic⋁Node <: LogisticInnerNode
     children::Vector{<:LogisticCircuit}
-    thetas::Matrix{Float64}
+    thetas::Matrix{Float32}
     data
     counter::UInt32
     Logistic⋁Node(children, class::Int) = begin
diff --git a/src/param_bit_circuit.jl b/src/param_bit_circuit.jl
index 33c2d512..f200327f 100644
--- a/src/param_bit_circuit.jl
+++ b/src/param_bit_circuit.jl
@@ -22,19 +22,22 @@ function ParamBitCircuit(pc::ProbCircuit, data; reset=true)
 end
 
 function ParamBitCircuit(lc::LogisticCircuit, nc, data; reset=true)
-    thetas::Vector{Vector{Float64}} = Vector{Vector{Float64}}()
+    thetas::Vector{Vector{Float32}} = Vector{Vector{Float32}}()
     on_decision(n, cs, layer_id, decision_id, first_element, last_element) = begin
         if isnothing(n)
             # @assert first_element == last_element
-            push!(thetas, zeros(Float64, nc))
+            push!(thetas, zeros(Float32, nc))
+            println("here, some node is not part of the logistic circuit")
         else
-            # @assert last_element-first_element+1 == length(n.log_probs) "$last_element-$first_element+1 != $(length(n.log_probs))"
+            # @assert last_element - first_element + 1 == size(n.thetas, 1)
+            # @assert size(n.thetas, 2) == nc
             for theta in eachrow(n.thetas)
                 push!(thetas, theta)
             end
         end
     end
     bc = BitCircuit(lc, data; reset=reset, on_decision)
+    thetas_matrix = permutedims(hcat(thetas...), (2, 1))
     ParamBitCircuit(bc, permutedims(hcat(thetas...), (2, 1)))
 end
 

From 82fed5598c01979d685ab2e10a16b8da5b33215c Mon Sep 17 00:00:00 2001
From: YitaoLiang <yliang@fandm.edu>
Date: Wed, 16 Sep 2020 03:46:10 -0700
Subject: [PATCH 122/131] [fix] bug fix for logistic circuits param updates

---
 src/Logistic/parameters.jl | 60 +++++++++++++++++---------------------
 1 file changed, 26 insertions(+), 34 deletions(-)

diff --git a/src/Logistic/parameters.jl b/src/Logistic/parameters.jl
index 3e3d4972..fdc4e9f2 100644
--- a/src/Logistic/parameters.jl
+++ b/src/Logistic/parameters.jl
@@ -30,18 +30,16 @@ function update_parameters_cpu(bc, data, labels, cl, step_size)
     params_lock::Threads.ReentrantLock = Threads.ReentrantLock()
 
     @inline function on_edge_binary(flows, values, prime, sub, element, grandpa, single_child)
-        if !single_child
-            lock(params_lock) do # TODO: move lock to inner loop?
-                for i = 1:size(flows, 1)
-                    @inbounds edge_flow = values[i, prime] & values[i, sub] & flows[i, grandpa]
-                    first_true_bit = trailing_zeros(edge_flow) + 1
-                    last_true_bit = 64 - leading_zeros(edge_flow)
-                    @simd for j = first_true_bit:last_true_bit
-                        ex_id = ((i - 1) << 6) + j
-                        if get_bit(edge_flow, j)
-                            for class = 1:nc
-                                @inbounds bc.params[element, class] -= (cl[ex_id, class] - labels[ex_id, class]) * step_size
-                            end
+        lock(params_lock) do # TODO: move lock to inner loop?
+            for i = 1:size(flows, 1)
+                @inbounds edge_flow = values[i, prime] & values[i, sub] & flows[i, grandpa]
+                first_true_bit = trailing_zeros(edge_flow) + 1
+                last_true_bit = 64 - leading_zeros(edge_flow)
+                @simd for j = first_true_bit:last_true_bit
+                    ex_id = ((i - 1) << 6) + j
+                    if get_bit(edge_flow, j)
+                        for class = 1:nc
+                            @inbounds bc.params[element, class] -= (cl[ex_id, class] - labels[ex_id, class]) * step_size
                         end
                     end
                 end
@@ -50,14 +48,12 @@ function update_parameters_cpu(bc, data, labels, cl, step_size)
     end
     
     @inline function on_edge_float(flows, values, prime, sub, element, grandpa, single_child)
-        if !single_child
-            lock(params_lock) do # TODO: move lock to inner loop?
-                @avx for i = 1:size(flows, 1)
-                    @inbounds edge_flow = values[i, prime] * values[i, sub] / values[i, grandpa] * flows[i, grandpa]
-                    edge_flow = vifelse(isfinite(edge_flow), edge_flow, zero(eltype(flows)))
-                    for class = 1:nc
-                        @inbounds bc.parames[element, class] -= (cl[i, class] - labels[i, class]) * edge_flow * step_size
-                    end
+        lock(params_lock) do # TODO: move lock to inner loop?
+            @avx for i = 1:size(flows, 1)
+                @inbounds edge_flow = values[i, prime] * values[i, sub] / values[i, grandpa] * flows[i, grandpa]
+                edge_flow = vifelse(isfinite(edge_flow), edge_flow, zero(eltype(flows)))
+                for class = 1:nc
+                    @inbounds bc.parames[element, class] -= (cl[i, class] - labels[i, class]) * edge_flow * step_size
                 end
             end
         end
@@ -83,15 +79,13 @@ function update_parameters_gpu(bc, data, labels, cl, step_size)
     params_device = CUDA.cudaconvert(bc.params)
 
     @inline function on_edge_binary(flows, values, prime, sub, element, grandpa, chunk_id, edge_flow, single_child)
-        if !single_child
-            first_true_bit = 1 + trailing_zeros(edge_flow)
-            last_true_bit = 64 - leading_zeros(edge_flow)
-            for j = first_true_bit:last_true_bit
-                if get_bit(edge_flow, j)
-                    ex_id = ((chunk_id - 1) << 6) + j
-                    for class = 1:nc
-                        CUDA.@atomic params_device[element, class] -= (cl_device[ex_id, class] - label_device[ex_id, class]) * step_size
-                    end
+        first_true_bit = 1 + trailing_zeros(edge_flow)
+        last_true_bit = 64 - leading_zeros(edge_flow)
+        for j = first_true_bit:last_true_bit
+            if get_bit(edge_flow, j)
+                ex_id = ((chunk_id - 1) << 6) + j
+                for class = 1:nc
+                    CUDA.@atomic params_device[element, class] -= (cl_device[ex_id, class] - label_device[ex_id, class]) * step_size
                 end
             end
         end
@@ -99,11 +93,9 @@ function update_parameters_gpu(bc, data, labels, cl, step_size)
     end
 
     @inline function on_edge_float(flows, values, prime, sub, element, grandpa, ex_id, edge_flow, single_child)
-        if !single_child
-            for class = 1:nc
-                CUDA.@atomic params_device[element, class] -= (cl_device[ex_id, class] - label_device[ex_id, class]) * edge_flow * step_size
-            end
-        end      
+        for class = 1:nc
+            CUDA.@atomic params_device[element, class] -= (cl_device[ex_id, class] - label_device[ex_id, class]) * edge_flow * step_size
+        end
         nothing
     end
 

From 38b6b9b03a42063d2976ea21c2feb17f57e694e4 Mon Sep 17 00:00:00 2001
From: MhDang <mhdang0026@gmail.com>
Date: Wed, 16 Sep 2020 21:24:43 -0700
Subject: [PATCH 123/131] reinstate structure learn

---
 src/LoadSave/plot.jl               |  4 +--
 src/ProbabilisticCircuits.jl       |  8 +++---
 src/structurelearner/heuristics.jl | 40 ++++++++++++++++++++++++------
 src/structurelearner/init.jl       |  4 +--
 4 files changed, 41 insertions(+), 15 deletions(-)

diff --git a/src/LoadSave/plot.jl b/src/LoadSave/plot.jl
index 84e7868c..e294e835 100644
--- a/src/LoadSave/plot.jl
+++ b/src/LoadSave/plot.jl
@@ -20,7 +20,7 @@ function DiGraph(pc::ProbCircuit)
     on_edge(g, id_dict, n::Union{PlainSumNode, StructSumNode}, c, n_id, c_id) = begin
         edge_labels[(n_id, c_id)] = begin
             i = findall(x -> x === c, children(n))[1]
-            "$(exp(n.log_probs[i]))"
+            "$(round(exp(n.log_probs[i]), digits=3))"
         end
     end
     g, _ = LogicCircuits.LoadSave.DiGraph(pc;on_edge=on_edge, on_var=add_label!)
@@ -30,5 +30,5 @@ end
 import TikzGraphs: plot
 plot(pc::ProbCircuit) = begin
     g, label, edge_labels = DiGraph(pc)
-    TikzGraphs.plot(g, label, edge_labels=edge_labels)
+    TikzGraphs.plot(g, label, edge_labels=edge_labels, edge_style="font=\\tiny")
 end
\ No newline at end of file
diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index 1e0f8357..aaac58d5 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -31,10 +31,10 @@ include("Logistic/Logistic.jl")
 include("mixtures/shared_prob_nodes.jl")
 # include("mixtures/em.jl")
 
-# include("structurelearner/chow_liu_tree.jl")
-# include("structurelearner/init.jl")
-# include("structurelearner/heuristics.jl")
-# include("structurelearner/learner.jl")
+include("structurelearner/chow_liu_tree.jl")
+include("structurelearner/init.jl")
+include("structurelearner/heuristics.jl")
+include("structurelearner/learner.jl")
 
 include("LoadSave/LoadSave.jl")
 @reexport using .LoadSave
diff --git a/src/structurelearner/heuristics.jl b/src/structurelearner/heuristics.jl
index 95c00e1e..7312aa27 100644
--- a/src/structurelearner/heuristics.jl
+++ b/src/structurelearner/heuristics.jl
@@ -3,9 +3,35 @@ using LinearAlgebra: diagind
 """
 Pick the edge with maximum flow
 """
-function eFlow(candidates::Vector{Tuple{Node, Node}})
+function count_downflow(values::Matrix{UInt64}, flows::Matrix{UInt64}, n::LogicCircuit)
+    dec_id = n.data.node_id
+    sum(1:size(flows,1)) do i
+        count_ones(flows[i, dec_id]) 
+    end
+end
+
+function count_downflow(values::Matrix{UInt64}, flows::Matrix{UInt64}, n::LogicCircuit, c::LogicCircuit)
+    grandpa = n.data.node_id
+    prime = c.prime.data.node_id
+    sub = c.sub.data.node_id
+    edge_count = sum(1:size(flows,1)) do i
+        count_ones(values[i, prime] & values[i, sub] & flows[i, grandpa]) 
+    end
+end
+
+function downflow_all(values::Matrix{UInt64}, flows::Matrix{UInt64}, n::LogicCircuit, c::LogicCircuit)
+    grandpa = n.data.node_id
+    prime = c.prime.data.node_id
+    sub = c.sub.data.node_id
+    edge = map(1:size(flows,1)) do i
+        digits(Bool, values[i, prime] & values[i, sub] & flows[i, grandpa], base=2, pad=64)
+    end
+    vcat(edge...)
+end
+
+function eFlow(values, flows, candidates::Vector{Tuple{Node, Node}})
     edge2flows = map(candidates) do (or, and)
-        sum(get_downflow(or, and))
+        count_downflow(values, flows, or, and)
     end
     (max_flow, max_edge_id) = findmax(edge2flows)
     candidates[max_edge_id], max_flow
@@ -14,8 +40,8 @@ end
 """
 Pick the variable with maximum sum of mutual information
 """
-function vMI(edge, vars::Vector{Var}, train_x)
-    examples_id = get_downflow(edge...)  
+function vMI(values, flows, edge, vars::Vector{Var}, train_x)
+    examples_id = downflow_all(values, flows, edge...)[1:num_examples(train_x)]
     sub_matrix = train_x[examples_id, vars]
     (_, mi) = mutual_information(sub_matrix; α=1.0)
     mi[diagind(mi)] .= 0
@@ -43,9 +69,9 @@ end
 
 function heuristic_loss(circuit::LogicCircuit, train_x; pick_edge="eFlow", pick_var="vMI")
     candidates, scope = split_candidates(circuit)
-    compute_flows(circuit, train_x)
+    values, flows = satisfies_flows(circuit, train_x)
     if pick_edge == "eFlow"
-        edge, flow = eFlow(candidates)
+        edge, flow = eFlow(values, flows, candidates)
     elseif pick_edge == "eRand"
         edge = eRand(candidates)
     else
@@ -57,7 +83,7 @@ function heuristic_loss(circuit::LogicCircuit, train_x; pick_edge="eFlow", pick_
     vars =  Var.(intersect(filter(l -> l > 0, lits), - filter(l -> l < 0, lits)))
 
     if pick_var == "vMI"
-        var, score = vMI(edge, vars, train_x)
+        var, score = vMI(values, flows, edge, vars, train_x)
     elseif pick_var == "vRand"
         var = vRand(vars)
     else
diff --git a/src/structurelearner/init.jl b/src/structurelearner/init.jl
index a25838c5..5c9155d7 100644
--- a/src/structurelearner/init.jl
+++ b/src/structurelearner/init.jl
@@ -1,11 +1,11 @@
-export learn_struct_prob_circuit, learn_vtree_from_clt, compile_sdd_from_clt
+export learn_chow_liu_tree_circuit, learn_vtree_from_clt, compile_sdd_from_clt
 using LightGraphs: outneighbors
 using MetaGraphs: get_prop
 
 """
 Learning from data a structured-decomposable circuit with several structure learning algorithms
 """
-function learn_struct_prob_circuit(data;
+function learn_chow_liu_tree_circuit(data;
         pseudocount = 1.0, 
         algo = "chow-liu", algo_kwargs=(α=1.0, clt_root="graph_center"), 
         vtree = "chow-liu", vtree_kwargs=(vtree_mode="balanced",))    

From 341f2f43625b29ba8c0c1aeccc60d9f28494d550 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 27 Sep 2020 14:24:09 -0700
Subject: [PATCH 124/131] MAP inference on CPU

---
 src/ProbabilisticCircuits.jl |  1 +
 src/queries/map.jl           | 71 ++++++++++++++++++++++++++++++++++++
 2 files changed, 72 insertions(+)
 create mode 100644 src/queries/map.jl

diff --git a/src/ProbabilisticCircuits.jl b/src/ProbabilisticCircuits.jl
index aaac58d5..8ec65ed9 100644
--- a/src/ProbabilisticCircuits.jl
+++ b/src/ProbabilisticCircuits.jl
@@ -19,6 +19,7 @@ include("parameters.jl")
 
 include("queries/likelihood.jl")
 include("queries/marginal_flow.jl")
+include("queries/map.jl")
 include("queries/sample.jl")
 include("queries/pr_constraint.jl")
 include("queries/information.jl")
diff --git a/src/queries/map.jl b/src/queries/map.jl
new file mode 100644
index 00000000..e8c2406f
--- /dev/null
+++ b/src/queries/map.jl
@@ -0,0 +1,71 @@
+export map_state, MAP
+
+import DataFrames: DataFrame, mapcols!
+
+#####################
+# Circuit MAP/MPE evaluation
+#####################
+
+"Evaluate maximum a-posteriori state of the circuit for a given input"
+map_state(root::ProbCircuit, data::Union{Bool,Missing}...) =
+    map_state(root, collect(Union{Bool,Missing}, data))
+
+map_state(root::ProbCircuit, data::Union{Vector{Union{Bool,Missing}},CuVector{UInt8}}) =
+    map_state(root, DataFrame(reshape(data, 1, :)))[1,:]
+
+map_state(circuit::ProbCircuit, data::DataFrame) =
+    map_state(same_device(ParamBitCircuit(circuit, data), data) , data)
+
+function map_state(pbc::ParamBitCircuit, data; Float=Float32)
+    @assert isgpu(data) == isgpu(pbc) "ParamBitCircuit and data need to be on the same device"
+    values = marginal_all(pbc, data)
+    state = Matrix{Bool}(undef, num_examples(data), num_features(data))
+    logprob = zeros(Float, num_examples(data))
+    Threads.@threads for ex_id = 1:num_examples(data)
+        map_state_rec(pbc, ex_id, num_nodes(pbc), values, state, logprob)
+    end
+    df = DataFrame(state)
+    mapcols!(c -> BitVector(c), df)
+    df, logprob
+end
+
+"""
+Maximum a-posteriori queries
+"""
+const MAP = map_state
+
+function map_state_rec(pbc, ex_id, dec_id, values, state, logprob)
+    bc = pbc.bitcircuit
+    if isleafgate(bc, dec_id)
+        if isliteralgate(bc, dec_id)
+            l = literal(bc, dec_id)
+            state[ex_id, lit2var(l)] = (l > 0) 
+        end
+    else
+        # recurse
+        edge_log_pr, prime, sub = map_child(pbc, ex_id, dec_id, values)
+        logprob[ex_id] += edge_log_pr
+        map_state_rec(pbc, ex_id, prime, values, state, logprob)
+        map_state_rec(pbc, ex_id, sub, values, state, logprob)
+    end
+end
+
+
+"Find the MAP child value and node id of a given decision node"
+function map_child(pbc::ParamBitCircuit, ex_id, dec_id, values)
+    pars = pbc.params
+    bc = pbc.bitcircuit
+    els = @inbounds bc.elements
+    els_start = @inbounds bc.nodes[1,dec_id]
+    els_end = @inbounds bc.nodes[2,dec_id]
+    pr_opt = typemin(eltype(values))
+    j_opt = 0
+    for j = els_start:els_end
+        pr = values[ex_id, els[2,j]] + values[ex_id, els[3,j]] + pars[j]
+        if pr > pr_opt
+            pr_opt = pr
+            j_opt = j
+        end
+    end
+    return pars[j_opt], els[2,j_opt], els[3,j_opt]
+end

From abbd7a94a7c4c350750acb0923495eaf54eb2d0a Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 27 Sep 2020 15:00:53 -0700
Subject: [PATCH 125/131] MAP CPU tests

---
 test/queries/map_tests.jl | 41 +++++++++++++++++++++++++++++++++++++++
 1 file changed, 41 insertions(+)
 create mode 100644 test/queries/map_tests.jl

diff --git a/test/queries/map_tests.jl b/test/queries/map_tests.jl
new file mode 100644
index 00000000..27ce2ad9
--- /dev/null
+++ b/test/queries/map_tests.jl
@@ -0,0 +1,41 @@
+using Test
+using LogicCircuits
+using ProbabilisticCircuits
+using DataFrames: DataFrame
+using CUDA
+
+include("../helper/gpu.jl")
+
+@testset "MAP" begin
+    prob_circuit = zoo_psdd("little_4var.psdd");
+
+    data_full = generate_data_all(num_variables(prob_circuit))
+
+    map, mappr = MAP(prob_circuit, data_full)
+
+    @test map == data_full
+    
+    evipr = EVI(prob_circuit, data_full)
+    @test mappr ≈ evipr atol=1e-6
+
+    data_marg = DataFrame([false false false false; 
+                      false true true false; 
+                      false false true true;
+                      false false false missing; 
+                      missing true false missing; 
+                      missing missing missing missing; 
+                      false missing missing missing])
+
+    map, mappr = MAP(prob_circuit, data_marg)
+
+    @test all(zip(eachcol(map), eachcol(data_marg))) do (cf,cm) 
+        all(zip(cf, cm)) do (f,m) 
+            ismissing(m) || f == m
+        end
+    end
+
+    mar = MAR(prob_circuit, data_marg)
+
+    @test all(mar .> mappr .- 1e-6)
+
+end
\ No newline at end of file

From 2d3afb33485c692f475e08ce1c349d36ec092f8e Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Sun, 27 Sep 2020 15:28:36 -0700
Subject: [PATCH 126/131] make MAP inference code more GPU friendly

---
 src/param_bit_circuit.jl |  8 +++++++-
 src/queries/map.jl       | 35 +++++++++++++++++------------------
 2 files changed, 24 insertions(+), 19 deletions(-)

diff --git a/src/param_bit_circuit.jl b/src/param_bit_circuit.jl
index f200327f..20599b22 100644
--- a/src/param_bit_circuit.jl
+++ b/src/param_bit_circuit.jl
@@ -47,11 +47,17 @@ end
 ## Helper functions ###
 #######################
 
-import LogicCircuits: num_nodes, num_elements, num_features
+params(c::ParamBitCircuit) = c.params
+
+import LogicCircuits: num_nodes, num_elements, num_features, num_leafs, nodes, elements
 
 num_nodes(c::ParamBitCircuit) = num_nodes(c.bitcircuit)
 num_elements(c::ParamBitCircuit) = num_elements(c.bitcircuit)
 num_features(c::ParamBitCircuit) = num_features(c.bitcircuit)
+num_leafs(c::ParamBitCircuit) = num_leafs(c.bitcircuit)
+
+nodes(c::ParamBitCircuit) = nodes(c.bitcircuit)
+elements(c::ParamBitCircuit) = elements(c.bitcircuit)
 
 import LogicCircuits: to_gpu, to_cpu, isgpu #extend
 
diff --git a/src/queries/map.jl b/src/queries/map.jl
index e8c2406f..4d2578fa 100644
--- a/src/queries/map.jl
+++ b/src/queries/map.jl
@@ -22,7 +22,8 @@ function map_state(pbc::ParamBitCircuit, data; Float=Float32)
     state = Matrix{Bool}(undef, num_examples(data), num_features(data))
     logprob = zeros(Float, num_examples(data))
     Threads.@threads for ex_id = 1:num_examples(data)
-        map_state_rec(pbc, ex_id, num_nodes(pbc), values, state, logprob)
+        map_state_rec(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), 
+                        ex_id, num_nodes(pbc), values, state, logprob)
     end
     df = DataFrame(state)
     mapcols!(c -> BitVector(c), df)
@@ -34,38 +35,36 @@ Maximum a-posteriori queries
 """
 const MAP = map_state
 
-function map_state_rec(pbc, ex_id, dec_id, values, state, logprob)
-    bc = pbc.bitcircuit
-    if isleafgate(bc, dec_id)
-        if isliteralgate(bc, dec_id)
-            l = literal(bc, dec_id)
-            state[ex_id, lit2var(l)] = (l > 0) 
+function map_state_rec(nl, params, nodes, elements, ex_id, dec_id, values, state, logprob)
+    if isleafgate(nl, dec_id)
+        if isliteralgate(nl, dec_id)
+            l = literal(nl, dec_id)
+            @inbounds state[ex_id, lit2var(l)] = (l > 0) 
         end
     else
         # recurse
-        edge_log_pr, prime, sub = map_child(pbc, ex_id, dec_id, values)
+        edge_log_pr, prime, sub = map_child(params, nodes, elements, ex_id, dec_id, values)
         logprob[ex_id] += edge_log_pr
-        map_state_rec(pbc, ex_id, prime, values, state, logprob)
-        map_state_rec(pbc, ex_id, sub, values, state, logprob)
+        map_state_rec(nl, params, nodes, elements, 
+            ex_id, prime, values, state, logprob)
+        map_state_rec(nl, params, nodes, elements, 
+            ex_id, sub, values, state, logprob)
     end
 end
 
 
 "Find the MAP child value and node id of a given decision node"
-function map_child(pbc::ParamBitCircuit, ex_id, dec_id, values)
-    pars = pbc.params
-    bc = pbc.bitcircuit
-    els = @inbounds bc.elements
-    els_start = @inbounds bc.nodes[1,dec_id]
-    els_end = @inbounds bc.nodes[2,dec_id]
+function map_child(params, nodes, elements, ex_id, dec_id, values)
+    els_start = @inbounds nodes[1,dec_id]
+    els_end = @inbounds nodes[2,dec_id]
     pr_opt = typemin(eltype(values))
     j_opt = 0
     for j = els_start:els_end
-        pr = values[ex_id, els[2,j]] + values[ex_id, els[3,j]] + pars[j]
+        pr = @inbounds values[ex_id, elements[2,j]] + values[ex_id, elements[3,j]] + params[j]
         if pr > pr_opt
             pr_opt = pr
             j_opt = j
         end
     end
-    return pars[j_opt], els[2,j_opt], els[3,j_opt]
+    @inbounds return params[j_opt], elements[2,j_opt], elements[3,j_opt]
 end

From 018cefaa9605145a1cfd5ab122a3451a4498fd0a Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Tue, 29 Sep 2020 00:58:10 -0700
Subject: [PATCH 127/131] MAP inference on GPU

---
 src/queries/map.jl | 112 +++++++++++++++++++++++++++++++++++----------
 1 file changed, 87 insertions(+), 25 deletions(-)

diff --git a/src/queries/map.jl b/src/queries/map.jl
index 4d2578fa..8172856a 100644
--- a/src/queries/map.jl
+++ b/src/queries/map.jl
@@ -14,18 +14,28 @@ map_state(root::ProbCircuit, data::Union{Vector{Union{Bool,Missing}},CuVector{UI
     map_state(root, DataFrame(reshape(data, 1, :)))[1,:]
 
 map_state(circuit::ProbCircuit, data::DataFrame) =
-    map_state(same_device(ParamBitCircuit(circuit, data), data) , data)
+    map_state(same_device(ParamBitCircuit(circuit, data), data), data)
 
 function map_state(pbc::ParamBitCircuit, data; Float=Float32)
     @assert isgpu(data) == isgpu(pbc) "ParamBitCircuit and data need to be on the same device"
     values = marginal_all(pbc, data)
-    state = Matrix{Bool}(undef, num_examples(data), num_features(data))
-    logprob = zeros(Float, num_examples(data))
-    Threads.@threads for ex_id = 1:num_examples(data)
-        map_state_rec(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), 
-                        ex_id, num_nodes(pbc), values, state, logprob)
+    if !isgpu(data)
+        state = zeros(Bool, num_examples(data), num_features(data))
+        logprob = zeros(Float, num_examples(data))
+        map_state_rec_cpu(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), num_nodes(pbc), values, state, logprob)
+    else
+        state = CUDA.zeros(Bool, num_examples(data), num_features(data))
+        logprob = CUDA.zeros(Float, num_examples(data))
+        stack = CUDA.zeros(Int32, num_examples(data), num_features(data)+3)
+        stack[:,1] .= 1 # start with 1 dec_id in the stack
+        stack[:,2] .= num_nodes(pbc) # start with the root in the stack
+        num_threads = 256
+        num_blocks = ceil(Int, size(state,1)/num_threads)
+        CUDA.@sync begin
+            @cuda threads=num_threads blocks=num_blocks map_state_iter_cuda(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), values, state, logprob, stack)
+        end
     end
-    df = DataFrame(state)
+    df = DataFrame(to_cpu(state))
     mapcols!(c -> BitVector(c), df)
     df, logprob
 end
@@ -35,36 +45,88 @@ Maximum a-posteriori queries
 """
 const MAP = map_state
 
+"Find the MAP child value and node id of a given decision node"
+function map_child(params, nodes, elements, ex_id, dec_id, values)
+    els_start = nodes[1,dec_id]
+    els_end = nodes[2,dec_id]
+    pr_opt = typemin(eltype(values))
+    j_opt = 1
+    for j = els_start:els_end
+        prime = elements[2,j]
+        sub = elements[3,j]
+        pr = values[ex_id, prime] + values[ex_id, sub] + params[j]
+        if pr > pr_opt
+            pr_opt = pr
+            j_opt = j
+        end
+    end
+    return params[j_opt], elements[2,j_opt], elements[3,j_opt] 
+end
+
+# CPU code
+
+function map_state_rec_cpu(nl, params, nodes, elements, dec_id, values, state, logprob)
+    Threads.@threads for ex_id = 1:size(state,1)
+        map_state_rec(nl, params, nodes, elements, ex_id, dec_id, values, state, logprob)
+    end
+end
+
 function map_state_rec(nl, params, nodes, elements, ex_id, dec_id, values, state, logprob)
     if isleafgate(nl, dec_id)
         if isliteralgate(nl, dec_id)
             l = literal(nl, dec_id)
-            @inbounds state[ex_id, lit2var(l)] = (l > 0) 
+            state[ex_id, lit2var(l)] = (l > 0) 
         end
     else
-        # recurse
         edge_log_pr, prime, sub = map_child(params, nodes, elements, ex_id, dec_id, values)
         logprob[ex_id] += edge_log_pr
-        map_state_rec(nl, params, nodes, elements, 
-            ex_id, prime, values, state, logprob)
-        map_state_rec(nl, params, nodes, elements, 
-            ex_id, sub, values, state, logprob)
+        map_state_rec(nl, params, nodes, elements, ex_id, prime, values, state, logprob)
+        map_state_rec(nl, params, nodes, elements, ex_id, sub,   values, state, logprob)
     end
 end
 
+# GPU code
 
-"Find the MAP child value and node id of a given decision node"
-function map_child(params, nodes, elements, ex_id, dec_id, values)
-    els_start = @inbounds nodes[1,dec_id]
-    els_end = @inbounds nodes[2,dec_id]
-    pr_opt = typemin(eltype(values))
-    j_opt = 0
-    for j = els_start:els_end
-        pr = @inbounds values[ex_id, elements[2,j]] + values[ex_id, elements[3,j]] + params[j]
-        if pr > pr_opt
-            pr_opt = pr
-            j_opt = j
+function map_state_iter_cuda(nl, params, nodes, elements, values, state, logprob, stack)
+    index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
+    stride_x = blockDim().x * gridDim().x
+    for ex_id = index_x:stride_x:size(state,1)
+        dec_id = pop_cuda!(stack, ex_id)
+        while dec_id > zero(eltype(stack))
+            if isleafgate(nl, dec_id)
+                if isliteralgate(nl, dec_id)
+                    l = literal(nl, dec_id)
+                    var = lit2var(l)
+                    state[ex_id, Int(var)] = (l > 0) 
+                end
+            else
+                edge_log_pr, prime, sub = map_child(params, nodes, elements, ex_id, dec_id, values)
+                logprob[ex_id] += edge_log_pr
+                push_cuda!(stack, ex_id, prime)
+                push_cuda!(stack, ex_id, sub)
+            end
+            dec_id = pop_cuda!(stack, ex_id)
         end
     end
-    @inbounds return params[j_opt], elements[2,j_opt], elements[3,j_opt]
+    return nothing
 end
+
+#TODO move to utils
+
+function pop_cuda!(stack, i)
+    if stack[i,1] == zero(eltype(stack))
+        return zero(eltype(stack))
+    else
+        stack[i,1] -= one(eltype(stack))
+        return stack[i,stack[i,1]+2]
+    end
+end
+
+function push_cuda!(stack, i, v)
+    stack[i,1] += one(eltype(stack))
+    CUDA.@cuassert 1+stack[i,1] <= size(stack,2) "CUDA stack overflow"
+    stack[i,1+stack[i,1]] = v
+    return nothing
+end
+
+length_cuda(stack, i) = stack[i,1]

From 8378bf587b6a60c64bee572fa7e9763094962248 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Tue, 29 Sep 2020 09:51:54 -0700
Subject: [PATCH 128/131] unit test for GPU MAP

---
 test/helper/gpu.jl                  |  4 ++++
 test/queries/likelihood_tests.jl    |  2 +-
 test/queries/map_tests.jl           | 10 ++++++++++
 test/queries/marginal_flow_tests.jl |  6 +++---
 4 files changed, 18 insertions(+), 4 deletions(-)

diff --git a/test/helper/gpu.jl b/test/helper/gpu.jl
index 2c277f95..95e03927 100644
--- a/test/helper/gpu.jl
+++ b/test/helper/gpu.jl
@@ -1,5 +1,9 @@
 using CUDA: CUDA
 
 function cpu_gpu_agree(f, data; atol=1e-7)
+    CUDA.functional() && @test f(data) == to_cpu(f(to_gpu(data)))
+end
+
+function cpu_gpu_agree_approx(f, data; atol=1e-7)
     CUDA.functional() && @test f(data) ≈ to_cpu(f(to_gpu(data))) atol=atol
 end
\ No newline at end of file
diff --git a/test/queries/likelihood_tests.jl b/test/queries/likelihood_tests.jl
index 4ef2afba..9f32e388 100644
--- a/test/queries/likelihood_tests.jl
+++ b/test/queries/likelihood_tests.jl
@@ -31,7 +31,7 @@ include("../helper/gpu.jl")
 
     @test 1 ≈ sum_prob_all atol = 1e-7;
 
-    cpu_gpu_agree(data_all) do d 
+    cpu_gpu_agree_approx(data_all) do d 
         EVI(prob_circuit, d)
     end
     
diff --git a/test/queries/map_tests.jl b/test/queries/map_tests.jl
index 27ce2ad9..bf204ab0 100644
--- a/test/queries/map_tests.jl
+++ b/test/queries/map_tests.jl
@@ -38,4 +38,14 @@ include("../helper/gpu.jl")
 
     @test all(mar .> mappr .- 1e-6)
 
+    # same MAP states on CPU and GPU
+    cpu_gpu_agree(data_marg) do d 
+        MAP(prob_circuit, d)[1]
+    end
+
+    # same MAP probabilities on CPU and GPU
+    cpu_gpu_agree_approx(data_marg) do d 
+        MAP(prob_circuit, d)[2]
+    end
+
 end
\ No newline at end of file
diff --git a/test/queries/marginal_flow_tests.jl b/test/queries/marginal_flow_tests.jl
index 4b0e6c12..235809c5 100644
--- a/test/queries/marginal_flow_tests.jl
+++ b/test/queries/marginal_flow_tests.jl
@@ -22,7 +22,7 @@ include("../helper/gpu.jl")
     calc_prob = exp.(MAR(prob_circuit, data_marg))
     @test true_prob ≈ calc_prob atol=1e-7
 
-    cpu_gpu_agree(data_marg) do d 
+    cpu_gpu_agree_approx(data_marg) do d 
         marginal_all(prob_circuit, d)
     end
 
@@ -37,7 +37,7 @@ include("../helper/gpu.jl")
     test_complete_mar(data_full)
     CUDA.functional() && test_complete_mar(to_gpu(data_full))
 
-    cpu_gpu_agree(data_full) do d 
+    cpu_gpu_agree_approx(data_full) do d 
         marginal_all(prob_circuit, d)
     end
 
@@ -69,7 +69,7 @@ end
     test_flows(data_full)
     CUDA.functional() && test_flows(to_gpu(data_full))
     
-    cpu_gpu_agree(data_full) do d 
+    cpu_gpu_agree_approx(data_full) do d 
         _, f = marginal_flows(prob_circuit, d)
         f[:,3:end] # ignore true and false leaf
     end

From 10640e4e0f0d7c2d90a7e107caec561a3778d89f Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Tue, 29 Sep 2020 11:27:54 -0700
Subject: [PATCH 129/131] MAP ccode cleanup

---
 src/Utils/misc.jl         |  26 +++++++++
 src/queries/map.jl        | 118 ++++++++++++++++++--------------------
 test/queries/map_tests.jl |  10 ++++
 3 files changed, 92 insertions(+), 62 deletions(-)

diff --git a/src/Utils/misc.jl b/src/Utils/misc.jl
index abea1c69..1237496e 100644
--- a/src/Utils/misc.jl
+++ b/src/Utils/misc.jl
@@ -1,7 +1,9 @@
 export to_long_mi,
+    pop_cuda!, push_cuda!, length_cuda,
     generate_all, generate_data_all
 
 using DataFrames
+using CUDA: CUDA
 
 ###################
 # Misc.
@@ -13,6 +15,30 @@ function to_long_mi(m::Matrix{Float64}, min_int, max_int)::Matrix{Int64}
     return @. round(Int64, m * δint / δmi + min_int)
 end
 
+
+###################
+# Rudimentary CUDA-compatible stack data structure
+####################
+
+function pop_cuda!(stack, i)
+    if @inbounds stack[i,1] == zero(eltype(stack))
+        return zero(eltype(stack))
+    else
+        @inbounds stack[i,1] -= one(eltype(stack))
+        @inbounds return stack[i,stack[i,1]+2]
+    end
+end
+
+function push_cuda!(stack, i, v)
+    @inbounds stack[i,1] += one(eltype(stack))
+    @inbounds CUDA.@cuassert 1+stack[i,1] <= size(stack,2) "CUDA stack overflow"
+    @inbounds stack[i,1+stack[i,1]] = v
+    return nothing
+end
+
+length_cuda(stack, i) = stack[i,1]
+
+
 ###################
 # One-Hot Encoding
 ####################
diff --git a/src/queries/map.jl b/src/queries/map.jl
index 8172856a..02e422fd 100644
--- a/src/queries/map.jl
+++ b/src/queries/map.jl
@@ -1,4 +1,4 @@
-export map_state, MAP
+export max_a_posteriori, MAP
 
 import DataFrames: DataFrame, mapcols!
 
@@ -7,87 +7,101 @@ import DataFrames: DataFrame, mapcols!
 #####################
 
 "Evaluate maximum a-posteriori state of the circuit for a given input"
-map_state(root::ProbCircuit, data::Union{Bool,Missing}...) =
-    map_state(root, collect(Union{Bool,Missing}, data))
+max_a_posteriori(root::ProbCircuit, data::Union{Bool,Missing}...) =
+    max_a_posteriori(root, collect(Union{Bool,Missing}, data))
 
-map_state(root::ProbCircuit, data::Union{Vector{Union{Bool,Missing}},CuVector{UInt8}}) =
-    map_state(root, DataFrame(reshape(data, 1, :)))[1,:]
+max_a_posteriori(root::ProbCircuit, data::Union{Vector{Union{Bool,Missing}},CuVector{UInt8}}) =
+    max_a_posteriori(root, DataFrame(reshape(data, 1, :)))[1,:]
 
-map_state(circuit::ProbCircuit, data::DataFrame) =
-    map_state(same_device(ParamBitCircuit(circuit, data), data), data)
+max_a_posteriori(circuit::ProbCircuit, data::DataFrame) =
+    max_a_posteriori(same_device(ParamBitCircuit(circuit, data), data), data)
 
-function map_state(pbc::ParamBitCircuit, data; Float=Float32)
+function max_a_posteriori(pbc::ParamBitCircuit, data; Float=Float32)
     @assert isgpu(data) == isgpu(pbc) "ParamBitCircuit and data need to be on the same device"
     values = marginal_all(pbc, data)
-    if !isgpu(data)
-        state = zeros(Bool, num_examples(data), num_features(data))
-        logprob = zeros(Float, num_examples(data))
-        map_state_rec_cpu(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), num_nodes(pbc), values, state, logprob)
+    state, logprob = map_down(pbc, data, values; Float)
+    if isgpu(values)
+        CUDA.unsafe_free!(values) # save the GC some effort
+        # do the conversion to a CuBitVector on the CPU...
+        df = DataFrame(to_cpu(state))
+        mapcols!(c -> to_gpu(BitVector(c)), df)
     else
-        state = CUDA.zeros(Bool, num_examples(data), num_features(data))
-        logprob = CUDA.zeros(Float, num_examples(data))
-        stack = CUDA.zeros(Int32, num_examples(data), num_features(data)+3)
-        stack[:,1] .= 1 # start with 1 dec_id in the stack
-        stack[:,2] .= num_nodes(pbc) # start with the root in the stack
-        num_threads = 256
-        num_blocks = ceil(Int, size(state,1)/num_threads)
-        CUDA.@sync begin
-            @cuda threads=num_threads blocks=num_blocks map_state_iter_cuda(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), values, state, logprob, stack)
-        end
+        df = DataFrame(state)
+        mapcols!(c -> BitVector(c), df)
     end
-    df = DataFrame(to_cpu(state))
-    mapcols!(c -> BitVector(c), df)
     df, logprob
 end
 
 """
 Maximum a-posteriori queries
 """
-const MAP = map_state
+const MAP = max_a_posteriori
+
+"""
+Mode of the distribution
+"""
+const mode = max_a_posteriori
 
 "Find the MAP child value and node id of a given decision node"
 function map_child(params, nodes, elements, ex_id, dec_id, values)
-    els_start = nodes[1,dec_id]
-    els_end = nodes[2,dec_id]
+    @inbounds els_start = nodes[1,dec_id]
+    @inbounds els_end = nodes[2,dec_id]
     pr_opt = typemin(eltype(values))
     j_opt = 1
     for j = els_start:els_end
-        prime = elements[2,j]
-        sub = elements[3,j]
-        pr = values[ex_id, prime] + values[ex_id, sub] + params[j]
+        @inbounds prime = elements[2,j]
+        @inbounds sub = elements[3,j]
+        @inbounds pr = values[ex_id, prime] + values[ex_id, sub] + params[j]
         if pr > pr_opt
             pr_opt = pr
             j_opt = j
         end
     end
-    return params[j_opt], elements[2,j_opt], elements[3,j_opt] 
+    @inbounds return params[j_opt], elements[2,j_opt], elements[3,j_opt] 
 end
 
 # CPU code
 
-function map_state_rec_cpu(nl, params, nodes, elements, dec_id, values, state, logprob)
+function map_down(pbc, data, values::Array; Float=Float32)
+    state = zeros(Bool, num_examples(data), num_features(data))
+    logprob = zeros(Float, num_examples(data))
     Threads.@threads for ex_id = 1:size(state,1)
-        map_state_rec(nl, params, nodes, elements, ex_id, dec_id, values, state, logprob)
+        map_rec(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), ex_id, num_nodes(pbc), values, state, logprob)
     end
+    return state, logprob
 end
 
-function map_state_rec(nl, params, nodes, elements, ex_id, dec_id, values, state, logprob)
+function map_rec(nl, params, nodes, elements, ex_id, dec_id, values, state, logprob)
     if isleafgate(nl, dec_id)
         if isliteralgate(nl, dec_id)
             l = literal(nl, dec_id)
-            state[ex_id, lit2var(l)] = (l > 0) 
+            @inbounds state[ex_id, lit2var(l)] = (l > 0) 
         end
     else
         edge_log_pr, prime, sub = map_child(params, nodes, elements, ex_id, dec_id, values)
-        logprob[ex_id] += edge_log_pr
-        map_state_rec(nl, params, nodes, elements, ex_id, prime, values, state, logprob)
-        map_state_rec(nl, params, nodes, elements, ex_id, sub,   values, state, logprob)
+        @inbounds logprob[ex_id] += edge_log_pr
+        map_rec(nl, params, nodes, elements, ex_id, prime, values, state, logprob)
+        map_rec(nl, params, nodes, elements, ex_id, sub,   values, state, logprob)
     end
 end
 
 # GPU code
 
-function map_state_iter_cuda(nl, params, nodes, elements, values, state, logprob, stack)
+function map_down(pbc, data, values::CuArray; Float=Float32)
+    state = CUDA.zeros(Bool, num_examples(data), num_features(data))
+    logprob = CUDA.zeros(Float, num_examples(data))
+    stack = CUDA.zeros(Int32, num_examples(data), num_features(data)+3)
+    @inbounds stack[:,1] .= 1 # start with 1 dec_id in the stack
+    @inbounds stack[:,2] .= num_nodes(pbc) # start with the root in the stack
+    num_threads = 256
+    num_blocks = ceil(Int, size(state,1)/num_threads)
+    CUDA.@sync begin
+        @cuda threads=num_threads blocks=num_blocks map_cuda_kernel(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), values, state, logprob, stack)
+    end
+    return state, logprob
+end
+
+function map_cuda_kernel(nl, params, nodes, elements, values, state, logprob, stack)
     index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
     stride_x = blockDim().x * gridDim().x
     for ex_id = index_x:stride_x:size(state,1)
@@ -97,11 +111,11 @@ function map_state_iter_cuda(nl, params, nodes, elements, values, state, logprob
                 if isliteralgate(nl, dec_id)
                     l = literal(nl, dec_id)
                     var = lit2var(l)
-                    state[ex_id, Int(var)] = (l > 0) 
+                    @inbounds state[ex_id, var] = (l > 0) 
                 end
             else
                 edge_log_pr, prime, sub = map_child(params, nodes, elements, ex_id, dec_id, values)
-                logprob[ex_id] += edge_log_pr
+                @inbounds logprob[ex_id] += edge_log_pr
                 push_cuda!(stack, ex_id, prime)
                 push_cuda!(stack, ex_id, sub)
             end
@@ -109,24 +123,4 @@ function map_state_iter_cuda(nl, params, nodes, elements, values, state, logprob
         end
     end
     return nothing
-end
-
-#TODO move to utils
-
-function pop_cuda!(stack, i)
-    if stack[i,1] == zero(eltype(stack))
-        return zero(eltype(stack))
-    else
-        stack[i,1] -= one(eltype(stack))
-        return stack[i,stack[i,1]+2]
-    end
-end
-
-function push_cuda!(stack, i, v)
-    stack[i,1] += one(eltype(stack))
-    CUDA.@cuassert 1+stack[i,1] <= size(stack,2) "CUDA stack overflow"
-    stack[i,1+stack[i,1]] = v
-    return nothing
-end
-
-length_cuda(stack, i) = stack[i,1]
+end
\ No newline at end of file
diff --git a/test/queries/map_tests.jl b/test/queries/map_tests.jl
index bf204ab0..1b0b1f8c 100644
--- a/test/queries/map_tests.jl
+++ b/test/queries/map_tests.jl
@@ -38,6 +38,16 @@ include("../helper/gpu.jl")
 
     @test all(mar .> mappr .- 1e-6)
 
+    # same MAP states on CPU and GPU
+    cpu_gpu_agree(data_full) do d 
+        MAP(prob_circuit, d)[1]
+    end
+
+    # same MAP probabilities on CPU and GPU
+    cpu_gpu_agree_approx(data_full) do d 
+        MAP(prob_circuit, d)[2]
+    end
+
     # same MAP states on CPU and GPU
     cpu_gpu_agree(data_marg) do d 
         MAP(prob_circuit, d)[1]

From a2701593cc1b094248efd57d7bdc0ecf949df177 Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Wed, 30 Sep 2020 17:00:43 -0700
Subject: [PATCH 130/131] conditional sampling on CPU

---
 src/queries/map.jl          |   2 +-
 src/queries/sample.jl       | 153 ++++++++++++++++++++++++++++--------
 test/queries/sample_test.jl |  56 ++++++++++++-
 3 files changed, 172 insertions(+), 39 deletions(-)

diff --git a/src/queries/map.jl b/src/queries/map.jl
index 02e422fd..698ae483 100644
--- a/src/queries/map.jl
+++ b/src/queries/map.jl
@@ -11,7 +11,7 @@ max_a_posteriori(root::ProbCircuit, data::Union{Bool,Missing}...) =
     max_a_posteriori(root, collect(Union{Bool,Missing}, data))
 
 max_a_posteriori(root::ProbCircuit, data::Union{Vector{Union{Bool,Missing}},CuVector{UInt8}}) =
-    max_a_posteriori(root, DataFrame(reshape(data, 1, :)))[1,:]
+    example(max_a_posteriori(root, DataFrame(reshape(data, 1, :))), 1)
 
 max_a_posteriori(circuit::ProbCircuit, data::DataFrame) =
     max_a_posteriori(same_device(ParamBitCircuit(circuit, data), data), data)
diff --git a/src/queries/sample.jl b/src/queries/sample.jl
index ea0065d4..e5d9eeda 100644
--- a/src/queries/sample.jl
+++ b/src/queries/sample.jl
@@ -1,47 +1,132 @@
 export sample
 
+import DataFrames: DataFrame, mapcols!
 import Random: default_rng
 
-"""
-Sample from a PC without any evidence
-"""
-function sample(circuit::ProbCircuit; rng = default_rng())::BitVector
-    
-    inst = Dict{Var,Bool}()
-    
-    simulate(node) = simulate(node, GateType(node))
-    
-    simulate(node, ::LeafGate) = begin
-        inst[variable(node)] = ispositive(node)
+#####################
+# Circuit MAP/MPE evaluation
+#####################
+
+"Sample states from the circuit distribution"
+function sample(pc::ProbCircuit; rng = default_rng())
+    dfs, prs = sample(pc, 1, [missing for i=1:num_variables(pc)]...; rng)
+    return dfs[1], prs[1]
+end
+
+sample(pc::ProbCircuit, num_samples; rng = default_rng()) =
+    sample(pc, num_samples, [missing for i=1:num_variables(pc)]...; rng)
+
+sample(pc::ProbCircuit, num_samples, data::Union{Bool,Missing}...; rng = default_rng()) =
+    sample(pc, num_samples, collect(Union{Bool,Missing}, data); rng)
+
+function sample(pc::ProbCircuit, num_samples, data::Union{Vector{Union{Bool,Missing}},CuVector{UInt8}}; rng = default_rng())
+    dfs, prs = sample(pc, num_samples, DataFrame(reshape(data, 1, :)); rng)
+    return map(df -> example(df,1), dfs), prs[:,1]
+end
+
+sample(circuit::ProbCircuit, num_samples, data::DataFrame; rng = default_rng()) =
+    sample(same_device(ParamBitCircuit(circuit, data), data), num_samples, data; rng)
+
+function sample(pbc::ParamBitCircuit, num_samples, data; Float=Float32, rng = default_rng())
+    @assert isgpu(data) == isgpu(pbc) "ParamBitCircuit and data need to be on the same device"
+    values = marginal_all(pbc, data)
+    states, logprobs = sample_down(pbc, num_samples, data, values, rng, Float)
+    if isgpu(values)
+        # CUDA.unsafe_free!(values) # save the GC some effort
+        # # do the conversion to a CuBitVector on the CPU...
+        # df = DataFrame(to_cpu(state))
+        # mapcols!(c -> to_gpu(BitVector(c)), df)
+    else
+        dfs = mapslices(DataFrame, states, dims = [2,3])
+        map(dfs) do df
+            mapcols!(c -> BitVector(c), df)
+        end
     end
-    
-    simulate(node, ::⋁Gate) = begin
-        idx = sample_index(exp.(node.log_probs); rng)
-        simulate(children(node)[idx])
+    dfs, logprobs
+end
+
+"Sample a child node id of a given decision node"
+function sample_child(params, nodes, elements, ex_id, dec_id, values, rng)
+    @inbounds els_start = nodes[1,dec_id]
+    @inbounds els_end = nodes[2,dec_id]
+    threshold = log(rand(rng)) + values[ex_id, dec_id]
+    cumul_prob = -Inf
+    j_sampled = els_end - els_start + 1 # give all numerical error probability to the last node
+    for j = els_start:els_end
+        @inbounds prime = elements[2,j]
+        @inbounds sub = elements[3,j]
+        @inbounds pr = values[ex_id, prime] + values[ex_id, sub] + params[j]
+        Δ = ifelse(cumul_prob == pr, zero(cumul_prob), abs(cumul_prob - pr))
+        cumul_prob = max(cumul_prob, pr) + log1p(exp(-Δ))
+        if cumul_prob > threshold
+            j_sampled = j
+            break
+        end
     end
+    @inbounds return params[j_sampled], elements[2,j_sampled], elements[3,j_sampled] 
+end
 
-    simulate(node, ::⋀Gate) = 
-        foreach(simulate, children(node))
+# CPU code
 
-    simulate(circuit)
-    
-    len = length(keys(inst))
-    BitVector([inst[i] for i = 1:len])
+function sample_down(pbc, num_samples, data, values::Array, rng, Float)
+    state = zeros(Bool, num_samples, num_examples(data), num_features(data))
+    logprob = zeros(Float, num_samples, num_examples(data))
+    Threads.@threads for (s_id, ex_id) = collect(Iterators.product(1:size(state,1), 1:size(state,2)))
+        sample_rec(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), ex_id, s_id, num_nodes(pbc), values, state, logprob, rng)
+    end
+    return state, logprob
 end
 
-
-"""
-Uniformly sample based on the probability of the items and return the selected index
-"""
-function sample_index(probs::AbstractVector{<:Number}; rng = default_rng())::Int32
-    z = sum(probs)
-    q = rand(rng) * z
-    cur = 0.0
-    for i = 1:length(probs)
-        cur += probs[i]
-        if q <= cur
-            return i
+function sample_rec(nl, params, nodes, elements, ex_id, s_id, dec_id, values, state, logprob, rng)
+    if isleafgate(nl, dec_id)
+        if isliteralgate(nl, dec_id)
+            l = literal(nl, dec_id)
+            @inbounds state[s_id, ex_id, lit2var(l)] = (l > 0) 
         end
+    else
+        edge_log_pr, prime, sub = sample_child(params, nodes, elements, ex_id, dec_id, values, rng)
+        @inbounds logprob[s_id, ex_id] += edge_log_pr
+        sample_rec(nl, params, nodes, elements, ex_id, s_id, prime, values, state, logprob, rng)
+        sample_rec(nl, params, nodes, elements, ex_id, s_id, sub,   values, state, logprob, rng)
     end
-    return length(probs)
 end
+
+# GPU code
+
+# function sample_down(pbc, data, values::CuArray; Float=Float32)
+#     state = CUDA.zeros(Bool, num_examples(data), num_features(data))
+#     logprob = CUDA.zeros(Float, num_examples(data))
+#     stack = CUDA.zeros(Int32, num_examples(data), num_features(data)+3)
+#     @inbounds stack[:,1] .= 1 # start with 1 dec_id in the stack
+#     @inbounds stack[:,2] .= num_nodes(pbc) # start with the pc in the stack
+#     num_threads = 256
+#     num_blocks = ceil(Int, size(state,1)/num_threads)
+#     CUDA.@sync begin
+#         @cuda threads=num_threads blocks=num_blocks sample_cuda_kernel(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), values, state, logprob, stack)
+#     end
+#     return state, logprob
+# end
+
+# function sample_cuda_kernel(nl, params, nodes, elements, values, state, logprob, stack)
+#     index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
+#     stride_x = blockDim().x * gridDim().x
+#     for ex_id = index_x:stride_x:size(state,1)
+#         dec_id = pop_cuda!(stack, ex_id)
+#         while dec_id > zero(eltype(stack))
+#             if isleafgate(nl, dec_id)
+#                 if isliteralgate(nl, dec_id)
+#                     l = literal(nl, dec_id)
+#                     var = lit2var(l)
+#                     @inbounds state[ex_id, var] = (l > 0) 
+#                 end
+#             else
+#                 edge_log_pr, prime, sub = sample_child(params, nodes, elements, ex_id, dec_id, values)
+#                 @inbounds logprob[ex_id] += edge_log_pr
+#                 push_cuda!(stack, ex_id, prime)
+#                 push_cuda!(stack, ex_id, sub)
+#             end
+#             dec_id = pop_cuda!(stack, ex_id)
+#         end
+#     end
+#     return nothing
+# end
\ No newline at end of file
diff --git a/test/queries/sample_test.jl b/test/queries/sample_test.jl
index fa10c285..0638a769 100644
--- a/test/queries/sample_test.jl
+++ b/test/queries/sample_test.jl
@@ -3,7 +3,7 @@ using LogicCircuits
 using ProbabilisticCircuits
 using Random: MersenneTwister
 
-@testset "Sampling Test" begin
+@testset "Unconditional Sampling Test" begin
 
     rng = MersenneTwister(42)
 
@@ -14,10 +14,11 @@ using Random: MersenneTwister
 
     hist = Dict{BitVector,Int}()
 
-    Nsamples = 10_0000
+    Nsamples = 2_0000
+    samples, _ = sample(prob_circuit, Nsamples; rng)
+    samples = map(BitVector, samples)
     for i = 1:Nsamples
-        s = sample(prob_circuit; rng)
-        hist[s] = get(hist, s, 0) + 1
+        hist[samples[i]] = get(hist, samples[i], 0) + 1
     end
 
     for i = 1:num_examples(data_all)
@@ -26,5 +27,52 @@ using Random: MersenneTwister
         estim_prob = get(hist, ex, 0) / Nsamples
         @test exact_prob ≈ estim_prob atol=1e-2;
     end
+end
+
+@testset "Conditional Sampling Test" begin
+
+    rng = MersenneTwister(42)
+    num_samples = 10
+
+    pc = zoo_psdd("little_4var.psdd");
+    data_all = generate_data_all(num_variables(pc));
+
+    # sampling given complete data should return same data with its log likelihood 
+
+
+    loglikelihoods = MAR(pc, data_all)
+    sample_states, sample_prs = sample(pc, num_samples, data_all; rng)
+
+    for i in 1:num_samples
+        @test sample_states[i] == data_all
+        @test sample_prs[i,:] ≈ loglikelihoods atol=1e-6
+    end
+    
+    # sampling given partial data invariants
+
+    data_marg = DataFrame([false false false false; 
+                      false true true false; 
+                      false false true true;
+                      false false false missing; 
+                      missing true false missing; 
+                      missing missing missing missing; 
+                      false missing missing missing])
+
+    _, map_pr = MAP(pc, data_marg)
+
+    sample_states, sample_prs = sample(pc, num_samples, data_marg; rng)
+    
+    for i in 1:num_samples
+
+        # samples keep the partial evidence values
+        @test all(zip(eachcol(sample_states[i]), eachcol(data_marg))) do (cf,cm) 
+            all(zip(cf, cm)) do (f,m) 
+                ismissing(m) || f == m
+            end
+        end
+
+        # probability does not exceed MAP probability
+        @test all(sample_prs[i,:] .<= map_pr .+ 1e-6)
+    end
 
 end
\ No newline at end of file

From 2db0d6c09ce4e65f6e33d4d4237da6beaf7cbfba Mon Sep 17 00:00:00 2001
From: Guy Van den Broeck <guyvdb@gmail.com>
Date: Wed, 30 Sep 2020 22:31:50 -0700
Subject: [PATCH 131/131] GPU sampling

---
 src/Utils/misc.jl            |  40 +++++++-
 src/queries/map.jl           |  26 ++---
 src/queries/marginal_flow.jl |   7 +-
 src/queries/sample.jl        | 190 ++++++++++++++++++++---------------
 test/queries/sample_test.jl  |  63 ++++++++----
 5 files changed, 199 insertions(+), 127 deletions(-)

diff --git a/src/Utils/misc.jl b/src/Utils/misc.jl
index 1237496e..9de4ccea 100644
--- a/src/Utils/misc.jl
+++ b/src/Utils/misc.jl
@@ -1,5 +1,5 @@
-export to_long_mi,
-    pop_cuda!, push_cuda!, length_cuda,
+export to_long_mi, logsumexp_cuda,
+    pop_cuda!, push_cuda!, all_empty, length_cuda,
     generate_all, generate_data_all
 
 using DataFrames
@@ -15,11 +15,18 @@ function to_long_mi(m::Matrix{Float64}, min_int, max_int)::Matrix{Int64}
     return @. round(Int64, m * δint / δmi + min_int)
 end
 
+# TODO: get rid of all copies
+@inline function logsumexp_cuda(x,y) 
+    Δ = ifelse(x == y, zero(x), CUDA.abs(x - y))
+    max(x, y) + CUDA.log1p(CUDA.exp(-Δ))
+end
 
 ###################
 # Rudimentary CUDA-compatible stack data structure
 ####################
 
+# sadly making `i` varargs doesn't work; kernel won't compile
+
 function pop_cuda!(stack, i)
     if @inbounds stack[i,1] == zero(eltype(stack))
         return zero(eltype(stack))
@@ -29,14 +36,37 @@ function pop_cuda!(stack, i)
     end
 end
 
-function push_cuda!(stack, i, v)
+function pop_cuda!(stack, i, j)
+    if @inbounds stack[i,j,1] == zero(eltype(stack))
+        return zero(eltype(stack))
+    else
+        @inbounds stack[i,j,1] -= one(eltype(stack))
+        @inbounds return stack[i,j,stack[i,j,1]+2]
+    end
+end
+
+function push_cuda!(stack, v, i)
     @inbounds stack[i,1] += one(eltype(stack))
-    @inbounds CUDA.@cuassert 1+stack[i,1] <= size(stack,2) "CUDA stack overflow"
+    @inbounds CUDA.@cuassert 1+stack[i,1] <= size(stack, ndims(stack)) "CUDA stack overflow"
     @inbounds stack[i,1+stack[i,1]] = v
     return nothing
 end
 
-length_cuda(stack, i) = stack[i,1]
+function push_cuda!(stack, v, i, j)
+    @inbounds stack[i, j,1] += one(eltype(stack))
+    @inbounds CUDA.@cuassert 1+stack[i, j,1] <= size(stack, ndims(stack)) "CUDA stack overflow"
+    @inbounds stack[i, j,1+stack[i, j,1]] = v
+    return nothing
+end
+
+all_empty(stack::AbstractArray{T,2}) where T = 
+    all(x -> iszero(x), stack[:,1])
+
+all_empty(stack::AbstractArray{T,3}) where T = 
+    all(x -> iszero(x), stack[:,:,1])
+
+
+length_cuda(stack, i...) = stack[i...,1]
 
 
 ###################
diff --git a/src/queries/map.jl b/src/queries/map.jl
index 698ae483..cda5d052 100644
--- a/src/queries/map.jl
+++ b/src/queries/map.jl
@@ -19,17 +19,7 @@ max_a_posteriori(circuit::ProbCircuit, data::DataFrame) =
 function max_a_posteriori(pbc::ParamBitCircuit, data; Float=Float32)
     @assert isgpu(data) == isgpu(pbc) "ParamBitCircuit and data need to be on the same device"
     values = marginal_all(pbc, data)
-    state, logprob = map_down(pbc, data, values; Float)
-    if isgpu(values)
-        CUDA.unsafe_free!(values) # save the GC some effort
-        # do the conversion to a CuBitVector on the CPU...
-        df = DataFrame(to_cpu(state))
-        mapcols!(c -> to_gpu(BitVector(c)), df)
-    else
-        df = DataFrame(state)
-        mapcols!(c -> BitVector(c), df)
-    end
-    df, logprob
+    return map_down(pbc, data, values; Float)
 end
 
 """
@@ -68,7 +58,9 @@ function map_down(pbc, data, values::Array; Float=Float32)
     Threads.@threads for ex_id = 1:size(state,1)
         map_rec(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), ex_id, num_nodes(pbc), values, state, logprob)
     end
-    return state, logprob
+    df = DataFrame(state)
+    mapcols!(c -> BitVector(c), df)
+    return df, logprob
 end
 
 function map_rec(nl, params, nodes, elements, ex_id, dec_id, values, state, logprob)
@@ -98,7 +90,11 @@ function map_down(pbc, data, values::CuArray; Float=Float32)
     CUDA.@sync begin
         @cuda threads=num_threads blocks=num_blocks map_cuda_kernel(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), values, state, logprob, stack)
     end
-    return state, logprob
+    CUDA.unsafe_free!(values) # save the GC some effort
+    # do the conversion to a CuBitVector on the CPU...
+    df = DataFrame(to_cpu(state))
+    mapcols!(c -> to_gpu(BitVector(c)), df)
+    return df, logprob
 end
 
 function map_cuda_kernel(nl, params, nodes, elements, values, state, logprob, stack)
@@ -116,8 +112,8 @@ function map_cuda_kernel(nl, params, nodes, elements, values, state, logprob, st
             else
                 edge_log_pr, prime, sub = map_child(params, nodes, elements, ex_id, dec_id, values)
                 @inbounds logprob[ex_id] += edge_log_pr
-                push_cuda!(stack, ex_id, prime)
-                push_cuda!(stack, ex_id, sub)
+                push_cuda!(stack, prime, ex_id)
+                push_cuda!(stack, sub, ex_id)
             end
             dec_id = pop_cuda!(stack, ex_id)
         end
diff --git a/src/queries/marginal_flow.jl b/src/queries/marginal_flow.jl
index ec7d399c..1a6b55df 100644
--- a/src/queries/marginal_flow.jl
+++ b/src/queries/marginal_flow.jl
@@ -324,7 +324,7 @@ function marginal_flows_down_layers_cuda(layer, nodes, elements, parents, params
                                 v_sub = @inbounds values[k, sub]
                                 edge_flow = compute_marg_edge_flow(v_prime, v_sub, v_gp, f_gp, θ)
                             end
-                            flow = sum_marg_flows(flow, edge_flow)
+                            flow = logsumexp_cuda(flow, edge_flow)
                             # report edge flow only once:
                             dec_id == prime && on_edge(flows, values, prime, sub, par, grandpa, k, edge_flow, single_child)
                         end
@@ -338,11 +338,6 @@ function marginal_flows_down_layers_cuda(layer, nodes, elements, parents, params
     return nothing
 end
 
-@inline function sum_marg_flows(x,y) 
-    Δ = ifelse(x == y, zero(x), CUDA.abs(x - y))
-    max(x, y) + CUDA.log1p(CUDA.exp(-Δ))
-end
-
 @inline function compute_marg_edge_flow(p_up, s_up, n_up, n_down, θ)
     x = p_up + s_up - n_up + n_down + θ
     ifelse(isnan(x), typemin(n_down), x)
diff --git a/src/queries/sample.jl b/src/queries/sample.jl
index e5d9eeda..72aa5c88 100644
--- a/src/queries/sample.jl
+++ b/src/queries/sample.jl
@@ -1,52 +1,77 @@
-export sample
+export sample, to_sampled_dataframes
 
 import DataFrames: DataFrame, mapcols!
 import Random: default_rng
 
 #####################
-# Circuit MAP/MPE evaluation
+# Circuit sampling
 #####################
 
-"Sample states from the circuit distribution"
+"Sample states from the circuit distribution."
 function sample(pc::ProbCircuit; rng = default_rng())
-    dfs, prs = sample(pc, 1, [missing for i=1:num_variables(pc)]...; rng)
-    return dfs[1], prs[1]
+    states, prs = sample(pc, 1, [missing for i=1:num_variables(pc)]...; rng)
+    return states[1,:], prs[1]
 end
 
-sample(pc::ProbCircuit, num_samples; rng = default_rng()) =
-    sample(pc, num_samples, [missing for i=1:num_variables(pc)]...; rng)
+sample(pc::ProbCircuit, num_samples; rng = default_rng(), gpu=false) =
+    sample(pc, num_samples, [missing for i=1:num_variables(pc)]...; rng, gpu)
 
-sample(pc::ProbCircuit, num_samples, data::Union{Bool,Missing}...; rng = default_rng()) =
-    sample(pc, num_samples, collect(Union{Bool,Missing}, data); rng)
+sample(pc::ProbCircuit, num_samples, inputs::Union{Bool,Missing}...; 
+        rng = default_rng(), gpu=false) =
+    sample(pc, num_samples, collect(Union{Bool,Missing}, inputs); rng, gpu)
 
-function sample(pc::ProbCircuit, num_samples, data::Union{Vector{Union{Bool,Missing}},CuVector{UInt8}}; rng = default_rng())
-    dfs, prs = sample(pc, num_samples, DataFrame(reshape(data, 1, :)); rng)
-    return map(df -> example(df,1), dfs), prs[:,1]
+function sample(pc::ProbCircuit, num_samples, inputs::AbstractVector{Union{Bool,Missing}}; 
+                rng = default_rng(), gpu=false)
+    data = DataFrame(reshape(inputs, 1, :))
+    data = gpu ? to_gpu(data) : data
+    states, prs = sample(pc, num_samples, data; rng)
+    return states[:,1,:], prs[:,1]
 end
 
 sample(circuit::ProbCircuit, num_samples, data::DataFrame; rng = default_rng()) =
     sample(same_device(ParamBitCircuit(circuit, data), data), num_samples, data; rng)
 
-function sample(pbc::ParamBitCircuit, num_samples, data; Float=Float32, rng = default_rng())
+function sample(pbc::ParamBitCircuit, num_samples, data; Float = Float32, rng = default_rng())
     @assert isgpu(data) == isgpu(pbc) "ParamBitCircuit and data need to be on the same device"
     values = marginal_all(pbc, data)
-    states, logprobs = sample_down(pbc, num_samples, data, values, rng, Float)
-    if isgpu(values)
-        # CUDA.unsafe_free!(values) # save the GC some effort
-        # # do the conversion to a CuBitVector on the CPU...
-        # df = DataFrame(to_cpu(state))
-        # mapcols!(c -> to_gpu(BitVector(c)), df)
-    else
-        dfs = mapslices(DataFrame, states, dims = [2,3])
-        map(dfs) do df
-            mapcols!(c -> BitVector(c), df)
+    return sample_down(pbc, num_samples, data, values, rng, Float)
+end
+
+"Convert an array of samples into a vector of dataframes"
+function to_sampled_dataframes(states) 
+    dfs = mapslices(DataFrame, states, dims = [2,3])
+    map(dfs) do df
+        mapcols!(c -> BitVector(c), df)
+    end
+    return dfs
+end
+
+# CPU code
+
+function sample_down(pbc, num_samples, data, values::Array, rng, ::Type{Float}) where Float
+    state = zeros(Bool, num_samples, num_examples(data), num_features(data))
+    logprob = zeros(Float, num_samples, num_examples(data))
+    Threads.@threads for (s_id, ex_id) = collect(Iterators.product(1:size(state,1), 1:size(state,2)))
+        sample_rec(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), ex_id, s_id, num_nodes(pbc), values, state, logprob, rng)
+    end
+    return state, logprob
+end
+
+function sample_rec(nl, params, nodes, elements, ex_id, s_id, dec_id, values, state, logprob, rng)
+    if isleafgate(nl, dec_id)
+        if isliteralgate(nl, dec_id)
+            l = literal(nl, dec_id)
+            @inbounds state[s_id, ex_id, lit2var(l)] = (l > 0) 
         end
+    else
+        edge_log_pr, prime, sub = sample_child_cpu(params, nodes, elements, ex_id, dec_id, values, rng)
+        @inbounds logprob[s_id, ex_id] += edge_log_pr
+        sample_rec(nl, params, nodes, elements, ex_id, s_id, prime, values, state, logprob, rng)
+        sample_rec(nl, params, nodes, elements, ex_id, s_id, sub,   values, state, logprob, rng)
     end
-    dfs, logprobs
 end
 
-"Sample a child node id of a given decision node"
-function sample_child(params, nodes, elements, ex_id, dec_id, values, rng)
+function sample_child_cpu(params, nodes, elements, ex_id, dec_id, values, rng)
     @inbounds els_start = nodes[1,dec_id]
     @inbounds els_end = nodes[2,dec_id]
     threshold = log(rand(rng)) + values[ex_id, dec_id]
@@ -66,67 +91,70 @@ function sample_child(params, nodes, elements, ex_id, dec_id, values, rng)
     @inbounds return params[j_sampled], elements[2,j_sampled], elements[3,j_sampled] 
 end
 
-# CPU code
 
-function sample_down(pbc, num_samples, data, values::Array, rng, Float)
-    state = zeros(Bool, num_samples, num_examples(data), num_features(data))
-    logprob = zeros(Float, num_samples, num_examples(data))
-    Threads.@threads for (s_id, ex_id) = collect(Iterators.product(1:size(state,1), 1:size(state,2)))
-        sample_rec(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), ex_id, s_id, num_nodes(pbc), values, state, logprob, rng)
+# GPU code
+
+function sample_down(pbc, num_samples, data, values::CuArray, rng, ::Type{Float}) where Float
+    CUDA.seed!(rand(rng, UInt))
+    state = CUDA.zeros(Bool, num_samples, num_examples(data), num_features(data))
+    logprob = CUDA.zeros(Float, num_samples, num_examples(data))
+    stack = CUDA.zeros(Int32, num_samples, num_examples(data), num_features(data)+3)
+    @inbounds stack[:,:,1] .= 1 # start with 1 dec_id in the stack
+    @inbounds stack[:,:,2] .= num_nodes(pbc) # start with the pc in the stack
+    num_threads =  balance_threads(num_samples, num_examples(data), 8)
+    num_blocks = (ceil(Int, num_samples/num_threads[1]), 
+                  ceil(Int, num_examples(data)/num_threads[2]))
+    CUDA.@sync  while true
+        r = CUDA.rand(num_samples, num_examples(data))
+        @cuda threads=num_threads blocks=num_blocks sample_cuda_kernel(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), values, state, logprob, stack, r, Float)
+        all_empty(stack) && break
     end
+    CUDA.unsafe_free!(values) # save the GC some effort
     return state, logprob
 end
 
-function sample_rec(nl, params, nodes, elements, ex_id, s_id, dec_id, values, state, logprob, rng)
-    if isleafgate(nl, dec_id)
-        if isliteralgate(nl, dec_id)
-            l = literal(nl, dec_id)
-            @inbounds state[s_id, ex_id, lit2var(l)] = (l > 0) 
+function sample_cuda_kernel(nl, params, nodes, elements, values, state, logprob, stack, r, ::Type{Float}) where Float
+    index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
+    index_y = (blockIdx().y - 1) * blockDim().y + threadIdx().y
+    stride_x = blockDim().x * gridDim().x
+    stride_y = blockDim().y * gridDim().y
+    for s_id = index_x:stride_x:size(state,1)
+        for ex_id = index_y:stride_y:size(state,2)
+            dec_id = pop_cuda!(stack, s_id, ex_id)
+            if dec_id > zero(eltype(stack))
+                if isleafgate(nl, dec_id)
+                    if isliteralgate(nl, dec_id)
+                        l = literal(nl, dec_id)
+                        var = lit2var(l)
+                        @inbounds state[s_id, ex_id, var] = (l > 0) 
+                    end
+                else
+                    edge_log_pr, prime, sub = sample_child_cuda(params, nodes, elements, s_id, ex_id, dec_id, values, r, Float)
+                    @inbounds logprob[s_id, ex_id] += edge_log_pr
+                    push_cuda!(stack, prime, s_id, ex_id)
+                    push_cuda!(stack, sub, s_id, ex_id)
+                end
+            end
         end
-    else
-        edge_log_pr, prime, sub = sample_child(params, nodes, elements, ex_id, dec_id, values, rng)
-        @inbounds logprob[s_id, ex_id] += edge_log_pr
-        sample_rec(nl, params, nodes, elements, ex_id, s_id, prime, values, state, logprob, rng)
-        sample_rec(nl, params, nodes, elements, ex_id, s_id, sub,   values, state, logprob, rng)
     end
+    return nothing
 end
 
-# GPU code
-
-# function sample_down(pbc, data, values::CuArray; Float=Float32)
-#     state = CUDA.zeros(Bool, num_examples(data), num_features(data))
-#     logprob = CUDA.zeros(Float, num_examples(data))
-#     stack = CUDA.zeros(Int32, num_examples(data), num_features(data)+3)
-#     @inbounds stack[:,1] .= 1 # start with 1 dec_id in the stack
-#     @inbounds stack[:,2] .= num_nodes(pbc) # start with the pc in the stack
-#     num_threads = 256
-#     num_blocks = ceil(Int, size(state,1)/num_threads)
-#     CUDA.@sync begin
-#         @cuda threads=num_threads blocks=num_blocks sample_cuda_kernel(num_leafs(pbc), params(pbc), nodes(pbc), elements(pbc), values, state, logprob, stack)
-#     end
-#     return state, logprob
-# end
-
-# function sample_cuda_kernel(nl, params, nodes, elements, values, state, logprob, stack)
-#     index_x = (blockIdx().x - 1) * blockDim().x + threadIdx().x
-#     stride_x = blockDim().x * gridDim().x
-#     for ex_id = index_x:stride_x:size(state,1)
-#         dec_id = pop_cuda!(stack, ex_id)
-#         while dec_id > zero(eltype(stack))
-#             if isleafgate(nl, dec_id)
-#                 if isliteralgate(nl, dec_id)
-#                     l = literal(nl, dec_id)
-#                     var = lit2var(l)
-#                     @inbounds state[ex_id, var] = (l > 0) 
-#                 end
-#             else
-#                 edge_log_pr, prime, sub = sample_child(params, nodes, elements, ex_id, dec_id, values)
-#                 @inbounds logprob[ex_id] += edge_log_pr
-#                 push_cuda!(stack, ex_id, prime)
-#                 push_cuda!(stack, ex_id, sub)
-#             end
-#             dec_id = pop_cuda!(stack, ex_id)
-#         end
-#     end
-#     return nothing
-# end
\ No newline at end of file
+function sample_child_cuda(params, nodes, elements, s_id, ex_id, dec_id, values, r, ::Type{Float}) where Float
+    @inbounds els_start = nodes[1,dec_id]
+    @inbounds els_end = nodes[2,dec_id]
+    @inbounds threshold = CUDA.log(r[s_id, ex_id]) + values[ex_id, dec_id]
+    cumul_prob::Float = -Inf
+    j_sampled = els_end - els_start + 1 # give all numerical error probability to the last node
+    for j = els_start:els_end
+        @inbounds prime = elements[2,j]
+        @inbounds sub = elements[3,j]
+        @inbounds pr::Float = values[ex_id, prime] + values[ex_id, sub] + params[j]
+        cumul_prob = logsumexp_cuda(cumul_prob, pr)
+        if cumul_prob > threshold
+            j_sampled = j
+            break
+        end
+    end
+    @inbounds return params[j_sampled], elements[2,j_sampled], elements[3,j_sampled] 
+end
\ No newline at end of file
diff --git a/test/queries/sample_test.jl b/test/queries/sample_test.jl
index 0638a769..46143add 100644
--- a/test/queries/sample_test.jl
+++ b/test/queries/sample_test.jl
@@ -2,31 +2,43 @@ using Test
 using LogicCircuits
 using ProbabilisticCircuits
 using Random: MersenneTwister
+using CUDA: functional
+
+function histogram_matches_likelihood(samples::Matrix{Bool}, worlds, loglikelihoods)
+    hist = Dict{BitVector,Int}()
+    for i = 1:size(samples,1)
+        sample = BitVector(samples[i,:]) 
+        hist[sample] = get(hist, sample, 0) + 1
+    end
+    for i = 1:size(worlds,1)
+        exact_prob = exp(loglikelihoods[i])
+        ex = BitVector(example(worlds,i))
+        estim_prob = get(hist, ex, 0) / size(samples,1)
+        @test exact_prob ≈ estim_prob atol=1e-2;
+    end
+
+end
 
 @testset "Unconditional Sampling Test" begin
 
     rng = MersenneTwister(42)
 
-    prob_circuit = zoo_psdd("little_4var.psdd");
-    data_all = generate_data_all(num_variables(prob_circuit));
-
-    calc_prob_all = EVI(prob_circuit, data_all)
+    pc = zoo_psdd("little_4var.psdd");
+    worlds = generate_data_all(num_variables(pc));
 
-    hist = Dict{BitVector,Int}()
+    loglikelihoods = EVI(pc, worlds)
 
     Nsamples = 2_0000
-    samples, _ = sample(prob_circuit, Nsamples; rng)
-    samples = map(BitVector, samples)
-    for i = 1:Nsamples
-        hist[samples[i]] = get(hist, samples[i], 0) + 1
-    end
 
-    for i = 1:num_examples(data_all)
-        exact_prob = exp(calc_prob_all[i])
-        ex = BitVector(example(data_all,i))
-        estim_prob = get(hist, ex, 0) / Nsamples
-        @test exact_prob ≈ estim_prob atol=1e-2;
+    samples, _ = sample(pc, Nsamples; rng)
+    histogram_matches_likelihood(samples, worlds, loglikelihoods)
+
+    if CUDA.functional()
+        samples, _ = sample(pc, Nsamples; rng, gpu = true)
+        samples_cpu = to_cpu(samples)
+        histogram_matches_likelihood(samples_cpu, worlds, loglikelihoods)    
     end
+
 end
 
 @testset "Conditional Sampling Test" begin
@@ -44,10 +56,21 @@ end
     sample_states, sample_prs = sample(pc, num_samples, data_all; rng)
 
     for i in 1:num_samples
-        @test sample_states[i] == data_all
+        @test sample_states[i,:,:] == convert(Matrix,data_all)
         @test sample_prs[i,:] ≈ loglikelihoods atol=1e-6
     end
     
+    # same states on CPU and GPU
+    cpu_gpu_agree(data_all) do d 
+        sample(pc, num_samples, d)[1]
+    end
+
+    # same probabilities on CPU and GPU
+    cpu_gpu_agree_approx(data_all) do d 
+        sample(pc, num_samples, d)[2]
+    end
+
+
     # sampling given partial data invariants
 
     data_marg = DataFrame([false false false false; 
@@ -65,14 +88,14 @@ end
     for i in 1:num_samples
 
         # samples keep the partial evidence values
-        @test all(zip(eachcol(sample_states[i]), eachcol(data_marg))) do (cf,cm) 
-            all(zip(cf, cm)) do (f,m) 
-                ismissing(m) || f == m
-            end
+        pairs = collect(zip(sample_states[i,:,:], convert(Matrix,data_marg)))
+        @test all(pairs) do (f,m)
+            ismissing(m) || f == m
         end
 
         # probability does not exceed MAP probability
         @test all(sample_prs[i,:] .<= map_pr .+ 1e-6)
     end
 
+
 end
\ No newline at end of file