A Projection Process

In [291]:
using LinearAlgebra, Combinatorics

In [303]:
N,n = 8,5
Y,_ = qr(randn(N,n))
Y = Matrix(Y)
K = Y*Y'

8×8 Array{Float64,2}:
  0.883617   -0.136266   -0.115083    …  -0.143913   -0.131843   -0.141605 
 -0.136266    0.670147    0.0724459      -0.129255   -0.232152   -0.141875 
 -0.115083    0.0724459   0.142911        0.0395701   0.0242015  -0.277216 
  0.111046    0.186961   -0.158035        0.217009    0.176035    0.0834222
 -0.0234192   0.267486   -0.00444622     -0.273366    0.0621028   0.013141 
 -0.143913   -0.129255    0.0395701   …   0.705667   -0.173125   -0.130091 
 -0.131843   -0.232152    0.0242015      -0.173125    0.807802   -0.136301 
 -0.141605   -0.141875   -0.277216       -0.130091   -0.136301    0.800561 

In [304]:
# All combinations of p subsets of 1:n
[𝓘 for 𝓘 ∈ combinations(1:N,n)]

56-element Array{Array{Int64,1},1}:
 [1, 2, 3, 4, 5]
 [1, 2, 3, 4, 6]
 [1, 2, 3, 4, 7]
 [1, 2, 3, 4, 8]
 [1, 2, 3, 5, 6]
 [1, 2, 3, 5, 7]
 [1, 2, 3, 5, 8]
 [1, 2, 3, 6, 7]
 [1, 2, 3, 6, 8]
 [1, 2, 3, 7, 8]
 [1, 2, 4, 5, 6]
 [1, 2, 4, 5, 7]
 [1, 2, 4, 5, 8]
 ⋮              
 [2, 3, 6, 7, 8]
 [2, 4, 5, 6, 7]
 [2, 4, 5, 6, 8]
 [2, 4, 5, 7, 8]
 [2, 4, 6, 7, 8]
 [2, 5, 6, 7, 8]
 [3, 4, 5, 6, 7]
 [3, 4, 5, 6, 8]
 [3, 4, 5, 7, 8]
 [3, 4, 6, 7, 8]
 [3, 5, 6, 7, 8]
 [4, 5, 6, 7, 8]

## This is a probability space

specifically P(𝓘) = det(K[𝓘,𝓘]) is thought of as the probability of 𝓘 

This is an n-DPP because all the points are size n

In [305]:
sum(det(K[𝓘,𝓘]) for 𝓘 ∈ combinations(1:N,n) )

0.9999999999999992

## if you take sizes k smaller than p you need to correct with binomial(p,j)

In [306]:
[[sum(det(K[𝒬,𝒬]) for 𝒬 ∈ combinations(1:N,k) ) for k=0:n] [binomial(n,k) for k=0:n]]

6×2 Array{Float64,2}:
  1.0   1.0
  5.0   5.0
 10.0  10.0
 10.0  10.0
  5.0   5.0
  1.0   1.0

## a really nice property of projection processes

In [307]:
## associate 𝓘  with its probability
## then associate all j subsets of 𝓘 with that probability over binomial(p,j)
## now add up the probabilities for all j subsets ... that will be the j subset probabilty

In [308]:
k = 3
d = Dict{Array{Int64,1},Float64}()
 for 𝓘 ∈ combinations(1:N, n)
    prob = det(K[𝓘,𝓘]) / binomial(N,n)
    for 𝒬 ∈ combinations(𝓘)
        if haskey(d,𝒬)
            d[𝒬] += prob
        else
            d[𝒬] = prob
        end
    end
end

In [309]:
# the answer that I expect is
for 𝒬 ∈ combinations(1:N)    
      println(𝒬," ",det(K[𝒬,𝒬])/binomial(N,n) ," ", d[𝒬]  ) 
end

[1] 0.01577888340359449 0.01577888340359447
[2] 0.011966914338520826 0.011966914338520818
[3] 0.002551981405124698 0.0025519814051246973
[4] 0.014191837037997567 0.014191837037997554
[5] 0.0034741232145313466 0.00347412321453135
[6] 0.012601195813984953 0.012601195813984946
[7] 0.01442504007150522 0.01442504007150521
[8] 0.014295739000455165 0.014295739000455145
[1, 2] 0.010242597399505993 0.010242597399505986
[1, 3] 0.0020184749851330187 0.0020184749851330165
[1, 4] 0.012319955057341339 0.012319955057341323
[1, 5] 0.0030600020611192278 0.003060002061119229
[1, 6] 0.01076479667409666 0.010764796674096652
[1, 7] 0.012435816061352164 0.012435816061352151
[1, 8] 0.01227389137582954 0.012273891375829522
[2, 3] 0.0016164816221998929 0.0016164816221998918
[2, 4] 0.00888643256837728 0.008886432568377275
[2, 5] 0.0010505200287650768 0.0010505200287650792
[2, 6] 0.008146320077530921 0.00814632007753092
[2, 7] 0.008704495367852743 0.008704495367852741
[2, 8] 0.009220810289851389 0.00922081028985

[1, 3, 4, 7, 8] 2.3309541114188805e-6 2.3309541114188805e-6
[1, 3, 5, 6, 7] 8.089554047506081e-5 8.089554047506081e-5
[1, 3, 5, 6, 8] 5.2093959728141476e-6 5.2093959728141476e-6
[1, 3, 5, 7, 8] 2.080118381740943e-5 2.080118381740943e-5
[1, 3, 6, 7, 8] 3.8161616913923133e-5 3.8161616913923133e-5
[1, 4, 5, 6, 7] 0.00012567548160379228 0.00012567548160379228
[1, 4, 5, 6, 8] 0.00013850796404832826 0.00013850796404832826
[1, 4, 5, 7, 8] 0.0012066502623286541 0.0012066502623286541
[1, 4, 6, 7, 8] 0.0028986793181537767 0.0028986793181537767
[1, 5, 6, 7, 8] 0.0004113477149473649 0.0004113477149473649
[2, 3, 4, 5, 6] 1.2081442567714053e-6 1.2081442567714053e-6
[2, 3, 4, 5, 7] 2.3542566790919752e-6 2.3542566790919752e-6
[2, 3, 4, 5, 8] 1.0149872387314817e-5 1.0149872387314817e-5
[2, 3, 4, 6, 7] 4.156829139528629e-5 4.156829139528629e-5
[2, 3, 4, 6, 8] 5.496755338322145e-5 5.496755338322145e-5
[2, 3, 4, 7, 8] 6.952226655239533e-5 6.952226655239533e-5
[2, 3, 5, 6, 7] 4.9027452139112103e-8 4.902745

KeyError: KeyError: key [1, 2, 3, 4, 5, 6] not found

In [310]:
## It seems people prefer to look at this the other way around
## but it amounts to the same thing

## specifically I can generate the n set according to the determinant
## and then the i set uniformly among subsets
## or I can start with the i set and find all the A sets that are supersets

for i = combinations(1:N)
# Generate all subsets Y of length n that contain i
 
 print( sum( det(K[Y,Y]) for Y ∈ combinations(1:N, n) if i ⊆ Y) )
 println( " ",det(K[i,i]) )
end

0.8836174706012904 0.8836174706012915
0.6701472029571661 0.6701472029571662
0.14291095868698298 0.1429109586869831
0.7947428741278632 0.7947428741278638
0.19455090001375555 0.1945509000137554
0.7056669655831573 0.7056669655831573
0.8078022440042921 0.8078022440042923
0.8005613840254884 0.8005613840254893
0.5735854543723353 0.5735854543723357
0.1130345991674489 0.11303459916744905
0.689917483211114 0.689917483211115
0.17136011542267676 0.17136011542267676
0.6028286137494127 0.602828613749413
0.6964056994357206 0.6964056994357212
0.6873379170464533 0.6873379170464542
0.09052297084319397 0.090522970843194
0.4976402238291274 0.4976402238291277
0.058829121610844415 0.058829121610844304
0.45619392434173156 0.4561939243417316
0.4874517405997535 0.4874517405997536
0.5163653762316773 0.5163653762316778
0.08860246298187006 0.08860246298187009
0.027783686783160514 0.027783686783160497
0.09928175339677132 0.09928175339677134
0.11485807880122889 0.11485807880122895
0.037560282774258234 0.0375602827

ArgumentError: ArgumentError: reducing over an empty collection is not allowed

## Another identity

In [311]:
det( K[ [1, 2, 3],[1, 2,3]])


0.07073078443908119

In [312]:
sum( det( Y[ [1,2,3],𝒬])^2 for 𝒬 ∈ combinations(1:5,3))

0.0707307844390812

## Now General Λ -- L Ensemble

In [283]:
N,n = 3,3
Y,_ = qr(randn(N,n))
Y = Matrix(Y)
Λ = Diagonal(rand(n))
L = Y*Λ*Y';

In [284]:
(1 + sum( det(L[𝒬,𝒬]) for 𝒬 ∈ combinations(1:N)))/det(I+L)

0.9999999999999997

## The simple thing:
   Take 𝒬 in the power set of 1:N with probabilty det(L[𝒬;𝒬])/det(I+L)

## Slightly more complicated:
   If A is the power set of 1:N, the probability that A ⊆ 𝒬 is det(K[A;A])

what does this mean?
   This means that if we add up all the disjoint situations of the probability of 𝒬 as above but only when A ⊆ 𝒬, we will get det(K[A;A])
   
   
   Let's take an example : A ={1}
   What we are going to do is take a random subset of 1:N, and we are wondering what is the probablity that we will see a {1} in this subset.  This probablity is K[1,1].
   This is the sum of P[1] +P[1,2] +P[1,3] + P[1,2,4,5] + lots of other things
   
  what is the probabilty of 𝒬 = [1] itself?
Answer: it's the probability that [1] shows up , but without any friends.
    it's not K[1;1]. Remember K[1,1] is the probablity that 1 shows up in 𝒬, usually with friends.  




In [285]:
println("True Probabilities L form")
println("[]"," ",1/det(I+L))
for 𝒬 ∈ combinations(1:N)
    println(𝒬," ",det(L[𝒬,𝒬])/det(I+L))
end

println()
K = L/(L+I) # L * inv(L+I)
# L = K/(I-K)

println("Cumulatives Probabilities K form")
  println("[] ",1)
for A = combinations(1:N)
# Generate all subsets Y
  
 println(A, " ",sum( det(L[Y,Y]) for Y ∈ combinations(1:N) if A ⊆ Y) / det(I+L))
 #println(" ",det(K[A,A]) )
end
                

True Probabilities L form
[] 0.32873468671520195
[1] 0.14354457045611285
[2] 0.14524090207685675
[3] 0.1541770679572946
[1, 2] 0.06334278470344586
[1, 3] 0.0671934295226372
[2, 3] 0.06811680194943265
[1, 2, 3] 0.02964975661901781

Cumulatives Probabilities K form
[] 1
[1] 0.30373054130121374
[2] 0.30635024534875305
[3] 0.3191370560483823
[1, 2] 0.09299254132246366
[1, 3] 0.096843186141655
[2, 3] 0.09776655856845047
[1, 2, 3] 0.02964975661901781


In [286]:
0.46008329904121614 -  0.13173534981704144

0.3283479492241747

In [287]:
0.30373054130121374 - (0.09299254132246366 + 0.096843186141655) + 0.02964975661901781


0.14354457045611288