In [1]:
%matplotlib inline
import matplotlib.pyplot as plt
import numpy as np
import tensorflow as tf
import pandas as pd
import random as rn
import os
import cne
import maxent

In [2]:
triples = [('Eve', 'type', 'Lecturer'),
           #('Eve', 'type', 'Person'), 
           ('Lecturer', 'subClassOf', 'Person'), 
           #('David', 'type', 'Person'),
           ('David', 'type', 'Researcher'),
           ('Researcher', 'subClassOf', 'Person'),
           ('Flora', 'hasSpouse', 'Gaston'),
           ('Gaston', 'type', 'Person'),
           #('Flora', 'type', 'Person')
          ]

train = np.array(triples)

entities = list(set(np.concatenate((train[:,0], train[:,2]), axis=0)))
relations = list(set(train[:,1]))

num_entities = len(entities)
num_relations = len(relations)

ent2idx = dict(zip(entities, range(num_entities)))
rel2idx = dict(zip(relations, range(num_relations)))

idx2ent = {idx:ent for ent,idx in ent2idx.items()}
idx2rel = {idx:rel for rel,idx in rel2idx.items()}

In [3]:
#A = np.zeros(shape=(num_entities,num_entities,num_relations))
A = np.zeros(shape=(num_entities,num_entities))

for h,r,t in train:
    
    h_idx = entities.index(h)
    r_idx = relations.index(r)
    t_idx = entities.index(t)
    
    #A[h_idx,t_idx,r_idx] = 1
    A[h_idx, t_idx] = 1

def score(h,r,t):
    return tf.reduce_sum(tf.square(h + r - t))

In [4]:
train2idx = []

for head, rel, tail in train:
    
    head_idx = ent2idx[head]
    tail_idx = ent2idx[tail]
    rel_idx = rel2idx[rel]

    train2idx.append([head_idx, rel_idx, tail_idx])
    
train2idx = np.array(train2idx)

In [5]:
from scipy import sparse
A_sparse = sparse.csr_matrix(A)  

In [6]:
prior = maxent.BGDistr(A_sparse) 
prior.fit() 

In [7]:
CNE = cne.ConditionalNetworkEmbedding(
    A=A_sparse,
    d=10,
    s1=1,
    s2=1.5,
    prior_dist=prior
    )
CNE.fit(lr=.001, max_iter=100)

Epoch: 0, grad norm: 7.3295, obj: 162.8532, obj smoothness: 162.8532
Epoch: 1, grad norm: 7.3317, obj: 162.8327, obj smoothness: 0.0205
Epoch: 2, grad norm: 7.3339, obj: 162.8121, obj smoothness: 0.0206
Epoch: 3, grad norm: 7.3361, obj: 162.7915, obj smoothness: 0.0206
Epoch: 4, grad norm: 7.3383, obj: 162.7708, obj smoothness: 0.0207
Epoch: 5, grad norm: 7.3406, obj: 162.7500, obj smoothness: 0.0207
Epoch: 6, grad norm: 7.3429, obj: 162.7293, obj smoothness: 0.0208
Epoch: 7, grad norm: 7.3452, obj: 162.7084, obj smoothness: 0.0208
Epoch: 8, grad norm: 7.3475, obj: 162.6875, obj smoothness: 0.0209
Epoch: 9, grad norm: 7.3498, obj: 162.6666, obj smoothness: 0.0210
Epoch: 10, grad norm: 7.3521, obj: 162.6456, obj smoothness: 0.0210
Epoch: 11, grad norm: 7.3545, obj: 162.6245, obj smoothness: 0.0211
Epoch: 12, grad norm: 7.3568, obj: 162.6034, obj smoothness: 0.0211
Epoch: 13, grad norm: 7.3592, obj: 162.5822, obj smoothness: 0.0212
Epoch: 14, grad norm: 7.3616, obj: 162.5609, obj smoothn

In [8]:
X = CNE._ConditionalNetworkEmbedding__emb

In [9]:
from scipy.stats import halfnorm

def get_pij(i,j,s1,s2,prior, X):
    
    p_prior = prior.get_row_probability([i], [j])
    
    normal_s1 = halfnorm.rvs(loc=0,scale=s1,size=1)
    normal_s2 = halfnorm.rvs(loc=0,scale=s2,size=1)
    
    numerator = p_prior * normal_s1
    denom = numerator + (1-p_prior)*normal_s2
    
    return numerator/denom

In [10]:
# x_i = np.array([1,2,3,4,5,6,7,8,9])
# x_j = np.array([0,1,0,0,0,0,0,0,0])
# np.outer(x_i, x_j)
#def get_hessian(i,j,k,P,A):
# P = np.array([[1,2,3],[4,5,6],[7,8,9]])
# A = np.array([[0,1,1],[1,0,0],[1,0,0]])
# print(P)
# print(A)
# print(P-A)

In [11]:
#np.diag((P-A)[~np.eye(A.shape[0], dtype=bool)])
i=0
#identity=[]
s1 = 1
s2 = 1.5
gamma = (1/(s1**2)) - (1/(s2**2))

def get_hessian(i,s1,s2,gamma,X,A):
    
    hessian = np.zeros(shape=(10,10))

    for j in range(A.shape[0]):

        if i != j:

            x_i = X[i,:]
            x_j = X[j,:]

            x_diff = (x_i - x_j).reshape(-1,1)  
            
            prob = get_pij(i,j,1,1.5,prior, X)

            h = (gamma**2) * np.dot(x_diff,x_diff.T) * (prob * (1-prob))

            a = A[i,j]

            p_diff = gamma * (prob - a)[0]

            p_diff_mat = p_diff * np.identity(h.shape[0])

            hessian += p_diff_mat - h
            
    return hessian

In [12]:
i=0
j=1
k=2

hessian = get_hessian(i,s1,s2,gamma,X,A)
pij = get_pij(i=i,j=j,s1=s1,s2=s2,prior=prior, X=X)

invert = (-hessian) / (gamma**2 * (pij) * (1-pij))

hess_inv = np.linalg.inv(-hessian)

x_i = X[i,:]
x_j = X[j,:]
x_k = X[k,:]

xij_diff = (x_i - x_j).reshape(1,-1)

xik_diff = (x_i - x_k)

np.dot(np.dot(xij_diff, hess_inv), xik_diff)

array([-6904.60463691])

In [None]:
#np.dot(np.dot(np.ones(shape=(3,1)), np.ones(shape=(1,3))), np.dot(P, 1-P))
# a = np.dot(P, 1-P)
# np.fill_diagonal(a, 0)
# a

In [None]:
# with tf.GradientTape(persistent=True) as g:
    
#     A = tf.convert_to_tensor(A)

#     head = tf.argmax(A[:,tail_idx, rel_idx])
#     tail = tf.argmax(A[head_idx,:, rel_idx])
#     rel = tf.argmax(A[head_idx,tail_idx,:])
    
#     other_head = tf.argmax(A[:,tail_idx, rel_idx])
#     other_tail = tf.argmax(A[head_idx,:, rel_idx])
#     other_rel = tf.argmax(A[head_idx,tail_idx,:])
    
#     head_e,_,tail_e,_,rel_e= model([head,head,tail,tail,rel])

#     get_score = score(head_e,rel_e,tail_e)
    
# g.gradient(get_score,tail_e)