In [None]:
from companykg import CompanyKG

## Initialize CompanyKG

In [None]:
DATA_ROOT_FOLDER = "./data"

# It may take long time if the data files are not yet downloaded.
comkg = CompanyKG(nodes_feature_type="msbert", load_edges_weights=True, data_root_folder=DATA_ROOT_FOLDER)

In [None]:
# Obtain the list of node IDs using nodes_id
len(comkg.nodes_id)

## Inspect CompanyKG

In [None]:
# Show the important info of the loaded data
comkg.describe()

In [None]:
# Nodes feature: ordered by comkg.nodes_id
comkg.nodes_feature

In [None]:
# Edges
comkg.edges

In [None]:
# Edges weight
comkg.edges_weight

## Inspect Evaluation Data

In [None]:
# SP samples
comkg.eval_tasks['sp'][1]

In [None]:
# SR samples
comkg.eval_tasks['sr'][1]

In [None]:
# CR samples
comkg.eval_tasks['cr'][1]

## Evaluate Node Feature

In [None]:
# Run all evaluation tasks on the loaded node feature
eval_results = comkg.evaluate()

In [None]:
# Show AUC score for SP task
eval_results["sp_auc"]

In [None]:
# Show test accuracy for SR task
eval_results["sr_test_acc"]

In [None]:
# Show validation accuracy for SR task
eval_results["sr_validation_acc"]

In [None]:
# Show Top-K Hit Rate for CR task
eval_results["cr_topk_hit_rate"]

## Evaluate Saved Embedding

In [None]:
# Run all evaluation tasks on the specified embeddings saved in torch.Tensor format

EMBEDDINGS_FILE = "./data/nodes_feature_msbert.pt"

eval_results = comkg.evaluate(embeddings_file=EMBEDDINGS_FILE)

In [None]:
# Show AUC score for SP task
eval_results["sp_auc"]

In [None]:
# Show test accuracy for SR task
eval_results["sr_test_acc"]

In [None]:
# Show validation accuracy for SR task
eval_results["sr_validation_acc"]

In [None]:
# Show Top-K Hit Rate for CR task
eval_results["cr_topk_hit_rate"]

## Create DGL Graph

In [None]:
# Takes about 15 mins, the graph will be saved to work_folder
g = comkg.get_dgl_graph(work_folder="./experiments")
g

In [None]:
# When call the same function again, it will load from file directly
g = comkg.get_dgl_graph(work_folder="./experiments")
g

## Create iGraph

In [None]:
g = comkg.to_igraph()
g