In [1]:
import torch
import numpy as np
import os
from torch_geometric.data import Data

  from .autonotebook import tqdm as notebook_tqdm


In [2]:
data_name = 'cora' 
attributes_file_name = os.path.join('../data', data_name, 'attributes')
labels_file_name = os.path.join('../data', data_name, 'labels')
valid_file_name = os.path.join('../data', data_name, 'valid_nodes')

features = np.loadtxt(attributes_file_name)
labels = np.loadtxt(labels_file_name, dtype=np.int64)[:,1]
valid_all_nodes_list = np.loadtxt(valid_file_name, dtype = np.int64)

# Test

In [3]:
from data_handler import update_viewed_training_nodes_and_edges, generate_graph

In [4]:
stream_edges_dir_name = os.path.join('../data', data_name, 'stream_edges')
viewed_training_nodes, viewed_training_edges = None, None
for t in range(14):
    coming_edges = np.loadtxt(os.path.join(stream_edges_dir_name, str(t)), dtype=int)
    viewed_training_nodes, viewed_training_edges = update_viewed_training_nodes_and_edges(
            coming_edges, viewed_training_nodes, viewed_training_edges, valid_all_nodes_list)
    graph = generate_graph(viewed_training_nodes, viewed_training_edges, features, labels)
    print(f"At timestep {t}, graph structure is: {graph}\n")
    print(f"Number of total viewed training nodes is {len(viewed_training_nodes)}.\n")
    print(f"Number of total viewed training edges is {viewed_training_edges.shape[0]}.\n")
    print(f"{'-':->30s}")

At timestep 0, graph structure is: Data(x=[522, 1433], edge_index=[2, 1056], y=[522], num_nodes=522)

Number of total viewed training nodes is 522.

Number of total viewed training edges is 528.

------------------------------
At timestep 1, graph structure is: Data(x=[772, 1433], edge_index=[2, 1584], y=[772], num_nodes=772)

Number of total viewed training nodes is 772.

Number of total viewed training edges is 792.

------------------------------
At timestep 2, graph structure is: Data(x=[901, 1433], edge_index=[2, 1924], y=[901], num_nodes=901)

Number of total viewed training nodes is 901.

Number of total viewed training edges is 962.

------------------------------
At timestep 3, graph structure is: Data(x=[933, 1433], edge_index=[2, 2022], y=[933], num_nodes=933)

Number of total viewed training nodes is 933.

Number of total viewed training edges is 1011.

------------------------------
At timestep 4, graph structure is: Data(x=[1083, 1433], edge_index=[2, 2478], y=[1083], num

# Valid set inclus

In [5]:
from data_handler import update_viewed_all_nodes_and_edges, generate_whole_graph

In [6]:
stream_edges_dir_name = os.path.join('../data', data_name, 'stream_edges')

viewed_all_nodes, viewed_all_edges = None, None
for t in range(14):
    coming_edges = np.loadtxt(os.path.join(stream_edges_dir_name, str(t)), dtype=int)
    viewed_all_nodes, viewed_all_edges = update_viewed_all_nodes_and_edges(
            coming_edges, viewed_all_nodes, viewed_all_edges) 
    graph, valid_nodes = generate_whole_graph(viewed_all_nodes, viewed_all_edges, valid_all_nodes_list, features, labels)
    print(f"At timestep {t}, graph structure is: {graph}\n")
    print(f"Number of all viewed nodes / edges is {len(viewed_all_nodes)} / {viewed_all_edges.shape[0]}.\n")
    print(f"Number of viewed valid nodes is {len(valid_nodes)}.\n")
    print(f"{'-':->30s}")

At timestep 0, graph structure is: Data(x=[735, 1433], edge_index=[2, 2168], y=[735], num_nodes=735)

Number of all viewed nodes / edges is 735 / 1084.

Number of viewed valid nodes is 213.

------------------------------
At timestep 1, graph structure is: Data(x=[1097, 1433], edge_index=[2, 3326], y=[1097], num_nodes=1097)

Number of all viewed nodes / edges is 1097 / 1663.

Number of viewed valid nodes is 325.

------------------------------
At timestep 2, graph structure is: Data(x=[1270, 1433], edge_index=[2, 3900], y=[1270], num_nodes=1270)

Number of all viewed nodes / edges is 1270 / 1950.

Number of viewed valid nodes is 369.

------------------------------
At timestep 3, graph structure is: Data(x=[1319, 1433], edge_index=[2, 4104], y=[1319], num_nodes=1319)

Number of all viewed nodes / edges is 1319 / 2052.

Number of viewed valid nodes is 386.

------------------------------
At timestep 4, graph structure is: Data(x=[1533, 1433], edge_index=[2, 4966], y=[1533], num_nodes=15