In [1]:
from models import GCN
from dgl.data import CoraGraphDataset, CiteseerGraphDataset, PubmedGraphDataset
import torch.nn as nn
import torch
import torch.nn.functional as F
import dgl
from time import perf_counter

  from .autonotebook import tqdm as notebook_tqdm


In [2]:
device = 'cpu'
activation = nn.ReLU()
epochs = 50
batch_size = 10000
lr = 0.02
loss_fn = nn.CrossEntropyLoss()
weight_decay = 5e-4

In [3]:
data = PubmedGraphDataset()
g = data[0]
g = g.to(device)
features = g.ndata['feat']
labels = g.ndata['label']
train_mask = g.ndata['train_mask']
val_mask = g.ndata['val_mask']
test_mask = g.ndata['test_mask']
in_feats = features.shape[-1]
n_classes = data.num_labels
n_edges = g.number_of_edges()
g = dgl.remove_self_loop(g)
g = dgl.add_self_loop(g)

  NumNodes: 19717
  NumEdges: 88651
  NumFeats: 500
  NumClasses: 3
  NumTrainingSamples: 60
  NumValidationSamples: 500
  NumTestSamples: 1000
Done loading data from cached files.




In [4]:
model = GCN(in_feats, 16, n_classes, 2, activation, dropout=0.2)
optimizer = torch.optim.Adam(model.parameters(), lr=lr, weight_decay=weight_decay)

In [5]:
def train(model, g, features, labels, train_mask, val_mask, test_mask):
    t = perf_counter()
    for epoch in range(epochs):
        model.train()
        logits = model(g, features)
        loss = loss_fn(logits[train_mask], labels[train_mask])
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()

        model.eval()
        logits = model(g, features)
        train_acc = torch.sum(logits[train_mask].argmax(1) == labels[train_mask]).item() / train_mask.sum().item()
        val_acc = torch.sum(logits[val_mask].argmax(1) == labels[val_mask]).item() / val_mask.sum().item()
        test_acc = torch.sum(logits[test_mask].argmax(1) == labels[test_mask]).item() / test_mask.sum().item()
        print(f'Epoch {epoch + 1:02d}, Loss: {loss:.4f}, Train: {train_acc:.4f}, Val: {val_acc:.4f}, Test: {test_acc:.4f}')

    training_time = perf_counter()-t
    print(f'Training time: {training_time:.4f}s')

In [6]:
train(model, g, features, labels, train_mask, val_mask, test_mask)

Epoch 01, Loss: 1.1006, Train: 0.4000, Val: 0.4280, Test: 0.4280
Epoch 02, Loss: 1.0948, Train: 0.6333, Val: 0.4880, Test: 0.4730
Epoch 03, Loss: 1.0880, Train: 0.6833, Val: 0.4880, Test: 0.4700
Epoch 04, Loss: 1.0773, Train: 0.6000, Val: 0.4300, Test: 0.4020
Epoch 05, Loss: 1.0663, Train: 0.6333, Val: 0.4740, Test: 0.4490
Epoch 06, Loss: 1.0530, Train: 0.7000, Val: 0.5780, Test: 0.5770
Epoch 07, Loss: 1.0391, Train: 0.8000, Val: 0.6460, Test: 0.6270
Epoch 08, Loss: 1.0251, Train: 0.8000, Val: 0.6640, Test: 0.6510
Epoch 09, Loss: 1.0073, Train: 0.8333, Val: 0.6840, Test: 0.6610
Epoch 10, Loss: 0.9921, Train: 0.8333, Val: 0.6940, Test: 0.6670
Epoch 11, Loss: 0.9719, Train: 0.8333, Val: 0.6940, Test: 0.6690
Epoch 12, Loss: 0.9593, Train: 0.8500, Val: 0.7020, Test: 0.6680
Epoch 13, Loss: 0.9308, Train: 0.8667, Val: 0.7060, Test: 0.6740
Epoch 14, Loss: 0.9193, Train: 0.8833, Val: 0.7140, Test: 0.6770
Epoch 15, Loss: 0.9046, Train: 0.8833, Val: 0.7060, Test: 0.6810
Epoch 16, Loss: 0.8678, T