Code release for camera-ready

lgalke · Apr 24, 2019 · 6a1ddf0 · 6a1ddf0
commit 6a1ddf0
Show file tree

Hide file tree

Showing 15 changed files with 1,068 additions and 0 deletions.
diff --git a/.gitignore b/.gitignore
@@ -0,0 +1 @@
+__pycache__/
diff --git a/README.md b/README.md
@@ -0,0 +1,71 @@
+# Code for evaluating graph neural nets with unseen nodes after pretraining
+
+**Paper:** L Galke, I Vagliano, A Scherp: *Can Graph Neural Networks Go "Online"? An Analysis of Pretraining and Inference*, RLGM@ICLR2019.
+
+A link to the paper will follow soon.
+
+## Requirements
+
+For the evaluate script: python3, torch, dgl, pandas
+For the visualization script: matplotlib, seaborn
+
+
+```sh
+pip install -r requirements.txt
+```
+
+## Reproducing our experiments
+
+We provide a convenience script for re-generating all the results from the paper.
+
+```sh
+./trigger.bash
+```
+
+## Running own experiments
+
+The pretraining/inference experiments can be conducted with the `evaluate.py` script
+
+```sh
+usage: evaluate.py [-h] [--dataset DATASET]
+			[--model MODEL]
+			[--runs RUNS]
+			[--inference INFERENCE]
+                   	[--invert]
+			[--outfile OUTFILE]
+			[--epochs EPOCHS]
+                   	[--no-cuda]
+			[--info]
+
+optional arguments:
+  -h, --help            show this help message and exit
+  --dataset DATASET     The input dataset.
+  --model MODEL         Specify model
+  --runs RUNS           Number of random reruns
+  --inference INFERENCE
+                        Number of inference epochs
+  --invert              Invert train and test set
+  --outfile OUTFILE     Dump Results to outfile
+  --epochs EPOCHS       Number of training epochs
+  --no-cuda             Force no cuda
+```
+
+For batching experiments, see the example in `trigger.bash`
+
+## Visualizing results
+
+We provide a script to visualize the results generated by `evaluate.py`.
+The script should be called on the results file specified by `--outfile`:
+
+```sh
+python3 visualize.py results.txt`
+```
+
+## Adding new models
+
+New models should be implemented as subclasses of `nn.Module` and implement
+`forward` as `forward(features)`, where `features` are the node features. They
+additionally need to satisfy `set_graph(g)`, where `g` is a `DGLGraph`
+instance.  This method will be called between the pretraining and the inference
+epochs.  They need to be registered along with hyperparameters and optimizers
+in the `factory.py`.
diff --git a/check.py b/check.py
@@ -0,0 +1,13 @@
+#!/usr/bin/env python3
+""" This tiny script checks how many rows are there per dataset/setting/model/pretraining config in full results file """
+import pandas as pd
+import sys
+ROWS_PER_RUN = 33
+data = pd.read_csv(sys.argv[1])
+for key, group in data.groupby(["dataset", "setting", "model","pretraining"]):
+    print("Runs for", key, ":", (group.count()/ROWS_PER_RUN).mean())
+
+# sns.relplot(x="epoch", y="accuracy", kind='line', col='dataset', row='setting', data=data, hue="model", style="pretraining", markers=False, ci="sd")
+# plt.savefig(sys.argv[1] + '.png')
+
+
diff --git a/evaluate.py b/evaluate.py
@@ -0,0 +1,222 @@
+import argparse
+import math
+import time
+import dgl
+import dgl.function as fn
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import numpy as np
+import pandas as pd
+from dgl import DGLGraph
+from dgl.data import register_data_args, load_data
+
+
+from factory import build_model, build_optimizer
+from gcn import gcn_norm
+
+
+def calc_accuracy(logits, true_labels):
+    __max_vals, max_indices = torch.max(logits, 1)
+    acc = (max_indices == true_labels).sum().float() / true_labels.size(0)
+    return acc.item()
+
+
+def eval_inference(epoch, net, features, labels, mask):
+    """
+    Evaluates the net on the (full) graph and calculates the
+    loss and accuracy for `mask`, which is usually the test set mask
+    """
+    with torch.no_grad():
+        net.eval()
+        dev_logits = net(features)
+        dev_logp = F.log_softmax(dev_logits, 1)
+        dev_loss = F.nll_loss(dev_logp[mask], labels[mask])
+    accuracy_score = calc_accuracy(dev_logp[mask], labels[mask])
+    print("Epoch {:05d} | Test Loss {:.4f} | Test Accuracy {:.4f}"
+          .format(epoch, dev_loss.detach().item(), accuracy_score))
+    return accuracy_score
+
+
+def train_epoch(epoch,
+                net,
+                optimizer,
+                features,
+                labels,
+                train_mask=None):
+    net.train()
+    logits = net(features)
+
+    if train_mask is not None:
+        # If mask is given, only optimize on the respective labels
+        task_loss = F.cross_entropy(logits[train_mask], labels[train_mask])
+    else:
+        # No mask is given, optimize on all
+        task_loss = F.cross_entropy(logits, labels)
+
+    optimizer.zero_grad()
+    task_loss.backward()
+    optimizer.step()
+    print("Epoch {:05d} | Task Loss: {:.4f}".format(epoch, task_loss.detach().item()))
+
+
+def appendDFToCSV_void(df, csvFilePath, sep=","):
+    """ Safe appending of a pandas df to csv file
+    Source: https://stackoverflow.com/questions/17134942/pandas-dataframe-output-end-of-csv
+    """
+    import os
+    if not os.path.isfile(csvFilePath):
+        df.to_csv(csvFilePath, mode='a', index=False, sep=sep)
+    elif len(df.columns) != len(pd.read_csv(csvFilePath, nrows=1, sep=sep).columns):
+        raise Exception("Columns do not match!! Dataframe has " + str(len(df.columns)) + " columns. CSV file has " + str(len(pd.read_csv(csvFilePath, nrows=1, sep=sep).columns)) + " columns.")
+    elif not (df.columns == pd.read_csv(csvFilePath, nrows=1, sep=sep).columns).all():
+        raise Exception("Columns and column order of dataframe and csv file do not match!!")
+    else:
+        df.to_csv(csvFilePath, mode='a', index=False, sep=sep, header=False)
+
+def main(args):
+    column_headers = ["dataset",
+                      "setting",
+                      "model",
+                      "pretraining",
+                      "epoch",
+                      "accuracy"]
+    use_cuda = args.use_cuda and torch.cuda.is_available()
+    print("Using CUDA:", use_cuda)
+
+    results_df = pd.DataFrame(columns=column_headers)
+
+    data = load_data(args)
+    features = torch.FloatTensor(data.features)
+    labels = torch.LongTensor(data.labels)
+    train_mask = torch.ByteTensor(data.train_mask)
+    val_mask = torch.ByteTensor(data.val_mask)
+    test_mask = torch.ByteTensor(data.test_mask)
+    in_feats = features.shape[1]
+    n_classes = data.num_labels
+
+    # We dont use a validation set
+    train_mask = train_mask | val_mask
+
+    if args.invert:
+        # This is different from swapping train and test mask
+        # because train | test not cover the whole dataset
+        train_mask, test_mask = ~train_mask, train_mask
+        setting = 'B'
+    else:
+        setting = 'A'
+
+    g = dgl.DGLGraph(data.graph)
+    # Suppress warning
+    g.set_n_initializer(dgl.init.zero_initializer)
+    # add self loop
+    g.add_edges(g.nodes(), g.nodes())
+
+    # g_train, g = split_graph(g, train_mask)
+    # # Select train nodes..
+    train_nodes = torch.arange(g.number_of_nodes())[train_mask]
+    if use_cuda:
+        features, labels = features.cuda(), labels.cuda()
+        train_mask, test_mask = train_mask.cuda(), test_mask.cuda()
+        train_nodes = train_nodes.cuda()
+
+    # .. to induce subgraph
+    g_train = g.subgraph(train_nodes)
+    g_train.set_n_initializer(dgl.init.zero_initializer)
+    features_train = features[train_mask]
+    labels_train = labels[train_mask]
+
+    # Verify sizes of train set
+    assert int(train_mask.sum().item()) == features_train.size(0)\
+        == labels_train.size(0) == g_train.number_of_nodes()
+
+
+    # Random Restarts
+    for __ in range(args.runs):
+        # Init net
+        net = build_model(args.model, args.dataset, g_train, in_feats, n_classes)
+        if use_cuda:
+            net = net.cuda()
+        print(net)
+
+        # Init optimizers
+        # optimizer = torch.optim.Adam(net.parameters(),
+        #                              **training_optimizer_params)
+        optimizer = build_optimizer(net.parameters(),
+                                    args.model,
+                                    args.dataset,
+                                    inference=False)
+        print("Optimizer", optimizer)
+
+        # Pre-training
+        for epoch in range(args.epochs):
+            train_epoch(epoch+1, net, optimizer,
+                        features_train, labels_train,
+                        train_mask=None  # Use all labels of the *train* subgraph
+                        )
+
+        print("=== INFERENCE ===")
+        net.set_graph(g)
+        # Eval without inference epochs
+        accuracy_score = eval_inference(0, net, features, labels, test_mask)
+        results_df = results_df.append(
+            pd.DataFrame([[args.dataset, setting, args.model, args.epochs, 0, accuracy_score]],
+                         columns=column_headers), ignore_index=True
+        )
+
+        # Fresh optimizer for up-training at inference time
+        # optimizer = torch.optim.Adam(net.parameters(),
+        #                              **inference_optimizer_params)
+        del optimizer
+        optimizer = build_optimizer(net.parameters(),
+                                    args.model,
+                                    args.dataset,
+                                    inference=True)
+
+        print("Fresh inference optimizer", optimizer)
+        for i in range(args.inference):
+            train_epoch(i+1, net, optimizer,
+                        features, labels,
+                        train_mask=train_mask)
+
+            accuracy_score = eval_inference(i+1, net, features, labels, test_mask)
+            results_df = results_df.append(
+                pd.DataFrame([[args.dataset, setting, args.model, args.epochs, i+1, accuracy_score]],
+                             columns=column_headers), ignore_index=True
+            )
+        del net
+        del optimizer
+        torch.cuda.empty_cache()  # don't leak here
+
+
+    print(args)
+    for i in range(args.inference + 1):
+        # Print results to command line
+        rbi = results_df[results_df['epoch'] == i]['accuracy']
+        print("Avg accuracy over {} runs after {} inference epochs: {:.4f} ({:.4f})".format(args.runs, i, rbi.mean(), rbi.std()))
+
+    if args.outfile is not None:
+        # And store them to csv file
+        appendDFToCSV_void(results_df, args.outfile, sep=",")
+
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser()
+    register_data_args(parser)
+    parser.add_argument('--model', type=str, help="Specify model")
+    parser.add_argument('--runs', default=1, type=int,
+                        help="Number of random reruns")
+    parser.add_argument('--inference', default=0, type=int,
+                        help="Number of inference epochs")
+    parser.add_argument('--invert', default=False, action='store_true',
+                        help="Invert train and test set")
+    parser.add_argument('--outfile', default=None, type=str,
+                        help="Dump Results to outfile")
+    parser.add_argument('--epochs', default=200, type=int,
+                        help="Number of training epochs")
+    parser.add_argument('--no-cuda', dest='use_cuda', default=True,
+                        action='store_false',
+                        help="Force no cuda")
+    args = parser.parse_args()
+    print(args)
+    main(args)
diff --git a/factory.py b/factory.py
@@ -0,0 +1,61 @@
+import torch
+import torch.nn.functional as F
+
+from gat import GAT
+from gcn import GCN
+from mlp import MLP
+from graphsage import GraphSAGE
+
+def build_model(model_key, dataset, g, in_feats, n_classes):
+    """
+    Returns a model instance based on --model command-line arg and dataset
+    """
+    if model_key == 'MLP':
+        return MLP(in_feats, 64, n_classes, 1, F.relu, 0.5)
+    elif model_key == 'GCN':
+        return GCN(g, in_feats, 16, n_classes, 1, F.relu, 0.5)
+    elif model_key == 'GCN-64':
+        return GCN(g, in_feats, 64, n_classes, 1, F.relu, 0.5)
+    elif model_key == 'GAT':
+        # Default args from paper
+        num_heads = 8
+        num_out_heads = 8 if dataset == 'pubmed' else 1
+        num_layers = 1  # one *hidden* layer
+        heads = ([num_heads] * num_layers) + [num_out_heads]
+        return GAT(g,
+                   num_layers,
+                   in_feats,
+                   8,  # hidden units per layer
+                   n_classes,
+                   heads,
+                   F.elu,  # activation fun
+                   0.6,  # feat dropout
+                   0.6,  # attn dropout
+                   0.2,  # negative slope for leakyrelu
+                   False  # Use residual connections
+                   )
+    elif model_key == 'GraphSAGE':
+        return GraphSAGE(g, in_feats, 16, n_classes, 1, F.relu, 0.5, "mean")
+
+    # Add more models here
+    raise ValueError("Invalid model key")
+
+def build_optimizer(parameters, model_key, dataset, inference=False):
+    """
+    Returns an optimizer instance based on --model command-line arg and dataset
+    """
+    # Inference is currently, as we use same optimizer params for inference as
+    # we do for training
+    if model_key == 'GAT':
+        lr = 0.01 if dataset == 'pubmed' else 0.005
+        weight_decay = 0.001 if dataset == 'pubmed' else 0.0005
+        return torch.optim.Adam(parameters, lr=lr, weight_decay=weight_decay)
+    elif model_key == 'GraphSAGE':
+        lr = 1e-2
+        wd = 5e-4
+        return torch.optim.Adam(parameters, lr=lr, weight_decay=wd)
+
+    # Default optimizer (used for GCNs and MLPs)
+    lr = 0.005
+    weight_decay = 5e-4
+    return torch.optim.Adam(parameters, lr=lr, weight_decay=weight_decay)