pyg-team · rusty1s · Aug 23, 2022 · Aug 23, 2022 · Aug 29, 2022 · Aug 29, 2022
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -5,6 +5,7 @@ The format is based on [Keep a Changelog](http://keepachangelog.com/en/1.0.0/).
 
 ## [2.2.0] - 2022-MM-DD
 ### Added
+- Added a benchmark for heterogeneous GNN execution ([#5265](https://github.com/pyg-team/pytorch_geometric/pull/5265))
 - Added `SparseTensor` support to inference benchmark suite ([#5242](https://github.com/pyg-team/pytorch_geometric/pull/5242), [#5258](https://github.com/pyg-team/pytorch_geometric/pull/5258))
 - Added experimental mode in inference benchmarks ([#5254](https://github.com/pyg-team/pytorch_geometric/pull/5254))
 - Added node classification example instrumented with [Weights and Biases (W&B) logging](https://wandb.com) and [W&B Sweeps](https://wandb.com/sweeps) ([#5192](https://github.com/pyg-team/pytorch_geometric/pull/5192))

@@ -0,0 +1,203 @@
+import argparse
+import time
+from collections import defaultdict
+
+import dgl
+import pyg_lib
+import torch
+
+from torch_geometric import seed_everything
+from torch_geometric.datasets import FakeHeteroDataset
+from torch_geometric.nn import MessagePassing
+
+SEED = 12345
+
+parser = argparse.ArgumentParser()
+parser.add_argument('--num_node_types', type=int, default=30)
+parser.add_argument('--num_edge_types', type=int, default=60)
+parser.add_argument('--avg_num_nodes', type=int, default=400)
+parser.add_argument('--avg_degree', type=int, default=10)
+parser.add_argument('--channels', type=int, default=64)
+parser.add_argument('--device', type=str, default='cpu')
+parser.add_argument('--warmup', type=str, default=10)
+parser.add_argument('--iterations', type=int, default=100)
+
+
+class SequentialRGCN(MessagePassing):
+    def __init__(self, num_edge_types, channels):
+        super().__init__(aggr='sum')
+        torch.manual_seed(SEED)
+        weight = torch.randn(num_edge_types, channels, channels)
+        self.register_buffer('weight', weight)
+
+    def forward(self, x_dict, edge_index_dict):
+        outs_dict = defaultdict(list)
+        for i, (edge_type, edge_index) in enumerate(edge_index_dict.items()):
+            src, _, dst = edge_type
+            out = self.propagate(edge_index, x=(x_dict[src], x_dict[dst]))
+            out = out @ self.weight[i]
+            outs_dict[dst].append(out)
+
+        out_dict = {}
+        for key, outs in outs_dict.items():
+            out_dict[key] = torch.stack(outs, dim=0).sum(dim=0)
+
+        return out_dict
+
+
+class VerticalRGCN(MessagePassing):
+    # https://arxiv.org/pdf/2107.10015.pdf
+    def __init__(self, num_edge_types, channels):
+        super().__init__(aggr='sum')
+        torch.manual_seed(SEED)
+        weight = torch.randn(num_edge_types, channels, channels)
+        self.register_buffer('weight', weight)
+
+    def forward(self, x, edge_index, edge_type):
+        edge_index = edge_index.clone()
+        edge_index[1] += x.size(0) * edge_type
+
+        out = self.propagate(
+            edge_index,
+            x=x,
+            size=(x.size(0), self.weight.size(0) * x.size(0)),
+        )
+
+        out = out.view(self.weight.size(0), x.size(0), x.size(1))
+        out = out @ self.weight
+        out = out.sum(dim=0)
+
+        return out
+
+
+class HorizontalRGCN(MessagePassing):
+    # https://arxiv.org/pdf/2107.10015.pdf
+    def __init__(self, num_edge_types, channels):
+        super().__init__(aggr='sum')
+        torch.manual_seed(SEED)
+        weight = torch.randn(num_edge_types, channels, channels)
+        self.register_buffer('weight', weight)
+
+    def forward(self, x, edge_index, edge_type):
+        edge_index = edge_index.clone()
+        edge_index[0] += x.size(0) * edge_type
+
+        out = x.view(1, x.size(0), x.size(1)) @ self.weight
+        out = out.view(self.weight.size(0) * x.size(0), x.size(1))
+
+        out = self.propagate(
+            edge_index,
+            x=out,
+            size=(self.weight.size(0) * x.size(0), x.size(0)),
+        )
+
+        return out
+
+
+class DGLTypedRGCN(MessagePassing):
+    def __init__(self, num_edge_types, channels):
+        super().__init__(aggr='sum')
+        torch.manual_seed(SEED)
+        weight = torch.randn(num_edge_types, channels, channels)
+        self.register_buffer('weight', weight)
+
+    def forward(self, x, edge_index, edge_sizes):
+        return self.propagate(edge_index, x=x, edge_sizes=edge_sizes)
+
+    def message(self, x_j, edge_sizes):
+        return dgl.ops.segment_mm(x_j, self.weight, edge_sizes)
+
+
+class CutlassTypedRGCN(MessagePassing):
+    def __init__(self, num_edge_types, channels):
+        super().__init__(aggr='sum')
+        torch.manual_seed(SEED)
+        weight = torch.randn(num_edge_types, channels, channels)
+        self.register_buffer('weight', weight)
+
+    def forward(self, x, edge_index, edge_type_ptr):
+        return self.propagate(edge_index, x=x, edge_type_ptr=edge_type_ptr)
+
+    def message(self, x_j, edge_type_ptr):
+        return pyg_lib.ops.segment_matmul(x_j, edge_type_ptr, self.weight)
+
+
+if __name__ == '__main__':
+    args = parser.parse_args()
+    print(args)
+
+    seed_everything(SEED)
+    dataset = FakeHeteroDataset(
+        num_graphs=1,
+        num_node_types=args.num_node_types,
+        num_edge_types=args.num_edge_types,
+        avg_num_nodes=args.avg_num_nodes,
+        avg_degree=args.avg_degree,
+    )
+    hetero_data = dataset[0].to(args.device)
+    for node_type in hetero_data.node_types:
+        store = hetero_data[node_type]
+        x = torch.randn(store.num_nodes, args.channels, device=args.device)
+        store.x = x
+    homo_data = hetero_data.to_homogeneous()
+    edge_sizes = homo_data.edge_type.bincount().cpu()
+    edge_type_ptr = torch.ops.torch_sparse.ind2ptr(
+        homo_data.edge_type,
+        args.num_edge_types,
+    )
+
+    conv = SequentialRGCN(args.num_edge_types, args.channels).to(args.device)
+    for i in range(args.warmup + args.iterations):
+        if i == args.warmup:
+            torch.cuda.synchronize()
+            t = time.perf_counter()
+        out_dict = conv(hetero_data.x_dict, hetero_data.edge_index_dict)
+    torch.cuda.synchronize()
+    t = time.perf_counter() - t
+    out1 = torch.cat([out for out in out_dict.values()])
+    print(f'{conv}: {t}')
+
+    conv = VerticalRGCN(args.num_edge_types, args.channels).to(args.device)
+    for i in range(args.warmup + args.iterations):
+        if i == args.warmup:
+            torch.cuda.synchronize()
+            t = time.perf_counter()
+        out2 = conv(homo_data.x, homo_data.edge_index, homo_data.edge_type)
+    torch.cuda.synchronize()
+    t = time.perf_counter() - t
+    print(f'{conv}: {t}')
+
+    conv = HorizontalRGCN(args.num_edge_types, args.channels).to(args.device)
+    for i in range(args.warmup + args.iterations):
+        if i == args.warmup:
+            torch.cuda.synchronize()
+            t = time.perf_counter()
+        out3 = conv(homo_data.x, homo_data.edge_index, homo_data.edge_type)
+    torch.cuda.synchronize()
+    t = time.perf_counter() - t
+    print(f'{conv}: {t}')
+
+    conv = DGLTypedRGCN(args.num_edge_types, args.channels).to(args.device)
+    for i in range(args.warmup + args.iterations):
+        if i == args.warmup:
+            torch.cuda.synchronize()
+            t = time.perf_counter()
+        out4 = conv(homo_data.x, homo_data.edge_index, edge_sizes)
+    torch.cuda.synchronize()
+    t = time.perf_counter() - t
+    print(f'{conv}: {t}')
+
+    conv = CutlassTypedRGCN(args.num_edge_types, args.channels).to(args.device)
+    for i in range(args.warmup + args.iterations):
+        if i == args.warmup:
+            torch.cuda.synchronize()
+            t = time.perf_counter()
+        out5 = conv(homo_data.x, homo_data.edge_index, edge_type_ptr)
+    torch.cuda.synchronize()
+    t = time.perf_counter() - t
+    print(f'{conv}: {t}')
+
+    assert torch.allclose(out1, out2, atol=1e-4)
+    assert torch.allclose(out2, out3, atol=1e-4)
+    assert torch.allclose(out3, out4, atol=1e-4)
+    assert torch.allclose(out4, out5, atol=1e-4)
@@ -189,6 +189,7 @@ def generate_data(self) -> HeteroData:
 
         iterator = zip(self.node_types, self.num_channels)
         for i, (node_type, num_channels) in enumerate(iterator):
+            # TODO: Generate num_nodes // len(node_types)
             num_nodes = get_num_nodes(self.avg_num_nodes, self.avg_degree)
 
             store = data[node_type]
@@ -204,6 +205,7 @@ def generate_data(self) -> HeteroData:
         for (src, rel, dst) in self.edge_types:
             store = data[(src, rel, dst)]
 
+            # TODO: Generate avg_degree // len(edge_types)
             store.edge_index = get_edge_index(
                 data[src].num_nodes,
                 data[dst].num_nodes,