<a href="https://colab.research.google.com/github/dlf1/hello-world/blob/master/Untitled2.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [49]:

!pip install -q torch-scatter -f https://pytorch-geometric.com/whl/torch-1.8.0+cu101.html
!pip install -q torch-sparse -f https://pytorch-geometric.com/whl/torch-1.8.0+cu101.html
!pip install -q torch-geometric


%matplotlib inline
import matplotlib.pyplot as plt
from sklearn.manifold import TSNE

def visualize(h, color, epoch=None, loss=None):
    plt.figure(figsize=(7,7))
    plt.xticks([])
    plt.yticks([])

    
    nx.draw_networkx(G, pos=nx.spring_layout(G, seed=42), with_labels=False,
                         node_color=color, cmap="Set2")
    plt.show()

In [32]:
import torch
from torch_geometric.datasets import TUDataset

dataset = TUDataset(root='data/TUDataset', name='MUTAG')

print()
print(f'Dataset: {dataset}:')
print('====================')
print(f'Number of graphs: {len(dataset)}')
print(f'Number of features: {dataset.num_features}')
print(f'Number of classes: {dataset.num_classes}')

data = dataset[0]  # Get the first graph object.

print()
print(data)
print('=============================================================')

# Gather some statistics about the first graph.
print(f'Number of nodes: {data.num_nodes}')
print(f'Number of edges: {data.num_edges}')
print(f'Average node degree: {data.num_edges / data.num_nodes:.2f}')
print(f'Contains isolated nodes: {data.contains_isolated_nodes()}')
print(f'Contains self-loops: {data.contains_self_loops()}')
print(f'Is undirected: {data.is_undirected()}')

Downloading https://www.chrsmrrs.com/graphkerneldatasets/MUTAG.zip
Extracting data/TUDataset/MUTAG/MUTAG.zip
Processing...
Done!

Dataset: MUTAG(188):
Number of graphs: 188
Number of features: 7
Number of classes: 2

Data(edge_attr=[38, 4], edge_index=[2, 38], x=[17, 7], y=[1])
Number of nodes: 17
Number of edges: 38
Average node degree: 2.24
Contains isolated nodes: False
Contains self-loops: False
Is undirected: True


In [34]:
from torch_geometric.data import DataLoader

train_loader = DataLoader(train_dataset, batch_size=64, shuffle=True)
test_loader = DataLoader(test_dataset, batch_size=64, shuffle=False)

for step, data in enumerate(train_loader):
    print(f'Step {step + 1}:')
    print('=======')
    print(f'Number of graphs in the current batch: {data.num_graphs}')
    print(data)
    print()

Step 1:
Number of graphs in the current batch: 64
Batch(batch=[1185], edge_attr=[2624, 4], edge_index=[2, 2624], ptr=[65], x=[1185, 7], y=[64])

Step 2:
Number of graphs in the current batch: 64
Batch(batch=[1146], edge_attr=[2538, 4], edge_index=[2, 2538], ptr=[65], x=[1146, 7], y=[64])

Step 3:
Number of graphs in the current batch: 22
Batch(batch=[383], edge_attr=[832, 4], edge_index=[2, 832], ptr=[23], x=[383, 7], y=[22])



In [41]:
from torch.nn import Linear
import torch.nn.functional as F
from torch_geometric.nn import GCNConv
from torch_geometric.nn import global_mean_pool


class GCN(torch.nn.Module):
    def __init__(self, hidden_channels):
        super(GCN, self).__init__()
        torch.manual_seed(12345)
        self.conv1 = GCNConv(dataset.num_node_features, hidden_channels)
        self.conv2 = GCNConv(hidden_channels, hidden_channels)
        self.conv3 = GCNConv(hidden_channels, hidden_channels)
        self.lin = Linear(hidden_channels, dataset.num_classes)

    def forward(self, x, edge_index, batch):
        
        x = self.conv1(x, edge_index)
        x = x.relu()
        x = self.conv2(x, edge_index)
        x = x.relu()
        x = self.conv3(x, edge_index)

        x = global_mean_pool(x, batch)  

 
        x = F.dropout(x, p=0.5, training=self.training)
        x = self.lin(x)
        
        return x

model = GCN(hidden_channels=64)
print(model)

GCN(
  (conv1): GCNConv(7, 64)
  (conv2): GCNConv(64, 64)
  (conv3): GCNConv(64, 64)
  (lin): Linear(in_features=64, out_features=2, bias=True)
)


In [42]:
from IPython.display import Javascript
display(Javascript('''google.colab.output.setIframeHeight(0, true, {maxHeight: 300})'''))

model = GCN(hidden_channels=64)
optimizer = torch.optim.Adam(model.parameters(), lr=0.01)
criterion = torch.nn.CrossEntropyLoss()

def train():
    model.train()

    for data in train_loader:  
         out = model(data.x, data.edge_index, data.batch)  
         loss = criterion(out, data.y) 
         loss.backward()  
         optimizer.step()  
         optimizer.zero_grad() 

def test(loader):
     model.eval()

     correct = 0
     for data in loader:  
         out = model(data.x, data.edge_index, data.batch)  
         pred = out.argmax(dim=1)  
         correct += int((pred == data.y).sum()) 
     return correct / len(loader.dataset)  


for epoch in range(1, 201):
    train()
    train_acc = test(train_loader)
    test_acc = test(test_loader)
    print(f'Epoch: {epoch:03d}, Train Acc: {train_acc:.4f}, Test Acc: {test_acc:.4f}')

<IPython.core.display.Javascript object>

Epoch: 001, Train Acc: 0.6467, Test Acc: 0.7368
Epoch: 002, Train Acc: 0.6467, Test Acc: 0.7368
Epoch: 003, Train Acc: 0.6467, Test Acc: 0.7368
Epoch: 004, Train Acc: 0.6467, Test Acc: 0.7368
Epoch: 005, Train Acc: 0.6600, Test Acc: 0.7368
Epoch: 006, Train Acc: 0.7467, Test Acc: 0.7632
Epoch: 007, Train Acc: 0.7200, Test Acc: 0.7632
Epoch: 008, Train Acc: 0.7267, Test Acc: 0.7895
Epoch: 009, Train Acc: 0.7333, Test Acc: 0.7632
Epoch: 010, Train Acc: 0.7267, Test Acc: 0.7895
Epoch: 011, Train Acc: 0.7333, Test Acc: 0.7895
Epoch: 012, Train Acc: 0.7333, Test Acc: 0.7895
Epoch: 013, Train Acc: 0.7467, Test Acc: 0.7895
Epoch: 014, Train Acc: 0.7467, Test Acc: 0.8158
Epoch: 015, Train Acc: 0.7533, Test Acc: 0.7895
Epoch: 016, Train Acc: 0.7533, Test Acc: 0.7368
Epoch: 017, Train Acc: 0.7533, Test Acc: 0.8158
Epoch: 018, Train Acc: 0.7400, Test Acc: 0.7632
Epoch: 019, Train Acc: 0.7533, Test Acc: 0.7632
Epoch: 020, Train Acc: 0.7600, Test Acc: 0.8158
Epoch: 021, Train Acc: 0.7600, Test Acc:

NameError: ignored

Number of training graphs: 150
Number of test graphs: 38


Step 1:
Number of graphs in the current batch: 1
Batch(batch=[19793], edge_index=[2, 126842], ptr=[2], x=[19793, 8710], y=[19793])



GCN(
  (conv1): GCNConv(8710, 64)
  (conv2): GCNConv(64, 64)
  (conv3): GCNConv(64, 64)
  (lin): Linear(in_features=64, out_features=70, bias=True)
)


<IPython.core.display.Javascript object>

ValueError: ignored