# Diffusion

This notebook illustrates the classification of the nodes of a graph by [diffusion](https://en.wikipedia.org/wiki/Heat_equation), based on the labels of a few nodes.

In [None]:
from IPython.display import SVG

In [None]:
import numpy as np

In [None]:
from sknetwork.data import karate_club, painters, movie_actor
from sknetwork.classification import DiffusionClassifier, get_accuracy_score
from sknetwork.visualization import svg_graph, visualize_bigraph

## Graphs

In [None]:
graph = karate_club(metadata=True)
adjacency = graph.adjacency
position = graph.position
labels_true = graph.labels

In [None]:
labels = {i: labels_true[i] for i in [0, 33]}

In [None]:
diffusion = DiffusionClassifier()
labels_pred = diffusion.fit_predict(adjacency, labels)

In [None]:
accuracy = get_accuracy_score(labels_true, labels_pred)
np.round(accuracy, 2)

In [None]:
image = svg_graph(adjacency, position, labels=labels_pred, seeds=labels)
SVG(image)

In [None]:
# probability distribution over labels
probs = diffusion.predict_proba()

In [None]:
probs

In [None]:
# label 1
scores = probs[:, 1]

In [None]:
image = svg_graph(adjacency, position, scores=scores, seeds=labels)
SVG(image)

## Directed graphs

In [None]:
graph = painters(metadata=True)
adjacency = graph.adjacency
position = graph.position
names = graph.names

In [None]:
rembrandt = 5
cezanne = 11
labels = {cezanne: 0, rembrandt: 1}

In [None]:
diffusion = DiffusionClassifier()
labels_pred = diffusion.fit_predict(adjacency, labels)

In [None]:
image = svg_graph(adjacency, position, names, labels=labels_pred, seeds=labels)
SVG(image)

In [None]:
# probability distribution over labels
probs = diffusion.predict_proba()

In [None]:
# label 0
scores = probs[:, 0]

In [None]:
image = svg_graph(adjacency, position, names=names, scores=scores, seeds=[cezanne])
SVG(image)

## Bipartite graphs

In [None]:
graph = movie_actor(metadata=True)
biadjacency = graph.biadjacency
names_row = graph.names_row
names_col = graph.names_col

In [None]:
inception = 0
drive = 3

In [None]:
labels_row = {inception: 0, drive: 1}

In [None]:
diffusion = DiffusionClassifier()
diffusion.fit(biadjacency, labels_row)
labels_row_pred = diffusion.labels_row_
labels_col_pred = diffusion.labels_col_

In [None]:
image = visualize_bigraph(biadjacency, names_row, names_col, labels_row_pred, labels_col_pred, seeds_row=labels_row)
SVG(image)

In [None]:
# probability distributions
probs_row = diffusion.predict_proba()
probs_col = diffusion.predict_proba(columns=True)

In [None]:
# probability of label 1
scores_row = probs_row[:,1]
scores_col = probs_col[:,1]

In [None]:
image = visualize_bigraph(biadjacency, names_row, names_col, scores_row=scores_row, scores_col=scores_col,
                    seeds_row=labels_row)
SVG(image)
