# Propagation

This notebook illustrates the clustering of a graph by [label propagation](https://en.wikipedia.org/wiki/Label_propagation_algorithm).

In [None]:
from IPython.display import SVG

In [None]:
import numpy as np

In [None]:
from sknetwork.data import karate_club, painters, movie_actor
from sknetwork.clustering import PropagationClustering, get_modularity
from sknetwork.linalg import normalize
from sknetwork.utils import get_membership
from sknetwork.visualization import visualize_graph, visualize_bigraph

## Graphs

In [None]:
graph = karate_club(metadata=True)
adjacency = graph.adjacency
position = graph.position

In [None]:
propagation = PropagationClustering()
labels = propagation.fit_predict(adjacency)

In [None]:
labels_unique, counts = np.unique(labels, return_counts=True)
print(labels_unique, counts)

In [None]:
image = visualize_graph(adjacency, position, labels=labels)
SVG(image)

In [None]:
# metric
get_modularity(adjacency, labels)

In [None]:
# aggregate graph
adjacency_aggregate = propagation.aggregate_

In [None]:
average = normalize(get_membership(labels).T)
position_aggregate = average.dot(position)
labels_unique, counts = np.unique(labels, return_counts=True)

In [None]:
image = visualize_graph(adjacency_aggregate, position_aggregate, counts, labels=labels_unique,
                  display_node_weight=True, node_weights=counts)
SVG(image)

In [None]:
# probability distribution over clusters
probs = propagation.predict_proba()

In [None]:
# scores for cluster 1
scores = probs[:,1]

In [None]:
image = visualize_graph(adjacency, position, scores=scores)
SVG(image)

## Directed graphs

In [None]:
graph = painters(metadata=True)
adjacency = graph.adjacency
names = graph.names
position = graph.position

In [None]:
propagation = PropagationClustering()
labels = propagation.fit_predict(adjacency)

In [None]:
labels_unique, counts = np.unique(labels, return_counts=True)
print(labels_unique, counts)

In [None]:
image = visualize_graph(adjacency, position, names=names, labels=labels)
SVG(image)

In [None]:
get_modularity(adjacency, labels)

In [None]:
# aggregate graph
adjacency_aggregate = propagation.aggregate_

In [None]:
average = normalize(get_membership(labels).T)
position_aggregate = average.dot(position)
labels_unique, counts = np.unique(labels, return_counts=True)

In [None]:
image = visualize_graph(adjacency_aggregate, position_aggregate, counts, labels=labels_unique,
                    display_node_weight=True, node_weights=counts)
SVG(image)

In [None]:
# probability distribution over clusters
probs = propagation.predict_proba()

In [None]:
# scores for cluster 1
scores = probs[:,1]

In [None]:
image = visualize_graph(adjacency, position, scores=scores)
SVG(image)

## Bipartite graphs

In [None]:
graph = movie_actor(metadata=True)
biadjacency = graph.biadjacency
names_row = graph.names_row
names_col = graph.names_col

In [None]:
propagation = PropagationClustering()
propagation.fit(biadjacency)
labels_row = propagation.labels_row_
labels_col = propagation.labels_col_

In [None]:
image = visualize_bigraph(biadjacency, names_row, names_col, labels_row, labels_col)
SVG(image)

In [None]:
get_modularity(biadjacency, labels_row, labels_col)

In [None]:
# aggregate graph
biadjacency_aggregate = propagation.aggregate_

In [None]:
labels_unique_row, counts_row = np.unique(labels_row, return_counts=True)
labels_unique_col, counts_col = np.unique(labels_col, return_counts=True)

In [None]:
image = visualize_bigraph(biadjacency_aggregate, counts_row, counts_col, labels_unique_row, labels_unique_col,
                    display_node_weight=True, node_weights_row=counts_row, node_weights_col=counts_col)
SVG(image)

In [None]:
# probability distribution over clusters
probs_row = propagation.predict_proba()
probs_col = propagation.predict_proba(columns=True)