In [1]:
import networkx as nx
import numpy as np
import matplotlib.cm as cm
import matplotlib.pyplot as plt


class Node:
    """ Describes a node in a graph, and the edges connected
        to that node."""

    def __init__(self, ID, neighbors, descriptor, truth=None, file_path=None):
        """
        Parameters
        ----------
        ID : int
            A unique identifier for this node. Should be a
            value in [0, N-1], if there are N nodes in total.

        neighbors : Sequence[int]
            The node-IDs of the neighbors of this node.

        descriptor : numpy.ndarray
            The shape-(512,) descriptor vector for the face that this node corresponds to.

        truth : Optional[str]
            If you have truth data, for checking your clustering algorithm,
            you can include the label to check your clusters at the end.
            If this node corresponds to a picture of Ryan, this truth
            value can just be "Ryan"

        file_path : Optional[str]
            The file path of the image corresponding to this node, so
            that you can sort the photos after you run your clustering
            algorithm
        """
        self.id = ID  # a unique identified for this node - this should never change

        # The node's label is initialized with the node's ID value at first,
        # this label is then updated during the whispers algorithm
        self.label = ID

        # (n1_ID, n2_ID, ...)
        # The IDs of this nodes neighbors. Empty if no neighbors
        self.neighbors = tuple(neighbors)
        self.descriptor = descriptor

        self.truth = truth
        self.file_path = file_path


def plot_graph(graph, adj):
    """ Use the package networkx to produce a diagrammatic plot of the graph, with
    the nodes in the graph colored according to their current labels.
    Note that only 20 unique colors are available for the current color map,
    so common colors across nodes may be coincidental.
    Parameters
    ----------
    graph : Tuple[Node, ...]
        The graph to plot. This is simple a tuple of the nodes in the graph.
        Each element should be an instance of the `Node`-class.

    adj : numpy.ndarray, shape=(N, N)
        The adjacency-matrix for the graph. Nonzero entries indicate
        the presence of edges.

    Returns
    -------
    Tuple[matplotlib.fig.Fig, matplotlib.axis.Axes]
        The figure and axes for the plot."""

    g = nx.Graph()
    for n, node in enumerate(graph):
        g.add_node(n)

    # construct a network-x graph from the adjacency matrix: a non-zero entry at adj[i, j]
    # indicates that an egde is present between Node-i and Node-j. Because the edges are
    # undirected, the adjacency matrix must be symmetric, thus we only look ate the triangular
    # upper-half of the entries to avoid adding redundant nodes/edges
    g.add_edges_from(zip(*np.where(np.triu(adj) > 0)))

    # we want to visualize our graph of nodes and edges; to give the graph a spatial representation,
    # we treat each node as a point in 2D space, and edges like compressed springs. We simulate
    # all of these springs decompressing (relaxing) to naturally space out the nodes of the graph
    # this will hopefully give us a sensible (x, y) for each node, so that our graph is given
    # a reasonable visual depiction
    pos = nx.spring_layout(g)

    # make a mapping that maps: node-lab -> color, for each unique label in the graph
    color = list(iter(cm.tab20b(np.linspace(0, 1, len(set(i.label for i in graph))))))
    color_map = dict(zip(sorted(set(i.label for i in graph)), color))
    colors = [color_map[i.label] for i in graph]  # the color for each node in the graph, according to the node's label

    # render the visualization of the graph, with the nodes colored based on their labels!
    fig, ax = plt.subplots()
    nx.draw_networkx_nodes(g, pos=pos, ax=ax, nodelist=range(len(graph)), node_color=colors)
    nx.draw_networkx_edges(g, pos, ax=ax, edgelist=g.edges())
    return fig, ax

In [2]:
import numpy as np
from typing import List

def whispers_algorithm(adj_matrix: np.ndarray, nodes: List[Node]):
    '''
    adj_matrix: an adjacency matrix that consists of all images (N x N). This is
    used for the weighted sum.
    
    nodes: a list of Node objects. This is used to determine if a node has been visited
    and also allows us to change the label of a node and access its neighbors.
    '''
    N = len(nodes)
    visited = {}
    while len(visited) < N:
        i = np.random.randint(0, N, size=1)[0]
        node = nodes[i]
        if node.id not in visited:
            weighted_sum_list = {}
            for neighbor in node.neighbors:
                if neighbor.label not in weighted_sum_list:
                    weighted_sum_list[neighbor.label] = adj_matrix[node.id][node.neighbor.id]
                else:
                    weighted_sum_list[neighbor.label] += adj_matrix[node.id][node.neighbor.id]
            if weighted_sum_list:
                max_weighted_sum = max(weighted_sum_list, key=weighted_sum_list.get)
                potential_neighbors = [k for k,v in weighted_sum_list.items() if v == max_weighted_sum]
                r = np.random.randint(0, len(potential_neighbors), size=1)[0]
                label = potential_neighbors[r].label
            
                node.label = label
            visited[node.id] = True

In [3]:
def assess_success(clusters, truth):
    correct_match = 0
    label_match_only = 0
    truth_match_only = 0
    no_match = 0
    
    for node_i in range(len(clusters)):
        
        if clusters[node_i].label == truth[node_i].label and clusters[node_i].truth == truth[node_i].truth: 
            correct_match += 1
        elif not clusters[node_i].label == truth[node_i].label and clusters[node_i].truth == truth[node_i].truth:
            truth_match_only += 1
        elif clusters[node_i].label == truth[node_i].label and not clusters[node_i].truth == truth[node_i].truth:
            labl_match_only += 1
        else: 
            no_match += 1
            
    
    pairwise_precision = correct_match / (correct_match + truth_match_only)
    pairwise_recall = correct_match / (correct_match + label_match_only)
    return pairwise_precision, pairwise_recall

In [5]:
from networkx.generators.random_graphs import erdos_renyi_graph

n = 6
p = 0.5

g = erdos_renyi_graph(n, p)

In [None]:
from networkx.linalg.