In [1]:
import time
import numpy as np
import math
import random
from random import randrange
from copy import copy, deepcopy

The file contains the adjacency list representation of a simple undirected graph. There are 200 vertices labeled 1 to 200. The first column in the file represents the vertex label, and the particular row (other entries except the first column) tells all the vertices that the vertex is adjacent to. So for example, the 6th row looks like : "6	155	56	52	120	......". This just means that the vertex with label 6 is adjacent to (i.e., shares an edge with) the vertices with labels 155,56,52,120,......,etc

Your task is to code up and run the randomized contraction algorithm for the min cut problem and use it on the above graph to compute the min cut. (HINT: Note that you'll have to figure out an implementation of edge contractions. Initially, you might want to do this naively, creating a new graph from the old every time there's an edge contraction. But you should also think about more efficient implementations.) (WARNING: As per the video lectures, please make sure to run the algorithm many times with different random seeds, and remember the smallest cut that you ever find.) Write your numeric answer in the space provided. So e.g., if your answer is 5, just type 5 in the space provided.


<img src="week4_file/week4_ilustration.png" style="width: 750px">
The process coresspond to the diagram is as follows:

First picture: 

G = {1 : [(1,2),(1,3)], 2 : [(2,1),(2,3),(2,4)], 3 : [(3,1),(3,2),(3,4)], 4:[(4,2),(4,3)]} 

edges = [(1,2),(1,3),(2,1),(2,3),(2,4),(3,1),(3,2),(3,4),(4,2),(4,3)]

Pick edges (1,3) to contract

Second picture:

G = {1 : [(1,2),(1,3),(3,2),(3,4)], 2 : [(2,1),(2,3),(2,4)], 4:[(4,2),(4,3)]} 

(3,1) is not included because it is self loop (1,3 are connected) and checked using line if not cuts.connected(w,j):  G[w].append((i,j)))

edges choice = [(1,2),(2,1),(2,3),(2,4),(3,2),(3,4),(4,2),(4,3)]

(1,3) and (3,1) cannot be choosen because it is connected now (self loop)

Third picture:

G = {1 : [(1,2),(1,3),(3,2),(3,4),(2,4)], 4:[(4,2),(4,3)]} 

(2,1),(2,3) excluded because (1,1) and (1,3) is connected

edges choice = [(2,4),(3,4),(4,2),(4,3)]
 

In [2]:
class UnionFind:
    """Weighted quick-union with path compression.
    The original Java implementation is introduced at
    https://www.cs.princeton.edu/~rs/AlgsDS07/01UnionFind.pdf
    >>> uf = UnionFind(10)
    >>> for (p, q) in [(3, 4), (4, 9), (8, 0), (2, 3), (5, 6), (5, 9),
    ...                (7, 3), (4, 8), (6, 1)]:
    ...     uf.union(p, q)
    >>> uf._id
    [8, 3, 3, 3, 3, 3, 3, 3, 3, 3]
    >>> uf.find(0, 1)
    True
    >>> uf._id
    [3, 3, 3, 3, 3, 3, 3, 3, 3, 3]
    """
        
    def __init__(self,n):
        self._id = list(range(n))
        self._sz = [1]*n
    
    def find(self,i):
        j = i
        while (j != self._id[j]):
            self._id[j] = self._id[self._id[j]]
            j = self._id[j]
        return j

    def connected(self,p,q):
        return self.find(p) == self.find(q)
    
    def union(self,p,q):
        i = self.find(p)
        j = self.find(q)
        if i == j:
            return
        elif (self._sz[i] < self._sz[j]):
            self._id[i] = j
            self._sz[j] += self._sz[i]
        else:
            self._id[j] = i
            self._sz[i] += self._sz[j]

In [3]:
def read_input(filename):
    with open('week4_file/'+filename) as f:
        G = {}
        edges = []
        for line in f:
            line = line.split() # to deal with blank 
            if line:            # lines (ie skip them)
                line = [int(i) for i in line]
                v = line[0]
                G[v] = [(v,u) for u in line[1:]]
                for i in line[1:]:
                    edges.append((v,i))
    return G,edges

In [4]:
def contract(G,edges,cuts,edge_index):
    while True:
        u,v = edges[edge_index]
        edge_index += 1
        u = cuts.find(u)
        v = cuts.find(v)
        #do not consider self-loops
        if not cuts.connected(u,v):
            cuts.union(u,v)
            break
    #find the new roots of both of u and v
    w = cuts.find(u)
    #w is connected to u and v
    
    #if w is not v or u itself, we append the edges
    if w!= v:
        for (i,j) in G[v]: #every i from (i,j) of G[v] is connected to v
            if not cuts.connected(w,j): #if w connected to j, and w is connected to v (w is the root of u and v)
                G[w].append((i,j))
        del G[v]
    
    if w!= u:
        for (i,j) in G[u]:
            if not cuts.connected(w,j):
                G[w].append((i,j))
        del G[u]
        
    return edge_index

In [5]:
def karger_min_cut(G,edges):
    n = max(G.keys())
    #To make union find start at 1 to n (coresspond to index 0 to n+1)
    cuts = UnionFind(n+1)
    edge_index = 0
    
    #while there are more than 2 vertices
    for _ in range(n-2):
        #pick a remaining edge(u,v) uniformly at random and merge (or "contract) u and v into a single vertex
        edge_index = contract(G,edges,cuts,edge_index)
    
    u,v = G.keys()
    #(u,v) self loop in the list of edges if and only if u and v is connected, we don't consider cuts.connected(u,x)
    #because G[u] and x where x is from (x,v) is always connected in the first place when we contract.
    #key with the minimum item
    
    if len(G[u]) <= len(G[v]):
        edge_min = G[u]
    else:
        edge_min = G[v]
    
    #return cut represented by final two vertices
    mc = [(i,j) for (i,j) in edge_min if not cuts.connected(i,j)]
    
    return mc, len(mc)
        

In [22]:
def monte_carlo_karger(G,edges,N=0):
    '''Compute a cut with fewest number of crossing edges: a min cut.'''
    min_cut_len = float("inf")
    n = max(G.keys())
    if N == 0:
        N = math.ceil(n**2*(math.log(n)))

    m = len(edges)
    for k in range(N):
        G_temp = deepcopy(G)
        random.shuffle(edges)
        #for i in range(m):
         #   j =  randrange(i,m) #generate 1 to m-1
          #  edges[i], edges[j] = edges[j] , edges[i]
        min_cut_temp, min_cut_len_temp = karger_min_cut(G_temp,edges)
        if min_cut_len_temp < min_cut_len:
            counter = 0
            min_cut_len = min_cut_len_temp
            min_cut = min_cut_temp
        if k % 100 == 0 and k != 0:
            counter +=1
            print(min_cut,min_cut_len)
            if counter == 10:
                return min_cut,min_cut_len
    return min_cut,min_cut_len

In [23]:
start_time = time.time()
G, edges = read_input('week4_test1.txt')
m = len(edges)
for i in range(m):
    j =  randrange(i,m) #generate 1 to m-1
    edges[i], edges[j] = edges[j] , edges[i]
print("--- %s seconds ---" % (time.time() - start_time))
#print(edges)

--- 0.009731054306030273 seconds ---


In [24]:
start_time = time.time()
G, edges = read_input('week4_test1.txt')
random.shuffle(edges)
print("--- %s seconds ---" % (time.time() - start_time))
print(edges)

--- 0.0020079612731933594 seconds ---
[(1, 4), (4, 5), (2, 4), (5, 8), (5, 4), (3, 1), (8, 7), (2, 3), (6, 5), (7, 1), (1, 7), (4, 1), (3, 2), (4, 3), (1, 2), (7, 6), (4, 2), (1, 3), (6, 8), (8, 6), (2, 1), (7, 5), (3, 4), (6, 7), (5, 6), (8, 5), (7, 8), (5, 7)]


In [25]:
G[1]

[(1, 2), (1, 3), (1, 4), (1, 7)]

In [26]:
lis = []
print(G[1])
print(G[2])
G[1] = [(i,j) for (i,j) in (*G[1],*G[2])]
print(G[1])

[(1, 2), (1, 3), (1, 4), (1, 7)]
[(2, 1), (2, 3), (2, 4)]
[(1, 2), (1, 3), (1, 4), (1, 7), (2, 1), (2, 3), (2, 4)]


In [27]:
start_time = time.time()
G, edges = read_input('week4_test1.txt') 
print(monte_carlo_karger(G,edges)) #2
print("--- %s seconds ---" % (time.time() - start_time))

[(1, 7), (4, 5)] 2
([(1, 7), (4, 5)], 2)
--- 0.04281306266784668 seconds ---


In [28]:
start_time = time.time()
G, edges = read_input('week4_test2.txt')
print(monte_carlo_karger(G,edges)) #2
print("--- %s seconds ---" % (time.time() - start_time))

[(1, 7), (4, 5)] 2
([(1, 7), (4, 5)], 2)
--- 0.06282973289489746 seconds ---


In [29]:
start_time = time.time()
G, edges = read_input('week4_test3.txt')
print(monte_carlo_karger(G,edges)) #1
print("--- %s seconds ---" % (time.time() - start_time))

[(4, 5)] 1
([(4, 5)], 1)
--- 0.04439592361450195 seconds ---


In [30]:
start_time = time.time()
G, edges = read_input('week4_test4.txt')
print(monte_carlo_karger(G,edges)) #1
print("--- %s seconds ---" % (time.time() - start_time))

[(4, 5)] 1
([(4, 5)], 1)
--- 0.06719017028808594 seconds ---


In [31]:
start_time = time.time()
G, edges = read_input('week4_test5.txt')
print(monte_carlo_karger(G,edges)) #3
print("--- %s seconds ---" % (time.time() - start_time))

[(17, 9), (30, 37), (11, 26)] 3
[(17, 9), (30, 37), (11, 26)] 3
[(17, 9), (30, 37), (11, 26)] 3
[(17, 9), (30, 37), (11, 26)] 3
[(17, 9), (30, 37), (11, 26)] 3
[(17, 9), (30, 37), (11, 26)] 3
[(17, 9), (30, 37), (11, 26)] 3
[(17, 9), (30, 37), (11, 26)] 3
[(17, 9), (30, 37), (11, 26)] 3
[(17, 9), (30, 37), (11, 26)] 3
([(17, 9), (30, 37), (11, 26)], 3)
--- 1.624953031539917 seconds ---


In [32]:
start_time = time.time()
G, edges = read_input('week4_test6.txt')
print(monte_carlo_karger(G,edges)) #2
print("--- %s seconds ---" % (time.time() - start_time))

[(1, 5), (4, 8)] 2
([(1, 5), (4, 8)], 2)
--- 0.07304501533508301 seconds ---


In [34]:
start_time = time.time()
G, edges = read_input('week4.txt')
print(monte_carlo_karger(G,edges)) #17
print("--- %s seconds ---" % (time.time() - start_time))

[(24, 53), (109, 86), (134, 80), (161, 149), (116, 164), (41, 108), (163, 79), (36, 122), (141, 178), (169, 27), (188, 58), (184, 171), (186, 37), (48, 193), (10, 185), (165, 91), (123, 156)] 17
[(24, 53), (109, 86), (134, 80), (161, 149), (116, 164), (41, 108), (163, 79), (36, 122), (141, 178), (169, 27), (188, 58), (184, 171), (186, 37), (48, 193), (10, 185), (165, 91), (123, 156)] 17
[(24, 53), (109, 86), (134, 80), (161, 149), (116, 164), (41, 108), (163, 79), (36, 122), (141, 178), (169, 27), (188, 58), (184, 171), (186, 37), (48, 193), (10, 185), (165, 91), (123, 156)] 17
[(24, 53), (109, 86), (134, 80), (161, 149), (116, 164), (41, 108), (163, 79), (36, 122), (141, 178), (169, 27), (188, 58), (184, 171), (186, 37), (48, 193), (10, 185), (165, 91), (123, 156)] 17
[(24, 53), (109, 86), (134, 80), (161, 149), (116, 164), (41, 108), (163, 79), (36, 122), (141, 178), (169, 27), (188, 58), (184, 171), (186, 37), (48, 193), (10, 185), (165, 91), (123, 156)] 17
[(24, 53), (109, 86), (13