In [10]:
import time
from heapdict import heapdict

In this programming problem you'll code up Dijkstra's shortest-path algorithm.

The file contains an adjacency list representation of an undirected weighted graph with 200 vertices labeled 1 to 200. Each row consists of the node tuples that are adjacent to that particular vertex along with the length of that edge. For example, the 6th row has 6 as the first entry indicating that this row corresponds to the vertex labeled 6. The next entry of this row "141,8200" indicates that there is an edge between vertex 6 and vertex 141 that has length 8200. The rest of the pairs of this row indicate the other vertices adjacent to vertex 6 and the lengths of the corresponding edges.

Your task is to run Dijkstra's shortest-path algorithm on this graph, using 1 (the first vertex) as the source vertex, and to compute the shortest-path distances between 1 and every other vertex of the graph. If there is no path between a vertex v and vertex 1, we'll define the shortest-path distance between 1 and v to be 1000000.

You should report the shortest-path distances to the following ten vertices, in order: 7,37,59,82,99,115,133,165,188,197. You should encode the distances as a comma-separated string of integers. So if you find that all ten of these vertices except 115 are at distance 1000 away from vertex 1 and 115 is 2000 distance away, then your answer should be 1000,1000,1000,1000,1000,2000,1000,1000,1000,1000. Remember the order of reporting DOES MATTER, and the string should be in the same order in which the above ten vertices are given. The string should not contain any spaces. Please type your answer in the space provided.

IMPLEMENTATION NOTES: This graph is small enough that the straightforward O(mn) time implementation of Dijkstra's algorithm should work fine. OPTIONAL: For those of you seeking an additional challenge, try implementing the heap-based version. Note this requires a heap that supports deletions, and you'll probably need to maintain some kind of mapping between vertices and their positions in the heap

In [14]:
def read_input_slow(filename):
    with open('week6_file/'+filename) as f: 
        edges = []
        for line in f:
            line = line.split() # to deal with blank 
            if line:            # lines (ie skip them)
                v = int(line[0])
                for paired in line[1:]:
                    w,weight = paired.split(',')
                    w = int(w)
                    weight = int(weight)
                    edges.append([v,w,weight])
                    
            n = v
    return edges,n

In [15]:
def dijkstra_algorithm_slow(filename):
    edges,n = read_input_slow(filename)
    A = [1000000]*(n+1)  #n size of Graph G
    B = [[]]*(n+1)
    X_ = [0]*(n+1)
    X = [1]
    A[1] = 0
    
    while len(X) != n:
        min_dist = 1000000
        for v,w,weight_vw in edges:
            if v in X and w not in X:
                if min_dist > A[v] + weight_vw:
                    min_dist = A[v] + weight_vw
                    w_star = w
                    v_star = v
                    weight_star = weight_vw
        X.append(w_star)
        A[w_star] = A[v_star] + weight_star
        B[w_star] = [*B[v_star]] + [w_star]
        
    return A,B

In [16]:
def read_input(filename):
    with open('week6_file/'+filename) as f:
        G = {}
        for line in f:
            line = line.split() # to deal with blank 
            if line:            # lines (ie skip them)
                v = int(line[0])
                for paired in line[1:]:
                    w,weight = paired.split(',')
                    w = int(w)
                    weight = int(weight)
                    if G.get(v) == None:
                        G[v] = [(v,w,weight)]
                    else:
                        G[v].append((v,w,weight))
                    
    return G

In [17]:
def dijkstra_algorithm(filename):
    G = read_input(filename)
    n = len(G.keys())
    A = [1000000]*(n+1)  #n size of Graph G
    B = [[]]*(n+1)
    X_ = [0]*(n+1)
    X = [1]
    A[1] = 0
    
    while len(X) != n:
        min_dist = 1000000
        for vertices in X: #Faster than loop through edges
            for (v,w,weight_vw) in G[vertices]:
                if w not in X:
                    if min_dist > A[v] + weight_vw:
                        min_dist = A[v] + weight_vw
                        w_star = w
                        v_star = v
                        weight_star = weight_vw
        X.append(w_star)
        A[w_star] = A[v_star] + weight_star
        B[w_star] = [*B[v_star]] + [w_star]
        
    return A,B

In [18]:
def dijkstra_algorithm_heap(filename):
    G = read_input(filename)
    n = len(G.keys())
    X = []
    A = [1000000]*(n+1)  #n size of Graph G
    A[1] = 0
    hd = heapdict()
    hd[1] = 0
    for i in list(G.keys())[1:]:
        hd[i] = 1000000

    while any(hd):
        w,distance = hd.popitem()
        X.append(w)
        A[w] = distance
        for (w,v,weight_wv) in G[w]: 
            if hd.get(v) != None:
                hd[v] = min(hd[v],A[w]+weight_wv)
        
    return A

In [19]:
start_time = time.time()
A,B = dijkstra_algorithm_slow('week6_test1.txt') 
print("--- %s seconds ---" % (time.time() - start_time))
start_time = time.time()
A,B = dijkstra_algorithm('week6_test1.txt') 
print("--- %s seconds ---" % (time.time() - start_time))
start_time = time.time()
A = dijkstra_algorithm_heap('week6_test1.txt') 
print("--- %s seconds ---" % (time.time() - start_time))
print(A,B)

--- 0.004079103469848633 seconds ---
--- 0.0008368492126464844 seconds ---
--- 0.0018088817596435547 seconds ---
[1000000, 0, 1, 2, 3, 4, 4, 3, 2] [[], [], [2], [2, 3], [2, 3, 4], [2, 3, 4, 5], [8, 7, 6], [8, 7], [8]]


In [23]:
start_time = time.time()
A,B = dijkstra_algorithm_slow('week6_test2.txt') 
print("--- %s seconds ---" % (time.time() - start_time))
start_time = time.time()
A,B = dijkstra_algorithm('week6_test2.txt') 
print("--- %s seconds ---" % (time.time() - start_time))
start_time = time.time()
A = dijkstra_algorithm_heap('week6_test2.txt') 
print("--- %s seconds ---" % (time.time() - start_time))
print(A,B)

--- 0.0009808540344238281 seconds ---
--- 0.0014100074768066406 seconds ---
--- 0.0010662078857421875 seconds ---
[1000000, 0, 3, 5, 8, 5, 7, 11, 4, 6, 10, 10] [[], [], [2], [2, 3], [2, 3, 4], [5], [2, 3, 6], [2, 3, 7], [8], [8, 9], [2, 3, 6, 10], [2, 3, 4, 11]]


In [21]:
start_time = time.time()
A,B = dijkstra_algorithm_slow('week6.txt') 
print("--- %s seconds ---" % (time.time() - start_time))
start_time = time.time()
A,B = dijkstra_algorithm('week6.txt') 
print("--- %s seconds ---" % (time.time() - start_time))
start_time = time.time()
A = dijkstra_algorithm_heap('week6.txt') 
print("--- %s seconds ---" % (time.time() - start_time))
print(A[7],A[37],A[59],A[82],A[99],A[115],A[133],A[165],A[188],A[197]) #2599 2610 2947 2052 2367 2399 2029 2442 2505 3068

--- 1.4893732070922852 seconds ---
--- 0.6011641025543213 seconds ---
--- 0.1737370491027832 seconds ---
2599 2610 2947 2052 2367 2399 2029 2442 2505 3068
