imports

In [None]:
# imports
import pandas as pd
import numpy as np
import json

loading data

In [None]:
# location dataframe
location_df = pd.read_csv('SaO_Optilandia_resub_locations.csv')

# links dataframe
links_df = pd.read_csv('SaO_Optilandia_resub_links.csv')

# extract lorry data from json
lorry_data = json.load(open('SaO_Optilandia_resub_depot_lorries.json', 'r'))

# set count to 0
k = 0

# initialise lorry list
lorry = []

# loop -> set i to the respective lorry key
for i in lorry_data.keys():
    # set j to the the number of lorries at key 'i'
    for j in range(0, len(lorry_data[i])):
        # append each lorry in lorry_data to lorry list
        lorry.append(pd.DataFrame(lorry_data[i][j], index=[k]))
        # accumulate index
        k += 1

# lorry dataframe
lorry_df = pd.concat(lorry)

In [None]:
# show first 5 rows of lorry_df
lorry_df.head()

In [None]:
# list of depot locations (where nodes == depot)
depot_locations = np.where(location_df.is_depot)[0]

# list of customer locations (where nodes == customers)
customer_locations = np.where(location_df.is_customer)[0]

imports + visualising the map

In [None]:
# imports
import networkx as nx
from scipy.spatial.distance import pdist, squareform
import matplotlib.pyplot as plt 

# parwise distance calculation for each node
euclidean = squareform(pdist(location_df[['x', 'y']]))

# edges list initialisation
edges = []

# loop through links_df rows
for _, (i, j) in links_df.iterrows():
    # append node at i, node at j, and their pairwise distance to edges
    edges.append((i, j, euclidean[i, j]))

# pos dict intialisation
pos = {}

# loop through location_df rows
for k, v in location_df[['x', 'y']].iterrows():
    # update pos dict with array of k, v 
    pos.update({k:v.values})

# initialise depot_labels dict
depot_labels = {}

# loop throgugh depot_locations
for i in depot_locations:
    # update depot_labels dict with {i:i}
    depot_labels.update({i:i})

# initialise customer_labels dict
customer_labels = {}

# loop through customer_locations
for i in customer_locations:
    # update customer_labels dict with {i:i}
    customer_labels.update({i:i})

# initialise nx Graph
G = nx.Graph()

# feed node list to G
G.add_nodes_from(location_df['id'].to_numpy())

# feed edges list to G
G.add_weighted_edges_from(edges)

# resize figure 
plt.figure(figsize=(16, 8))

# sketch graph
nx.draw(G, pos=pos, node_size=40)

# label depot nodes
nx.draw_networkx_labels(G, pos, depot_labels)

# label customer nodes
nx.draw_networkx_labels(G, pos, customer_labels)

# mark depot nodes
nx.draw_networkx_nodes(G, pos=pos, nodelist=depot_locations, node_color='r', node_size=400, alpha=0.9)

# mark customer nodes
nx.draw_networkx_nodes(G, pos=pos, nodelist=customer_locations, node_color='g', node_size=200, alpha=0.3)

clustering nodes (customer_locations) via nearest neighbour sorting

In [None]:
# intialise cluster dict
cluster = {124:[], 127:[], 167:[], 523:[]}

# intialise nodes list
nodes = [] 

# loop through each node in customer_locations
for node in customer_locations:
    # check if node in nodes
    if node not in nodes:
        # initialise dist list
        dist = []
        # loop through each depot key
        for depot in cluster.keys():
            # append euclidean weights to dist 
            dist.append(euclidean[node, depot])
        # get shortest distance
        shortestDist = min(dist)
        # match shortest distance to equivalent node index
        nearestDepotIndex = np.where(euclidean[node]==shortestDist)
        # add node to relative nearest depot location
        cluster[int(nearestDepotIndex[0])].append(node)
        # track applied nodes
        nodes.append(node)
        # clear dist
        dist.clear()

# print allocated nodes to relative cluster points (depot locations)
print(cluster)

# clear nodes list
nodes.clear()

states and constraints

In [None]:
# setting required column 
location_df['required'] = location_df['capacity']-location_df['level']

# displaying rows where is_customer true
location_df[location_df['is_customer']==True].head()

greedy search (breadth-first-search used for path finding)

In [None]:
# function: finding next nearest customer node
def nearest_customer(currentState, customerList):
    #initialise dist dict
    dist = {}
    
    # loop through customerList
    for i in customerList:
        # check for all where customer != currentState
        if i != currentState:
            # update dist with available customer index and their relative weights
            dist.update({i:euclidean[i,currentState]})

    # initialise temp list
    temp = []

    # loop through keys of dist 
    for i in dist.keys():
        # add weights to temp
        temp.append(dist[i])
    
    # get lowest weight
    _shortestDist = min(temp)
    
    # find relative index of lowest weight
    nearestCustomerIndex = np.where(euclidean[currentState]==_shortestDist)
    
    # return next index with relative weight
    return int(nearestCustomerIndex[0]), _shortestDist

In [None]:
# test nearest_customer()
nearest_customer(1, [2, 3, 1, 5])

In [None]:
# function: finding the nearest depot
def nearest_depot(currentState, depotList):
    # intialise dist dict
    dist = {}

    # loop through depotList
    for i in depotList:
        # update dist with depot and their relative distance values
        dist.update({i:euclidean[currentState, i]})
    
    # intialise temp list
    temp = []

    # loop through dist.keys()
    for i in dist.keys():
        # add values of each dist.keys() to temp 
        temp.append(dist[i])

    # get lowest depot weight
    _shortestDist = min(temp)

    # get the relative node index of the closest depot
    _nearestDepotIndex = np.where(euclidean[currentState]==_shortestDist)

    # return next depot index with relative weight
    return int(_nearestDepotIndex[0]), _shortestDist

In [None]:
# test near_depot()
nearest_depot(1, depot_locations)

In [None]:
# add 'depot' column to lorry_df and updae with the lorry's relative depot 
lorry_df['depot'] = lorry_df.lorry_id.apply(lambda x: x.split('-')[0])
lorry_df.head()

In [None]:
# intialise routes dict
routes = {}

# loop through lorry_df.index 
for i in lorry_df.index:
    # update routes with key: lorry_id, value: capacity
    routes.update({lorry_df['lorry_id'][i]:[[int(lorry_df.depot[i]),int(lorry_df['capacity'][i])]]})

In [None]:
# display routes so far
routes

In [None]:
# Routing from A to B using recursive Breadth-First-Search based algorithm to find shortest route, with back tracing
def routing(currState, toState, edges):
    # intialise visitedState list for tracking node traversal
    visitedState = [currState]
    # initialise visitedEdge list for tracking edge traversal
    visitedEdge = []
    # intialise edgeMemory list for storing the explored edges
    edgeMemory = []
    # intialise queue list for choosing the central node for next traversal
    queue = [currState]

    # loop while toState is not found
    while currState != toState:
        # remove and store the last element of the queue list as q
        q = queue.pop(0)
        
        # intialise currEdges dict which holds the next set of edges for traversals
        currEdges = {}
        # get the nodes at each edge, where either nodes are equivalent to q
        for edge in list(np.where(links_df[['id1', 'id2']]==q)[0]):
            # update the dict with the relative edge key and the node pairs
            currEdges.update({edge:[edges[edge][0], edges[edge][1]]})
        
        # store the explored edges in edgeMemory list
        edgeMemory.append(currEdges)

        # loop through each edge in currEdges
        for edge in currEdges:
            # check if the edge has been visited 
            if edge not in visitedEdge:
                # if not visited then add the edge to visitedEdge
                visitedEdge.append(edge)
                # check the node index in the edge that has not been visited 
                if currEdges[edge][0] not in visitedState and currEdges[edge][1] in visitedState:
                    # set currState to the unvisited node 
                    currState = currEdges[edge][0]
                    # mark the node in currState as visited 
                    visitedState.append(currState)
                    # add new currState to queue 
                    queue.append(currState)
                    # check if toState reached
                    if currState == toState:
                        # set currState to toState
                        currState = toState
                        # end loop
                        break 
                # similar to above but in the context of different index position of the node that has not been visited
                if currEdges[edge][1] not in visitedState and edges[edge][0] in visitedState:
                    currState = currEdges[edge][1]
                    visitedState.append(currState)
                    queue.append(currState)
                    if currState == toState:
                        currState = toState
                        break
    
    # set startState as the first node in visitedState list
    startState = visitedState[0]
    # set lastQ as the toState for tracking q node from end of order
    lastQ = [toState]
    # intialise backtrace list for backtracing the edges from edgeMemory
    backtrace = []
    # initialise nodetrace list for backtracing the nodes from edgeMemory
    nodetrace = []

    # intialise edgeMemoryReversed for reordering edgeMemory 
    edgeMemoryReversed = []
    # loop through each index between range 0 and length of edgeMemory
    for i in range (0, len(edgeMemory)):
        # set endElement to the last element in edgeMemory
        endElement = edgeMemory.pop(-1)
        # add the endElement to edgeMemoryReversed
        edgeMemoryReversed.append(endElement)
    
    # while last element in lastQ is not equivalent to the startState
    while lastQ[-1] != startState:
        # loop through each edge options in edgeMemoryReversed
        for edgeOpt in edgeMemoryReversed:
            # loop through each edge from as keys of the edge options
            for edge in edgeOpt.keys():

                # check if last element of lastQ is in the set of edge options given the edge
                if lastQ[-1] in edgeOpt[edge]:
                    # add the edge to backtrace 
                    backtrace.append(edge)
                    # check index of node which matches the lastQ element 
                    if lastQ[-1] == edgeOpt[edge][0] and lastQ[-1] != edgeOpt[edge][1]:
                        # update lastQ as the the node which does not match the lastQ element
                        lastQ.append(edgeOpt[edge][1])
                        # add the node to nodetrace
                        nodetrace.append(edgeOpt[edge][1])
                        # return to while iterate
                        break
                        # similar to above but in the context of different index postion of the matching node with lastQ element
                    if lastQ[-1] != edgeOpt[edge][0] and lastQ[-1] == edgeOpt[edge][1]:
                        lastQ.append(edgeOpt[edge][0])
                        nodetrace.append(edgeOpt[edge][0])
                        break
    
    # re-ordering edges from start to end
    edgeTraversed = []
    for i in range(0, len(backtrace)):
        endElement = backtrace.pop(-1)
        edgeTraversed.append(endElement)

    # re-ordering nodes from start to end 
    nodeOrder = []
    for i in range(0, len(nodetrace)):
        endElement = nodetrace.pop(-1)
        nodeOrder.append(endElement)
    
    # adding route weight (distance between nodes) to each traversal made
    routeWeight = []
    for edge in edgeTraversed:
        routeWeight.append(edges[edge][2])

    # return the the order in which nodes were visited and the order in which edges were traversed
    return nodeOrder, edgeTraversed, routeWeight

In [None]:
# test: gives the node order in routing
print(f'node order: {routing(124, 10, edges)[0]}')
# test: gives the traversed edges in routing
print(f'edge order: {routing(124, 10, edges)[1]}')
# test: gives the weight routes for traversed
print(f'weights: {routing(124, 10, edges)[2]}')

In [None]:
# intialise totalRouteCost list to store route costs
routeTotalCost = []

In [None]:
# route() function to allocate gas depending on the allocated customer's tank level and their distance from lorry's state
def route(lorryId, allocatedCustomers):
    # get currentId of lorry
    currentId = lorryId
    # get base depot of lorry
    operatingDepot = currentId.split('-')[0]
    # get currentCapacity of lorry
    currentCapacity = float(lorry_df[lorry_df['lorry_id']==currentId].capacity)
    # get currentCpm of lorry
    currentCpm = float(lorry_df[lorry_df['lorry_id']==currentId].cpm)
    # get currentCptm of lorry
    currentCptm = float(lorry_df[lorry_df['lorry_id']==currentId].cptm)
    # get currentState of lorry
    currentState = int(lorry_df[lorry_df['lorry_id']==currentId].depot)
    # get current depot of lorry
    currentDepot = int(lorry_df[lorry_df['lorry_id']==currentId].depot)
    # set next customer capacity at 0
    nextCustomerCapacity = 0

    # iterate while the lorry capacity is >= the remaining customer capacity and while their are remaining allocated customers
    while (currentCapacity >= nextCustomerCapacity) and (len(allocatedCustomers)>0):
        # get the nearest customer from the lorry's current state
        nextCustomer = nearest_customer(currentState, allocatedCustomers)
        
        # check if customer tank space is more than 50% (i.e., (customerCapacity-customerRequired) < (customerCapacity/2))
        if ((location_df[location_df['id']==nextCustomer[0]]['capacity'].iloc[0])-float(location_df[location_df['id']==nextCustomer[0]]['required'].iloc[0])) < ((location_df[location_df['id']==nextCustomer[0]]['capacity'].iloc[0])):
        # if float((location_df[location_df['id']==nextCustomer[0]]['capacity'].iloc[0])-float(location_df[location_df['id']==nextCustomer[0]]['required'].iloc[0])) < float((location_df[location_df['id']==nextCustomer[0]]['capacity'].iloc[0])*float(0.5)):
            # append visited customer node, and the amount of gas deposit to routes dict
            routes[currentId].append([int(nextCustomer[0]), -(location_df[location_df['id']==nextCustomer[0]]['required'].iloc[0])])
            # get the cost of traversing between each node links when travelling to nextCustomer node (round to 2 d.p.)
            routeCost = round(sum(routing(currentState, nextCustomer[0], edges)[2])*(currentCpm+(currentCapacity*currentCptm)), 2)
            # append routeCost to routeTotalCost list for post-route cost eval.
            routeTotalCost.append(routeCost)
            # update the current lorry capacity after gas deposit
            currentCapacity = currentCapacity-(location_df[location_df['id']==nextCustomer[0]]['required'].iloc[0])
            # update the allocatedCustomer's list by removing the served customers
            allocatedCustomers.remove(nextCustomer[0])
            # update the lorry's currentState 
            currentState = nextCustomer[0]

        # check if customer tank space is less than 50% (i.e., (customerCapacity-customerRequired) > (customerCapacity/2))
        elif ((location_df[location_df['id']==nextCustomer[0]]['capacity'].iloc[0])-(location_df[location_df['id']==nextCustomer[0]]['required'].iloc[0])) > ((location_df[location_df['id']==nextCustomer[0]]['capacity'].iloc[0])):
        # elif float((location_df[location_df['id']==nextCustomer[0]]['capacity'].iloc[0])-float(location_df[location_df['id']==nextCustomer[0]]['required'].iloc[0])) > float((location_df[location_df['id']==nextCustomer[0]]['capacity'].iloc[0])*float(0.5)):
            # amount of gas deposit 0 since no deposit made
            fillAmount = float(0)
            # append visited customer node, and -0 gas deposit as this customer need not be served
            routes[currentId].append([int(nextCustomer[0]), -fillAmount])
            # get the cost of traversing between each node links when travelling to nextCustomer node (round to 2 d.p.)
            routeCost = round(sum(routing(currentState, nextCustomer[0], edges)[2])*(currentCpm+(currentCapacity*currentCptm)), 2)
            # append routeCost to routeTotalCost list for post-route cost eval.
            routeTotalCost.append(routeCost)
            # update the current lorry capacity after gas deposit (-0 here since 0 deposit)
            currentCapacity = currentCapacity-0
            # if tank space is less than 50% then remove customer node as they do not require filling
            allocatedCustomers.remove(nextCustomer[0])
            # update the lorry's currentState
            currentState = nextCustomer[0]
        
        # check for remaining allocated customers
        if len(allocatedCustomers) != 0:
            # set nextCustomerCapacity to the nearest customer's capacity for consecutive iterations
            nextCustomerCapacity = location_df[location_df['id']==(nearest_customer(nextCustomer[0], allocatedCustomers)[0])]['required'].iloc[0]
    
    # if lorry's currentCapacity < nextCustomerCapacity
    if currentCapacity < nextCustomerCapacity:
        # update the cluster's customer list with the current set of allocatedCustomers
        cluster[currentDepot]=allocatedCustomers
        # print current lorry's end of route
        print(f'{currentId} finished operating at {currentState}')
    
    # check if any allocated customers remaining
    elif len(allocatedCustomers)==0:
        # print current lorry's  end of route
        print(f'{currentId} finished operating at {currentState}')

In [None]:
# loop through each depot in depot_locations
for i in depot_locations:
    # initialise relative dataframe for lorries at each depot
    df = lorry_df[lorry_df['depot']==f'{i}']
    # set count to 0
    count = 0 

    # loop through each index per in-loop defined df (of depot-relative lorries)
    for j in df.index:
        # print start of lorry's route
        print(f'{df.loc[j].lorry_id} started operating')
        # call route() for each lorry in the relative depot
        route(df.loc[j].lorry_id, cluster[i])
        # count increment
        count += 1
        
        # check if depot's allocated customers remaining
        if len(cluster[i])!=0 and count==len(df.index): 
            # while depot has customers remaining
            while len(cluster[i]!=0):
                # set currentId to relative lorry's ID
                currentId = lorry_df.loc[j]['lorry_id']
                # get the last state of the relative lorry from routes dict
                currentState = routes[currentId][-1][0]
                # find the nearest depot from the lorry's current state
                nearDepot = nearest_depot(currentState)
                # print refill statement
                print(f'{currentId} is refilling tank at {nearDepot[0]}')
                # get the cost of traversing between each node links when travelling to nearDepot node (round to 2 d.p.)
                routeCost = round(sum(routing(currentState, nearDepot[0], edges)[2])*((lorry_df.loc[j]['cpm'])+(lorry_df.loc[j]['capacity']*lorry_df.loc[j]['cptm'])), 2)
                # append routeCost to routeTotalCost list for post-route cost eval.
                routeTotalCost.append(routeCost)
                # update routes dict with new state and refill amount
                routes[currentId].append([int(nearDepot[0]),int(lorry_df.loc[j]['capacity'])])
                # update currentState to nearDepot
                currentState = nearDepot[0]
                # call route() for the relative lorry with the relative allocated customers
                route(currentId, cluster[i])
        # check if depot has customers remaining
        elif len(cluster[i])==0:
            # end loop if no customers remaining
            break

In [None]:
# print routes
print(routes)

In [None]:
# print cost of each traversal made and the sum of the costs rounded to 2 d.p.
print(f'PATH COST: {routeTotalCost} \n\nTOTAL COST: {round(sum(routeTotalCost), 2)}')

In [None]:
# initialise results list
results = []
# store the lorry_id and relative traversal made in routes to results
for i in routes.keys():
    results.append({'lorry_id':i, 'traversal':routes[i]})

In [None]:
# an encoder class which helps to make the results list json serializable 
class NpEncoder(json.JSONEncoder):
    def default(self, obj):
         if isinstance(obj, np.integer):
            return int(obj)
         elif isinstance(obj, np.floating):
            return float(obj)
         elif isinstance(obj, np.ndarray):
            return obj.tolist()
         else:
            return super(NpEncoder, self).default(obj)

In [None]:
# open new file 'task1_solution.json' as file for outputting results in json format
with open('task1_solution.json', 'w') as file:
    # use json.dump() to convert type(results) to json and stream to filepath 
    json.dump(results, file, cls=NpEncoder)