# LN - Data PP - Stability and efficiency calculations

## Import libraries and data

In [119]:
import sqlite3
import numpy as np
import pandas as pd
import networkx as nx
import itertools
#import matplotlib.pyplot as plt
import time
import pickle

import os
import re
import sys
import io
from itertools import islice

from tqdm.notebook import trange, tqdm
from time import sleep

from dask_cloudprovider import FargateCluster
from dask.distributed import Client
import dask.array as da
import dask
dask.config.set({'distributed.scheduler.allowed-failures': 50}) 

import s3fs

import boto3


In [69]:


# Load Data

# Initiate s3 resource

session = boto3.session.Session()
s3 = session.resource('s3')


# Dataframe

decisions_load = s3.Object(bucket_name='ln-strategy-data', key='LN_channels.csv').get()
decisions_df=pd.read_csv(io.BytesIO(decisions_load['Body'].read()))

# Channel closures
closure_file = s3.Object(bucket_name='ln-strategy-data', key='channel_closures.p').get()
channel_closures = pickle.loads(closure_file['Body'].read())
    
    
# Channel openings 
opens_file = s3.Object(bucket_name='ln-strategy-data', key='channel_opens.p').get()
channel_opens = pickle.loads(opens_file['Body'].read())

    

# Create list with graph keys

#TODO: Save graphs as numpy array in single H5 file to reduce. Test if creating graphs takes longer than reading from S3

# graph_dir='./data/graph_snapshots' - For local tests
extraction_id=1585344554
graph_keys = [obj.key 
        for obj in s3.Bucket(name='ln-strategy-data').objects.all()
        if re.match(".*"+str(extraction_id)+"_connected/.*\.gpickle",obj.key)]





In [148]:
# Test: extracted formats
print("Number of graph keys:{}".format(len(graph_keys)))
print("---Sample graph keys---")
print(graph_keys[0])
print("---Sample channel opens---")
print(channel_opens[513675])
print("---Sample channel closures---")
print(channel_closures[592638])
print("----Sample blocks----")
print(blocks[1])


Number of graph keys:3996
---Sample graph keys---
graph_snapshots/1585344554_connected/505149.gpickle
---Sample channel opens---
[(5474, 7365, {'capacity': 50000, 'open_fee': 306, 'dec_id': 1, 'channel_id': '513675x2245x0'})]
---Sample channel closures---
[(3098, 1492, {'close_type': 'mutual', 'dec_id': 0, 'channel_id': '505149x622x0'}), (2104, 3098, {'close_type': 'force', 'dec_id': 26620, 'channel_id': '570913x720x1'})]
----Sample blocks----
525952


In [191]:
decisions_df.sort_values(by=['close_block'],inplace=True,ascending=True)
decisions_df.head(10)

Unnamed: 0,short_channel_id,open_block,open_transaction,address,close_block,close_transaction,node0,node1,satoshis,last_seen,...,last_update,close_type,close_htlc_count,close_balance_a,close_balance_b,dec_id,node0_id,node1_id,bet_mar_node0,bet_mar_node1
1027,535029x2012x1,535029,d01928d350e1ba04d7335a91e6dd54f5dbf94859e0c59b...,bc1qszamn0la3yqrqhjj8yepdxkl9qlr84zfwgg9zrkccl...,535029.0,d01928d350e1ba04d7335a91e6dd54f5dbf94859e0c59b...,022a7809052db05fde648391a53aba82286e4a517cff1d...,031b71cbad0cb4e22141e45f16c83c332f755e1ba68195...,462124,2019-07-18 02:48:37,...,,unused,0.0,275630.0,0.0,1027,3160,263,,
1045,535177x446x1,535177,7376d5bc0c18bbff8f644d0827e759a1518b38e1e95a08...,bc1qauzljedtlva73ngg7suqketlvn5gnnuemxpeuevcqt...,535177.0,7376d5bc0c18bbff8f644d0827e759a1518b38e1e95a08...,02272bd12e59324d0f2b231fb88f134b57eb26dd100d2c...,031b71cbad0cb4e22141e45f16c83c332f755e1ba68195...,257307,2019-07-18 02:48:40,...,,unused,0.0,218405.0,0.0,1045,2096,263,,
2745,549037x2738x0,549037,b7128bbbe422b4f18fad71b091eed1f9e4b0d231be8117...,bc1q95fytjzs8f7fma2nf66gcva7c3w7hnkdwrkef9pu33...,549037.0,b7128bbbe422b4f18fad71b091eed1f9e4b0d231be8117...,028b892b15f5cabcea5165b236db0e36dc06553c323c84...,038b36a43c38f75cd15bb25394f1cd162f717df0055852...,400000,2019-08-22 02:59:19,...,1547494000.0,unused,0.0,400000.0,0.0,2745,908,3654,-0.010145,0.001177
2744,549037x2737x0,549037,0825da5e96cd45fced3233ebe615721b687285839d3036...,bc1q5mqzhw5e42rfqh250zalwu47ru8gvz4g4k968me0mg...,549037.0,0825da5e96cd45fced3233ebe615721b687285839d3036...,02b95713bbe4609a337f3ca5aab3a75674083ddf5331a4...,038b36a43c38f75cd15bb25394f1cd162f717df0055852...,400000,2019-08-22 02:59:19,...,1547503000.0,unused,0.0,400000.0,0.0,2744,6052,3654,0.018342,0.014761
40227,549489x1194x1,549489,58dafe493648fbdd69143c26e0cf8a66ae11a272c2739d...,bc1q25j5l6crv4mrjkjjjw4rzyv890cwwnyyw9dezcqs5x...,549489.0,58dafe493648fbdd69143c26e0cf8a66ae11a272c2739d...,02574ffa55d394b9326f6e5c15992cc0516b0d6e6a79a1...,03a5927b64b1ea8657d5b770d61a3e2d0554fdb5d56877...,2500000,2019-06-13 01:12:27,...,,unused,0.0,8974.0,0.0,40227,5247,696,-0.019278,-0.006038
37095,562592x1695x1,562592,06b4d9b3cfa10bd2cd33131d034a6b38c1651eee49018a...,bc1q9jnkm78y45kyasnu43p52gc8sqazwy4yfjtqzkwqx5...,562592.0,06b4d9b3cfa10bd2cd33131d034a6b38c1651eee49018a...,029b71b8186914267ea59cb081c43ad1aeb874b5a185a4...,03864ef025fde8fb587d989186ce6a4a186895ee44a926...,5000000,2019-06-13 02:13:01,...,,unused,0.0,4995006.0,0.0,37095,4405,6802,,
37213,564495x455x1,564495,8a5764e1f0cb659b687a0675cd88983526bd9213665986...,bc1qqgcvu4nl3vjm4vvr9r5l2f4ufppph5fn070fzscq4r...,564510.0,655c3d44c09055e9af9f8d13d55c99979e0b0b306230b9...,024655b768ef40951b20053a5c4b951606d4d86085d512...,0375a154b8f94eb0556566d60d96acc47f99f2f0d74ef9...,400000,2019-06-03 04:39:32,...,,unused,0.0,395111.0,0.0,37213,4528,4646,,
37209,564476x2292x0,564476,0e00d6dc5cf2232d15750bd3177c57521cdff678a5666a...,bc1qec377ms3a79e3v3pe8gfjrzp6syfqykeqkw2lsh86f...,564511.0,58fea309da14892858be78c8c45a7d06fa6796e77e51d8...,028303182c9885da93b3b25c9621d22cf34475e63c1239...,03820e3b7bdbf7ccafe67791088de15df162b352f3b7ba...,20000,2019-06-03 04:39:12,...,,unused,0.0,17111.0,0.0,37209,6190,6834,,
37256,564948x2100x0,564948,e1b4de87949168dafae980bc1f467b2bee878c2667383a...,bc1ql47jp0hprvcq4dz8y5dpape60vhf532uea2rv9v20q...,565057.0,af2a36eb0782958a3f2e7aacb89dfdb92defeaed44df3c...,02529db69fd2ebd3126fb66fafa234fc3544477a23d509...,02e63d3e5a2351cc8de6c63b0d0784d1940406c5addce4...,47882,2019-06-03 04:43:42,...,,force,0.0,44239.0,0.0,37256,7699,4242,,
37255,564948x2082x0,564948,eb12d66c34e8009c408fa56d948bf87baec4888caddd2d...,bc1q4ksyf7c7jphsmwdj8n944y0mypy7n28mts5tt9zrph...,565057.0,af557d74c148c434156edc034b0a94d97afcda20e8c2b6...,02e63d3e5a2351cc8de6c63b0d0784d1940406c5addce4...,039edc94987c8f3adc28dab455efc00dea876089a120f5...,47882,2019-06-03 04:43:40,...,,force,0.0,44239.0,0.0,37255,4242,6403,,


In [None]:
sys.getsizeof(decisions_df)

## Connection to AWS - Fargate Clusters

In [250]:
cluster = FargateCluster(n_workers=20,scheduler_timeout='60 minutes',image='dsrincon/dask-graph:nx-scipy-v1')

  next(self.gen)


In [251]:
cluster

VBox(children=(HTML(value='<h2>FargateCluster</h2>'), HBox(children=(HTML(value='\n<div>\n  <style scoped>\n  …

In [253]:
client = Client(cluster)


python
+---------------------------+---------------+
|                           | version       |
+---------------------------+---------------+
| client                    | 3.7.3.final.0 |
| scheduler                 | 3.7.4.final.0 |
| tcp://172.31.0.253:38335  | 3.7.4.final.0 |
| tcp://172.31.15.181:36571 | 3.7.4.final.0 |
| tcp://172.31.17.129:33915 | 3.7.4.final.0 |
| tcp://172.31.17.149:33709 | 3.7.4.final.0 |
| tcp://172.31.22.101:42231 | 3.7.4.final.0 |
| tcp://172.31.3.220:46565  | 3.7.4.final.0 |
| tcp://172.31.34.23:35353  | 3.7.4.final.0 |
| tcp://172.31.35.18:37609  | 3.7.4.final.0 |
| tcp://172.31.37.140:39817 | 3.7.4.final.0 |
| tcp://172.31.42.71:35675  | 3.7.4.final.0 |
| tcp://172.31.48.218:42075 | 3.7.4.final.0 |
| tcp://172.31.55.135:37159 | 3.7.4.final.0 |
| tcp://172.31.59.113:46209 | 3.7.4.final.0 |
| tcp://172.31.6.118:33597  | 3.7.4.final.0 |
| tcp://172.31.65.139:39809 | 3.7.4.final.0 |
| tcp://172.31.69.199:39365 | 3.7.4.final.0 |
| tcp://172.31.74.198:4501

## Extract Graphs for Analysis

In [254]:
# Lazy extract Graphs

# Function for lazy S3 extraction
def load_snapshots(key):
    session = boto3.session.Session()
    s3 = session.resource('s3')
    response = s3.Object(bucket_name='ln-strategy-data', key=key).get()
    G=pickle.loads(response['Body'].read())
    
    return G
    
# Script to create delayed array
graph_snapshots=[]
blocks=[]

for key in graph_keys[2800:3000]: # Remove index for full range
    # Create block list from file_names
    block_i=int(key.split(".")[0].split("/")[-1]) 
    blocks.append(block_i)
    
    # Extract graphs
    G=dask.delayed(load_snapshots)(key)
    graph_snapshots.append(G)
   

In [None]:
# Test Lazy Graph extract
graph_i=dask.compute(graph_snapshots[0])[0]
block=graph_i.graph['block']
print(type(block))

#graph_snapshots=dask.compute(*graph_snapshots)
#block=graph_snapshots[0].graph['block']
    
#print(len(graph_snapshots[5]))
#print(graph_snapshots[3].graph['block'])

# Delayed testing
#results = dask.compute(*futures)
#graphs=dask.compute(*graph_snapshots)

## Stability/Efficiency analysis by utility definition

In order to understand the potential motivations behind each decision we analyze each decission (opening or closure of a channel) independently from the perspective of each of the participants in the decission, which we'll call the node under analysis. For each decission we extract or compute the following information: 



## Betweeness


Betweenness centrality measures how central is a network to the flow of information in a network. In the case of the Lightning Network the higher the betweenness centrality of a node, the more transactions (messages) that are routed through it. In particular, we will use a measure of betweenness centrality defined in (Brandes and Fleischer 2005 - https://link.springer.com/chapter/10.1007/978-3-540-31856-9_44) that models infomation through a network, as electric current, efficiently and not only considering shortest path. This allows us to account for the fact that not all transactions travel through shortes path given that there are fee and capacity considerations.  

### Baseline betweeness

In [268]:
# Distributed betweeness function

snapshot_bet_list_fut=[]

def bet_cent(g):
   
    #Uncomment depending on approx or full
    g_bet=nx.algorithms.centrality.approximate_current_flow_betweenness_centrality(g,weight='capacity',kmax=10000)
    #g_bet=nx.algorithms.centrality.current_flow_betweenness_centrality(g,weight='capacity')
    block=g.graph['block']
    #else:
    #g_bet={}
    return (block,g_bet)
    

for g in graph_snapshots:
    block_bet_tuple=dask.delayed(bet_cent)(g)
    snapshot_bet_list_fut.append(block_bet_tuple)

futures_bet = dask.persist(*snapshot_bet_list_fut)

In [269]:
start=time.time()
snapshot_bet_list = dask.compute(*futures_bet)
end=time.time()
print('Compute in seconds: {}'.format(end-start))

Compute in seconds: 38.58454084396362


In [270]:
# Define dictionary 
snapshot_bet={record[0]:record[1] for record in snapshot_bet_list}

In [154]:
# Test results and size of betweeness in memory
# Create list with graph keys
print(sys.getsizeof(snapshot_bet))
#n_items = take(10, snapshot_bet.items())
#print(n_items)

9320


### Pairwise stability 

- **Marginal betweenness (bet_mar_nodei)**: The % change between the betweenness centrality, for the node under analysis, given the graph from the previous block and the betweenness centrality of the resulting graph after enacting the decission (adding or removing a channel). Weighted current betweenness centrality is used for this measure.

> **Marginal betweenness for opens** 

In [277]:
#------STABILITY FOR OPENS----

# Function to calculate marginal betweenness centrality for all channel openings in snapshot

def bet_mar_open(input_tuple):
    
    block=input_tuple[0]
    G=input_tuple[1]
    block_opens=input_tuple[2]
    G_bets=input_tuple[3]
  

    # For each open calculate marginal betweenness for each node in channel
    
    
    bet_mar_node0_dic_i={} #Dictionary to store marginal betweeness centrality for node0
    bet_mar_node1_dic_i={} #Dictionary to store marginal betweeness centrality for node0
    for open_edge in block_opens:
        
        # Extract info about channel
        channel_id=open_edge[2]['channel_id']
        node0=open_edge[0]
        node1=open_edge[1]
        edge_list=[open_edge]
        
        
        
        # Copy original graph
        g_mar=G.copy()   
        old_nodes=False
        
        
        
        # Retrieve betweenness before channel if nodes existed, else define betweeness as 0
        if (g_mar.has_node(node0)):
            node0_bet=G_bets[node0]
            old_nodes=True
        else:
            node0_bet=0
            
        if (g_mar.has_node(node1)):
            node1_bet=G_bets[node1]
            old_nodes=True
        else:
            node1_bet=0
        
            
        if old_nodes:    
            # Add edges and calculate betweeness if at least one of the nodes is in graph 
            g_mar.add_edges_from(edge_list)
            g_mar_bet=nx.algorithms.centrality.approximate_current_flow_betweenness_centrality(g_mar,weight='capacity',kmax=10000)
            node0_mar_bet=(g_mar_bet[node0]-node0_bet)
            node1_mar_bet=(g_mar_bet[node1]-node1_bet)
        else:
            node0_mar_bet=0
            node1_mar_bet=0

        
        # Update dictionary - new betweenness
        bet_mar_node0_dic_i[channel_id]=node0_mar_bet
        bet_mar_node1_dic_i[channel_id]=node1_mar_bet
        
    
    return (bet_mar_node0_dic_i,bet_mar_node1_dic_i)
    

# Script to parallelize bet_mar_open

bet_mar_dicfut=[]
for i in range(1,len(graph_snapshots)):
    
    block=blocks[i]
    block_prev=blocks[i-1]
    block_opens=channel_opens[block]
    #print((block_opens))
    g=graph_snapshots[i-1] # Pass previous graph
    g_bet=snapshot_bet[block_prev]
    input_tuple=(block,g,block_opens,g_bet)
    output_tuple=dask.delayed(bet_mar_open)(input_tuple)
    bet_mar_dicfut.append(output_tuple)

futures_bet_mar = dask.persist(*bet_mar_dicfut)


In [278]:
# Run computation
start=time.time()
bet_mar_diclist = dask.compute(*futures_bet_mar)
end=time.time()
print('Compute in seconds: {}'.format(end-start))
print('Size in memory: {}'.format(sys.getsizeof(bet_mar_diclist)))


Compute in seconds: 102.84716725349426
Size in memory: 1640


In [244]:
# Test output
print(bet_mar_diclist[10])

({'548617x1301x0': -6.0334583966724907e-05}, {'548617x1301x0': 0.0013275461061590472})


In [245]:
# Create single dictionaries for node0 and node1

bet_mar_node0_list=[t[0] for t in bet_mar_diclist]
bet_mar_node1_list=[t[1] for t in bet_mar_diclist]

bet_mar_node0_dic={}
for d in bet_mar_node0_list:
    bet_mar_node0_dic.update(d)
    
bet_mar_node1_dic={}
for d in bet_mar_node1_list:
    bet_mar_node1_dic.update(d)

# Test output
# print(bet_mar_node1_dic)

In [246]:
# Add to DataFrame

# Create empty columns
decisions_df['bet_mar_node0']=np.nan
decisions_df['bet_mar_node1']=np.nan

# Populate df with values
decisions_df['bet_mar_node0']=decisions_df['short_channel_id'].map(bet_mar_node0_dic)
decisions_df['bet_mar_node1']=decisions_df['short_channel_id'].map(bet_mar_node1_dic)

decisions_df_filter=decisions_df[decisions_df['bet_mar_node0'].notnull()]
print(len(decisions_df_filter))


396


In [247]:
decisions_df_filter.sort_values(by=['close_block'],inplace=True,ascending=True)
decisions_df_filter.head(10)

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  """Entry point for launching an IPython kernel.


Unnamed: 0,short_channel_id,open_block,open_transaction,address,close_block,close_transaction,node0,node1,satoshis,last_seen,...,close_htlc_count,close_balance_a,close_balance_b,dec_id,node0_id,node1_id,bet_mar_node0,bet_mar_node1,bet_marclose_node0,bet_marclose_node1
2745,549037x2738x0,549037,b7128bbbe422b4f18fad71b091eed1f9e4b0d231be8117...,bc1q95fytjzs8f7fma2nf66gcva7c3w7hnkdwrkef9pu33...,549037.0,b7128bbbe422b4f18fad71b091eed1f9e4b0d231be8117...,028b892b15f5cabcea5165b236db0e36dc06553c323c84...,038b36a43c38f75cd15bb25394f1cd162f717df0055852...,400000,2019-08-22 02:59:19,...,0.0,400000.0,0.0,2745,908,3654,-0.010145,0.001176619,-0.008922,0.000211
2744,549037x2737x0,549037,0825da5e96cd45fced3233ebe615721b687285839d3036...,bc1q5mqzhw5e42rfqh250zalwu47ru8gvz4g4k968me0mg...,549037.0,0825da5e96cd45fced3233ebe615721b687285839d3036...,02b95713bbe4609a337f3ca5aab3a75674083ddf5331a4...,038b36a43c38f75cd15bb25394f1cd162f717df0055852...,400000,2019-08-22 02:59:19,...,0.0,400000.0,0.0,2744,6052,3654,0.018342,0.01476137,0.000272,-0.000155
40227,549489x1194x1,549489,58dafe493648fbdd69143c26e0cf8a66ae11a272c2739d...,bc1q25j5l6crv4mrjkjjjw4rzyv890cwwnyyw9dezcqs5x...,549489.0,58dafe493648fbdd69143c26e0cf8a66ae11a272c2739d...,02574ffa55d394b9326f6e5c15992cc0516b0d6e6a79a1...,03a5927b64b1ea8657d5b770d61a3e2d0554fdb5d56877...,2500000,2019-06-13 01:12:27,...,0.0,8974.0,0.0,40227,5247,696,-0.019278,-0.006038171,-0.019414,-0.005255
2991,549668x215x0,549668,9db0314ed243141d152057bdb16b6a1fee650cf68c3565...,bc1qjhwn44uyurz7mrc7dwtehzd7rqefzjp9q4zcmhl064...,578710.0,1350e1c9001ec23ca2f58e02da10a3dec69690b031a858...,0217890e3aad8d35bc054f43acc00084b25229ecff0ab6...,02f9eaf9949ca9da663fc24494abae4153ee4f0aee480d...,100000,2019-06-17 04:06:28,...,0.0,79845.0,0.0,2991,7058,3139,0.11505,0.0002157941,,
2940,549563x2304x0,549563,580895adf54d61e2b0cddc040256be11d865661c866c50...,bc1q42tyxyzw2t8tquk0dm4ffvyrlq776dn336y70s8sa9...,578751.0,df1a986f5315dbe75769b7efba017620f07e659e3e2900...,0223390bea8aa598442d056ace37c07e7364da1341b368...,032d4baebebfdeab7a2ecef2fbe109cbef10de95f05aa5...,20420,2019-06-17 04:06:05,...,0.0,17128.0,0.0,2940,2090,540,-0.000775,0.03494538,,
2730,548951x2816x1,548951,9a461d65a7ec250583ae08dc90036670f7038b74d8a2ec...,bc1q6a79t3f606xs3u635z7mge3dkzaxg894p8308qtv0g...,578754.0,09556ea391ed1ad33b9dbb2fafa5c16ce097d69578ba4b...,030c3f19d742ca294a55c00376b3b355c3c90d61c6b6b3...,037eb17d0fee2d20bacea3d78940b40f4ac61a5a7040a2...,1000000,2019-06-17 04:04:38,...,0.0,35060.0,35060.0,2730,218,1070,0.00435,0.0001835569,,
2915,549558x1279x0,549558,2484708911606f16497a85742460c46e5d77f944d0f6f4...,bc1qsm6crya8ve4pghxf37yhwcwgsp8zke4xv3s25tecvq...,578767.0,0c51829b63ba853ebf0e6e7ba69196c1f5a1a63e0e0dec...,02705407cde2e485542ac068c449d8b2966d46c5506ecb...,032d4baebebfdeab7a2ecef2fbe109cbef10de95f05aa5...,20420,2019-06-17 04:05:56,...,0.0,18865.0,0.0,2915,488,540,-0.000499,0.0004019322,,
2764,549087x1404x0,549087,d59b04f38f7f9d7b3e520150ec09274301278cffa39378...,bc1q6k4v7xx3w7c7qq65w2xm485qcmfk9sva8u5sh902q0...,578850.0,eaf1ad7a71b21db6c6f9ba66d4e7ff780b29cacb7fcec2...,029a06f84c9bfddcf4dca173a4d1a540e6ce7f75cc7d1d...,03166d4154c205b9eb9a5f6c0b38925c8b2f6fb0dfa088...,200000,2019-06-17 04:04:52,...,0.0,197853.0,0.0,2764,2661,558,-0.000702,-1.123397e-15,,
36592,549070x2528x1,549070,58f8d8f8681072ed4f7426f9a299b962cb955967bcb181...,bc1qmc39hhgyt7wwr5ykhy00r845razf6c5aqpeunv8jan...,578909.0,ea322bbf924e8e191e5d7b20204d7af1c240c8618b4172...,03864ef025fde8fb587d989186ce6a4a186895ee44a926...,039195c0969d69f9a25839cb44bd5e858bd9e397163895...,10000000,2019-06-03 03:25:27,...,0.0,9996402.0,0.0,36592,6802,5142,0.100518,1.872334e-14,,
2947,549568x580x0,549568,f7c6532e0fd71fcd7937c1d2e1c5d892b8d40d6581f8e9...,bc1q087x35h5c7875j648h8mg8tuq862fxyattzqa5n4v9...,578929.0,bcc30f9c9a0621c03e346bd95465cf6053f6b694e343d4...,032d4baebebfdeab7a2ecef2fbe109cbef10de95f05aa5...,033ec518c6ad5b565a89215d9f59c9d6dd2ca3d757b4c8...,20420,2019-06-17 04:06:08,...,0.0,19751.0,0.0,2947,540,4799,0.000265,-0.03410426,,


**TODO**: Why is length of Dataframe longer than the number of snapshots extracted? Could it be that some channels appear more than once in dataframe?

> **Marginal betweenness for closures** 

In [298]:
#------STABILITY FOR CLOSURES----

# Function to calculate marginal betweenness centrality for all channel closures in snapshot

def bet_mar_close(input_tuple):
    
    block=input_tuple[0]
    G=input_tuple[1]
    block_closes=input_tuple[2]
    G_bets=input_tuple[3]
   

    # For each open calculate marginal betweenness for each node in channel
    
    
    bet_mar_node0_dic_i={} #Dictionary to store marginal betweeness centrality for node0
    bet_mar_node1_dic_i={} #Dictionary to store marginal betweeness centrality for node0
    for close_edge in block_closes:
        
        # Extract info about channel
        channel_id=close_edge[2]['channel_id']
        node0=close_edge[0]
        node1=close_edge[1]
        edge_list=[(node0,node1)]
        
        
        
        # Copy original graph
        g_mar=G.copy() 
        old_nodes=False #If there is at least one old node change to True, to run nx betweeness algo
        
        
        # Retrieve betweenness for nodes in snapshot. Check for node in previous graph
        
        if (g_mar.has_node(node0)):
            node0_bet=G_bets[node0]
            old_nodes=True
        else:
            node0_bet=0
        
        if (g_mar.has_node(node1)):
            node1_bet=G_bets[node1]
            old_nodes=True
        else:
            node1_bet=0
        
        # Define marginal graph by removing edges and extracting connected component
        
        
        if old_nodes:
            g_mar.remove_edges_from(edge_list)   
            connected_components=[c for c in nx.algorithms.components.connected_components(g_mar)]
            g_mar=g_mar.subgraph(connected_components[0]).copy() 
            # Uncomment for aprox
            #g_mar_bet=nx.algorithms.centrality.approximate_current_flow_betweenness_centrality(g_mar,weight='capacity',kmax=10000)
            g_mar_bet=nx.algorithms.centrality.current_flow_betweenness_centrality(g_mar,weight='capacity')
        
            # Update marginal values for node0 and node1
        
            if (g_mar.has_node(node0)): #If connected component of marginal graph contains node0 find betweeness
                node0_bet_pos=g_mar_bet[node0]
            else: # else update with fixed value
                node0_bet_pos=0
            
            
            
            if (g_mar.has_node(node1)): #If connected component of marginal graph contains node1 find betweeness
                node1_bet_pos=g_mar_bet[node1]
            else: # else update with fixed value
                node1_bet_pos=0
            
            
        else:
            node0_bet_pos=0
            node1_bet_pos=0
        
        # Calculate final betweeness
        node0_mar_bet=node0_bet_pos-node0_bet
        node1_mar_bet=node1_bet_pos-node1_bet
        
        # Update dictionary - new betweenness
        bet_mar_node0_dic_i[channel_id]=node0_mar_bet
        bet_mar_node1_dic_i[channel_id]=node1_mar_bet
        
    
    return (bet_mar_node0_dic_i,bet_mar_node1_dic_i)
    

# Script to parallelize bet_mar_open

bet_mar_dicfut=[]
for i in range(1,len(graph_snapshots)):
    
    block=blocks[i]
    block_prev=blocks[i-1]
    block_closes=channel_closures[block]
   
    g=graph_snapshots[i-1]
    g_bet=snapshot_bet[block_prev]
    input_tuple=(block,g,block_closes,g_bet)
    output_tuple=dask.delayed(bet_mar_close)(input_tuple)
    bet_mar_dicfut.append(output_tuple)

futures_bet_mar_close = dask.persist(*bet_mar_dicfut)


In [299]:
# Run computation
start=time.time()
bet_mar_diclist_close = dask.compute(*futures_bet_mar_close)
end=time.time()
print('Compute in seconds: {}'.format(end-start))
print('Size in memory: {}'.format(sys.getsizeof(bet_mar_diclist_close)))


Compute in seconds: 64.99275374412537
Size in memory: 1640


In [300]:
# Test output
print(bet_mar_diclist_close)

(({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({'549037x2737x0': 0.002313189991499001, '549037x2738x0': 0.0006411690078780455}, {'549037x2737x0': 0, '549037x2738x0': 0}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({}, {}), ({},

In [312]:
# Create single dictionaries for node0 and node1 closures

bet_marclose_node0_list=[t[0] for t in bet_mar_diclist_close]
bet_marclose_node1_list=[t[1] for t in bet_mar_diclist_close]

bet_marclose_node0_dic={}
for d in bet_marclose_node0_list:
    bet_marclose_node0_dic.update(d)
    
bet_marclose_node1_dic={}
for d in bet_marclose_node1_list:
    bet_marclose_node1_dic.update(d)

# Test output
print(bet_marclose_node0_dic)

{'549037x2737x0': 0.002313189991499001, '549037x2738x0': 0.0006411690078780455, '549489x1194x1': 0.0008884777262015605}


In [313]:
# Add to DataFrame

# Create empty columns
decisions_df['bet_marclose_node0']=np.nan
decisions_df['bet_marclose_node1']=np.nan

# Populate df with values
decisions_df['bet_marclose_node0']=decisions_df['short_channel_id'].map(bet_marclose_node0_dic)
decisions_df['bet_marclose_node1']=decisions_df['short_channel_id'].map(bet_marclose_node1_dic)

decisions_df_marclose=decisions_df[decisions_df['bet_marclose_node1'].notnull()]
#print(len(decisions_df_filter))
decisions_df_marclose

Unnamed: 0,short_channel_id,open_block,open_transaction,address,close_block,close_transaction,node0,node1,satoshis,last_seen,...,node0_id,node1_id,bet_mar_node0,bet_mar_node1,bet_marclose_node0,bet_marclose_node1,bet_actopen_node0,bet_actopen_node1,bet_actclose_node0,bet_actclose_node1
2745,549037x2738x0,549037,b7128bbbe422b4f18fad71b091eed1f9e4b0d231be8117...,bc1q95fytjzs8f7fma2nf66gcva7c3w7hnkdwrkef9pu33...,549037.0,b7128bbbe422b4f18fad71b091eed1f9e4b0d231be8117...,028b892b15f5cabcea5165b236db0e36dc06553c323c84...,038b36a43c38f75cd15bb25394f1cd162f717df0055852...,400000,2019-08-22 02:59:19,...,908,3654,-0.010145,0.001177,0.000641,0.0,-0.000331,0.001376,-0.000331,0.001376
2744,549037x2737x0,549037,0825da5e96cd45fced3233ebe615721b687285839d3036...,bc1q5mqzhw5e42rfqh250zalwu47ru8gvz4g4k968me0mg...,549037.0,0825da5e96cd45fced3233ebe615721b687285839d3036...,02b95713bbe4609a337f3ca5aab3a75674083ddf5331a4...,038b36a43c38f75cd15bb25394f1cd162f717df0055852...,400000,2019-08-22 02:59:19,...,6052,3654,0.018342,0.014761,0.002313,0.0,0.000581,0.001376,0.000581,0.001376
40227,549489x1194x1,549489,58dafe493648fbdd69143c26e0cf8a66ae11a272c2739d...,bc1q25j5l6crv4mrjkjjjw4rzyv890cwwnyyw9dezcqs5x...,549489.0,58dafe493648fbdd69143c26e0cf8a66ae11a272c2739d...,02574ffa55d394b9326f6e5c15992cc0516b0d6e6a79a1...,03a5927b64b1ea8657d5b770d61a3e2d0554fdb5d56877...,2500000,2019-06-13 01:12:27,...,5247,696,-0.019278,-0.006038,0.000888,0.00122,-3e-06,0.006659,-3e-06,0.006659


distributed.client - ERROR - Failed to reconnect to scheduler after 10.00 seconds, closing client
_GatheringFuture exception was never retrieved
future: <_GatheringFuture finished exception=CancelledError()>
concurrent.futures._base.CancelledError


- **Actual change in betweenness (bet_act_nodei)**: The % change between the betweenness centrality, for the node under analysis, given the graph from the previous block and the betweenness centrality of the resulting graph after enacting **all** the decissions (adding or removing a channels) in the current block. Weighted current betweenness centrality is used for this measure.

In [309]:
# Calculate actual difference in betweeness

bet_actopen_node0_dic={}
bet_actopen_node1_dic={}
bet_actclose_node0_dic={}
bet_actclose_node1_dic={}

# List to store tuples of block and node with exceptions
node0_block_ex=[]
node1_block_ex=[]
node0_plus_ex=[]
node1_plus_ex=[]

node0_block_ex_close=[]
node1_block_ex_close=[]
node0_plus_ex_close=[]
node1_plus_ex_close=[]



for i in range(1,len(graph_snapshots)):
    block=blocks[i-1]
    block_plus=blocks[i]
    
    # OPENS: Calculate difference in betweeness for each one
    for open_edge in channel_opens[block_plus]:
        
        # Extract info about open
        channel_id=open_edge[2]['channel_id']
        node0=open_edge[0]
        node1=open_edge[1]
        
        # Define base betweeness. If new node, define as 0
        
        try:
            node0_bet=snapshot_bet[block][node0]
            
        except KeyError:
            node0_bet=0
            node0_block_ex.append((block,node0))
            
            
        try:
            node1_bet=snapshot_bet[block][node1]
            
        except KeyError:
            node1_bet=0
            node1_block_ex.append((block,node1))
        
        
        # Get betweeness after open. If node is not existend, define as 0
        
        try:
            node0_act_bet=snapshot_bet[block_plus][node0]
            
        except KeyError:
            node0_act_bet=0
            node0_plus_ex.append((block_plus,node0))
            
        try:
            node1_act_bet=snapshot_bet[block_plus][node1]
            
        except KeyError:
            node1_act_bet=0
            node1_plus_ex.append((block_plus,node1))
      
        # Calculate difference
        
        node0_act_bet_delta=node0_act_bet-node0_bet
        node1_act_bet_delta=node1_act_bet-node1_bet
        
        #Update dictionary
        bet_actopen_node0_dic[channel_id]=node0_act_bet_delta
        bet_actopen_node1_dic[channel_id]=node1_act_bet_delta
        
  
    
    
    # CLOSURES: Calculate difference in betweeness for each one
    

    for close_edge in channel_closures[block_plus]:
        
        # Extract info about open
        channel_id=close_edge[2]['channel_id']
        node0=close_edge[0]
        node1=close_edge[1]
        
        # Define base betweeness. If new node, define as 0
        
        try:
            node0_bet=snapshot_bet[block][node0]
            
        except KeyError:
            node0_bet=0
            node0_block_ex_close.append((block,node0))
            
            
        try:
            node1_bet=snapshot_bet[block][node1]
            
        except KeyError:
            node1_bet=0
            node1_block_ex_close.append((block,node1))
        
        
        # Get betweeness after close. If node is not existend, define as 0
        
        try:
            node0_act_bet=snapshot_bet[block_plus][node0]
            
        except KeyError:
            node0_act_bet=0
            node0_plus_ex_close.append((block_plus,node0))
            
        try:
            node1_act_bet=snapshot_bet[block_plus][node1]
            
        except KeyError:
            node1_act_bet=0
            node1_plus_ex_close.append((block_plus,node1))
      
        # Calculate difference
        
        node0_act_bet_delta=node0_act_bet-node0_bet
        node1_act_bet_delta=node1_act_bet-node1_bet
        
        #Update dictionary
        bet_actclose_node0_dic[channel_id]=node0_act_bet_delta
        bet_actclose_node1_dic[channel_id]=node1_act_bet_delta      
        
    

In [235]:
# OPEN Print blocks and nodes (block,node) that raised exceptions
print("----EXCEPTIONS RAISED----")
print("Node 0 not present in initial block:")
print(node0_block_ex)
print("Node 1 not present in initial block:")
print(node1_block_ex)
print("Node 0 not present in next block:")
print(node0_plus_ex)
print("Node 1 not present in next block:")
print(node1_plus_ex)

----EXCEPTIONS RAISED----
Node 0 not present in initial block:
[(548588, 5400), (548618, 3350), (548618, 4479), (548628, 2750), (548628, 2750), (548677, 2661), (548728, 3139), (548759, 3111), (548839, 1572), (548872, 2434), (548879, 2034), (548898, 1675), (548898, 1675), (548905, 1020), (548943, 7340), (549028, 1511), (549070, 2), (549092, 4000), (549094, 4735), (549096, 5714), (549202, 2325), (549204, 717), (549209, 6916), (549210, 7341), (549277, 4198), (549381, 2382), (549383, 7126), (549403, 3748), (549403, 3748), (549403, 3748), (549403, 3748), (549403, 3748), (549403, 3748), (549513, 816), (549590, 193), (549617, 757), (549622, 757), (549671, 943)]
Node 1 not present in initial block:
[(548568, 6619), (548744, 4828), (548800, 2250), (548898, 1675), (548898, 1675), (548898, 1675), (548898, 1675), (548898, 1675), (548899, 2604), (548905, 5966), (548943, 4185), (549025, 1329), (549028, 1511), (549036, 3654), (549036, 3654), (549036, 3654), (549036, 3654), (549036, 3654), (549036, 36

In [310]:
# CLOSE Print blocks and nodes (block,node) that raised exceptions
print("----EXCEPTIONS RAISED----")
print("Node 0 not present in initial block:")
print(node0_block_ex_close)
print("Node 1 not present in initial block:")
print(node1_block_ex_close)
print("Node 0 not present in next block:")
print(node0_plus_ex_close)
print("Node 1 not present in next block:")
print(node1_plus_ex_close)

----EXCEPTIONS RAISED----
Node 0 not present in initial block:
[]
Node 1 not present in initial block:
[(549036, 3654), (549036, 3654)]
Node 0 not present in next block:
[]
Node 1 not present in next block:
[]


In [302]:
# Test output
#bet_actclose_node0_dic

In [311]:
# Add to DataFrame - OPENS

# Create empty columns
decisions_df['bet_actclose_node0']=np.nan
decisions_df['bet_actclose_node1']=np.nan

# Populate df with values
decisions_df['bet_actclose_node0']=decisions_df['short_channel_id'].map(bet_actclose_node0_dic)
decisions_df['bet_actclose_node1']=decisions_df['short_channel_id'].map(bet_actclose_node1_dic)

decisions_df_actclose=decisions_df[decisions_df['bet_actclose_node0'].notnull()]
#print(len(decisions_df_actopen))
decisions_df_actclose.head(10)

Unnamed: 0,short_channel_id,open_block,open_transaction,address,close_block,close_transaction,node0,node1,satoshis,last_seen,...,node0_id,node1_id,bet_mar_node0,bet_mar_node1,bet_marclose_node0,bet_marclose_node1,bet_actopen_node0,bet_actopen_node1,bet_actclose_node0,bet_actclose_node1
2745,549037x2738x0,549037,b7128bbbe422b4f18fad71b091eed1f9e4b0d231be8117...,bc1q95fytjzs8f7fma2nf66gcva7c3w7hnkdwrkef9pu33...,549037.0,b7128bbbe422b4f18fad71b091eed1f9e4b0d231be8117...,028b892b15f5cabcea5165b236db0e36dc06553c323c84...,038b36a43c38f75cd15bb25394f1cd162f717df0055852...,400000,2019-08-22 02:59:19,...,908,3654,-0.010145,0.001177,-0.008922,0.001376,-0.000331,0.001376,-0.000331,0.001376
2744,549037x2737x0,549037,0825da5e96cd45fced3233ebe615721b687285839d3036...,bc1q5mqzhw5e42rfqh250zalwu47ru8gvz4g4k968me0mg...,549037.0,0825da5e96cd45fced3233ebe615721b687285839d3036...,02b95713bbe4609a337f3ca5aab3a75674083ddf5331a4...,038b36a43c38f75cd15bb25394f1cd162f717df0055852...,400000,2019-08-22 02:59:19,...,6052,3654,0.018342,0.014761,0.000272,0.001376,0.000581,0.001376,0.000581,0.001376
40227,549489x1194x1,549489,58dafe493648fbdd69143c26e0cf8a66ae11a272c2739d...,bc1q25j5l6crv4mrjkjjjw4rzyv890cwwnyyw9dezcqs5x...,549489.0,58dafe493648fbdd69143c26e0cf8a66ae11a272c2739d...,02574ffa55d394b9326f6e5c15992cc0516b0d6e6a79a1...,03a5927b64b1ea8657d5b770d61a3e2d0554fdb5d56877...,2500000,2019-06-13 01:12:27,...,5247,696,-0.019278,-0.006038,-0.019414,0.006659,-3e-06,0.006659,-3e-06,0.006659






- **Marginal betweeness pairwise stability (bet_mar_pairstab)**: Evaluates if given the marginal graph that results from just enacting this decission is consistent with pairwise stability, from a betweenness perspective.

- **Actual betweeness pairwise stability (bet_act_pairstab)**: Evaluates if given the marginal graph that results from all the decisions in the block is consitend with pairwise stability, from a betweenness perspective. 




### Nash stability 

- **% Change with respect to not making decision (bet_binstat_deltai)**: The % change in betwewnness centrality, for the node under analysis, given the resulting graph after all of the decissions have been executed. 
- **Nash compatible - binary strategy (bet_binstat_nash)**: Returns true if given the other decissions enacted in the block not making decision would have NOT have resulted in higher betweenness centrality. This tells me if my strategy helped me be better off (took into account what others were doing)

(Optional approaches - Check for tracktability)
- **Nash compatible - close only strategy (bet_closestat_nash)**: Returns true if given the other decissions enacted in the block, closing any other channels would NOT have not resulted in higher betwneenness centrality. (NOTE: Check if there are combinatorial considerations, if so just look at closings up to x) 
- **Nash compatible - close/open (bet_allstat_nash)**: Returns true if given the other decissions enacted in the block, closing any other channels (with any node) or opening a channel with one of the round participants would NOT have not resulted in lower betwneenness centrality. (NOTE: To make it reasonable and constraint the strategy space only consider 'similar nodes' or with relationships in the past?).



### Efficiency
- **Average betweeness per block (bet_effic)**: Average betweenness centrality for all the nodes. 



## Connectivity

### Pairwise stability 

- **Marginal % change in connectivity (con_mar_deltai)**: The % change between the shortest path average, for the node under analysis, given the graph from the previous block and the shortest path average of the resulting graph after enacting the decission (adding or removing a channel). Weighted shortest path (_single_source_dijkstra_path_) is used for this measure.

- **Actual % change in connectivity (con_act_deltai)**: The % change between the shortest path average, for the node under analysis, given the graph from the previous block and the shortest path average of the resulting graph after enacting **all** the decissions (adding or removing a channels) in the current block. Weighted shortest path (_single_source_dijkstra_path_) is used for this measure.

- **Marginal connectivity pairwise stability (con_mar_pairstab)**: Evaluates if given the marginal graph that results from just enacting this decission is consistent with pairwise stability, from a connectivity perspective.

- **Actual connectivity pairwise stability (con_act_pairstab)**: Evaluates if given the marginal graph that results from all the decisions in the block is consitend with pairwise stability, from a connectivity perspective.  



### Nash stability 

- **% Change with respect to not making decision (con_binstat_deltai)**: The % change in shortest path average, for the node under analysis, given the resulting graph after all of the decissions have been executed. 
- **Nash compatible - binary strategy (con_binstat_nash)**: Returns true if given the other decissions enacted in the block not making decision would have NOT have resulted in higher shortest path average. NOTE: This indicates if the strategy selected made the node better off (took into account what others were doing)

(Optional approaches - Check for tracktability)
- **Nash compatible - close only strategy (con_closestat_nash)**: Returns true if given the other decissions enacted in the block, closing any other channels would NOT have not resulted in higher shortest path average. (NOTE: Check if there are combinatorial considerations, if so just look at closings up to x) 
- **Nash compatible - close/open (con_allstat_nash)**: Returns true if given the other decissions enacted in the block, closing any other channels (with any node) or opening a channel with one of the round participants would NOT have not resulted in lower shortest path average. (NOTE: To make it reasonable and constraint the strategy space only consider 'similar nodes' or with relationships in the past?).



### Efficiency
- **Average betweeness per block (bet_effic)**: Average shortest path average for all the nodes. 





## Utility Functions

In [93]:
def take(n, iterable):
    "Return first n items of the iterable as a list"
    return list(islice(iterable, n))