## Summary Data for GraphML Files

In [1]:
import graph_tool.all as gt
import os
import numpy as np
import graph_tool
from tqdm import tqdm_notebook

from lib.analysis import clustering
from lib.analysis import dist
from lib.analysis import model
from lib.analysis import power
from lib.analysis import stats

## Part 1: Summary Statistics

Basic statistics for each country's government

In [2]:
data = 'data'
ignore = ['.DS_Store', 'us']
graphs = {}

In [3]:
for country in [d for d in os.listdir(data) if d not in ignore]:
    path = os.path.join(data, country)
    for file in [f for f in os.listdir(path) if f not in ignore]:
        if file.endswith('.graphml'):
            fpath = os.path.join(path, file)
            graphs[file[:-8]] = gt.load_graph(fpath)

In [None]:
with open("summary.csv", "w+") as f:
    f.write(','.join(['Number of Edges', 'Number of Vertices',
                      'Clustering Coefficient', 'Average Degree',
                      'Average Excess Degree', 'Average Distance',
                      'Size of LCC', 'Number of CC']) + '\n')
    for name, g in graphs.items():
        print(name)
        f.write(f'{name},{str(stats.summary(g))}\n')

net_se


## Part 2: Assortivity

Computes assoritivty on specified attribute for every country across years 

In [4]:
individual_graphs = {}

root = '/Users/benjaminlai/Desktop/CSE-416-Final-Project/data/'
countries = os.listdir(root)
nets = [country + "/" + net + "/" for country in countries
                            for net in os.listdir(root + country)
                            if not net.endswith('.graphml')]

for net in nets:
    for x in os.listdir(root+net):
        if x.endswith('.graphml'):
            individual_graphs[x] = gt.load_graph(root + net + x) 

In [9]:
with open("assortivity_summary.csv", "w+") as f:
    f.write(','.join(['Assortivity Measure']) + '\n')
    for name, g in individual_graphs.items():
        if g.vertex_properties.keys():
            # NOTE: most graphs do not have property maps for keys, don't know why
            attribute = "g"
            f.write(f'{name},{str(stats.assortativity_summary(g, attribute))}\n')