In [2]:
import networkx as nx
import graph_tool.all as gt
import pandas as pd

## Preprocessing of datasets
All datasets are converted from csv/edgelists to graphml format.

### Mouse visual cortex

`data/mouse_vc.graphml`

*Source*: [https://s3.amazonaws.com/connectome-graphs/mouse/mouse_visual.cortex_2.graphml]

### Yeast gene regulatory network

From `data/YRN.txt` to `data/yeast8k.graphml`

*Source*: [http://archive.gersteinlab.org/proj/Hierarchy_Rewiring/PNAS_hier/YRN.txt]

In [None]:
G = nx.read_adjlist(path="data/YRN.txt",delimiter="\t",nodetype=str,create_using=nx.DiGraph)
nx.write_graphml(G,path="data/yeast8k.graphml")

### E. Coli gene regulatory network

From `data/ERN.txt` to `data/ecoli2k.graphml`

*Source*: [http://archive.gersteinlab.org/proj/Hierarchy_Rewiring/PNAS_hier/ERN.txt]

In [None]:
G = nx.read_adjlist(path="data/ERN.txt",delimiter="\t",nodetype=str,create_using=nx.DiGraph)
nx.write_graphml(G,path="data/ecoli2k.graphml")

### Facebook Ego Network

From `data/facebook_combined.txt` to `data/fbego.graphml`

*Source*: [http://snap.stanford.edu/data/facebook.tar.gz]


In [None]:
G = nx.read_adjlist(path="data/facebook_combined.txt",delimiter="\t",nodetype=str,create_using=nx.DiGraph)
nx.write_graphml(G,path="data/fbego.graphml")

### Bitcoin Alpha trust Network

From `data/soc-sign-bitcoinalpha.csv.gz` to `data/bc.graphml`

*Source*: [https://snap.stanford.edu/data/soc-sign-bitcoinalpha.csv.gz]


In [3]:
G = nx.read_adjlist(path="data/soc-sign-bitcoinalpha.csv.gz",delimiter=",",nodetype=str,create_using=nx.DiGraph)
nx.write_graphml(G,path="data/bc.graphml")

### Python Dependency Network

From `data/requirements.csv` to `data/pydep.graphml`

*Source*: [http://kgullikson88.github.io/blog/Downloads/PypiDependencies/requirements.csv]


In [4]:
with open("data/requirements.csv") as f:
    df = pd.read_csv(f,delimiter=",")

df.drop(columns=["package","package_version"],inplace=True)
df.dropna(axis=0,inplace=True)
df.reset_index(drop="index",inplace=True)
elist = list()
for row in df.values:
    tupl = (row[1],row[0]) if row[1] != row[0] else None
    elist.append(tupl) if tupl is not None else None
G = nx.DiGraph(elist)
G.remove_edges_from(nx.selfloop_edges(G))
nx.write_graphml(G,path="data/pydep2.graphml")