In [None]:
import networks.randomize_network as rn
import create_datasets.create_nx_datasets
import networkx as nx

#### Random networks
Create 100 random networks for each randomization method ("Shuffled" and "Rewired") and for each gene set (AD and NDD).

#### AD gene set

In [None]:
indir = 'data'
outdir = 'data/random_networks'

disease = 'AD'
network = 'PPI'

infile = f'{indir}/{disease}_STRING_PPI_edgelist_biggest.txt'
original = rn.load_graph(infile)

for i in range(1, 101):
    shuffled = rn.shuffle_nodes(original)
    nx.write_edgelist(shuffled, f'{outdir}/shuffled/{disease}_{network}_rand{i}_edgelist.txt')

    rewired = rn.generate_RDPN(infile)
    nx.write_edgelist(shuffled, f'{outdir}/rewired/{disease}_{network}_rand{i}_edgelist.txt')


#### NDD gene set - PET target - Shuffled datasets

In [None]:
disease = 'ND'
network = 'PPI'

infile = f'{indir}/{disease}_STRING_PPI_edgelist_biggest.txt'
original = rn.load_graph(infile)

for i in range(1, 101):
    shuffled = rn.shuffle_nodes(original)
    nx.write_edgelist(shuffled, f'{outdir}/shuffled/{disease}_{network}_rand{i}_edgelist.txt')

    rewired = rn.generate_RDPN(infile)
    nx.write_edgelist(shuffled, f'{outdir}/rewired/{disease}_{network}_rand{i}_edgelist.txt')

### Random graph datasets
Create corresponding graph-datasets for each random network. This takes time because 800 different graph-datasets (2 methods x 2 gene sets x 100 random networks x 2 different targets) are built.

#### PET target - Shuffled datasets - AD gene set

In [None]:
import os, sys, datetime, pickle

In [None]:
dataset = 'ADNI'
target = 'PET'
disease = 'AD'
network = 'shuffled'

indir = 'data'
outdir = f'data/graph_datasets/{target}/{network}'
print('Input directory:', indir)
print('Output directory:', outdir)
print()

for i in range(1, 101):

    start_time = datetime.datetime.now()
    print()

    # result_nodes = create_nx_datasets.main(indir, 'ADNI', 'PET', 'AD', 'original', 'missense', None)
    result_nodes = create_nx_datasets.main(indir, dataset, target, disease, network, 'missense', i)
    print('Coding: number of missense variants per node')

    outfile = f'{outdir}/{disease}_PPI_rand{i}_missense.pkl'
    print('Resulting dataset saved at:', outfile)
    print()

    with open(outfile, 'wb') as f:
        pickle.dump(result_nodes, f)

    result_nodes_time = datetime.datetime.now()
    print('Processing time:', result_nodes_time - start_time)
    print('\n\n')

#### PET target - Shuffled datasets - NDD gene set

In [None]:
dataset = 'ADNI'
target = 'PET'
disease = 'ND'
network = 'shuffled'

indir = 'data'
outdir = f'data/graph_datasets/{target}/{network}'
print('Input directory:', indir)
print('Output directory:', outdir)
print()

for i in range(1, 101):

    start_time = datetime.datetime.now()
    print()

    # result_nodes = create_nx_datasets.main(indir, 'ADNI', 'PET', 'AD', 'original', 'missense', None)
    result_nodes = create_nx_datasets.main(indir, dataset, target, disease, network, 'missense', i)
    print('Coding: number of missense variants per node')

    outfile = f'{outdir}/{disease}_PPI_rand{i}_missense.pkl'
    print('Resulting dataset saved at:', outfile)
    print()

    with open(outfile, 'wb') as f:
        pickle.dump(result_nodes, f)

    result_nodes_time = datetime.datetime.now()
    print('Processing time:', result_nodes_time - start_time)
    print('\n\n')

#### PET&DX target - Shuffled datasets - AD gene set

In [None]:
dataset = 'ADNI'
target = 'PETandDX'
disease = 'AD'
network = 'shuffled'

indir = 'data'
outdir = f'data/graph_datasets/{target}/{network}'
print('Input directory:', indir)
print('Output directory:', outdir)
print()

for i in range(1, 101):

    start_time = datetime.datetime.now()
    print()

    # result_nodes = create_nx_datasets.main(indir, 'ADNI', 'PET', 'AD', 'original', 'missense', None)
    result_nodes = create_nx_datasets.main(indir, dataset, target, disease, network, 'missense', i)
    print('Coding: number of missense variants per node')

    outfile = f'{outdir}/{disease}_PPI_rand{i}_missense.pkl'
    print('Resulting dataset saved at:', outfile)
    print()

    with open(outfile, 'wb') as f:
        pickle.dump(result_nodes, f)

    result_nodes_time = datetime.datetime.now()
    print('Processing time:', result_nodes_time - start_time)
    print('\n\n')

#### PET&DX target - Shuffled datasets - NDD gene set

In [None]:
dataset = 'ADNI'
target = 'PETandDX'
disease = 'ND'
network = 'shuffled'

indir = 'data'
outdir = f'data/graph_datasets/{target}/{network}'
print('Input directory:', indir)
print('Output directory:', outdir)
print()

for i in range(1, 101):

    start_time = datetime.datetime.now()
    print()

    # result_nodes = create_nx_datasets.main(indir, 'ADNI', 'PET', 'AD', 'original', 'missense', None)
    result_nodes = create_nx_datasets.main(indir, dataset, target, disease, network, 'missense', i)
    print('Coding: number of missense variants per node')

    outfile = f'{outdir}/{disease}_PPI_rand{i}_missense.pkl'
    print('Resulting dataset saved at:', outfile)
    print()

    with open(outfile, 'wb') as f:
        pickle.dump(result_nodes, f)

    result_nodes_time = datetime.datetime.now()
    print('Processing time:', result_nodes_time - start_time)
    print('\n\n')

#### PET target - Rewired datasets - AD gene set

In [None]:
dataset = 'ADNI'
target = 'PET'
disease = 'AD'
network = 'rewired'

indir = 'data'
outdir = f'data/graph_datasets/{target}/{network}'
print('Input directory:', indir)
print('Output directory:', outdir)
print()

for i in range(1, 101):

    start_time = datetime.datetime.now()
    print()

    # result_nodes = create_nx_datasets.main(indir, 'ADNI', 'PET', 'AD', 'original', 'missense', None)
    result_nodes = create_nx_datasets.main(indir, dataset, target, disease, network, 'missense', i)
    print('Coding: number of missense variants per node')

    outfile = f'{outdir}/{disease}_PPI_rand{i}_missense.pkl'
    print('Resulting dataset saved at:', outfile)
    print()

    with open(outfile, 'wb') as f:
        pickle.dump(result_nodes, f)

    result_nodes_time = datetime.datetime.now()
    print('Processing time:', result_nodes_time - start_time)
    print('\n\n')

#### PET target - Rewired datasets - NDD gene set

In [None]:
dataset = 'ADNI'
target = 'PET'
disease = 'ND'
network = 'rewired'

indir = 'data'
outdir = f'data/graph_datasets/{target}/{network}'
print('Input directory:', indir)
print('Output directory:', outdir)
print()

for i in range(1, 101):

    start_time = datetime.datetime.now()
    print()

    # result_nodes = create_nx_datasets.main(indir, 'ADNI', 'PET', 'AD', 'original', 'missense', None)
    result_nodes = create_nx_datasets.main(indir, dataset, target, disease, network, 'missense', i)
    print('Coding: number of missense variants per node')

    outfile = f'{outdir}/{disease}_PPI_rand{i}_missense.pkl'
    print('Resulting dataset saved at:', outfile)
    print()

    with open(outfile, 'wb') as f:
        pickle.dump(result_nodes, f)

    result_nodes_time = datetime.datetime.now()
    print('Processing time:', result_nodes_time - start_time)
    print('\n\n')

#### PET&DX target - Rewired datasets - AD gene set

In [None]:
dataset = 'ADNI'
target = 'PETandDX'
disease = 'AD'
network = 'rewired'

indir = 'data'
outdir = f'data/graph_datasets/{target}/{network}'
print('Input directory:', indir)
print('Output directory:', outdir)
print()

for i in range(1, 101):

    start_time = datetime.datetime.now()
    print()

    # result_nodes = create_nx_datasets.main(indir, 'ADNI', 'PET', 'AD', 'original', 'missense', None)
    result_nodes = create_nx_datasets.main(indir, dataset, target, disease, network, 'missense', i)
    print('Coding: number of missense variants per node')

    outfile = f'{outdir}/{disease}_PPI_rand{i}_missense.pkl'
    print('Resulting dataset saved at:', outfile)
    print()

    with open(outfile, 'wb') as f:
        pickle.dump(result_nodes, f)

    result_nodes_time = datetime.datetime.now()
    print('Processing time:', result_nodes_time - start_time)
    print('\n\n')

#### PET&DX target - Rewired datasets - NDD gene set

In [None]:
dataset = 'ADNI'
target = 'PETandDX'
disease = 'ND'
network = 'rewired'

indir = 'data'
outdir = f'data/graph_datasets/{target}/{network}'
print('Input directory:', indir)
print('Output directory:', outdir)
print()

for i in range(1, 101):

    start_time = datetime.datetime.now()
    print()

    # result_nodes = create_nx_datasets.main(indir, 'ADNI', 'PET', 'AD', 'original', 'missense', None)
    result_nodes = create_nx_datasets.main(indir, dataset, target, disease, network, 'missense', i)
    print('Coding: number of missense variants per node')

    outfile = f'{outdir}/{disease}_PPI_rand{i}_missense.pkl'
    print('Resulting dataset saved at:', outfile)
    print()

    with open(outfile, 'wb') as f:
        pickle.dump(result_nodes, f)

    result_nodes_time = datetime.datetime.now()
    print('Processing time:', result_nodes_time - start_time)
    print('\n\n')