# Network Analysis for BeveL Betaseries 

Inputs: betaseries files for BeveL participants (n=85) drawn from 4 conditions: choice, reward taste, punishment taste, neutral rinse

Analysis workflow is mapped off this paper: https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5429248/


### Input Data
- One timeseries txt file per participant. Conditions must be separated in unique folder
- Need a txt file of the labels for each ROI

### Outputs
- Circle graph showing thresholded connectivity of each ROI. ROI color denotes modules. 
- Circle graph of module edge weights. 
- CSV file with module assignment & nodal metrics for each ROI

### Running the notebook
The following parts of the code should be changed
1. Filepath to timeseries 
2. Name of circle graph figure
3. Module dict to assign to module graph
4. Name of module graph figure
5. Name of csv file

## Note: 
### Print Statements are commented out to save time, remove comments if desired. 

In [1]:
# Imports 
import glob
import os
import networkx as nx
import numpy as np
import pandas as pd
import bz2
import pickle
import community
import statistics
import pdb
from scipy import stats
import scipy
import matplotlib
matplotlib.use("Qt5Agg")
import matplotlib.pyplot as plt

from visbrain.objects import ConnectObj, SceneObj, SourceObj, BrainObj, ColorbarObj
from visbrain.io import download_file




In [2]:
basepath = '/Users/jennygilbert/Documents/'

## Load in the data

### Find the path to the data

In [24]:
#Find the path to data
file_list = glob.glob(os.path.join(basepath,'betaseries_bevel/4_combine_timeseries/punishment/*.txt'))

In [25]:
#Check the files found
print(file_list)

['/Users/jennygilbert/Documents/betaseries_bevel/4_combine_timeseries/punishment/sub-001_punish.txt', '/Users/jennygilbert/Documents/betaseries_bevel/4_combine_timeseries/punishment/sub-002_punish.txt', '/Users/jennygilbert/Documents/betaseries_bevel/4_combine_timeseries/punishment/sub-003_punish.txt', '/Users/jennygilbert/Documents/betaseries_bevel/4_combine_timeseries/punishment/sub-004_punish.txt', '/Users/jennygilbert/Documents/betaseries_bevel/4_combine_timeseries/punishment/sub-005_punish.txt', '/Users/jennygilbert/Documents/betaseries_bevel/4_combine_timeseries/punishment/sub-006_punish.txt', '/Users/jennygilbert/Documents/betaseries_bevel/4_combine_timeseries/punishment/sub-007_punish.txt', '/Users/jennygilbert/Documents/betaseries_bevel/4_combine_timeseries/punishment/sub-009_punish.txt', '/Users/jennygilbert/Documents/betaseries_bevel/4_combine_timeseries/punishment/sub-010_punish.txt', '/Users/jennygilbert/Documents/betaseries_bevel/4_combine_timeseries/punishment/sub-011_pu

In [26]:
#Check to see how many participants 
#len(file_list)

### Make a dictionary to read in the files to pandas

In [27]:
#Setting the ditionary
my_dict={}
for item in file_list:
    name=item.split('/')[7].split('.')[0]
    print(name)
    my_dict.setdefault(name, []).append(item)

sub-001_punish
sub-002_punish
sub-003_punish
sub-004_punish
sub-005_punish
sub-006_punish
sub-007_punish
sub-009_punish
sub-010_punish
sub-011_punish
sub-012_punish
sub-013_punish
sub-014_punish
sub-015_punish
sub-016_punish
sub-017_punish
sub-018_punish
sub-019_punish
sub-020_punish
sub-021_punish
sub-022_punish
sub-024_punish
sub-025_punish
sub-026_punish
sub-027_punish
sub-028_punish
sub-029_punish
sub-030_punish
sub-031_punish
sub-032_punish
sub-033_punish
sub-034_punish
sub-035_punish
sub-036_punish
sub-037_punish
sub-038_punish
sub-039_punish
sub-040_punish
sub-041_punish
sub-042_punish
sub-043_punish
sub-044_punish
sub-045_punish
sub-046_punish
sub-047_punish
sub-048_punish
sub-050_punish
sub-052_punish
sub-053_punish
sub-054_punish
sub-055_punish
sub-056_punish
sub-057_punish
sub-058_punish
sub-059_punish
sub-060_punish
sub-061_punish
sub-062_punish
sub-063_punish
sub-064_punish
sub-066_punish
sub-067_punish
sub-068_punish
sub-069_punish
sub-070_punish
sub-071_punish
sub-072_pu

In [28]:
# Checking to make sure its populated
#my_dict['sub-024_reward']

### Read the data from the dictionary into pandas

In [29]:
#Setting the data dictionary
data_dict={}
for key, value in my_dict.items():
    for i in value:
        data_dict.setdefault(key, []).append(pd.read_csv(i, sep='\t' ,header=None,index_col=False))

In [30]:
#Check the dictionary
data_dict.keys()

dict_keys(['sub-001_punish', 'sub-002_punish', 'sub-003_punish', 'sub-004_punish', 'sub-005_punish', 'sub-006_punish', 'sub-007_punish', 'sub-009_punish', 'sub-010_punish', 'sub-011_punish', 'sub-012_punish', 'sub-013_punish', 'sub-014_punish', 'sub-015_punish', 'sub-016_punish', 'sub-017_punish', 'sub-018_punish', 'sub-019_punish', 'sub-020_punish', 'sub-021_punish', 'sub-022_punish', 'sub-024_punish', 'sub-025_punish', 'sub-026_punish', 'sub-027_punish', 'sub-028_punish', 'sub-029_punish', 'sub-030_punish', 'sub-031_punish', 'sub-032_punish', 'sub-033_punish', 'sub-034_punish', 'sub-035_punish', 'sub-036_punish', 'sub-037_punish', 'sub-038_punish', 'sub-039_punish', 'sub-040_punish', 'sub-041_punish', 'sub-042_punish', 'sub-043_punish', 'sub-044_punish', 'sub-045_punish', 'sub-046_punish', 'sub-047_punish', 'sub-048_punish', 'sub-050_punish', 'sub-052_punish', 'sub-053_punish', 'sub-054_punish', 'sub-055_punish', 'sub-056_punish', 'sub-057_punish', 'sub-058_punish', 'sub-059_punish',

In [31]:
#Check for the dataframe
#data_dict['sub-058_reward']

### Create a new dictionary with correlation matrix

In [32]:
#Setting up the correlation dictionary
cor_dict={}

for key, value in data_dict.items():
    value[0]
    #pdb.set_trace()
    cor_matrix = value[0].corr()
    cor_dict[key] = cor_matrix
    

In [33]:
#check the dictionary
#list(cor_dict.values())[3]

### Make a dictionary of labels for the nodes

In [34]:
#This points to a txt file with the ROI names in a list separated by commas
path = os.path.join(basepath,'betaseries_bevel/5_analysis/labels.txt')
df_label = pd.read_csv(path, sep=',')

#df_label.head()

In [35]:
labels_dict = {}
n=0
for item in df_label:
    labels_dict[n]=item
    n=n+1

In [36]:
print(labels_dict)

{0: 'Amygdala_L', 1: 'Amygdala_R', 2: 'Dorsal_striatum_L', 3: 'Dorsal_striatum_R', 4: 'Fusiform_gyrus_L', 5: 'Fusiform_gyrus_R', 6: 'Hippocampus_L', 7: 'Hippocampus_R', 8: 'Insula_L', 9: 'Insula_R', 10: 'Intracalcarine_cortex_L', 11: 'Intracalcarine_cortex_R', 12: 'lOFC_L', 13: 'lOFC_R', 14: 'mOFC_L', 15: 'mOFC_R', 16: 'Oral_somatosensory_cortex_R', 17: 'Oral_somatosensory_cortex_L', 18: 'Precuneus_L', 19: 'Precuneus_R', 20: 'Ventral_striatum_L', 21: 'Ventral_striatum_R', 22: 'vlPFC_L', 23: 'vlPFC_R', 24: 'vlThalamus_L', 25: 'vlThalamus_R', 26: 'vmPFC_L', 27: 'vmPFC_R'}


### Function to create a graph with positive or negative values and minimum correlation value

In [37]:
def create_corr_network_5(G, corr_direction, min_correlation):

    ##Creates a copy of the graph
    H = G.copy()
    
    ##Checks all the edges and removes some based on corr_direction
    for stock1, stock2, weight in list(G.edges(data=True)):
        ##if we only want to see the positive correlations we then delete the edges with weight smaller than 0        
        if corr_direction == "positive":
            ####it adds a minimum value for correlation. 
            ####If correlation weaker than the min, then it deletes the edge
            if weight["weight"] <0 or weight["weight"] < min_correlation:
                H.remove_edge(stock1, stock2)
        ##this part runs if the corr_direction is negative and removes edges with weights equal or largen than 0
        else:
            ####it adds a minimum value for correlation. 
            ####If correlation weaker than the min, then it deletes the edge
            if weight["weight"] >=0 or weight["weight"] > min_correlation:
                H.remove_edge(stock1, stock2)
    return(H)

### Function to make a graph object BY SUBJECT
This will return:
- The edges (noramlized R correlation matrix, in pandas dataframe)
- The correlations (absolute value of the edges in a numpy dataframe)
- The mean_FC (the mean functional connectivity per subject/run)
- The graphs (this will contain the raw graph object G as well as the the partion values from the modularity calculation)
- The modules (communitites in the network at the participant level

## Changes from the First Iteration

1. Test for mean,sd, and module assignment distribution among participant's graphs

In [38]:
def make_graphs(list_o_data, direction, min_cor):
    edge_dict={}
    cor_dict={}
    FC_dict={}
    sd_dict={}
    graph_dict={}
    partition_dict={}
    for key, values in list_o_data.items():
            #i=i.set_index(labels.ID)
            #i.rename(columns=labels.ID, inplace=True)
            ########################################
            edge_dict.setdefault(key, []).append(values)
            ########################################
            cor_matrix = np.asmatrix(values)
            x=abs(cor_matrix)
            mu=x.mean()
            sd=x.std()
            ########################################
            cor_dict.setdefault(key, []).append(x)
            ########################################
            FC_dict.setdefault(key, []).append(mu)
            sd_dict.setdefault(key, []).append(sd)
            ########################################
            G = nx.from_numpy_matrix(cor_matrix)
            #for i, nlrow in labels.iterrows():
                #G.node[i].update(nlrow[0:].to_dict())
            ########################################
            graph_dict.setdefault(key, []).append(G)
            ########################################
            partition = community.best_partition(create_corr_network_5(G, direction,min_cor))
            ########################################
            partition_dict.setdefault(key, []).append(partition)
            ########################################
    return({'edges':edge_dict, 'correlations':cor_dict, 'mean_FC':FC_dict, 'stdev':sd_dict, 'graphs':graph_dict,'modules':partition_dict})

### Apply the function to correlations & check output

In [39]:
# Apply function
GRAPHS = make_graphs(cor_dict, "positive", 0)

In [40]:
# Check the keys for the dictionary
GRAPHS.keys()

dict_keys(['edges', 'correlations', 'mean_FC', 'stdev', 'graphs', 'modules'])

In [41]:
# Check modules for one subject
GRAPHS['stdev']['sub-001_punish']

[0.2085705198242629]

In [42]:
#Check to make sure graphs are filled
#Test = GRAPHS['graphs']['sub-001_reward'][0]
#Test.edges(data=True)

In [43]:
GRAPHS['mean_FC']

{'sub-001_punish': [0.2984725547965786],
 'sub-002_punish': [0.36187669892176433],
 'sub-003_punish': [0.23179400836690212],
 'sub-004_punish': [0.2218585345684793],
 'sub-005_punish': [0.3264160988593797],
 'sub-006_punish': [0.2378711677620616],
 'sub-007_punish': [0.24981460869514568],
 'sub-009_punish': [0.29231269564476253],
 'sub-010_punish': [0.2739706441707339],
 'sub-011_punish': [0.39826603868875093],
 'sub-012_punish': [0.36764007982188884],
 'sub-013_punish': [0.3312139442024204],
 'sub-014_punish': [0.2345046910925483],
 'sub-015_punish': [0.281123567143881],
 'sub-016_punish': [0.284660470914947],
 'sub-017_punish': [0.2921770618617725],
 'sub-018_punish': [0.2624712527541421],
 'sub-019_punish': [0.2580907630786738],
 'sub-020_punish': [0.25383758934187167],
 'sub-021_punish': [0.24124403459043567],
 'sub-022_punish': [0.25799381409298494],
 'sub-024_punish': [0.22938628671486858],
 'sub-025_punish': [0.2619255208732469],
 'sub-026_punish': [0.23971396055766653],
 'sub-0

### Get the standard deviation of the mean correlation

In [44]:
#statistics.stdev(GRAPHS['mean_FC'])
m=[]

for key,value in GRAPHS['mean_FC'].items():
    m.append(value[0])

In [45]:
#describe the mean correlation of participant's graphs
stats.describe(m)

DescribeResult(nobs=85, minmax=(0.18767806940114912, 0.5022611328907918), mean=0.3047133910764402, variance=0.004022407263029967, skewness=1.0784310430684483, kurtosis=1.356752359594437)

In [46]:
statistics.mean(m)

0.3047133910764402

In [47]:
m

[0.2984725547965786,
 0.36187669892176433,
 0.23179400836690212,
 0.2218585345684793,
 0.3264160988593797,
 0.2378711677620616,
 0.24981460869514568,
 0.29231269564476253,
 0.2739706441707339,
 0.39826603868875093,
 0.36764007982188884,
 0.3312139442024204,
 0.2345046910925483,
 0.281123567143881,
 0.284660470914947,
 0.2921770618617725,
 0.2624712527541421,
 0.2580907630786738,
 0.25383758934187167,
 0.24124403459043567,
 0.25799381409298494,
 0.22938628671486858,
 0.2619255208732469,
 0.23971396055766653,
 0.37580986347479456,
 0.18767806940114912,
 0.29876429803169013,
 0.30005010762663054,
 0.320850250380847,
 0.24475327027101418,
 0.26955165238007023,
 0.29312364086772486,
 0.2590993390541854,
 0.27383836824751107,
 0.2972464165348981,
 0.3120679489940092,
 0.24010980251075523,
 0.27244953706393354,
 0.22338350560138376,
 0.27643285502296244,
 0.31040499664209675,
 0.40136519373802243,
 0.4689283375153202,
 0.36735333682708726,
 0.29965406453514365,
 0.22485625378889973,
 0.298942

In [48]:
#Show the histogram of average correlation across participant's graphs

hist, bin_edges = scipy.histogram(m, bins = 10) 
  
# Checking the results 
print ("No. of points in each bin : ", hist) 
print ("Size of the bins          : ", bin_edges) 
  
# plotting the histogram 
plt.bar(bin_edges[:-1], hist, width = .1) 
plt.xlim(min(bin_edges), max(bin_edges)) 
plt.show() 



No. of points in each bin :  [ 2 14 16 26 11  5  5  2  1  3]
Size of the bins          :  [0.18767807 0.21913638 0.25059468 0.28205299 0.31351129 0.3449696
 0.37642791 0.40788621 0.43934452 0.47080283 0.50226113]


### Get the mean SD of participant's corrleation matricies

In [49]:
sd=[]
for key,value in GRAPHS['stdev'].items():
    sd.append(value[0])

In [50]:
#describe the mean correlation of participant's graphs
stats.describe(sd)

DescribeResult(nobs=85, minmax=(0.19323841162830502, 0.32177245475495625), mean=0.22357595815321907, variance=0.0004967810822295364, skewness=2.04173520399252, kurtosis=5.631693320540235)

In [51]:
sd

[0.2085705198242629,
 0.26346129505427124,
 0.2017936509693653,
 0.20591675572034066,
 0.22059427136403997,
 0.22072735554828213,
 0.2073908159291184,
 0.20423214727274902,
 0.19955359666273914,
 0.27651841388216514,
 0.21144016323745204,
 0.23079005923048498,
 0.22803843213001243,
 0.2188618298640308,
 0.22182734673052362,
 0.20501163942456718,
 0.208024618736703,
 0.21473404466257118,
 0.21274501442391625,
 0.21185686366210024,
 0.21881018906867558,
 0.2162012851597408,
 0.21101202867293384,
 0.21461359172990702,
 0.2651190594645822,
 0.19323841162830502,
 0.2112463733671291,
 0.22241170711413014,
 0.23434626809917028,
 0.2044668082553281,
 0.20441124287998028,
 0.2281362975291849,
 0.20879159231862926,
 0.2118468374343377,
 0.2020023398033139,
 0.23423728866479462,
 0.21877246752099105,
 0.22628911700296123,
 0.2054076992409443,
 0.2012631746946747,
 0.21126518520907625,
 0.22127795114914695,
 0.2552612901467353,
 0.2579575875972968,
 0.22090406839668236,
 0.20747912322726164,
 0.22

In [52]:
hist, bin_edges = scipy.histogram(sd, bins = 10) 
  
# Checking the results 
print ("No. of points in each bin : ", hist) 
print ("Size of the bins          : ", bin_edges) 
  
# plotting the histogram 
plt.bar(bin_edges[:-1], hist, width = .05) 
plt.xlim(min(bin_edges), max(bin_edges)) 
plt.show() 



No. of points in each bin :  [16 25 26  9  2  3  2  0  0  2]
Size of the bins          :  [0.19323841 0.20609182 0.21894522 0.23179862 0.24465203 0.25750543
 0.27035884 0.28321224 0.29606565 0.30891905 0.32177245]


If this value is low (<0.1) then you don't need to threshold the graph? 

### Test Modularity

Goal: use modularity function from communities to identify module structure that emerge during reward within the sample

In [53]:
#this is pulling out the module structure for each participant
modules=[]

for key,value in GRAPHS['modules'].items():
    modules.append(value[0])

In [54]:
#print it to make sure it works
modules

[{0: 0,
  1: 1,
  2: 0,
  3: 0,
  4: 2,
  5: 3,
  6: 0,
  7: 0,
  8: 1,
  9: 1,
  10: 3,
  11: 3,
  12: 2,
  13: 4,
  14: 2,
  15: 3,
  16: 5,
  17: 5,
  18: 4,
  19: 4,
  20: 6,
  21: 5,
  22: 1,
  23: 1,
  24: 3,
  25: 1,
  26: 6,
  27: 0},
 {0: 0,
  1: 0,
  2: 1,
  3: 1,
  4: 2,
  5: 2,
  6: 0,
  7: 0,
  8: 1,
  9: 1,
  10: 2,
  11: 2,
  12: 3,
  13: 3,
  14: 2,
  15: 2,
  16: 1,
  17: 1,
  18: 4,
  19: 1,
  20: 1,
  21: 1,
  22: 4,
  23: 4,
  24: 2,
  25: 2,
  26: 1,
  27: 1},
 {0: 0,
  1: 0,
  2: 1,
  3: 1,
  4: 2,
  5: 2,
  6: 0,
  7: 0,
  8: 3,
  9: 3,
  10: 3,
  11: 3,
  12: 1,
  13: 4,
  14: 5,
  15: 1,
  16: 1,
  17: 1,
  18: 2,
  19: 5,
  20: 0,
  21: 0,
  22: 5,
  23: 5,
  24: 4,
  25: 4,
  26: 2,
  27: 1},
 {0: 0,
  1: 0,
  2: 1,
  3: 1,
  4: 2,
  5: 2,
  6: 0,
  7: 0,
  8: 3,
  9: 3,
  10: 2,
  11: 2,
  12: 3,
  13: 3,
  14: 2,
  15: 2,
  16: 1,
  17: 1,
  18: 0,
  19: 4,
  20: 1,
  21: 1,
  22: 5,
  23: 5,
  24: 3,
  25: 3,
  26: 1,
  27: 1},
 {0: 0,
  1: 0,
  2: 1,
  3:

In [55]:
#made a df of the modules
df = pd.DataFrame.from_dict(modules)

In [56]:
df

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,...,18,19,20,21,22,23,24,25,26,27
0,0,1,0,0,2,3,0,0,1,1,...,4,4,6,5,1,1,3,1,6,0
1,0,0,1,1,2,2,0,0,1,1,...,4,1,1,1,4,4,2,2,1,1
2,0,0,1,1,2,2,0,0,3,3,...,2,5,0,0,5,5,4,4,2,1
3,0,0,1,1,2,2,0,0,3,3,...,0,4,1,1,5,5,3,3,1,1
4,0,0,1,1,0,2,0,0,1,3,...,0,4,4,4,5,5,3,3,1,5
5,0,1,2,2,3,4,3,3,0,2,...,4,4,0,0,1,1,0,0,3,3
6,0,0,1,1,2,3,0,0,4,4,...,3,1,0,0,5,5,4,0,2,5
7,0,0,1,1,2,3,0,0,4,4,...,2,2,5,5,6,6,4,4,5,5
8,0,1,2,2,1,0,1,1,3,4,...,5,1,0,0,5,5,3,3,5,0
9,0,0,1,1,0,1,0,0,1,1,...,0,1,2,0,3,0,0,0,0,1


In [57]:
#label the modules
df.rename(columns={0:"Amygdala_L",1:"Amygdala_R", 2:"Dorsal_striatum_L", 3:"Dorsal_striatum_R", 4:"Fusiform_gyrus_L", 5:"Fusiform_gyrus_R", 6:"Hippocampus_L", 7:"Hippocampus_R", 8:"Insula_L",
          9:"Insula_R", 10:"Intracalcarine_cortex_L", 11:"Intracalcarine_cortex_R", 12:"lOFC_L", 13: "lOFC_R", 14: "mOFC_L", 15:"mOFC_R", 16:"Oral_somatosensory_cortex_R", 17:"Oral_somatosensory_cortex_L", 18:"Precuneus_L", 
          19:"Precuneus_R", 20:"Ventral_striatum_L", 21:"Ventral_striatum_R", 22:"vlPFC_L", 23:"vlPFC_R", 24:"vlThalamus_L" , 25:"vlThalamus_R", 26: "vmPFC_L", 27: "vmPFC_R"})

Unnamed: 0,Amygdala_L,Amygdala_R,Dorsal_striatum_L,Dorsal_striatum_R,Fusiform_gyrus_L,Fusiform_gyrus_R,Hippocampus_L,Hippocampus_R,Insula_L,Insula_R,...,Precuneus_L,Precuneus_R,Ventral_striatum_L,Ventral_striatum_R,vlPFC_L,vlPFC_R,vlThalamus_L,vlThalamus_R,vmPFC_L,vmPFC_R
0,0,1,0,0,2,3,0,0,1,1,...,4,4,6,5,1,1,3,1,6,0
1,0,0,1,1,2,2,0,0,1,1,...,4,1,1,1,4,4,2,2,1,1
2,0,0,1,1,2,2,0,0,3,3,...,2,5,0,0,5,5,4,4,2,1
3,0,0,1,1,2,2,0,0,3,3,...,0,4,1,1,5,5,3,3,1,1
4,0,0,1,1,0,2,0,0,1,3,...,0,4,4,4,5,5,3,3,1,5
5,0,1,2,2,3,4,3,3,0,2,...,4,4,0,0,1,1,0,0,3,3
6,0,0,1,1,2,3,0,0,4,4,...,3,1,0,0,5,5,4,0,2,5
7,0,0,1,1,2,3,0,0,4,4,...,2,2,5,5,6,6,4,4,5,5
8,0,1,2,2,1,0,1,1,3,4,...,5,1,0,0,5,5,3,3,5,0
9,0,0,1,1,0,1,0,0,1,1,...,0,1,2,0,3,0,0,0,0,1


# Plot the distibution of module assignments for the ROIs

In [58]:
df.hist()

array([[<matplotlib.axes._subplots.AxesSubplot object at 0x1c218254a8>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x1c21d440f0>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x1c1e6b8748>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x1c1e6dbdd8>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x1c1e70b4a8>],
       [<matplotlib.axes._subplots.AxesSubplot object at 0x1c1e70b4e0>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x1c1e763208>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x1c1e78a898>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x1c1e7b3f28>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x1c1e7e35f8>],
       [<matplotlib.axes._subplots.AxesSubplot object at 0x1c1e80cc88>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x1c1e83e358>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x1c1e8669e8>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x1c1

### Only a couple ROI have stable module assignment -- modules 0, 1, and 2 
- 0:"Amygdala_L"
- 1:"Amygdala_R"
- 2:"Dorsal_striatum_L"

In [59]:
#find the mean over the columns
df.mean(axis = 0)

0     0.000000
1     0.411765
2     1.152941
3     1.270588
4     1.341176
5     2.164706
6     1.035294
7     0.952941
8     2.623529
9     2.482353
10    2.411765
11    2.505882
12    2.435294
13    2.682353
14    2.388235
15    2.388235
16    1.964706
17    1.952941
18    2.352941
19    2.352941
20    2.329412
21    2.047059
22    2.952941
23    3.176471
24    2.741176
25    2.635294
26    2.870588
27    2.741176
dtype: float64

In [60]:
# Check the standard deviation over the columns
df.std(axis = 0)

0     0.000000
1     0.495074
2     0.645606
3     0.730105
4     1.180728
5     1.193704
6     1.383982
7     1.387923
8     1.447300
9     1.385398
10    1.275167
11    1.350692
12    1.569403
13    1.424378
14    1.581847
15    1.559106
16    1.523210
17    1.587945
18    1.810721
19    1.716210
20    1.898547
21    1.844592
22    1.812036
23    1.878300
24    1.662993
25    1.653618
26    1.804678
27    1.826739
dtype: float64



## The standard deviation of module assignments is high (>1) for the majority of the modules. 

### This suggests the module assignment is not stable across participants 

### Using the median module assignment across participants makes more sense than the mean

In [None]:
#find the mean over the columns
partition_median = df.median()
df_median = pd.DataFrame(partition_median)

In [None]:
# View the median module for each node
df_median

### Make a Dicitionary with the modules

In [None]:
#Convert modules to dictionary
#mod_dict={}
#for index, row in df_median.iterrows():
    #mod_dict[index]= row[0]

#mod_dict

### Combine participant correlation matrices into one mean OR MEDIAN correlation matrix

In [61]:
#make the function to combine
def make_total_graphs(dict_o_data):
    mylist=[]
    for key, val_list in dict_o_data.items():
        for i in val_list:
            cor_matrix = np.asarray(i)
            mylist.append(cor_matrix)
    x=np.stack(mylist, axis=2)
    mu=np.median(x, axis=(2))
    #mu=np.mean(x, axis=(2))
    return(mu)

In [62]:
#Make the mean graph with correlations
mean_graph = make_total_graphs(GRAPHS['correlations'])

In [63]:
#Check to make sure this worked 
print(mean_graph.shape)

#Convert the graph to a numpy matrix so it can be recognized by networkX
mean_graph_mat = np.matrix(mean_graph)

#Check the mean correlation to use to threshold later
mean_graph_mat.mean()

(28, 28)


0.285967988775244

In [64]:
meanG = nx.from_numpy_matrix(mean_graph_mat)

# Check Modularity in the Mean Graph

### This is the way Cohen's group usually calculates modularity, because its more stable

In [65]:
partition = community.best_partition(meanG)

In [66]:
#Add the modules and ROI labels to the graph
nx.set_node_attributes(meanG, partition, 'modules')
nx.set_node_attributes(meanG, labels_dict, 'ROIs')

In [67]:
# Check to make sure this worked
ROIs=nx.get_node_attributes(meanG,'ROIs')
ROIs

{0: 'Amygdala_L',
 1: 'Amygdala_R',
 2: 'Dorsal_striatum_L',
 3: 'Dorsal_striatum_R',
 4: 'Fusiform_gyrus_L',
 5: 'Fusiform_gyrus_R',
 6: 'Hippocampus_L',
 7: 'Hippocampus_R',
 8: 'Insula_L',
 9: 'Insula_R',
 10: 'Intracalcarine_cortex_L',
 11: 'Intracalcarine_cortex_R',
 12: 'lOFC_L',
 13: 'lOFC_R',
 14: 'mOFC_L',
 15: 'mOFC_R',
 16: 'Oral_somatosensory_cortex_R',
 17: 'Oral_somatosensory_cortex_L',
 18: 'Precuneus_L',
 19: 'Precuneus_R',
 20: 'Ventral_striatum_L',
 21: 'Ventral_striatum_R',
 22: 'vlPFC_L',
 23: 'vlPFC_R',
 24: 'vlThalamus_L',
 25: 'vlThalamus_R',
 26: 'vmPFC_L',
 27: 'vmPFC_R'}

In [68]:
#Check if this worked
partitions=nx.get_node_attributes(meanG,'modules')
partitions

{0: 0,
 1: 0,
 2: 1,
 3: 1,
 4: 2,
 5: 3,
 6: 0,
 7: 0,
 8: 4,
 9: 4,
 10: 3,
 11: 3,
 12: 3,
 13: 3,
 14: 2,
 15: 2,
 16: 1,
 17: 1,
 18: 5,
 19: 5,
 20: 6,
 21: 6,
 22: 1,
 23: 1,
 24: 4,
 25: 4,
 26: 1,
 27: 1}

# NOW: Check if mean partitioned graph is more stable than individually partitioned median modules 








In [69]:
#Apply the partition to participant's data

modg = community.induced_graph(partitions, meanG) 

### Function to make a thresholded graph

In [70]:
def threshold(G, corr_direction, min_correlation):

    ##Creates a copy of the graph
    H = G.copy()
    
    ##Checks all the edges and removes some based on corr_direction
    for stock1, stock2, weight in list(G.edges(data=True)):
        ##if we only want to see the positive correlations we then delete the edges with weight smaller than 0        
        if corr_direction == "positive":
            ####it adds a minimum value for correlation. 
            ####If correlation weaker than the min, then it deletes the edge
            if weight["weight"] <0 or weight["weight"] < min_correlation:
                H.remove_edge(stock1, stock2)
        ##this part runs if the corr_direction is negative and removes edges with weights equal or largen than 0
        else:
            ####it adds a minimum value for correlation. 
            ####If correlation weaker than the min, then it deletes the edge
            if weight["weight"] >=0 or weight["weight"] > min_correlation:
                H.remove_edge(stock1, stock2)
    return(H)

In [71]:
threshG = threshold(meanG, 'positive', 0.3)

In [72]:
meanG.nodes(data=True)

NodeDataView({0: {'modules': 0, 'ROIs': 'Amygdala_L'}, 1: {'modules': 0, 'ROIs': 'Amygdala_R'}, 2: {'modules': 1, 'ROIs': 'Dorsal_striatum_L'}, 3: {'modules': 1, 'ROIs': 'Dorsal_striatum_R'}, 4: {'modules': 2, 'ROIs': 'Fusiform_gyrus_L'}, 5: {'modules': 3, 'ROIs': 'Fusiform_gyrus_R'}, 6: {'modules': 0, 'ROIs': 'Hippocampus_L'}, 7: {'modules': 0, 'ROIs': 'Hippocampus_R'}, 8: {'modules': 4, 'ROIs': 'Insula_L'}, 9: {'modules': 4, 'ROIs': 'Insula_R'}, 10: {'modules': 3, 'ROIs': 'Intracalcarine_cortex_L'}, 11: {'modules': 3, 'ROIs': 'Intracalcarine_cortex_R'}, 12: {'modules': 3, 'ROIs': 'lOFC_L'}, 13: {'modules': 3, 'ROIs': 'lOFC_R'}, 14: {'modules': 2, 'ROIs': 'mOFC_L'}, 15: {'modules': 2, 'ROIs': 'mOFC_R'}, 16: {'modules': 1, 'ROIs': 'Oral_somatosensory_cortex_R'}, 17: {'modules': 1, 'ROIs': 'Oral_somatosensory_cortex_L'}, 18: {'modules': 5, 'ROIs': 'Precuneus_L'}, 19: {'modules': 5, 'ROIs': 'Precuneus_R'}, 20: {'modules': 6, 'ROIs': 'Ventral_striatum_L'}, 21: {'modules': 6, 'ROIs': 'Vent

### Function to visualize thresholded graph with modules in colors

In [73]:
def jenny_graph(graph):
    edges,weights = zip(*nx.get_edge_attributes(graph, 'weight').items())
    nodes, color = zip(*nx.get_node_attributes(graph,'modules').items()) #if your modules are named different change here
    nodes, positions = zip(*nx.get_node_attributes(graph,'ROIs').items())
    #positions
    positions=nx.circular_layout(graph) #this is defining a circluar graph, if you want a different one you change the circular part of this line
    
    #Figure size
    plt.figure(figsize=(40,25))
    
    
    #draws nodes
    color = np.array(color)
    nColormap=plt.cm.Spectral #check here if you want different colors https://matplotlib.org/3.1.1/gallery/color/colormap_reference.html
    cM=color.max()
    cm=color.min()
    y=nx.draw_networkx_nodes(graph,positions, 
                           node_color=color,
                           node_size=4000,
                           alpha=0.8, 
                           cmap= nColormap,
                           vmin=cm ,vmax=cM)

    #Styling for labels
    nx.draw_networkx_labels(graph, positions, labels = ROIs, font_size=10, 
                            font_family='sans-serif', fontweight = 'bold')
    
    
    #draw edges
    weights=np.array(weights)
    eColormap=plt.cm.bwr #check here if you want different colors https://matplotlib.org/3.1.1/gallery/color/colormap_reference.html
    wt=weights*5
    M=wt.max()
    m=wt.min()
    x=nx.draw_networkx_edges(graph, positions, edge_list=edges, style='solid', width = wt, edge_color = wt,
                           cmap=eColormap,
                           edge_vmin=m,
                           edge_vmax=M)
    
    #format the colorbar
    node_bar=plt.colorbar(y)
    edge_bar=plt.colorbar(x)

    node_bar.set_label('Modularity',fontsize = 25)
    edge_bar.set_label('Strength of edge weight',fontsize = 25)

    plt.axis('off')
    plt.title("Modularity and Edge Weights of Average Graph", fontsize = 30)
    #plt.savefig(os.path.join(basepath,"betaseries_bevel/5_analysis/modularity_circle_reward.png", format="PNG")
    plt.show()

In [74]:
jenny_graph(threshG)



# USE BCTPY FOR PARTICIPATION COEFFICIENT

In [93]:
import bct

In [None]:
#Participation coefficient usage
#bct.participation_coef(W, ci, degree='undirected')¶

In [107]:
a = np.array(list(partition.keys()))

In [121]:
b = np.reshape(a, (28,1))

In [122]:
b

array([[ 0],
       [ 1],
       [ 2],
       [ 3],
       [ 4],
       [ 5],
       [ 6],
       [ 7],
       [ 8],
       [ 9],
       [10],
       [11],
       [12],
       [13],
       [14],
       [15],
       [16],
       [17],
       [18],
       [19],
       [20],
       [21],
       [22],
       [23],
       [24],
       [25],
       [26],
       [27]])

In [123]:
b.shape

(28, 1)

In [129]:
b.dtype

dtype('int64')

In [130]:
b.astype('float64')

array([[ 0.],
       [ 1.],
       [ 2.],
       [ 3.],
       [ 4.],
       [ 5.],
       [ 6.],
       [ 7.],
       [ 8.],
       [ 9.],
       [10.],
       [11.],
       [12.],
       [13.],
       [14.],
       [15.],
       [16.],
       [17.],
       [18.],
       [19.],
       [20.],
       [21.],
       [22.],
       [23.],
       [24.],
       [25.],
       [26.],
       [27.]])

In [132]:
mean_graph_mat.shape

(28, 28)

In [133]:
mean_graph_mat.dtype

dtype('float64')

In [136]:
participation_coeff = bct.participation_coef(mean_graph_mat, b)

ValueError: non-broadcastable output operand with shape (28,) doesn't match the broadcast shape (28,28)

### Error Message: 
---------------------------------------------------------------------------
ValueError                                Traceback (most recent call last)
<ipython-input-134-8b30ab33fac5> in <module>()
----> 1 bct.participation_coef(mean_graph_mat, b)

/anaconda3/lib/python3.6/site-packages/bct/algorithms/centrality.py in participation_coef(W, ci, degree)
    734 
    735     for i in range(1, int(np.max(ci)) + 1):
--> 736         Kc2 += np.square(np.sum(W * (Gc == i), axis=1))
    737 
    738     P = np.ones((n,)) - Kc2 / np.square(Ko)

ValueError: non-broadcastable output operand with shape (28,) doesn't match the broadcast shape (28,28)

### Make Module Graph with Nodes Weighted by Clustering Coefficient

Make a new graph with modules from whole group analysis 

In [75]:
#modg = community.induced_graph(partitions, meanG)

In [None]:
#Clustering coeff multiplied by 2000 -- so the size works with networkx node sizing
#reward_clust_dict = {
    #0.0: 1200,
    #1.0: 1320,
    #2.0: 1360,
    #3.0: 1160,
#}

#punish_clust_dict = {
    #0.0: 1200,
    #1.0: 1280,
    #2.0: 1240,
    #3.0: 1300
#}

In [None]:
#Set module attributes**** Need to change this depending on the condition

#REWARD
#nx.set_node_attributes(modg, reward_clust_dict, 'clustering')

#PUNISHMENT
#nx.set_node_attributes(modg, punish_clust_dict, 'clustering')

In [None]:
#list(modg.nodes)

### Function to make module structure graph

In [None]:
def module_fig(G):
    edges,weights = zip(*nx.get_edge_attributes(G,'weight').items())
    #nodes, size = zip(*nx.get_node_attributes(G,'clustering').items())
    
    
    positions=nx.circular_layout(G)
    plt.figure(figsize=(25,20))
    
    color = np.array(list(G.nodes))
    nColormap=plt.cm.Spectral #check here if you want different colors https://matplotlib.org/3.1.1/gallery/color/colormap_reference.html
    cM=color.max()
    cm=color.min()
    nx.draw_networkx_nodes(G,positions, 
                           node_color=color, 
                           #node_size=size,
                           alpha=1.0, 
                           cmap= 'Spectral',
                           vmin=cm,vmax=cM )
   
    #Styling for labels
    nx.draw_networkx_labels(G, positions, font_size=8, font_family='sans-serif')
    
    x=nx.draw_networkx_edges(G, positions, edge_list=edges,style='solid', width = weights, edge_color = weights)
   
    edge_bar=plt.colorbar(x)
    edge_bar.set_label('Strength of edge weight',fontsize = 25)
    
    plt.title("Module Connectivity Weights", fontsize = 30)
    #plt.savefig(os.path.join(basepath,"betaseries_bevel/5_analysis/results/modularity_edges_reward_weighted.png"), format="PNG")
    plt.axis('off')
    plt.show()

In [None]:
#module_fig(modg)

### Calculate Nodal Metrics by Participant
- Clustering Coefficient
- Betweenness centrality

Function to pull the nodal parameters by subject

In [76]:
def make_node_stats(list_o_data, direction, min_cor):
    clustering_dict ={}
    centrality_dict ={}
    
    
    for key, values in list_o_data.items():
            ########################################
            cor_matrix = np.asmatrix(values)
            x=abs(cor_matrix)
            mu=x.mean()
            ########################################
            G = nx.from_numpy_matrix(cor_matrix)
            tG = create_corr_network_5(G, direction,min_cor)
            ########################################
            clustering = nx.clustering(tG, weight=True)
            ########################################
            clustering_dict.setdefault(key, []).append(clustering)
            ########################################
            centrality = nx.betweenness_centrality(tG, weight=True)
            ########################################
            centrality_dict.setdefault(key, []).append(centrality)
            ########################################
    return({'clustering_coeff':clustering_dict, 'btn_centrality':centrality_dict})

In [77]:
#Metrics computed on an UNTHRESHOLDED GRAPH
nodes = make_node_stats(cor_dict, "positive", 0)

In [78]:
nodes.keys()

dict_keys(['clustering_coeff', 'btn_centrality'])

In [79]:
#nodes['btn_centrality']['sub-001_reward']

In [80]:
clustering_coeff=[]

for key,value in nodes['clustering_coeff'].items():
    clustering_coeff.append(value[0])

In [81]:
#bring into pandas
df_clust = pd.DataFrame.from_dict(clustering_coeff)

In [82]:
#Calculate average module centrality *** THIS IS THE MEAN ASSIGNMENT
#df_clust['module0_mean'] = df_clust[[0,1,6,7]].mean(axis=1)
#df_clust['module1_mean'] = df_clust[[2,3,16,17]].mean(axis=1)
#df_clust['module2_mean'] = df_clust[[4,14,15]].mean(axis=1)
#df_clust['module3_mean'] = df_clust[[5,10,11]].mean(axis=1)
#df_clust['module4_mean'] = df_clust[[8,9,24,25]].mean(axis=1)
#df_clust['module5_mean'] = df_clust[[12,13]].mean(axis=1)
#df_clust['module6_mean'] = df_clust[[18,19]].mean(axis=1)
#df_clust['module7_mean'] = df_clust[[20,21]].mean(axis=1)
#df_clust['module8_mean'] = df_clust[[22,23,26,27]].mean(axis=1)

In [83]:
#Calculate average module centrality *** THIS IS THE MEAN ASSIGNMENT
df_clust['module0_mean'] = df_clust[[0,1,6,7]].mean(axis=1)
df_clust['module1_mean'] = df_clust[[2,3,16,17,22,23,26,27]].mean(axis=1)
df_clust['module2_mean'] = df_clust[[4,14,15]].mean(axis=1)
df_clust['module3_mean'] = df_clust[[5,10,11,12,13]].mean(axis=1)
df_clust['module4_mean'] = df_clust[[8,9,24,25]].mean(axis=1)
df_clust['module5_mean'] = df_clust[[18,19]].mean(axis=1)
df_clust['module6_mean'] = df_clust[[20,21]].mean(axis=1)

In [84]:

df_clust.rename(columns={0:"Amygdala_L",1:"Amygdala_R", 2:"Dorsal_striatum_L", 3:"Dorsal_striatum_R", 4:"Fusiform_gyrus_L", 5:"Fusiform_gyrus_R", 6:"Hippocampus_L", 7:"Hippocampus_R", 8:"Insula_L",
          9:"Insula_R", 10:"Intracalcarine_cortex_L", 11:"Intracalcarine_cortex_R", 12:"lOFC_L", 13: "lOFC_R", 14: "mOFC_L", 15:"mOFC_R", 16:"Oral_somatosensory_cortex_L", 17:"Oral_somatosensory_cortex_R", 18:"Precuneus_L", 
          19:"Precuneus_R", 20:"Ventral_striatum_L", 21:"Ventral_striatum_R", 22:"vlPFC_L", 23:"vlPFC_R", 24:"vlThalamus_L" , 25:"vlThalamus_R", 26: "vmPFC_L", 27: "vmPFC_R"})

Unnamed: 0,Amygdala_L,Amygdala_R,Dorsal_striatum_L,Dorsal_striatum_R,Fusiform_gyrus_L,Fusiform_gyrus_R,Hippocampus_L,Hippocampus_R,Insula_L,Insula_R,...,vlThalamus_R,vmPFC_L,vmPFC_R,module0_mean,module1_mean,module2_mean,module3_mean,module4_mean,module5_mean,module6_mean
0,0.964912,0.952569,0.926154,0.926154,0.886667,0.940000,0.936842,0.926154,0.960145,0.949275,...,0.943333,0.877493,0.934783,0.945119,0.931397,0.883947,0.914011,0.954295,0.936923,0.899671
1,0.897436,0.897436,0.981884,0.923077,0.952569,0.983333,0.897436,0.897436,0.946667,0.923077,...,0.920000,0.923077,0.981884,0.897436,0.947952,0.944019,0.971889,0.921795,0.911795,0.915769
2,0.907692,0.905797,0.910000,0.907692,0.894928,0.909524,0.948052,0.926667,0.943723,0.884058,...,0.923913,0.886154,0.931159,0.922052,0.895301,0.898132,0.907032,0.914373,0.877800,0.907179
3,0.810277,0.844156,0.852814,0.842105,0.746667,0.786765,0.766667,0.786765,0.786667,0.878947,...,0.786667,0.845850,0.807971,0.801966,0.839368,0.780686,0.768020,0.820213,0.857800,0.810845
4,0.952899,0.930736,0.946667,0.946667,0.923077,0.945652,0.891738,0.923077,0.891738,0.934066,...,0.898462,0.891738,0.978947,0.924612,0.922668,0.907265,0.941994,0.909400,0.947840,0.909930
5,0.835498,0.786561,0.775362,0.819048,0.847953,0.779412,0.806324,0.842105,0.795238,0.790514,...,0.804762,0.742857,0.785714,0.817622,0.798608,0.736782,0.753312,0.815465,0.672386,0.878947
6,0.903333,0.928105,0.876667,0.930736,0.851852,0.851852,0.883333,0.884058,0.876667,0.903333,...,0.948529,0.898551,0.898551,0.899707,0.907106,0.879506,0.878495,0.900594,0.887446,0.907444
7,0.988304,0.926154,0.914530,0.914530,0.914530,0.963333,0.926154,0.944615,0.944615,0.914530,...,0.946667,0.960000,0.980952,0.946307,0.939932,0.934587,0.938830,0.932991,0.961999,0.961667
8,0.928105,0.924901,0.903333,0.903333,0.886667,0.846154,0.826667,0.938095,0.952381,0.870769,...,0.861660,0.863333,0.870769,0.904442,0.890871,0.900858,0.879654,0.897811,0.808810,0.884001
9,0.981818,0.939394,1.000000,1.000000,0.750000,0.950000,0.752381,0.689474,0.904412,0.869281,...,0.666667,0.871795,1.000000,0.840767,0.916193,0.769298,0.822569,0.812471,0.868554,0.656470


In [85]:
central=[]

for key,value in nodes['btn_centrality'].items():
    central.append(value[0])

In [86]:
df_cent = pd.DataFrame.from_dict(central)

In [87]:
df_cent['module0_mean'] = df_cent[[0,1,6,7]].mean(axis=1)
df_cent['module1_mean'] = df_cent[[2,3,16,17,22,23,26,27]].mean(axis=1)
df_cent['module2_mean'] = df_cent[[4,14,15]].mean(axis=1)
df_cent['module3_mean'] = df_cent[[5,10,11,12,13]].mean(axis=1)
df_cent['module4_mean'] = df_cent[[8,9,24,25]].mean(axis=1)
df_cent['module5_mean'] = df_cent[[18,19]].mean(axis=1)
df_cent['module6_mean'] = df_cent[[20,21]].mean(axis=1)

In [88]:
#Calculate average module centrality
#df_cent['module0_mean'] = df_cent[[0,1,6,7]].mean(axis=1)
#df_cent['module1_mean'] = df_cent[[2,3,16,17]].mean(axis=1)
#df_cent['module2_mean'] = df_cent[[4,14,15]].mean(axis=1)
#df_cent['module3_mean'] = df_cent[[5,10,11]].mean(axis=1)
#df_cent['module4_mean'] = df_cent[[8,9,24,25]].mean(axis=1)
#df_cent['module5_mean'] = df_cent[[12,13]].mean(axis=1)
#df_cent['module6_mean'] = df_cent[[18,19]].mean(axis=1)
#df_cent['module7_mean'] = df_cent[[20,21]].mean(axis=1)
#df_cent['module8_mean'] = df_cent[[22,23,26,27]].mean(axis=1)

In [89]:
#rename_columns
df_cent.rename(columns={0:"Amygdala_L",1:"Amygdala_R", 2:"Dorsal_striatum_L", 3:"Dorsal_striatum_R", 4:"Fusiform_gyrus_L", 5:"Fusiform_gyrus_R", 6:"Hippocampus_L", 7:"Hippocampus_R", 8:"Insula_L",
          9:"Insula_R", 10:"Intracalcarine_cortex_L", 11:"Intracalcarine_cortex_R", 12:"lOFC_L", 13: "lOFC_R", 14: "mOFC_L", 15:"mOFC_R", 16:"Oral_somatosensory_cortex_L", 17:"Oral_somatosensory_cortex_R", 18:"Precuneus_L", 
          19:"Precuneus_R", 20:"Ventral_striatum_L", 21:"Ventral_striatum_R", 22:"vlPFC_L", 23:"vlPFC_R", 24:"vlThalamus_L" , 25:"vlThalamus_R", 26: "vmPFC_L", 27: "vmPFC_R"})

Unnamed: 0,Amygdala_L,Amygdala_R,Dorsal_striatum_L,Dorsal_striatum_R,Fusiform_gyrus_L,Fusiform_gyrus_R,Hippocampus_L,Hippocampus_R,Insula_L,Insula_R,...,vlThalamus_R,vmPFC_L,vmPFC_R,module0_mean,module1_mean,module2_mean,module3_mean,module4_mean,module5_mean,module6_mean
0,0.000789,0.001690,0.003480,0.003480,0.008783,0.002576,0.001665,0.003480,0.001429,0.001925,...,0.002332,0.010789,0.002592,0.001906,0.003618,0.009220,0.005757,0.001714,0.005134,0.006183
1,0.006720,0.006720,0.000642,0.004504,0.002035,0.000248,0.006720,0.006720,0.002874,0.004504,...,0.004830,0.004504,0.000642,0.006720,0.002869,0.002830,0.000930,0.004732,0.005446,0.004885
2,0.004455,0.003935,0.004052,0.004455,0.005795,0.004233,0.001656,0.003073,0.001836,0.006385,...,0.003084,0.007126,0.002670,0.003280,0.005396,0.005080,0.004992,0.003807,0.003913,0.004331
3,0.009967,0.007100,0.006419,0.005458,0.023450,0.009876,0.016475,0.010092,0.013988,0.004185,...,0.013771,0.007410,0.010879,0.010909,0.007226,0.015997,0.007574,0.009895,0.004459,0.011727
4,0.001819,0.002568,0.002249,0.002249,0.003869,0.002266,0.006722,0.003869,0.006722,0.000896,...,0.005913,0.006722,0.000519,0.003744,0.004269,0.005116,0.002623,0.004539,0.001567,0.004689
5,0.008603,0.013332,0.016173,0.009286,0.006328,0.010547,0.011801,0.006998,0.014492,0.013329,...,0.011116,0.020162,0.013581,0.010184,0.011966,0.006592,0.015619,0.010987,0.009980,0.004725
6,0.004657,0.001739,0.006972,0.002808,0.010102,0.010102,0.006223,0.005761,0.006923,0.004657,...,0.001079,0.005125,0.005125,0.004595,0.004533,0.006994,0.007023,0.005089,0.004703,0.003824
7,0.000271,0.004267,0.005198,0.005198,0.005198,0.001572,0.004163,0.002688,0.002688,0.005198,...,0.002762,0.001757,0.000600,0.002847,0.003311,0.003524,0.003264,0.003702,0.001282,0.001664
8,0.002327,0.003178,0.004931,0.004931,0.006437,0.004765,0.014503,0.002133,0.001659,0.008036,...,0.010225,0.011944,0.008036,0.005535,0.007158,0.006188,0.006136,0.006417,0.003220,0.006519
9,0.000237,0.001367,0.000000,0.000000,0.014676,0.001897,0.011905,0.028131,0.004211,0.006607,...,0.030073,0.003804,0.000000,0.010410,0.009520,0.016471,0.015891,0.012274,0.007414,0.051259


Save out to CSV files

In [90]:
df_clust.to_csv(os.path.join(basepath,'betaseries_bevel/5_analysis/node_clustering_punishment_weighted_median.csv'), header = True, index = None)

In [91]:
df_cent.to_csv(os.path.join(basepath,'betaseries_bevel/5_analysis/node_centrality_punishment_weighted_median.csv'), header = True, index = None)

# Brain graphs  
http://visbrain.org/index.html

In [None]:
positions = pd.read_csv(os.path.join(basepath,'betaseries_bevel/3_pull_timeseries/betaseries_rois.txt'), sep='\t')

In [None]:
positions=positions.drop('Region', axis=1)


In [None]:
positions_dict=positions.to_dict('index')

In [None]:
nx.set_node_attributes(meanG, positions_dict, 'pos')

In [None]:
def brain_graph(G, strength, radius, colormap):
    mods=[node[1]['modules'] for node in G.nodes(data=True)]
    ccol=[]
    for m in mods:
        if m == 0.0:
            ccol.append('mediumvioletred')
        if m == 1.0:
            ccol.append('orange')
        if m == 2.0:
            ccol.append('yellowgreen')
        if m == 3.0:
            ccol.append('slateblue')
            
    # Colorbar default arguments. See `visbrain.objects.ColorbarObj`
    CBAR_STATE = dict(cbtxtsz=12, txtsz=10., width=.1, cbtxtsh=3., ndigits=1,
                  rect=(-.3, -2., 1., 4.))
        
    nodes, edges = np.asarray([list(node[1]['pos'].values()) for node in meanG.nodes(data=True)]), nx.to_numpy_array(G)

    #Change backgrounnd color here
    sc = SceneObj(size=(500, 600), bgcolor = 'grey')
    
    # Coloring method
    color_by = 'strength'
    # Because we don't want to plot every connections, we only keep connections
    select = edges > strength
    
    # Define the connectivity object
    c_default = ConnectObj('default', nodes, edges, select=select, line_width=3., cmap=colormap, color_by=color_by)
    
    # Then, we define the sources
    s_obj = SourceObj('sources', nodes, color=ccol, radius_min=radius)
    sc.add_to_subplot(c_default, title='Node Connectivity Grouped by Module')
    
    # And add connect, source and brain objects to the scene
    sc.add_to_subplot(s_obj)
    sc.add_to_subplot(BrainObj('B3'), use_this_cam=True)
    
    #Add colorbar
    cb_parr = ColorbarObj(c_default, cblabel='Connectivity strength', **CBAR_STATE, cmap=colormap)
    sc.add_to_subplot(cb_parr, row=0, col=1, width_max=200)
    
    # Coloring method
    color_by = 'count'
    
    # Define the connectivity and source object
    c_count = ConnectObj('default', nodes, edges, select=select, line_width=4.,
                         color_by=color_by, antialias=True,  cmap=colormap)

    s_obj_c = SourceObj('sources', nodes, color=ccol, radius_min=radius,
                        symbol='square')

    # And add connect, source and brain objects to the scene
    sc.add_to_subplot(c_count, row=1, col=0,
                      title='Node Grouped by Number of Connections per node')

    sc.add_to_subplot(s_obj_c, use_this_cam=True, row=1, col=0)
    sc.add_to_subplot(BrainObj('B3'), use_this_cam=True, row=1, col=0)
    
    
    #Add colorbar
    cb_parr_c = ColorbarObj(c_count, cblabel='Number of connections per node', **CBAR_STATE, cmap=colormap)
    sc.add_to_subplot(cb_parr_c, row=1, col=1, width_max=200)

    sc.preview()

    #sc.screenshot(os.path.join(basepath,'betaseries_bevel/5_analysis/example_brain_obj.png'), transparent=True)

In [None]:
brain_graph(meanG, .4, 15., 'Blues')

## Save GRAPHS dictionary in a pickle file in case of crash

In [None]:
pickle.dump(GRAPHS, open(os.path.join(basepath, 'betaseries_bevel/tmp/Graphs'), 'wb'), protocol=4)

In [None]:
with open(os.path.join(basepath, 'betaseries_bevel/tmp/Graphs'), 'rb') as pickle_file:
    try:
        while True:
            GRAPHS = pickle.load(pickle_file)
#             print (GRAPHS)
    except EOFError:
        pass

# Testing Participation Coefficient

#This is the function from Jess Cohen via 

In [None]:
import numpy as np
from random import choice
import networkx as nx

def within_community_degree(weighted_partition, nan = 0.0, catch_edgeless_node=True):
    ''' Computes "within-module degree" (z-score) for each node (Guimera 2007, J Stat Mech)

    ------
    Parameters
    ------
    weighted_partition: Louvain Weighted Partition
        louvain = weighted_modularity.LouvainCommunityDetection(graph)
        weighted_partitions = louvain.run()
        weighted_partition = weighted_partition[0], where index is the partition level
    nan : int
        number to replace unexpected values (e.g., -infinity) with
        default = 0.0
    catch_edgeless_node: Boolean
        raise ValueError if node degree is zero
        default = True

    ------
    Returns
    ------
    within_community_degree: dict
        Dictionary of the within community degree of each node.

    '''
    wc_dict = {}
    for c, community in enumerate(weighted_partition.communities):
        community_degrees = []
        for node in community: #get average within-community-degree
            node_degree = weighted_partition.node_degree(node)
            if node_degree == 0.0: #catch edgeless nodes
                if catch_edgeless_node:
                    raise ValueError("Node {} is edgeless".format(node))
                wc_dict[node] = 0.0
                continue
            community_degrees.append(weighted_partition.node_degree_by_community(node)[c])
        for node in community: #get node's within_community-degree z-score
            within_community_degree = weighted_partition.node_degree_by_community(node)[c]
            std = np.std(community_degrees) # std of community's degrees
            mean = np.mean(community_degrees) # mean of community's degrees
            if std == 0.0: #so we don't divide by 0
                wc_dict[node] = (within_community_degree - mean) #z_score
                continue
            wc_dict[node] = (within_community_degree - mean / std) #z_score
    return wc_dict

def participation_coefficient(weighted_partition, catch_edgeless_node=True):
    '''
    Computes the participation coefficient for each node (Guimera 2007, J Stat Mech)

    ------
    Parameters
    ------
    weighted_partition: Louvain Weighted Partition
        louvain = weighted_modularity.LouvainCommunityDetection(graph)
        weighted_partitions = louvain.run()
        weighted_partition = weighted_partition[0], where index is the partition level
    catch_edgeless_node: Boolean
        raise ValueError if node degree is zero
        default = True

    ------
    Returns
    ------
    participation_coefficient: dict
        Dictionary of the participation coefficient of each node.
    '''
    pc_dict = {}
    graph = weighted_partition.graph
    for node in graph:
        node_degree = weighted_partition.node_degree(node)
        if node_degree == 0.0: 
            if catch_edgeless_node:
                raise ValueError("Node {} is edgeless".format(node))
            pc_dict[node] = 0.0
            continue    
        deg_per_comm = weighted_partition.node_degree_by_community(node)
        deg_per_comm.pop(weighted_partition.get_node_community(node))
        bc_degree = sum(deg_per_comm) #between community degree
        if bc_degree == 0.0:
            pc_dict[node] = 0.0
            continue
        pc = 1 - ((float(bc_degree) / float(node_degree))**2)
        pc_dict[node] = pc
    return pc_dict