<a href="https://colab.research.google.com/github/marlapinkert/final_project_compcognition/blob/main/download_and_correlation_df.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# Test - Download script

In [175]:
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
from itertools import combinations
from glob import glob

In [None]:
!python download_abide_preproc.py -d rois_cc200 -p cpac -s filt_global -o /content

In [185]:
# We list the paths for each subject using glob
subj_paths = sorted(glob("/content/Outputs/cpac/filt_global/rois_cc200/*.1D"))

In [189]:
# Define function which get list of unique correlations for one subject
def get_corr_list(path):

    # read the file into a DataFrame
    df = pd.read_csv(path, sep="\t")

    # calculate corr matrix for DataFrame (all rois)
    corrs = pd.DataFrame(df.corr())

    # create index with only unique combinations of row x column
    # this ensures we get an index which only gets us the "lower half"
    # of the correlation matrix
    rois_numbers = np.linspace(0, (len(corrs)-1), len(corrs), dtype = "int")
    comb_ind = [comb for comb in combinations(rois_numbers, 2)]

    # use new index to select only the unique combinations from our DataFrame
    # we save this as a dictionnary with the combination of values as keys
    # I.e., correlation of region 1 and region 4 is called "1x4"
    unique_corrs = {}
    for ind in comb_ind:
       unique_corrs[f"{ind[0]}x{ind[1]}"] = corrs.iloc[ind]

    # We add the name of the file as "ID" to the dictionnary.
    # This allows us to later identify the subjects when we create our
    # DataFrame with all our subjects
    unique_corrs["ID"] = path.split("/")[-1]

    return(unique_corrs)

In [192]:
# Create DataFrame with all subjects
list_unique_corrs = []
for path in subj_paths:
    list_unique_corrs.append(get_corr_list(path))

complete_df = pd.DataFrame(list_unique_corrs)

In [196]:
complete_df.to_csv("complete_df.csv")

In [197]:
complete_df

Unnamed: 0,0x1,0x2,0x3,0x4,0x5,0x6,0x7,0x8,0x9,0x10,...,195x197,195x198,195x199,196x197,196x198,196x199,197x198,197x199,198x199,ID
0,-0.023153,-0.202225,-0.118862,-0.150774,-0.151980,-0.044154,-0.119716,-0.073078,-0.166378,0.117244,...,-0.176420,0.038425,0.287099,-0.243898,0.019874,0.005184,0.286736,0.058742,-0.054218,CMU_a_0050649_rois_cc200.1D
1,0.103007,0.063233,-0.132441,0.021815,-0.223033,-0.093503,0.065371,0.086376,-0.184331,0.284540,...,,0.129328,-0.055361,,0.001252,-0.052512,,,0.300453,CMU_a_0050653_rois_cc200.1D
2,-0.108143,0.180122,-0.094069,-0.301107,0.065537,-0.541221,0.249262,-0.313523,,-0.001450,...,,0.163772,-0.134280,,0.159858,0.221677,,,-0.258332,CMU_b_0050651_rois_cc200.1D
3,-0.326598,-0.034746,-0.143261,-0.442049,0.057040,-0.383205,0.330628,-0.156431,-0.267438,-0.364511,...,-0.091295,-0.271951,0.175467,-0.238492,-0.060148,-0.025812,0.178454,-0.030119,-0.289735,CMU_b_0050657_rois_cc200.1D
4,-0.272753,-0.228588,-0.062366,-0.142554,0.279675,-0.036850,0.177369,0.149434,0.004807,-0.075403,...,-0.053606,0.043377,0.295762,-0.067350,-0.216341,-0.143870,-0.025863,0.076545,0.059318,CMU_b_0050669_rois_cc200.1D
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
879,-0.094873,-0.165853,0.063408,-0.082486,0.037484,-0.037947,0.243281,0.014499,-0.060678,-0.154020,...,-0.076239,0.152765,0.193868,-0.191272,-0.107559,0.142799,0.241740,0.026914,0.185163,Yale_0050624_rois_cc200.1D
880,-0.111606,0.074133,-0.150416,-0.361879,0.190066,-0.530953,0.462906,0.090152,-0.016788,-0.168453,...,0.030378,-0.127839,0.081401,-0.069043,-0.009438,0.351551,0.108695,0.354649,-0.053610,Yale_0050625_rois_cc200.1D
881,-0.113827,-0.256892,-0.125796,-0.119745,0.051036,0.137680,0.223421,0.026294,0.024161,0.115746,...,-0.103226,-0.196867,0.020505,-0.047386,-0.274118,-0.200910,0.261185,0.208521,0.162905,Yale_0050626_rois_cc200.1D
882,-0.220996,0.312383,-0.224964,-0.055642,-0.014701,-0.124708,0.038391,0.212432,-0.140073,-0.213447,...,-0.132730,0.328198,0.009550,-0.067159,-0.039316,0.139553,0.116997,-0.076892,0.020700,Yale_0050627_rois_cc200.1D
