## Import packages

In [None]:
import pandas as pd
import os

import sys
sys.path.append(r'C:\Users\Valentino\Documents\MATLAB\PNN_wholeBrain\analysis_CTR')
from geneTool import GeneManager, print_correlation_summary, check_markers
from AbaTool import Atlas, AnatomyDataFrameManager
from StatTools import correlation_with_abagenes
import dataIO



nodes_path = r'C:\Users\Valentino\Documents\MATLAB\PNN_wholeBrain\analysis_CTR\structures.json'
A = Atlas(nodes = nodes_path)
GM = GeneManager()
DFM = AnatomyDataFrameManager(A)

# Genes correlated with PNNs
---

#### load datasets and define saving path

In [None]:
# --------------------------------------------------------------------
ish_path = r"D:\proj_PNN-Atlas\ABAgeneData"
# --------------------------------------------------------------------

ish_en = dataIO.loadGeneExpressionFromFile(ish_path, metric = 'energy')
ish_dens = dataIO.loadGeneExpressionFromFile(ish_path, metric = 'density')
ish_int = dataIO.loadGeneExpressionFromFile(ish_path, metric = 'intensity')


In [None]:
# --------------------------------------------------------------------
searchPath = r'D:\proj_PNN-Atlas\RESULTS\allData_CTR'
channelName = 'wfa'     # 'wfa' or 'pv'
# --------------------------------------------------------------------

wfa = dataIO.allMiceRegions(searchPath=searchPath, channelName=channelName, normCellIntens=True)
wfa = DFM.multiIndexDf_from_fineDf(wfa, verbose=True)
wfa = DFM.regionsDf_to_mid(wfa, verbose=False, normalize= True)

avg_en = DFM.midDf_to_avgVector(
                            wfa,
                            'energy',
                            exclude_last = 5,
                            )

avg_diff = DFM.midDf_to_avgVector(
                            wfa,
                            'diffuseFluo',
                            exclude_last = 5,
                            )



In [None]:
# --------------------------------------------------------------------
savingdir = r'D:\proj_PNN-Atlas\RESULTS\genecorrelationISH\correlations'
# --------------------------------------------------------------------

## PNN Energy

### Gene expression energy

In [None]:
corr_stat1 = correlation_with_abagenes(avgseries=avg_en,
                                    genes_df=ish_en,
                                    gene_manager=GM)
                                    

In [None]:
corr_stat1

In [None]:
filepath = os.path.join(savingdir,'pnnEn_ishEn_corrdata.csv')
corr_stat1.to_csv(filepath, index=False)

In [None]:
check_markers(corr_stat1, 'wfa')

In [None]:
print_correlation_summary(corr_stat1, alpha_bonf = 0.05, alpha_fdr = 0.01,to_file=False, prefix="pnnEn-ISHen")

### Gene expression intensity

In [None]:
corr_stat2 = correlation_with_abagenes(avgseries=avg_en,
                                    genes_df=ish_int,
                                    gene_manager=GM)

In [None]:
filepath = os.path.join(savingdir,'pnnEn_ishInt_corrdata.csv')
corr_stat2.to_csv(filepath, index=False)

In [None]:
check_markers(corr_stat2, 'wfa')

In [None]:
print_correlation_summary(corr_stat2, alpha_bonf = 0.05, alpha_fdr = 0.01,to_file=False, prefix="pnnEn-ISHint")

### Gene expression density

In [None]:
corr_stat3 = correlation_with_abagenes(avgseries=avg_en,
                                    genes_df=ish_dens,
                                    gene_manager=GM)

In [None]:
filepath = os.path.join(savingdir,'pnnEn_ishDens_corrdata.csv')
corr_stat3.to_csv(filepath, index=False)

In [None]:
check_markers(corr_stat3, 'wfa')

In [None]:
print_correlation_summary(corr_stat3, alpha_bonf = 0.05, alpha_fdr = 0.01,to_file=False, prefix="pnnEn-ISHdens")

## WFA diffuse fluorescence

### Gene expression density

In [None]:
corr_stat4 = correlation_with_abagenes(avgseries=avg_diff,
                                    genes_df=ish_dens,
                                    gene_manager=GM)

In [None]:
filepath = os.path.join(savingdir,'wfaDiff_ishDens_corrdata.csv')
corr_stat4.to_csv(filepath, index=False)

In [None]:
check_markers(corr_stat4, 'wfa')

In [None]:
print_correlation_summary(corr_stat4, alpha_bonf = 0.05, alpha_fdr = 0.01,to_file=False, prefix="wfaDiff-ISHdens")

### Gene expression energy

In [None]:
corr_stat5 = correlation_with_abagenes(avgseries=avg_diff,
                                    genes_df=ish_en,
                                    gene_manager=GM)

In [None]:
filepath = os.path.join(savingdir,'wfaDiff_ishEn_corrdata.csv')
corr_stat5.to_csv(filepath, index=False)

In [None]:
check_markers(corr_stat5, 'wfa')

In [None]:
print_correlation_summary(corr_stat5, alpha_bonf = 0.05, alpha_fdr = 0.01,to_file=False, prefix="wfaDiff-ISHen")

### Gene expression intensity

In [None]:
corr_stat6 = correlation_with_abagenes(avgseries=avg_diff,
                                    genes_df=ish_int,
                                    gene_manager=GM)

In [None]:
filepath = os.path.join(savingdir,'wfaDiff_ishInt_corrdata.csv')
corr_stat6.to_csv(filepath, index=False)

In [None]:
check_markers(corr_stat6, 'wfa')

In [None]:
print_correlation_summary(corr_stat6, alpha_bonf = 0.05, alpha_fdr = 0.01,to_file=False, prefix="wfaDIff-ISHint")