## Import packages

In [1]:
import pandas as pd
import os,sys
sys.path.append(r'{}'.format(os.path.abspath(os.pardir)))

from wholebrain_tools import aba, genes, dataIO
import wholebrain_tools.stats as st 
import wholebrain_tools.graphics as gt

paths = dataIO.pathParser()

nodes_path = paths.structures
A = aba.Atlas(nodes = nodes_path)
GM = genes.GeneManager()
DFM = aba.AnatomyDataFrameManager(A)

# Genes correlated with PV cells
---

#### load datasets and define saving path

In [2]:
# --------------------------------------------------------------------
ish_path = paths.abaIsh_datasets
# --------------------------------------------------------------------

ish_en = dataIO.loadGeneExpressionFromFile(ish_path, metric = 'energy')
ish_dens = dataIO.loadGeneExpressionFromFile(ish_path, metric = 'density')
ish_int = dataIO.loadGeneExpressionFromFile(ish_path, metric = 'intensity')


In [None]:
# --------------------------------------------------------------------
searchPath = paths.alldata
channelName = 'pv'     # 'wfa' or 'pv'
# --------------------------------------------------------------------

pv = dataIO.allMiceRegions(searchPath=searchPath, channelName=channelName, normCellIntens=True)
pv = DFM.multiIndexDf_from_fineDf(pv, verbose=True)
pv = DFM.regionsDf_to_mid(pv, verbose=False, normalize= True)

avg_en = DFM.midDf_to_avgVector(
                            pv,
                            'energy',
                            exclude_last = 5,
                            )




In [None]:
# --------------------------------------------------------------------
savingdir = paths.corrdata_genes
# --------------------------------------------------------------------

## PV Energy

### Gene expression energy

In [None]:
corr_stat1 = st.correlation_with_abagenes(avgseries=avg_en,
                                    genes_df=ish_en,
                                    gene_manager=GM)

In [None]:
filepath = os.path.join(savingdir,'pvEn_ishEn_corrdata.csv')
corr_stat1.to_csv(filepath, index=False)

In [None]:
genes.check_markers(corr_stat1, 'pv')

In [None]:
genes.print_correlation_summary(corr_stat1, alpha_bonf = 0.05, alpha_fdr = 0.01,to_file=False, prefix="pvEn-ISHen")

### Gene expression intensity

In [None]:
corr_stat2 = st.correlation_with_abagenes(avgseries=avg_en,
                                    genes_df=ish_int,
                                    gene_manager=GM)

In [None]:
filepath = os.path.join(savingdir,'pvEn_ishInt_corrdata.csv')
corr_stat2.to_csv(filepath, index=False)

In [None]:
genes.check_markers(corr_stat2, 'pv')

In [None]:
genes.print_correlation_summary(corr_stat2, alpha_bonf = 0.05, alpha_fdr = 0.01,to_file=False, prefix="pvEn-ISHint")

### Gene expression density

In [None]:
corr_stat3 = st.correlation_with_abagenes(avgseries=avg_en,
                                    genes_df=ish_dens,
                                    gene_manager=GM)

In [None]:
filepath = os.path.join(savingdir,'pvEn_ishDens_corrdata.csv')
corr_stat3.to_csv(filepath, index=False)

In [None]:
genes.check_markers(corr_stat3, 'pv')

In [None]:
genes.print_correlation_summary(corr_stat3, alpha_bonf = 0.05, alpha_fdr = 0.01,to_file=False, prefix="pvEn-ISHdens")