**Cell Types Project Notebook**


In [None]:
import pandas as pd
from scipy import stats
import matplotlib as mpl
import matplotlib.pyplot as plt
import numpy as np

In [None]:
from allensdk.core.cell_types_cache import CellTypesCache
from allensdk.api.queries.cell_types_api import CellTypesApi
ctc = CellTypesCache(manifest_file='cell_types/manifest.json')
human_cells = ctc.get_cells(species=[CellTypesApi.HUMAN])
human_df = pd.DataFrame(human_cells)
human_df = human_df.set_index('id')
human_df.head()
ephys_features = pd.DataFrame(ctc.get_ephys_features()).set_index('specimen_id')
human_ephys_df = human_df.join(ephys_features)
human_ephys_df.head()

In [None]:
gene_df = pd.read_csv('brainarea_vs_genes_exp_w_reannotations.tsv', delimiter = '\t')
gene_df = gene_df.set_index('gene_symbol')
gene_df.head()
brain_regions = [item for item in gene_df.columns]
#print(brain_regions)
genes = [item for item in gene_df.index]
#print(genes)

In [None]:
#Find all GABA-related genes https://www.genenames.org/data/genegroup/#!/group/562
GABA_genes = []
for item in genes:
    if "GABR" in item or "GABBR" in item:
        GABA_genes.append(item)
print(GABA_genes)

In [None]:
#Find brain regions where GABA receptors are expressed the most
gaba_gene_df = gene_df.loc[GABA_genes]

# Sum expression levels across all GABA receptor genes for each brain area
gaba_region_expression = gaba_gene_df.sum(axis=0).sort_values(ascending=False)

# Display the top 5 brain areas with highest GABA receptor expression
print("Top Brain Regions with Highest GABA Receptor Gene Expression:")
print(gaba_region_expression.head(10))

In [None]:
#Find all Glutamate-related genes https://www.genenames.org/data/genegroup/#!/group/282
glutamate_genes = []
for item in genes:
    if "GRM" in item or "GRI" in item:
        glutamate_genes.append(item)
print(glutamate_genes)

In [None]:
#Find brain regions where GABA receptors are expressed the most
glutamate_gene_df = gene_df.loc[glutamate_genes]

# Sum expression levels across all GABA receptor genes for each brain area
glutamate_region_expression = glutamate_gene_df.sum(axis=0).sort_values(ascending=False)

# Display the top 5 brain areas with highest GABA receptor expression
print("Top Brain Regions with Highest Glutamate Receptor Gene Expression:")
print(glutamate_region_expression.head(10))