# Expressed Gene List of Mimic

Brian asked Sharvani and Max to intersect the Mimic list with all the commonly expressed genes on the the X and 4th. I need to dump out these gene lists for them to do the merge.

In [1]:
import os
import sys
from pathlib import Path

from IPython.display import display, HTML, Markdown
import numpy as np
import pandas as pd
from scipy.stats import chi2_contingency

import matplotlib as mpl
import matplotlib.pyplot as plt
import seaborn as sns

# Project level imports
sys.path.insert(0, '../lib')
from larval_gonad.notebook import Nb
from larval_gonad.x_to_a import (CHROMS_CHR, MAJOR_ARMS_CHR, idx_stats_by_cluster, commonly_expressed)
from larval_gonad.plotting import make_figs
from larval_gonad.io import memory

# Setup notebook
nbconfig = Nb.setup_notebook('2018-02-08_expressed_gene_list_for_mimic', subproject_dir='../output/testis_scRNAseq_pilot')

last updated: 2018-02-08 
Git hash: be8ef9727c59afa8d3497e24ff289ad4e61e8c95


In [2]:
# Import data from testes
norm = nbconfig.seurat.get_normalized_read_counts()

# Get list of commonly expressed gene
expressed = commonly_expressed(norm)

In [8]:
expressed2Chrom = nbconfig.fbgn2chrom.loc[expressed]

In [25]:
interest = expressed2Chrom[(expressed2Chrom.chrom == 'chrX') | (expressed2Chrom.chrom == 'chr4')].copy()
interest['gene'] = interest.index.map(lambda x: nbconfig.fbgn2symbol[x])
interest.set_index('gene', append=True, inplace=True)

In [26]:
interest.groupby('chrom').size()

chrom
chr4     44
chrX    466
dtype: int64

In [27]:
nbconfig.table_name('target')

'./tables/2018-02-08_expressed_gene_list_for_mimic_target'

In [28]:
fname = '../output/2018-02-08_expressed_gene_list_for_mimic_target.tsv'
interest.to_csv(fname, sep='\t')