# Summary analysis in Hippocampus

In [1]:
import numpy as np
import pandas as pd
from venn import venn
from matplotlib import pyplot as plt

from plotnine import *
from warnings import filterwarnings
from matplotlib.cbook import mplDeprecation
filterwarnings("ignore",category=mplDeprecation)

## Summary plots

### Genes

In [2]:
genes = pd.read_csv('../../_m/genes/diffExpr_interaction_full.txt', 
                    sep='\t')
genes = genes[(genes['adj.P.Val'] < 0.20)].sort_values('adj.P.Val')
genes['Feature'] = genes.index
genes = genes[['Feature', 'Symbol', 'ensemblID', 'logFC', 'adj.P.Val']]
genes['Type'] = 'gene'
genes.head()

Unnamed: 0,Feature,Symbol,ensemblID,logFC,adj.P.Val,Type


### Transcripts

In [20]:
trans = pd.read_csv('../../_m/transcripts/diffExpr_interaction_full.txt', 
                    sep='\t', index_col=0)
trans = trans[(trans['adj.P.Val'] < 0.20)].sort_values('adj.P.Val')
trans['Feature'] = trans.index
trans['ensemblID'] = trans.gene_id.str.replace('\\.\d+', '')
trans = trans[['Feature', 'Symbol', 'ensemblID', 'logFC', 'P.Value', 'adj.P.Val']]
trans['Type'] = 'transcript'
trans.head()

Unnamed: 0,Feature,Symbol,ensemblID,logFC,P.Value,adj.P.Val,Type
ENST00000478214.1,ENST00000478214.1,HMGA1,ENSG00000137309,2.625696,1e-06,0.097925,transcript


### Exons

In [9]:
exons = pd.read_csv('../../_m/exons/diffExpr_interaction_full.txt', 
                    sep='\t', index_col=0)
exons = exons[(exons['adj.P.Val'] < 0.20)].sort_values('adj.P.Val')
exons['Feature'] = exons.index
exons = exons[['Feature', 'Symbol', 'ensemblID', 'logFC', 'adj.P.Val']]
exons['Type'] = 'exon'
exons.head()

Unnamed: 0,Feature,Symbol,ensemblID,logFC,adj.P.Val,Type


### Junctions

In [12]:
juncs = pd.read_csv('../../_m/junctions/diffExpr_interaction_full.txt', 
                    sep='\t', index_col=0)
juncs = juncs[(juncs['adj.P.Val'] < 0.05)].sort_values('adj.P.Val')
juncs['Feature'] = juncs.index
juncs = juncs[['Feature', 'Symbol', 'ensemblID', 'logFC', 'adj.P.Val']]
juncs['Type'] = 'junction'
juncs.head()

Unnamed: 0,Feature,Symbol,ensemblID,logFC,adj.P.Val,Type
chr14:49853786-49862553(-),chr14:49853786-49862553(-),,,6.843164,0.002007,junction
chr18:31592940-31592993(+),chr18:31592940-31592993(+),,,3.726332,0.003891,junction
chr21:8219273-8402302(-),chr21:8219273-8402302(-),,,-3.263341,0.003891,junction
chrX:140784309-140784456(+),chrX:140784309-140784456(+),,,3.17827,0.046789,junction


#### Junction (chr21:8402231-8402287) within RNA45SN3, there is lots of splicing recorded in sorted BAM.