# Immune Circle Heatmap

This notebooks takes the genes that are a hit from the Brca reactome gsea (metabolism pathway) and maps them on a large circle heat map. 

In [2]:
import pandas as pd
import numpy as np
import seaborn as sns
import matplotlib.pyplot as plt
import scipy.stats
import re
import sys 
import statsmodels.stats.multitest


import gseapy as gp
from gseapy.plot import barplot, dotplot

import cptac
import cptac.utils as u
import plot_utils as p 

  import pandas.util.testing as tm


Load df with all of the genes that have atleast 2 trans effects. Then get list of the gene names and use them to run a GSEA. 

In [3]:
df = pd.read_csv("../Step3.3_Pos_Neg_Correlation_patterns/csv_files/pancan_EGFR_all_FDR_atleast2_same_corr.csv")
df = df.set_index('Comparison')
df1_transposed = df.T 
FDR_atleast2= df1_transposed.columns.values.tolist()


In [4]:
atleast2_sig = []
for gene in FDR_atleast2:
    atleast2_sig.append((re.sub("_proteomics", "", gene)))
len(atleast2_sig)

731

Run GSEA using reactome 2016 set

In [5]:

tumor_enr = gp.enrichr(gene_list = atleast2_sig, description='Tumor_partition', gene_sets='KEGG_2016', 
                       outdir='test/enrichr_kegg')

In [7]:
tumor_enr.res2d.head(5)

Unnamed: 0,Gene_set,Term,Overlap,P-value,Adjusted P-value,Old P-value,Old Adjusted P-value,Odds Ratio,Combined Score,Genes
0,KEGG_2016,T cell receptor signaling pathway Homo sapiens...,18/104,3.843089e-08,1.1e-05,0,0,4.735347,80.853225,JUN;NFATC2;PIK3CD;CD3G;PIK3CG;VAV1;MAPK13;ZAP7...
1,KEGG_2016,B cell receptor signaling pathway Homo sapiens...,15/73,4.867319e-08,7e-06,0,0,5.621873,94.661868,CR2;JUN;SYK;PIK3CD;NFATC2;PIK3CG;VAV1;PPP3CC;I...
2,KEGG_2016,Natural killer cell mediated cytotoxicity Homo...,20/135,1.017982e-07,1e-05,0,0,4.053301,65.259253,SYK;IFNGR1;SH2D1A;NFATC2;PIK3CD;ITGAL;PIK3CG;V...
3,KEGG_2016,Glycolysis / Gluconeogenesis Homo sapiens hsa0...,14/67,1.089237e-07,8e-06,0,0,5.716969,91.657983,GPI;ADH1C;ADH1B;ENO1;HK2;PKM;ALDH1B1;PGK1;ALDO...
4,KEGG_2016,Fc gamma R-mediated phagocytosis Homo sapiens ...,16/93,2.376797e-07,1.4e-05,0,0,4.707059,71.793675,NCF1;SYK;MYO10;SPHK1;WAS;PIK3CD;PLD1;PIK3CG;VA...


In [35]:
#get just the immune genes
cptac_df = tumor_enr.res2d
immune = cptac_df.iloc[0,9]
immune = immune.split(';')

len(immune)


18

In [36]:

df_FDR_append_all = pd.read_csv("../Step3.2_combining_pearson_dfs/csv_files/pancan_EGFR_pearson_all_prot_append_return_all.csv")
df_FDR_append_all = df_FDR_append_all.drop(['Unnamed: 0'], axis=1)

In [37]:
immune_column_names = []
for gene in immune:
    gene += "_proteomics"
    immune_column_names.append(gene)

df_FDR_immune_all = df_FDR_append_all[df_FDR_append_all.Comparison.isin(immune_column_names)]


# T cell Receptor  

In [39]:
p.plotCircleHeatMap(df_FDR_immune_all, "P_value","Correlation","Comparison","Cancer Type",plot_width= 800, plot_height = 650,)

# B cell Receptor

In [27]:
#get just the immune genes
cptac_df = tumor_enr.res2d
immune = cptac_df.iloc[1,9]
immune = immune.split(';')

len(immune)

15

In [28]:
immune_column_names = []
for gene in immune:
    gene += "_proteomics"
    immune_column_names.append(gene)

df_FDR_immune_all = df_FDR_append_all[df_FDR_append_all.Comparison.isin(immune_column_names)]

In [29]:
p.plotCircleHeatMap(df_FDR_immune_all, "P_value","Correlation","Comparison","Cancer Type",plot_width= 600, plot_height = 650,)

In [31]:
#get just the immune genes
cptac_df = tumor_enr.res2d
immune = cptac_df.iloc[2,9]
immune = immune.split(';')

len(immune)

20

In [32]:
immune_column_names = []
for gene in immune:
    gene += "_proteomics"
    immune_column_names.append(gene)

df_FDR_immune_all = df_FDR_append_all[df_FDR_append_all.Comparison.isin(immune_column_names)]

In [33]:
p.plotCircleHeatMap(df_FDR_immune_all, "P_value","Correlation","Comparison","Cancer Type",plot_width= 600, plot_height = 650,)