# Examine Relation of Altered Transcriptomics and Proteomics when ARID1A is mutated in Ovarian Cancer

### Library Imports

In [2]:
import pandas as pd
import numpy as np
import scipy.stats
import collections
import re
import gseapy as gp
from gseapy.plot import barplot, dotplot
import matplotlib.pyplot as plt
import seaborn as sns

import cptac
import cptac.algorithms as al

ov = cptac.Ovarian()

                                    

### Load Results of Trans Analysis

In [4]:
Trans_Results = pd.read_csv("Formatted_Trans_Results.csv")

### Filter for only Ovarian Cancer Type, ARID1A Mutation, and Transcript or Proteomic Comparison

In [16]:
Ovarian = Trans_Results.loc[Trans_Results['Cancer_Type'] == 'Ovarian']
ARID = Ovarian.loc[Ovarian['Mutation_Gene'] == 'ARID1A']

transcript = ARID.loc[ARID['Omics'] == 'transcriptomics']
proteomic = ARID.loc[ARID['Omics'] == 'proteomics']

transcript_proteins = list(transcript['Protein'])
proteomic_proteins = list(proteomic['Protein'])

### Print proteins whose proteomic levels are significantly altered when ARID1A is Mutated

In [19]:
proteomic_proteins

['ING1', 'OLFM4', 'TIMP1', 'PAXIP1', 'ING1', 'ZBTB40', 'PIGR', 'TMEM63A']

### Print proteins whose transcript levels are significantly altered when ARID1A is Mutated

In [18]:
transcript_proteins

['PGR',
 'MTNR1B',
 'CDK20',
 'HMX3',
 'RXFP1',
 'GPR97',
 'TUNAR',
 'SLC26A2',
 'PGAP2',
 'ANKRD20A12P',
 'TNFRSF18',
 'HGD',
 'C10orf71',
 'LOC100506526',
 'C2CD4B',
 'MFAP3L',
 'LINC00645',
 'OLFM4',
 'HES2',
 'RNF186',
 'SLC5A9',
 'CCAT1',
 'FGF14',
 'LOC158434',
 'GABRP',
 'ERMN',
 'SCGB2A1',
 'SERINC2',
 'HMX2',
 'CAPN6',
 'ELP3',
 'GUCA1C',
 'GJD3',
 'RCAN1',
 'PIGR',
 'LOC102723769',
 'ARSA',
 'LINC00485',
 'KLHDC7B',
 'C2orf16',
 'GDA',
 'LRRC26',
 'MOGAT1',
 'CRELD2',
 'NCMAP',
 'MSX1',
 'SCNN1B',
 'AGR2',
 'LINC01207',
 'TCN1',
 'LEFTY1',
 'MTRNR2L1',
 'SPATA21',
 'CSF3',
 'GNRHR',
 'RASD1',
 'SLC46A2',
 'SPRR2D',
 'ANKS4B',
 'BAIAP2L2',
 'SERPINA4',
 'PHYHIPL',
 'ANAPC4',
 'TFF3',
 'PEBP4',
 'C1orf64',
 'PGR',
 'OR8D4',
 'PRR15',
 'FAM150B',
 'UBTFL1',
 'FGL1',
 'CCAT2',
 'SERPINA3',
 'ZBTB25',
 'DUXA',
 'STX18',
 'MICALCL',
 'CREB3L1',
 'MSS51',
 'CLCA1',
 'SPDEF',
 'PLIN3',
 'FBXW10',
 'SCGB1D2',
 'PRAMEF12',
 'MMP26',
 'KRT24',
 'FAM149A',
 'MBD3L3',
 'SERPINA1',
 'MBD3L

### Find proteins in both lists

In [21]:
in_both = []
for pp in proteomic_proteins:
    if pp in transcript_proteins:
        print(pp)
        in_both.append(pp)

OLFM4
PIGR


<b>OLFM4</b> and <b>PIGR</b> are the only proteins showing significant change in both proteomic expression and transcript expression when ARID1A is mutated in Ovarian Cancer

In [27]:
transcript_df = ov.join_omics_to_mutations(mutations_genes='ARID1A', omics_df_name='transcriptomics', omics_genes=in_both)
proteomic_df = ov.join_omics_to_mutations(mutations_genes='ARID1A', omics_df_name='proteomics', omics_genes=in_both)

#joint_df = pd.concat([transcript_df, proteomic_df])

#joint_df

transcript_df


Unnamed: 0_level_0,OLFM4_transcriptomics,PIGR_transcriptomics,ARID1A_Mutation,ARID1A_Location,ARID1A_Mutation_Status,Sample_Status
Sample_ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1
S001,2.062720,147.178000,[Wildtype_Tumor],[No_mutation],Wildtype_Tumor,Tumor
S002,0.072102,0.041317,[Wildtype_Tumor],[No_mutation],Wildtype_Tumor,Tumor
S003,0.000000,0.027524,[Wildtype_Tumor],[No_mutation],Wildtype_Tumor,Tumor
S004,0.174432,10.052100,[Wildtype_Tumor],[No_mutation],Wildtype_Tumor,Tumor
S005,0.165579,0.325556,[Wildtype_Tumor],[No_mutation],Wildtype_Tumor,Tumor
S006,0.118844,10.660800,[Wildtype_Tumor],[No_mutation],Wildtype_Tumor,Tumor
S007,0.065489,0.593011,[Wildtype_Tumor],[No_mutation],Wildtype_Tumor,Tumor
S008,0.000000,0.579682,[Wildtype_Tumor],[No_mutation],Wildtype_Tumor,Tumor
S009,0.010962,0.942334,[Wildtype_Tumor],[No_mutation],Wildtype_Tumor,Tumor
S011,0.082004,0.015715,[Wildtype_Tumor],[No_mutation],Wildtype_Tumor,Tumor


In [28]:
mutateddf = transcript_df.loc[transcript_df['ARID1A_Mutation_Status'] != 'Wildtype_Tumor']
mutateddf

Unnamed: 0_level_0,OLFM4_transcriptomics,PIGR_transcriptomics,ARID1A_Mutation,ARID1A_Location,ARID1A_Mutation_Status,Sample_Status
Sample_ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1
S026,0.187611,71.2816,[Missense_Mutation],[p.I1625T],Single_mutation,Tumor
S044,0.142194,0.286387,[Missense_Mutation],[p.A1946P],Single_mutation,Tumor
S078,34.2684,25.1176,"[Frame_Shift_Del, Frame_Shift_Del]","[p.Q1519Rfs*8, p.F2141Sfs*59]",Multiple_mutation,Tumor
S080,174.078,224.109,"[Missense_Mutation, Nonsense_Mutation]","[p.S202Y, p.E992*]",Multiple_mutation,Tumor


Very few ARID1A Mutation in Ovarian Cancer (But seems to have a large effect)?