# PIK3CA: Effects of Mutation

<b> Standard imports for playing with and plotting data frames. </b>

In [6]:
import pandas as pd
import numpy as np
import scipy.stats
from scipy.stats import pearsonr
import matplotlib.pyplot as plt
import seaborn as sns
#import altair as alt

#alt.renderers.enable('notebook')


<b> Import CPTAC </b>

In [7]:
import CPTAC

In [8]:
somatic_mutations = CPTAC.get_somatic()
proteomics = CPTAC.get_proteomics()
phos = CPTAC.get_phosphoproteomics()

<b> List of proteins that interact with PIK3R1 (according to STRING) </b>

In [17]:
protList = ['IRS1', 'IRS2', 'AKT1', 'AKT2', 'P55G', 'ERBB3', 'P85A', 'MRAS', 'PTEN', 'RPS6KB1','PI3KR1']

<b> Proteome abundance of proteins that interact with PIK3R1 </b>

In [18]:
pcutoff = 0.05 / len(protList)
gene = 'PIK3CA'

sigResults = [];
for protein in protList: 
    if protein in proteomics.columns:
        cross = CPTAC.merge_mutations(proteomics, protein, gene)
        cross = cross[["Mutation", protein]].dropna(axis=0)
        mutated = cross.loc[cross["Mutation"] == "Missense_Mutation"]
        wt = cross.loc[cross["Mutation"] == "Wildtype"]
        ttest = scipy.stats.ttest_ind(mutated[protein], wt[protein])
        if(ttest[1] <= pcutoff):
            sigResults.append(protein)
            print("Test for " + protein + ": ")
            print(ttest) 

Test for IRS1: 
Ttest_indResult(statistic=-3.5379526832870027, pvalue=0.00055342765400399)
Test for IRS2: 
Ttest_indResult(statistic=-4.172569544762063, pvalue=5.7556845433808284e-05)
Test for AKT2: 
Ttest_indResult(statistic=-4.475870221783481, pvalue=1.602813329063142e-05)
Test for PTEN: 
Ttest_indResult(statistic=-3.964063883981443, pvalue=0.00011889565588022356)


<b> Print the list of proteins with significant results </b>

In [11]:
print(sigResults)

['IRS1', 'IRS2', 'PTEN']


### Phosphoproteome abundance of interacting proteins

In [12]:
phosProtList = ['IRS1', 'ATK1', 'P55G', 'ERBB3', 'P85A', 'MRAS', 'PTEN', 'RPS6KB1']

In [16]:
sigResults = [];
pcutoff = 0.05/len(phosProtList)
print(pcutoff)

for protein in phosProtList: 
        cross = CPTAC.merge_mutations(phos, protein, gene)
        #print(cross.head())
        for loc in cross.columns:
            #print(loc)
            cross_site = cross[["Mutation", loc]].dropna(axis=0)
            #print(cross_site)
            mutated = cross_site.loc[cross_site["Mutation"] == "Missense_Mutation"]
            wt = cross_site.loc[cross_site["Mutation"] == "Wildtype"]
            ttest = scipy.stats.ttest_ind(mutated[loc], wt[loc])
            if(ttest[1] <= pcutoff):
                sigResults.append(loc)
                print("Test for " + loc + ": ")
                print(ttest)          

0.00625
Test for IRS1-S1100: 
Ttest_indResult(statistic=-4.622106285824137, pvalue=1.0484520589658975e-05)
Test for IRS1-S1101: 
Ttest_indResult(statistic=-4.385594568310565, pvalue=2.6789608760057653e-05)
Test for IRS1-S1134: 
Ttest_indResult(statistic=-2.9445313115058926, pvalue=0.003961148385953724)
Test for IRS1-S270: 
Ttest_indResult(statistic=-3.174535388441041, pvalue=0.001859256194718747)
Test for IRS1-S323: 
Ttest_indResult(statistic=-3.1585209409938275, pvalue=0.0020179736762149306)
Test for IRS1-S330: 
Ttest_indResult(statistic=-3.3292748915226333, pvalue=0.0012681260438923202)
Test for IRS1-S415: 
Ttest_indResult(statistic=-3.865988661402689, pvalue=0.0002073367241030126)
Test for IRS1-S531: 
Ttest_indResult(statistic=-3.3613860066999215, pvalue=0.0010270551532348862)
Test for IRS1-S629: 
Ttest_indResult(statistic=-3.1918506213584283, pvalue=0.001812000986004178)
Test for IRS1-S672: 
Ttest_indResult(statistic=-2.919065502670874, pvalue=0.004718653170379472)


ValueError: Cannot index with multidimensional key