# PIK3CA: Effects of Mutation on AKT2

<b> Standard imports for playing with and plotting data frames. </b>

In [None]:
import pandas as pd
import numpy as np
import scipy.stats
import matplotlib.pyplot as plt
import seaborn as sns

<b> Import CPTAC data

In [None]:
import CPTAC

In [None]:
somatic_mutations = CPTAC.get_somatic()
proteomics = CPTAC.get_proteomics()
phos = CPTAC.get_phosphoproteomics()

# PI3KCA mutation and AKT2 proteome abundance

### Perform a t-test with mutated and non-mutated protein levels

In [None]:
protList = ['AKT2']
pcutoff = 0.05 / len(protList)
gene = 'PIK3CA'

sigResults = [];
for protein in protList: 
    if protein in proteomics.columns:
        cross = CPTAC.merge_mutations(proteomics, protein, gene)
        cross = cross[["Mutation", protein]].dropna(axis=0)
        mutated = cross.loc[cross["Mutation"] == "Missense_Mutation"]
        wt = cross.loc[cross["Mutation"] == "Wildtype"]
        ttest = scipy.stats.ttest_ind(mutated[protein], wt[protein])
        if(ttest[1] <= pcutoff):
            sigResults.append(protein)
            print("Test for " + protein + ": ")
            print(ttest) 

 ### We can now plot the data 

In [None]:
a4_dims = (11.7, 8.27)
fig, ax = plt.subplots(figsize=a4_dims)
somatic_boxplot = sns.boxplot(data=cross, x="Mutation",y='AKT2', ax = ax)
somatic_boxplot.set_title("PI3KCA gene mutation AKT2 protein abundance")
somatic_boxplot = sns.stripplot(data=cross, x="Mutation", y='AKT2',jitter=True, color=".3")
somatic_boxplot.set(xlabel="Somatic Gene Mutation",ylabel="Proteomics")
plt.show()

## PIK3CA mutation and AKT2 protein abundance (no control)

<b> Take out the conrol </b>

In [None]:
proteomics = proteomics[:100]

### Perform a t-test with mutated and non-mutated protein levels

In [None]:
protList = ['AKT2']
pcutoff = 0.05 / len(protList)
gene = 'PIK3CA'


sigResults = [];
for protein in protList: 
    if protein in proteomics.columns:
        cross = CPTAC.merge_mutations(proteomics, protein, gene)
        cross = cross[["Mutation", protein]].dropna(axis=0)
        mutated = cross.loc[cross["Mutation"] == "Missense_Mutation"]
        wt = cross.loc[cross["Mutation"] == "Wildtype"]
        ttest = scipy.stats.ttest_ind(mutated[protein], wt[protein])
        if(ttest[1] <= pcutoff):
            sigResults.append(protein)
            print("Test for " + protein + ": ")
            print(ttest) 
        else:
            print("Unsignificant results for " + protein + ":")
            print(ttest)

# PI3KCA mutation and IRS1 phosphoproteome abundance

In [None]:
phosProtList = ['AKT2']
sigResults = [];
pcutoff = 0.05/len(phosProtList)
print(pcutoff)

for protein in phosProtList: 
        cross = CPTAC.compare_mutations(phos, protein, gene)
        #print(cross.head())
        for loc in cross.columns:
            #print(loc)
            cross_site = cross[["Mutation", loc]].dropna(axis=0)
            #print(cross_site)
            mutated = cross_site.loc[cross_site["Mutation"] == "Missense_Mutation"]
            wt = cross_site.loc[cross_site["Mutation"] == "Wildtype"]
            ttest = scipy.stats.ttest_ind(mutated[loc], wt[loc])
            if(ttest[1] <= pcutoff):
                sigResults.append(loc)
                print("Test for " + loc + ": ")
                print(ttest)             