# Mutual Exclusivity: BRCA

In [1]:
import os
import os.path as op

os.chdir('../')

# os.listdir()

In [2]:
# SNV_PATHS
SNV_COMMON_PATH = "C:/Users/ibrah/Desktop/SNV_data/SNV_datasets/"
BRCA_SNV_PATH = op.join(SNV_COMMON_PATH, "SNV_BRCA_hg38_2021-09-22.csv")

# PATIENT INTERACTION DATA PATHS
BRCA_PATIENT_INTERACTION_DATA_PATH = "dev/BRCA_patient_interactions_analysis_table_2021-11-15.xlsx"

# Reflect changes in the modules immediately.
%load_ext autoreload
%autoreload 2

In [3]:
from helpers.helpers_analysis.mutual_exclusivity import MutualExclusivity
from helpers.helpers_analysis.protein_id_retrieval import ProteinIDFetcher

In [4]:
brca_mutex = MutualExclusivity(
    tcga="BRCA", 
    tcga_snv_path=BRCA_SNV_PATH, 
    patient_interaction_data_path=BRCA_PATIENT_INTERACTION_DATA_PATH
)

2021-11-15 15:13:26 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading SNV data simplified ..
2021-11-15 15:13:26 |[32m INFO     [0m| helpers.helpers_analysis.loaders | Loading BRCA SNV datasets ..
2021-11-15 15:13:33 |[36m DEBUG    [0m| helpers.helpers_analysis.loaders | BRCA SNV data size: (120988, 121)
2021-11-15 15:13:34 |[36m DEBUG    [0m| helpers.helpers_analysis.loaders | BRCA SNV data processed size: (60251, 121)
2021-11-15 15:13:34 |[32m INFO     [0m| helpers.helpers_analysis.loaders | BRCA SNV datasets are loaded.
2021-11-15 15:13:34 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading patient ids ..
2021-11-15 15:13:34 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading patient to snv_data ..


  0%|          | 0/985 [00:00<?, ?it/s]

2021-11-15 15:13:44 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | patient interaction data patient data ..


In [5]:
len(brca_mutex.patients)

985

In [6]:
len(brca_mutex.get_patients_with("P04637", identifier_type="protein"))

204

In [7]:
len(brca_mutex.get_patients_with("P04626", identifier_type="protein"))

27

In [8]:
ProteinIDFetcher().fetch("ERBB2")

['P04626', 'J3QLU9']

In [9]:
len(brca_mutex.get_patients_with("P04626", identifier_type="protein"))

27

In [10]:
len(brca_mutex.get_patients_with("J3QLU9", identifier_type="protein"))

0

Örneğin ERBB2 geni için en sık disrupt olan interactor SRPK1, ERBB2 ile SRPK1 arasındaki mutual exclusivity'yi hesaplayalım. 

S1 ERBB'nun mutasyona uğradığı hasta seti olsun. 
S2 SRPK1'nın mutasyona uğradığı hasta seti olsun. 

P04626 - ERBBR
Q96SB4 - SRPK1

|S1 union S2| / |S1| + |S2| değerini hesaplayalım. 

mutasyona uğradığı derken direk snv datasına bakabiliriz elaspic'i karıştırmadan. 

Aynı hesaplamayı ERBB2'nun bütün interactorları için tekrarlayalım. SRPK1 ile olan mutual exclusivity değeri daha mı iyi görelim.

Bunu analysis.docx'deki tablolarda bulunan genler için tekrarlayalım.

In [11]:
brca_mutex.calculate_mutual_exclusivity("P04626", "Q96SB4")

1.0

## Patient Interaction Data

In [12]:
brca_mutex.patient_interaction_data.head()

Unnamed: 0,PATIENT,PROTEIN_GENE,MUTATION,INTERACTORS,NUM_INTERACTORS,DISRUPTIVE_INTERACTORS,NUM_DISRUPTIVE_INTERACTORS,NON_DISRUPTIVE_INTERACTORS,NUM_NON_DISRUPTIVE_INTERACTORS,CORE_INTERFACE_VS_INTERFACE_STATUS
0,TCGA-D8-A1XY,Q9UKS6:PACSIN3,R24H,"Q9BY11:PACSIN1,Q9UNF0:PACSIN2,Q5TZC3:PACSIN1,Q...",4,"Q9BY11:PACSIN1:0.5,Q9UNF0:PACSIN2:0.59,Q6FIA3:...",3,Q5TZC3:PACSIN1,1,I
1,TCGA-AO-A0J5,Q9UBN7:HDAC6,D567Y,Q96DB2:HDAC11,1,Q96DB2:HDAC11:0.55,1,,0,I
2,TCGA-A8-A093,P28062:PSMB8,R216W,P40306:PSMB10,1,,0,P40306:PSMB10,1,I
3,TCGA-A8-A093,Q15842:KCNJ8,E237K,"Q14654:KCNJ11,P63252:KCNJ2",2,"Q14654:KCNJ11:0.52,P63252:KCNJ2:0.53",2,,0,I
4,TCGA-LD-A74U,O15041:SEMA3E,E364K,Q9Y4D7:PLXND1,1,,0,Q9Y4D7:PLXND1,1,I


In [None]:
    SRPK1

In [15]:
brca_mutex.get_disrupted_interactors(
    "ERBB2", identifier_type="gene", return_counter=True
)

Counter({'P21860:ERBB3': 1,
         'O60674:JAK2': 1,
         'P15153:RAC2': 1,
         'Q96SB4:SRPK1': 7,
         'Q9UJM3:ERRFI1': 1,
         'Q92625:ANKS1A': 1,
         'P23458:JAK1': 1,
         'P00533:EGFR': 2,
         'P51813:BMX': 2,
         'Q14289:PTK2B': 2,
         'P16591:FER': 2,
         'P06241:FYN': 2,
         'P08069:IGF1R': 2,
         'Q13153:PAK1': 2,
         'P42680:TEC': 2})

In [14]:
brca_mutex.get_disrupted_interactors("TP53", identifier_type="gene", return_counter=True)

Counter({'O15350:TP73': 13,
         'Q96KQ7:EHMT2': 14,
         'Q13625:TP53BP2': 42,
         'Q9H9B1:EHMT1': 9,
         'Q9H3D4:TP63': 18,
         'Q96KQ4:PPP1R13B': 42,
         'Q99728:BARD1': 8,
         'O75832:PSMD10': 8,
         'Q9ULT8:HECTD1': 8,
         'H2EHT1:TP53': 16,
         'K7PPA8:TP53': 16,
         'P62993:GRB2': 33,
         'P07948:LYN': 12,
         'Q8WUF5:PPP1R13L': 30,
         'Q06187:BTK': 31})

In [14]:
brca_mutex.get_disrupted_interactors("TP53", identifier_type="gene", return_counter=True)

Counter({'O15350:TP73': 13,
         'Q96KQ7:EHMT2': 14,
         'Q13625:TP53BP2': 42,
         'Q9H9B1:EHMT1': 9,
         'Q9H3D4:TP63': 18,
         'Q96KQ4:PPP1R13B': 42,
         'Q99728:BARD1': 8,
         'O75832:PSMD10': 8,
         'Q9ULT8:HECTD1': 8,
         'H2EHT1:TP53': 16,
         'K7PPA8:TP53': 16,
         'P62993:GRB2': 33,
         'P07948:LYN': 12,
         'Q8WUF5:PPP1R13L': 30,
         'Q06187:BTK': 31})

In [15]:
brca_mutex.get_disrupted_interactors("TP53", identifier_type="gene")

['Q13625:TP53BP2',
 'Q96KQ4:PPP1R13B',
 'P62993:GRB2',
 'Q06187:BTK',
 'Q8WUF5:PPP1R13L',
 'Q9H3D4:TP63',
 'H2EHT1:TP53',
 'K7PPA8:TP53',
 'Q96KQ7:EHMT2',
 'O15350:TP73',
 'P07948:LYN',
 'Q9H9B1:EHMT1',
 'Q99728:BARD1',
 'O75832:PSMD10',
 'Q9ULT8:HECTD1']

In [16]:
brca_mutex.get_disrupted_interactors("TP53", identifier_type="gene", return_counter=True)

Counter({'O15350:TP73': 13,
         'Q96KQ7:EHMT2': 14,
         'Q13625:TP53BP2': 42,
         'Q9H9B1:EHMT1': 9,
         'Q9H3D4:TP63': 18,
         'Q96KQ4:PPP1R13B': 42,
         'Q99728:BARD1': 8,
         'O75832:PSMD10': 8,
         'Q9ULT8:HECTD1': 8,
         'H2EHT1:TP53': 16,
         'K7PPA8:TP53': 16,
         'P62993:GRB2': 33,
         'P07948:LYN': 12,
         'Q8WUF5:PPP1R13L': 30,
         'Q06187:BTK': 31})

In [17]:
brca_mutex.get_disrupted_interactors("H3C1", identifier_type="gene", return_counter=True)

Counter({'P62805:H4C1': 6,
         'Q9UER7:DAXX': 4,
         'P04908:H2AC4': 4,
         'Q16777:H2AC20': 3,
         'P16104:H2AX': 4,
         'P0C0S8:H2AC11': 4,
         'O75367:MACROH2A1': 4,
         'P0C0S5:H2AZ1': 4,
         'Q9Y294:ASF1A': 1,
         'Q9NVP2:ASF1B': 1,
         'P49450:CENPA': 1})

In [18]:
brca_mutex.get_disrupted_interactors("H4C1", identifier_type="gene", return_counter=True)

Counter({'P84243:H3-3A': 7,
         'Q16695:H3-4': 5,
         'Q71DI3:H3C15': 7,
         'P49450:CENPA': 5,
         'P68431:H3C1': 8,
         'Q16514:TAF12': 2,
         'Q9UER7:DAXX': 3,
         'P06899:H2BC11': 1,
         'Q16778:H2BC21': 1,
         'B4E1C1:nan': 4,
         'Q53F85:nan': 3,
         'P04908:H2AC4': 2,
         'P16104:H2AX': 1,
         'P0C0S5:H2AZ1': 2,
         'Q16777:H2AC20': 2,
         'Q9Y294:ASF1A': 1})

In [19]:
brca_mutex.get_disrupted_interactors("MAP2K4", identifier_type="gene", return_counter=True)

Counter({'Q5S007:LRRK2': 6,
         'P52564:MAP2K6': 6,
         'P00533:EGFR': 1,
         'P35916:FLT4': 1,
         'Q99558:MAP3K14': 1,
         'P45984:MAPK9': 1,
         'Q16539:MAPK14': 2})

In [20]:
ProteinIDFetcher().fetch("TP53")

['H2EHT1', 'K7PPA8', 'P04637']

In [21]:
ProteinIDFetcher().fetch("MAP2K4")

['P45985']

In [22]:
ProteinIDFetcher().fetch("ERBB2")

['P04626', 'J3QLU9']

In [23]:
brca_mutex.calculate_mutual_exclusivity("Q96SB4", "P04626")

1.0

In [24]:
brca_mutex.calculate_mutual_exclusivity("P08069", "Q96SB4")

0.9285714285714286

In [25]:
brca_mutex.calculate_mutual_exclusivity("P08069", "P23458")

0.9375

In [26]:
brca_mutex.calculate_mutual_exclusivity("P23458", "P08069")

0.9375

## Analysis Genes

### ERBB2

In [27]:
ProteinIDFetcher().fetch("ERBB2")

['P04626', 'J3QLU9']

In [28]:
brca_mutex.get_disruptive_mutual_exclusivity_data("P04626")

2021-11-13 21:32:59 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P04626's interactors ..
2021-11-13 21:32:59 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P04626 have 15 interactors:
['Q96SB4:SRPK1', 'P00533:EGFR', 'P51813:BMX', 'Q14289:PTK2B', 'P16591:FER', 'P06241:FYN', 'P08069:IGF1R', 'Q13153:PAK1', 'P42680:TEC', 'P21860:ERBB3', 'O60674:JAK2', 'P15153:RAC2', 'Q9UJM3:ERRFI1', 'Q92625:ANKS1A', 'P23458:JAK1']


Unnamed: 0,PROTEIN:GENE,NUM_PATIENTS,INTERACTOR,NUM_PATIENTS_INTERACTOR,MUTUAL_EXCLUSIVITY
0,P04626:ERBB2,27,Q96SB4:SRPK1,5,1.0
1,P04626:ERBB2,27,P00533:EGFR,13,1.0
2,P04626:ERBB2,27,P51813:BMX,6,0.9697
3,P04626:ERBB2,27,Q14289:PTK2B,4,1.0
4,P04626:ERBB2,27,P16591:FER,6,0.9697
5,P04626:ERBB2,27,P06241:FYN,2,1.0
6,P04626:ERBB2,27,P08069:IGF1R,9,0.9722
7,P04626:ERBB2,27,Q13153:PAK1,4,0.9677
8,P04626:ERBB2,27,P42680:TEC,5,1.0
9,P04626:ERBB2,27,P21860:ERBB3,19,0.9565


In [29]:
brca_mutex.export_disruptive_mutual_exclusivity_data("dev/mutex", "P04626")

2021-11-13 21:33:00 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P04626's interactors ..
2021-11-13 21:33:00 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P04626 have 15 interactors:
['Q96SB4:SRPK1', 'P00533:EGFR', 'P51813:BMX', 'Q14289:PTK2B', 'P16591:FER', 'P06241:FYN', 'P08069:IGF1R', 'Q13153:PAK1', 'P42680:TEC', 'P21860:ERBB3', 'O60674:JAK2', 'P15153:RAC2', 'Q9UJM3:ERRFI1', 'Q92625:ANKS1A', 'P23458:JAK1']
2021-11-13 21:33:00 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Exporting Mutual Exclusivity BRCA P04626 ..
2021-11-13 21:33:00 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | dev/mutex\BRCA_P04626_ERBB2_2021-11-13.csv is exported successfully.


### TP53

In [30]:
ProteinIDFetcher().fetch("TP53")

['H2EHT1', 'K7PPA8', 'P04637']

In [31]:
brca_mutex.get_disruptive_mutual_exclusivity_data("P04637")

2021-11-13 21:33:00 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P04637's interactors ..
2021-11-13 21:33:00 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P04637 have 15 interactors:
['Q13625:TP53BP2', 'Q96KQ4:PPP1R13B', 'P62993:GRB2', 'Q06187:BTK', 'Q8WUF5:PPP1R13L', 'Q9H3D4:TP63', 'H2EHT1:TP53', 'K7PPA8:TP53', 'Q96KQ7:EHMT2', 'O15350:TP73', 'P07948:LYN', 'Q9H9B1:EHMT1', 'Q99728:BARD1', 'O75832:PSMD10', 'Q9ULT8:HECTD1']


Unnamed: 0,PROTEIN:GENE,NUM_PATIENTS,INTERACTOR,NUM_PATIENTS_INTERACTOR,MUTUAL_EXCLUSIVITY
0,P04637:TP53,204,Q13625:TP53BP2,8,0.9953
1,P04637:TP53,204,Q96KQ4:PPP1R13B,5,1.0
2,P04637:TP53,204,P62993:GRB2,2,1.0
3,P04637:TP53,204,Q06187:BTK,7,0.9953
4,P04637:TP53,204,Q8WUF5:PPP1R13L,2,1.0
5,P04637:TP53,204,Q9H3D4:TP63,2,0.9951
6,P04637:TP53,204,H2EHT1:TP53,0,1.0
7,P04637:TP53,204,K7PPA8:TP53,0,1.0
8,P04637:TP53,204,Q96KQ7:EHMT2,2,1.0
9,P04637:TP53,204,O15350:TP73,3,1.0


In [32]:
brca_mutex.export_disruptive_mutual_exclusivity_data("dev/mutex", "P04637")

2021-11-13 21:33:00 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P04637's interactors ..
2021-11-13 21:33:00 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P04637 have 15 interactors:
['Q13625:TP53BP2', 'Q96KQ4:PPP1R13B', 'P62993:GRB2', 'Q06187:BTK', 'Q8WUF5:PPP1R13L', 'Q9H3D4:TP63', 'H2EHT1:TP53', 'K7PPA8:TP53', 'Q96KQ7:EHMT2', 'O15350:TP73', 'P07948:LYN', 'Q9H9B1:EHMT1', 'Q99728:BARD1', 'O75832:PSMD10', 'Q9ULT8:HECTD1']
2021-11-13 21:33:00 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Exporting Mutual Exclusivity BRCA P04637 ..
2021-11-13 21:33:00 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | dev/mutex\BRCA_P04637_TP53_2021-11-13.csv is exported successfully.


### H3C1

In [33]:
ProteinIDFetcher().fetch("H3C1")

['P68431']

In [34]:
brca_mutex.get_disruptive_mutual_exclusivity_data("P68431")

2021-11-13 21:33:01 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P68431's interactors ..
2021-11-13 21:33:01 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P68431 have 11 interactors:
['P62805:H4C1', 'Q9UER7:DAXX', 'P04908:H2AC4', 'P16104:H2AX', 'P0C0S8:H2AC11', 'O75367:MACROH2A1', 'P0C0S5:H2AZ1', 'Q16777:H2AC20', 'Q9Y294:ASF1A', 'Q9NVP2:ASF1B', 'P49450:CENPA']


Unnamed: 0,PROTEIN:GENE,NUM_PATIENTS,INTERACTOR,NUM_PATIENTS_INTERACTOR,MUTUAL_EXCLUSIVITY
0,P68431:H3C1,29,P62805:H4C1,18,0.9787
1,P68431:H3C1,29,Q9UER7:DAXX,4,1.0
2,P68431:H3C1,29,P04908:H2AC4,14,0.9767
3,P68431:H3C1,29,P16104:H2AX,0,1.0
4,P68431:H3C1,29,P0C0S8:H2AC11,13,0.9762
5,P68431:H3C1,29,O75367:MACROH2A1,1,1.0
6,P68431:H3C1,29,P0C0S5:H2AZ1,3,0.9688
7,P68431:H3C1,29,Q16777:H2AC20,1,1.0
8,P68431:H3C1,29,Q9Y294:ASF1A,1,1.0
9,P68431:H3C1,29,Q9NVP2:ASF1B,1,1.0


In [35]:
brca_mutex.export_disruptive_mutual_exclusivity_data("dev/mutex", "P68431")

2021-11-13 21:33:01 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P68431's interactors ..
2021-11-13 21:33:01 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P68431 have 11 interactors:
['P62805:H4C1', 'Q9UER7:DAXX', 'P04908:H2AC4', 'P16104:H2AX', 'P0C0S8:H2AC11', 'O75367:MACROH2A1', 'P0C0S5:H2AZ1', 'Q16777:H2AC20', 'Q9Y294:ASF1A', 'Q9NVP2:ASF1B', 'P49450:CENPA']
2021-11-13 21:33:01 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Exporting Mutual Exclusivity BRCA P68431 ..
2021-11-13 21:33:01 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | dev/mutex\BRCA_P68431_H3C1_2021-11-13.csv is exported successfully.


### H4C1

In [36]:
ProteinIDFetcher().fetch("H4C1")

['P62805']

In [37]:
brca_mutex.get_disruptive_mutual_exclusivity_data("P62805")

2021-11-13 21:33:01 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P62805's interactors ..
2021-11-13 21:33:01 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P62805 have 16 interactors:
['P68431:H3C1', 'P84243:H3-3A', 'Q71DI3:H3C15', 'Q16695:H3-4', 'P49450:CENPA', 'B4E1C1:nan', 'Q9UER7:DAXX', 'Q53F85:nan', 'Q16514:TAF12', 'P04908:H2AC4', 'P0C0S5:H2AZ1', 'Q16777:H2AC20', 'P06899:H2BC11', 'Q16778:H2BC21', 'P16104:H2AX', 'Q9Y294:ASF1A']


Unnamed: 0,PROTEIN:GENE,NUM_PATIENTS,INTERACTOR,NUM_PATIENTS_INTERACTOR,MUTUAL_EXCLUSIVITY
0,P62805:H4C1,18,P68431:H3C1,29,0.9787
1,P62805:H4C1,18,P84243:H3-3A,3,1.0
2,P62805:H4C1,18,Q71DI3:H3C15,4,1.0
3,P62805:H4C1,18,Q16695:H3-4,2,1.0
4,P62805:H4C1,18,P49450:CENPA,0,1.0
5,P62805:H4C1,18,B4E1C1:nan,0,1.0
6,P62805:H4C1,18,Q9UER7:DAXX,4,0.9545
7,P62805:H4C1,18,Q53F85:nan,0,1.0
8,P62805:H4C1,18,Q16514:TAF12,1,1.0
9,P62805:H4C1,18,P04908:H2AC4,14,0.9688


In [38]:
brca_mutex.export_disruptive_mutual_exclusivity_data("dev/mutex", "P62805")

2021-11-13 21:33:01 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P62805's interactors ..
2021-11-13 21:33:01 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P62805 have 16 interactors:
['P68431:H3C1', 'P84243:H3-3A', 'Q71DI3:H3C15', 'Q16695:H3-4', 'P49450:CENPA', 'B4E1C1:nan', 'Q9UER7:DAXX', 'Q53F85:nan', 'Q16514:TAF12', 'P04908:H2AC4', 'P0C0S5:H2AZ1', 'Q16777:H2AC20', 'P06899:H2BC11', 'Q16778:H2BC21', 'P16104:H2AX', 'Q9Y294:ASF1A']
2021-11-13 21:33:02 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Exporting Mutual Exclusivity BRCA P62805 ..
2021-11-13 21:33:02 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | dev/mutex\BRCA_P62805_H4C1_2021-11-13.csv is exported successfully.


### MAP2K4

In [39]:
ProteinIDFetcher().fetch("MAP2K4")

['P45985']

In [40]:
brca_mutex.get_disruptive_mutual_exclusivity_data("P45985")

2021-11-13 21:33:02 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P45985's interactors ..
2021-11-13 21:33:02 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P45985 have 7 interactors:
['Q5S007:LRRK2', 'P52564:MAP2K6', 'Q16539:MAPK14', 'P00533:EGFR', 'P35916:FLT4', 'Q99558:MAP3K14', 'P45984:MAPK9']


Unnamed: 0,PROTEIN:GENE,NUM_PATIENTS,INTERACTOR,NUM_PATIENTS_INTERACTOR,MUTUAL_EXCLUSIVITY
0,P45985:MAP2K4,13,Q5S007:LRRK2,13,1.0
1,P45985:MAP2K4,13,P52564:MAP2K6,3,0.9375
2,P45985:MAP2K4,13,Q16539:MAPK14,2,1.0
3,P45985:MAP2K4,13,P00533:EGFR,13,1.0
4,P45985:MAP2K4,13,P35916:FLT4,2,1.0
5,P45985:MAP2K4,13,Q99558:MAP3K14,2,1.0
6,P45985:MAP2K4,13,P45984:MAPK9,0,1.0


In [41]:
brca_mutex.export_disruptive_mutual_exclusivity_data("dev/mutex", "P45985")

2021-11-13 21:33:02 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P45985's interactors ..
2021-11-13 21:33:02 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P45985 have 7 interactors:
['Q5S007:LRRK2', 'P52564:MAP2K6', 'Q16539:MAPK14', 'P00533:EGFR', 'P35916:FLT4', 'Q99558:MAP3K14', 'P45984:MAPK9']
2021-11-13 21:33:02 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Exporting Mutual Exclusivity BRCA P45985 ..
2021-11-13 21:33:02 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | dev/mutex\BRCA_P45985_MAP2K4_2021-11-13.csv is exported successfully.


---

In [47]:
ProteinIDFetcher().fetch("PIK3CA")

['P42336']

In [49]:
brca_mutex.get_patients_with("P42336", identifier_type="protein")

['TCGA-D8-A1XY',
 'TCGA-AO-A0J5',
 'TCGA-A8-A093',
 'TCGA-C8-A133',
 'TCGA-AQ-A54O',
 'TCGA-A8-A07G',
 'TCGA-LD-A74U',
 'TCGA-BH-A0W5',
 'TCGA-BH-A18F',
 'TCGA-HN-A2OB',
 'TCGA-BH-A2L8',
 'TCGA-E9-A1RD',
 'TCGA-EW-A6SC',
 'TCGA-AO-A0JF',
 'TCGA-AN-A0FS',
 'TCGA-AO-A03L',
 'TCGA-AN-A049',
 'TCGA-E2-A10C',
 'TCGA-E2-A15E',
 'TCGA-A2-A0CP',
 'TCGA-GM-A3NW',
 'TCGA-BH-A0HN',
 'TCGA-E9-A1R0',
 'TCGA-A2-A0YH',
 'TCGA-E9-A226',
 'TCGA-AN-A0FF',
 'TCGA-E2-A576',
 'TCGA-A8-A07B',
 'TCGA-GM-A2DH',
 'TCGA-A7-A5ZW',
 'TCGA-AN-A0AJ',
 'TCGA-A8-A09C',
 'TCGA-LD-A66U',
 'TCGA-EW-A1OV',
 'TCGA-AR-A0TR',
 'TCGA-AO-A0JA',
 'TCGA-A7-A6VX',
 'TCGA-D8-A27T',
 'TCGA-BH-A0GY',
 'TCGA-E9-A1NG',
 'TCGA-AC-A5EH',
 'TCGA-AC-A23E',
 'TCGA-EW-A1IW',
 'TCGA-BH-A0EE',
 'TCGA-BH-A203',
 'TCGA-A2-A0EO',
 'TCGA-LL-A50Y',
 'TCGA-A2-A0EW',
 'TCGA-A7-A0DB',
 'TCGA-AC-A3OD',
 'TCGA-BH-A0BM',
 'TCGA-E2-A1B4',
 'TCGA-BH-A0DK',
 'TCGA-D8-A1J8',
 'TCGA-BH-A18I',
 'TCGA-E2-A15C',
 'TCGA-AR-A24K',
 'TCGA-BH-A8FY',
 'TCGA-XX-A899

In [42]:
len(brca_mutex.snv_data)

60251

In [43]:
brca_mutex.snv_data

Unnamed: 0,Hugo_Symbol,SWISSPROT,HGVSp_Short,Tumor_Sample_Barcode
0,USP24,Q9UPU5,I342V,TCGA-D8-A1XY
1,ERICH3,Q5RHP9,E1406K,TCGA-D8-A1XY
2,SPHKAP,Q2M3C7,R1372S,TCGA-D8-A1XY
3,HRH1,P35367,M206V,TCGA-D8-A1XY
4,LRRC2,Q9BYS8,P359L,TCGA-D8-A1XY
...,...,...,...,...
60246,PCDH19,Q8TAB3,R284C,TCGA-E9-A1NI
60247,ARMCX3,Q9UH62,E310V,TCGA-E9-A1NI
60248,MUM1L1,Q5H9M0,V610L,TCGA-E9-A1NI
60249,L1CAM,P32004,V871L,TCGA-E9-A1NI
