# Mutual Exclusivity

## Setup

In [1]:
import os
import os.path as op

os.chdir('../')

# os.listdir()
# Reflect changes in the modules immediately.
%load_ext autoreload
%autoreload 2

In [2]:
# SNV_PATHS
SNV_COMMON_PATH = "C:/Users/ibrah/Desktop/SNV_data/SNV_datasets/"
BRCA_SNV_PATH = op.join(SNV_COMMON_PATH, "SNV_BRCA_hg38_2021-09-22.csv")
ESCA_SNV_PATH = op.join(SNV_COMMON_PATH, "SNV_ESCA_hg38_2021-09-22.csv")
GBM_SNV_PATH = op.join(SNV_COMMON_PATH, "SNV_GBM_hg38_2021-09-22.csv")
HNSC_SNV_PATH = op.join(SNV_COMMON_PATH, "SNV_HNSC_hg38_2021-09-22.csv")
OV_SNV_PATH = op.join(SNV_COMMON_PATH, "SNV_OV_hg38_2021-09-22.csv")

BRCA_PRELIMINARY_DATA_PATH = r"../data/predictions_datasets/brca_prediction_2021-11-17/558297b6/brca_preliminary_data_cgc_2021-11-17.xlsx"
ESCA_PRELIMINARY_DATA_PATH = r"../data/predictions_datasets/esca_prediction_2021-11-17/59544312/esca_preliminary_data_cgc_2021-11-17.xlsx"
GBM_PRELIMINARY_DATA_PATH = r"../data/predictions_datasets/gbm_prediction_2021-11-17/b9cfc7ea/gbm_preliminary_data_cgc_2021-11-17.xlsx"
HNSC_PRELIMINARY_DATA_PATH = r"../data/predictions_datasets/hnsc_prediction_2021-11-17/53930f30/hnsc_preliminary_data_cgc_2021-11-17.xlsx"
OV_PRELIMINARY_DATA_PATH = r"../data/predictions_datasets/ov_prediction_2021-11-17/37bf1637/ov_preliminary_data_cgc_2021-11-17.xlsx"

# PATIENT INTERACTION DATA PATHS
BRCA_PATIENT_INTERACTION_DATA_PATH = "../data/patient_interaction_datasets/BRCA_patient_interactions_analysis_table_2021-11-17.xlsx"
ESCA_PATIENT_INTERACTION_DATA_PATH = "../data/patient_interaction_datasets/ESCA_patient_interactions_analysis_table_2021-11-17.xlsx"
GBM_PATIENT_INTERACTION_DATA_PATH = "../data/patient_interaction_datasets/GBM_patient_interactions_analysis_table_2021-11-17.xlsx"
HNSC_PATIENT_INTERACTION_DATA_PATH = "../data/patient_interaction_datasets/HNSC_patient_interactions_analysis_table_2021-11-17.xlsx"
OV_PATIENT_INTERACTION_DATA_PATH = "../data/patient_interaction_datasets/OV_patient_interactions_analysis_table_2021-11-17.xlsx"

# Reflect changes in the modules immediately.
%load_ext autoreload
%autoreload 2

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload


In [3]:
def get_protein_gene_pairs(preliminary_data):
    """
    Applies the following filtering conditions to given preliminary data and return protein and gene pairs.
    """
    data_filtered = preliminary_data[
        (preliminary_data["NUM_ELASPIC_INTERFACE_ENTRIES"] >= 10) &
        (preliminary_data["PATIENT_INTERFACE_COUNT"] > 5)
    ]
    
    protein_gene_pairs = list(zip(data_filtered["PROTEIN"], data_filtered["GENE"]))
    return protein_gene_pairs

In [4]:
import pandas as pd
from helpers.helpers_analysis.mutual_exclusivity import MutualExclusivity
from helpers.helpers_analysis.protein_id_retrieval import ProteinIDFetcher

## Instantiate `MutualExclusivity` Objects for Each Cohort

### BRCA

In [5]:
brca_mutex = MutualExclusivity(
    tcga="BRCA", 
    tcga_snv_path=BRCA_SNV_PATH, 
    patient_interaction_data_path=BRCA_PATIENT_INTERACTION_DATA_PATH
)

2021-11-20 02:49:45 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading SNV data simplified ..
2021-11-20 02:49:45 |[32m INFO     [0m| helpers.helpers_analysis.loaders | Loading BRCA SNV datasets ..
2021-11-20 02:49:50 |[36m DEBUG    [0m| helpers.helpers_analysis.loaders | BRCA SNV data size: (120988, 121)
2021-11-20 02:49:51 |[36m DEBUG    [0m| helpers.helpers_analysis.loaders | BRCA SNV data processed size: (60251, 121)
2021-11-20 02:49:51 |[32m INFO     [0m| helpers.helpers_analysis.loaders | BRCA SNV datasets are loaded.
2021-11-20 02:49:51 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading patient ids ..
2021-11-20 02:49:51 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading patient to snv_data ..


  0%|          | 0/985 [00:00<?, ?it/s]

2021-11-20 02:49:59 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | patient interaction data patient data ..


In [6]:
len(brca_mutex.patients)

985

### ESCA

In [7]:
esca_mutex = MutualExclusivity(
    tcga="ESCA", 
    tcga_snv_path=ESCA_SNV_PATH, 
    patient_interaction_data_path=ESCA_PATIENT_INTERACTION_DATA_PATH
)

2021-11-20 02:50:00 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading SNV data simplified ..
2021-11-20 02:50:00 |[32m INFO     [0m| helpers.helpers_analysis.loaders | Loading ESCA SNV datasets ..
2021-11-20 02:50:02 |[36m DEBUG    [0m| helpers.helpers_analysis.loaders | ESCA SNV data size: (45313, 121)
2021-11-20 02:50:02 |[36m DEBUG    [0m| helpers.helpers_analysis.loaders | ESCA SNV data processed size: (19497, 121)
2021-11-20 02:50:02 |[32m INFO     [0m| helpers.helpers_analysis.loaders | ESCA SNV datasets are loaded.
2021-11-20 02:50:02 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading patient ids ..
2021-11-20 02:50:02 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading patient to snv_data ..


  0%|          | 0/184 [00:00<?, ?it/s]

2021-11-20 02:50:03 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | patient interaction data patient data ..


In [8]:
len(esca_mutex.patients)

184

### GBM

In [9]:
gbm_mutex = MutualExclusivity(
    tcga="GBM", 
    tcga_snv_path=GBM_SNV_PATH, 
    patient_interaction_data_path=GBM_PATIENT_INTERACTION_DATA_PATH
)

2021-11-20 02:50:04 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading SNV data simplified ..
2021-11-20 02:50:04 |[32m INFO     [0m| helpers.helpers_analysis.loaders | Loading GBM SNV datasets ..
2021-11-20 02:50:07 |[36m DEBUG    [0m| helpers.helpers_analysis.loaders | GBM SNV data size: (82765, 121)
2021-11-20 02:50:08 |[36m DEBUG    [0m| helpers.helpers_analysis.loaders | GBM SNV data processed size: (46847, 121)
2021-11-20 02:50:08 |[32m INFO     [0m| helpers.helpers_analysis.loaders | GBM SNV datasets are loaded.
2021-11-20 02:50:08 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading patient ids ..
2021-11-20 02:50:08 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading patient to snv_data ..


  0%|          | 0/392 [00:00<?, ?it/s]

2021-11-20 02:50:09 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | patient interaction data patient data ..


In [10]:
len(gbm_mutex.patients)

392

### HNSC

In [11]:
hnsc_mutex = MutualExclusivity(
    tcga="HNSC", 
    tcga_snv_path=HNSC_SNV_PATH, 
    patient_interaction_data_path=HNSC_PATIENT_INTERACTION_DATA_PATH
)

2021-11-20 02:50:10 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading SNV data simplified ..
2021-11-20 02:50:10 |[32m INFO     [0m| helpers.helpers_analysis.loaders | Loading HNSC SNV datasets ..
2021-11-20 02:50:14 |[36m DEBUG    [0m| helpers.helpers_analysis.loaders | HNSC SNV data size: (102309, 121)
2021-11-20 02:50:15 |[36m DEBUG    [0m| helpers.helpers_analysis.loaders | HNSC SNV data processed size: (54883, 121)
2021-11-20 02:50:15 |[32m INFO     [0m| helpers.helpers_analysis.loaders | HNSC SNV datasets are loaded.
2021-11-20 02:50:15 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading patient ids ..
2021-11-20 02:50:15 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading patient to snv_data ..


  0%|          | 0/507 [00:00<?, ?it/s]

2021-11-20 02:50:17 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | patient interaction data patient data ..


In [12]:
len(hnsc_mutex.patients)

507

### OV

In [13]:
ov_mutex = MutualExclusivity(
    tcga="OV", 
    tcga_snv_path=OV_SNV_PATH, 
    patient_interaction_data_path=OV_PATIENT_INTERACTION_DATA_PATH
)

2021-11-20 02:50:18 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading SNV data simplified ..
2021-11-20 02:50:18 |[32m INFO     [0m| helpers.helpers_analysis.loaders | Loading OV SNV datasets ..
2021-11-20 02:50:21 |[36m DEBUG    [0m| helpers.helpers_analysis.loaders | OV SNV data size: (75168, 121)
2021-11-20 02:50:21 |[36m DEBUG    [0m| helpers.helpers_analysis.loaders | OV SNV data processed size: (38486, 121)
2021-11-20 02:50:21 |[32m INFO     [0m| helpers.helpers_analysis.loaders | OV SNV datasets are loaded.
2021-11-20 02:50:21 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading patient ids ..
2021-11-20 02:50:21 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Loading patient to snv_data ..


  0%|          | 0/436 [00:00<?, ?it/s]

2021-11-20 02:50:23 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | patient interaction data patient data ..


In [14]:
len(ov_mutex.patients)

436

## Instantiate `MutualExclusivity` Objects for Each Cohort

In [15]:
def export_mutex_data_for_selected_genes(preliminary_data_path, mutex_obj):
    preliminary_data = pd.read_excel(preliminary_data_path)

    protein_gene_list = get_protein_gene_pairs(preliminary_data)

    for protein_gene in protein_gene_list:
        protein, gene = protein_gene
        print(f"PROTEIN_GENE: {protein}_{gene}")
        mutex_obj.get_disruptive_mutual_exclusivity_data(protein)
        mutex_obj.export_disruptive_mutual_exclusivity_data("dev\mutex_counts_and_probs", protein)
        mutex_obj.export_disruptive_mutual_exclusivity_data("dev\mutex_counts_and_probs", protein, prob=True)
    
    print("Completed.")

In [16]:
# BRCA
export_mutex_data_for_selected_genes(BRCA_PRELIMINARY_DATA_PATH, brca_mutex)

PROTEIN_GENE: O75582_RPS6KA5
2021-11-20 02:50:27 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over O75582's interactors ..
2021-11-20 02:50:27 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | O75582 have 6 interactors:
Counter({'Q15759:MAPK11': 2, 'Q15418:RPS6KA1': 2, 'Q16539:MAPK14': 1, 'L7RSM2:MAPK14': 1, 'Q9UK32:RPS6KA6': 1, 'P67870:CSNK2B': 1})
2021-11-20 02:50:27 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over O75582's interactors ..
2021-11-20 02:50:27 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | O75582 have 6 interactors:
Counter({'Q15759:MAPK11': 2, 'Q15418:RPS6KA1': 2, 'Q16539:MAPK14': 1, 'L7RSM2:MAPK14': 1, 'Q9UK32:RPS6KA6': 1, 'P67870:CSNK2B': 1})
2021-11-20 02:50:27 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | Exporting Mutual Exclusivity BRCA O75582 ..
2021-11-20 02:50:27 |[32m INFO     [0m| helpers

In [17]:
# ESCA
export_mutex_data_for_selected_genes(ESCA_PRELIMINARY_DATA_PATH, esca_mutex)

PROTEIN_GENE: P04637_TP53
2021-11-20 02:50:33 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P04637's interactors ..
2021-11-20 02:50:33 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P04637 have 17 interactors:
Counter({'Q13625:TP53BP2': 30, 'Q96KQ4:PPP1R13B': 30, 'P62993:GRB2': 19, 'Q06187:BTK': 18, 'P07948:LYN': 18, 'Q8WUF5:PPP1R13L': 17, 'Q9H3D4:TP63': 13, 'H2EHT1:TP53': 11, 'K7PPA8:TP53': 11, 'Q96KQ7:EHMT2': 8, 'O15350:TP73': 6, 'O75832:PSMD10': 3, 'Q99466:NOTCH4': 2, 'Q9H9B1:EHMT1': 2, 'Q99728:BARD1': 2, 'Q9ULT8:HECTD1': 2, 'Q53GA5:nan': 1})
2021-11-20 02:50:33 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P04637's interactors ..
2021-11-20 02:50:33 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P04637 have 17 interactors:
Counter({'Q13625:TP53BP2': 30, 'Q96KQ4:PPP1R13B': 30, 'P62993:GRB2': 19, 'Q06187:BTK': 18, 'P07948:LYN':

In [18]:
# GBM
export_mutex_data_for_selected_genes(GBM_PRELIMINARY_DATA_PATH, gbm_mutex)

PROTEIN_GENE: P04637_TP53
2021-11-20 02:50:37 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P04637's interactors ..
2021-11-20 02:50:37 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P04637 have 19 interactors:
Counter({'Q13625:TP53BP2': 30, 'Q96KQ4:PPP1R13B': 30, 'P62993:GRB2': 22, 'P07948:LYN': 19, 'Q9H3D4:TP63': 18, 'Q8WUF5:PPP1R13L': 18, 'Q06187:BTK': 18, 'H2EHT1:TP53': 14, 'K7PPA8:TP53': 14, 'O15350:TP73': 7, 'Q96KQ7:EHMT2': 6, 'Q9H9B1:EHMT1': 5, 'Q99728:BARD1': 5, 'O75832:PSMD10': 5, 'Q9ULT8:HECTD1': 5, 'Q99466:NOTCH4': 2, 'Q9GZV1:ANKRD2': 1, 'P25963:NFKBIA': 1, 'Q53GA5:nan': 1})
2021-11-20 02:50:37 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P04637's interactors ..
2021-11-20 02:50:37 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P04637 have 19 interactors:
Counter({'Q13625:TP53BP2': 30, 'Q96KQ4:PPP1R13B': 30, 'P62993:GR

In [19]:
# HNSC
export_mutex_data_for_selected_genes(HNSC_PRELIMINARY_DATA_PATH, hnsc_mutex)

PROTEIN_GENE: P01112_HRAS
2021-11-20 02:50:40 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P01112's interactors ..
2021-11-20 02:50:40 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P01112 have 18 interactors:
Counter({'Q07889:SOS1': 25, 'Q07890:SOS2': 25, 'G5E9C8:SOS1': 21, 'Q13972:RASGRF1': 16, 'Q9UJ41:RABGEF1': 15, 'Q13671:RIN1': 12, 'Q8IV61:RASGRP3': 11, 'Q9NZL6:RGL1': 9, 'Q12967:RALGDS': 3, 'Q15811:ITSN1': 3, 'P15498:VAV1': 3, 'Q13905:RAPGEF1': 3, 'Q13009:TIAM1': 3, 'Q9P212:PLCE1': 3, 'P10398:ARAF': 1, 'P08069:IGF1R': 1, 'P06239:LCK': 1, 'O95267:RASGRP1': 1})
2021-11-20 02:50:41 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P01112's interactors ..
2021-11-20 02:50:41 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P01112 have 18 interactors:
Counter({'Q07889:SOS1': 25, 'Q07890:SOS2': 25, 'G5E9C8:SOS1': 21, 'Q13972:RASGRF1': 1

In [20]:
# OV
export_mutex_data_for_selected_genes(OV_PRELIMINARY_DATA_PATH, ov_mutex)

PROTEIN_GENE: P04637_TP53
2021-11-20 02:50:48 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P04637's interactors ..
2021-11-20 02:50:48 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P04637 have 19 interactors:
Counter({'Q13625:TP53BP2': 61, 'Q96KQ4:PPP1R13B': 61, 'P62993:GRB2': 46, 'Q8WUF5:PPP1R13L': 40, 'Q06187:BTK': 40, 'P07948:LYN': 33, 'Q9H3D4:TP63': 31, 'H2EHT1:TP53': 27, 'K7PPA8:TP53': 27, 'O15350:TP73': 21, 'Q96KQ7:EHMT2': 18, 'O75832:PSMD10': 8, 'Q9H9B1:EHMT1': 6, 'Q99728:BARD1': 6, 'Q9ULT8:HECTD1': 6, 'Q99466:NOTCH4': 3, 'Q53GA5:nan': 3, 'Q9GZV1:ANKRD2': 1, 'P25963:NFKBIA': 1})
2021-11-20 02:50:48 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Calculating Mutual Exclusivity over P04637's interactors ..
2021-11-20 02:50:48 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | P04637 have 19 interactors:
Counter({'Q13625:TP53BP2': 61, 'Q96KQ4:PPP1R13B': 61, 'P62993:

=======================================

# Codes for Analsis.docx

## BRCA

### `ERBB2`

In [177]:
brca_mutex.get_counts_summary_table("ERBB2")

2021-12-07 21:49:52 |[36m DEBUG    [0m| helpers.helpers_analysis.mutual_exclusivity | interactors: ['Q96SB4:SRPK1', 'P00533:EGFR', 'P51813:BMX', 'Q14289:PTK2B', 'P16591:FER', 'P06241:FYN', 'P08069:IGF1R', 'Q13153:PAK1', 'P42680:TEC', 'P21860:ERBB3', 'O60674:JAK2', 'P15153:RAC2', 'Q9UJM3:ERRFI1', 'Q92625:ANKS1A', 'P23458:JAK1']


ValueError: too many values to unpack (expected 2)

In [169]:
interactor_count_pairs = brca_mutex.get_disrupted_interactors(
    "ERBB2", identifier_type="gene", return_counter=True, most_common=True
)
interactor_count_pairs

[('Q96SB4:SRPK1', 7),
 ('P00533:EGFR', 2),
 ('P51813:BMX', 2),
 ('Q14289:PTK2B', 2),
 ('P16591:FER', 2),
 ('P06241:FYN', 2),
 ('P08069:IGF1R', 2),
 ('Q13153:PAK1', 2),
 ('P42680:TEC', 2),
 ('P21860:ERBB3', 1),
 ('O60674:JAK2', 1),
 ('P15153:RAC2', 1),
 ('Q9UJM3:ERRFI1', 1),
 ('Q92625:ANKS1A', 1),
 ('P23458:JAK1', 1)]

In [170]:
for interactor_protein_gene, count in interactor_count_pairs:
    _, interactor_gene = interactor_protein_gene.split(':')
    brca_mutex.get_patients_with_disruptive_interaction(gene_A="ERBB2", gene_B=interactor_gene)

GENE_A: ERBB2
GENE_B: SRPK1
patients_gene_A_disrupts_B (7): 
 {'TCGA-A8-A0AB', 'TCGA-LL-A740', 'TCGA-D8-A1XM', 'TCGA-A8-A0A6', 'TCGA-A2-A0T6', 'TCGA-AC-A3YI', 'TCGA-BH-A18P'}
patients_gene_B_disrupts_A (0): 
 set()
Intersection (0): 
set()
- - - - - - - - - - - - - - - - - - - - - -
GENE_A: ERBB2
GENE_B: EGFR
patients_gene_A_disrupts_B (2): 
 {'TCGA-AN-A046', 'TCGA-A2-A3XV'}
patients_gene_B_disrupts_A (0): 
 set()
Intersection (0): 
set()
- - - - - - - - - - - - - - - - - - - - - -
GENE_A: ERBB2
GENE_B: BMX
patients_gene_A_disrupts_B (2): 
 {'TCGA-E9-A1R5', 'TCGA-BH-A1FE'}
patients_gene_B_disrupts_A (1): 
 {'TCGA-B6-A0RU'}
Intersection (0): 
set()
- - - - - - - - - - - - - - - - - - - - - -
GENE_A: ERBB2
GENE_B: PTK2B
patients_gene_A_disrupts_B (2): 
 {'TCGA-E9-A1R5', 'TCGA-BH-A1FE'}
patients_gene_B_disrupts_A (0): 
 set()
Intersection (0): 
set()
- - - - - - - - - - - - - - - - - - - - - -
GENE_A: ERBB2
GENE_B: FER
patients_gene_A_disrupts_B (2): 
 {'TCGA-E9-A1R5', 'TCGA-BH-A1FE'}
pat

In [139]:
ProteinIDFetcher().fetch("ERBB2")

['P04626', 'J3QLU9']

In [147]:
brca_mutex.get_patients_with_disruptive_interaction(gene_A="H3C1", gene_B="H4C1")

2021-12-07 20:01:55 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | patients_gene_A_disrupts_B (5): 
 {'TCGA-5L-AAT1', 'TCGA-AC-A62X', 'TCGA-A2-A0EQ', 'TCGA-E9-A226', 'TCGA-A8-A09I'}
2021-12-07 20:01:55 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | patients_gene_B_disrupts_A (8): 
 {'TCGA-LL-A73Y', 'TCGA-AR-A0TY', 'TCGA-A8-A06Y', 'TCGA-BH-A1F0', 'TCGA-A2-A0YM', 'TCGA-BH-A0H7', 'TCGA-D8-A1JA', 'TCGA-AN-A0AT'}
2021-12-07 20:01:55 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | Intersection (0): 
set()
2021-12-07 20:01:55 |[32m INFO     [0m| helpers.helpers_analysis.mutual_exclusivity | done.


In [160]:
brca_mutex.get_patients_with_disruptive_interaction(gene_A="TP53", gene_B="TP53BP2")

GENE_A: TP53
GENE_B: TP53BP2
patients_gene_A_disrupts_B (42): 
 {'TCGA-A7-A6VW', 'TCGA-A2-A0SW', 'TCGA-C8-A12O', 'TCGA-BH-A203', 'TCGA-C8-A1HF', 'TCGA-A8-A09X', 'TCGA-LL-A6FR', 'TCGA-A2-A04T', 'TCGA-OL-A5RY', 'TCGA-AR-A2LH', 'TCGA-AN-A0FX', 'TCGA-BH-A1FE', 'TCGA-EW-A1P4', 'TCGA-E2-A574', 'TCGA-BH-A0BC', 'TCGA-BH-A0AV', 'TCGA-AR-A1AW', 'TCGA-AR-A24T', 'TCGA-B6-A0WX', 'TCGA-BH-A0WA', 'TCGA-C8-A134', 'TCGA-B6-A0RS', 'TCGA-EW-A1P1', 'TCGA-C8-A26W', 'TCGA-D8-A1JM', 'TCGA-D8-A1XL', 'TCGA-BH-A1FN', 'TCGA-A8-A07W', 'TCGA-C8-A12P', 'TCGA-B6-A0I1', 'TCGA-A2-A0T1', 'TCGA-A2-A0CL', 'TCGA-LL-A8F5', 'TCGA-D8-A1JF', 'TCGA-EW-A6S9', 'TCGA-A2-A4S1', 'TCGA-BH-A5IZ', 'TCGA-AN-A04C', 'TCGA-C8-A278', 'TCGA-E9-A1NC', 'TCGA-AR-A1AJ', 'TCGA-AR-A0TP'}
patients_gene_B_disrupts_A (0): 
 set()
Intersection (0): 
set()



In [132]:
# brca_mutex.get_disrupted_interactors_unique_patients(
#     "ERBB2", identifier_type="gene"
# )

AttributeError: 'MutualExclusivity' object has no attribute 'get_disrupted_interactors_unique_patients'

In [44]:
brca_mutex.get_disrupted_interactors_probabilities("ERBB2", identifier_type="gene")

{'Q96SB4:SRPK1': 4.79,
 'P08069:IGF1R': 1.82,
 'Q14289:PTK2B': 1.62,
 'P16591:FER': 1.52,
 'P00533:EGFR': 1.49,
 'P42680:TEC': 1.4,
 'Q13153:PAK1': 1.4,
 'P51813:BMX': 1.38,
 'P06241:FYN': 1.3,
 'P21860:ERBB3': 0.84,
 'Q9UJM3:ERRFI1': 0.8,
 'P15153:RAC2': 0.75,
 'P23458:JAK1': 0.66,
 'O60674:JAK2': 0.63,
 'Q92625:ANKS1A': 0.55}

In [None]:
brca_preliminary_data = pd.read_excel(BRCA_PRELIMINARY_DATA_PATH)
brca_preliminary_data[
    brca_preliminary_data["GENE"] == "SRPK1"
]

Unnamed: 0,PROTEIN,GENE,NUM_ELASPIC_INTERFACE_ENTRIES,NUM_DISRUPTIVE_ENTRIES,NUM_INCR_NOEFF_ENTRIES,NUM_UNIQUE_INTERACTORS,PATIENT_CORE_COUNT,PATIENT_INTERFACE_COUNT,NUM_INTERFACE_PATIENTS_DISRUPTIVE_INTERACTOR,BASELINE,OUR_METHOD,OUR_METHOD/BASELINE,ELASPIC_COVERAGE,CGC_STATUS,CGC_STATUS (BRCA)
6533,Q96SB4,SRPK1,3,2,0,3,2,1,1,2,2,1.0,3,-,-


### `TP53`

In [49]:
brca_mutex.get_disrupted_interactors(
    "TP53", identifier_type="gene", return_counter=True, most_common=True
)

[('Q13625:TP53BP2', 42),
 ('Q96KQ4:PPP1R13B', 42),
 ('P62993:GRB2', 33),
 ('Q06187:BTK', 31),
 ('Q8WUF5:PPP1R13L', 30),
 ('Q9H3D4:TP63', 18),
 ('H2EHT1:TP53', 16),
 ('K7PPA8:TP53', 16),
 ('Q96KQ7:EHMT2', 14),
 ('O15350:TP73', 13),
 ('P07948:LYN', 12),
 ('Q9H9B1:EHMT1', 9),
 ('Q99728:BARD1', 8),
 ('O75832:PSMD10', 8),
 ('Q9ULT8:HECTD1', 8)]

In [50]:
brca_mutex.get_disrupted_interactors_probabilities("TP53", identifier_type="gene")

{'Q13625:TP53BP2': 35.9,
 'Q96KQ4:PPP1R13B': 34.07,
 'Q06187:BTK': 24.39,
 'P62993:GRB2': 24.14,
 'Q8WUF5:PPP1R13L': 21.68,
 'Q9H3D4:TP63': 13.65,
 'H2EHT1:TP53': 12.37,
 'K7PPA8:TP53': 12.190000000000001,
 'O15350:TP73': 10.41,
 'Q96KQ7:EHMT2': 9.3,
 'P07948:LYN': 8.69,
 'Q9H9B1:EHMT1': 5.97,
 'O75832:PSMD10': 5.9,
 'Q99728:BARD1': 5.79,
 'Q9ULT8:HECTD1': 5.78}

### `H3C1`

In [68]:
brca_mutex.get_disrupted_interactors(
    "H3C1", identifier_type="gene", return_counter=True, most_common=True
)

[('P62805:H4C1', 6),
 ('Q9UER7:DAXX', 6),
 ('P04908:H2AC4', 4),
 ('P16104:H2AX', 4),
 ('P0C0S8:H2AC11', 4),
 ('O75367:MACROH2A1', 4),
 ('P0C0S5:H2AZ1', 4),
 ('Q16777:H2AC20', 3),
 ('Q9Y294:ASF1A', 3),
 ('Q9NVP2:ASF1B', 3),
 ('P49450:CENPA', 3)]

In [69]:
brca_mutex.get_disrupted_interactors_probabilities("H3C1", identifier_type="gene")

{'Q9UER7:DAXX': 3.87,
 'P62805:H4C1': 3.6,
 'P0C0S5:H2AZ1': 2.58,
 'P0C0S8:H2AC11': 2.58,
 'P16104:H2AX': 2.58,
 'P49450:CENPA': 2.5700000000000003,
 'P04908:H2AC4': 2.5100000000000002,
 'O75367:MACROH2A1': 2.4699999999999998,
 'Q9NVP2:ASF1B': 2.22,
 'Q9Y294:ASF1A': 2.04,
 'Q16777:H2AC20': 1.96}

### `H4C1`

In [72]:
brca_mutex.get_disrupted_interactors(
    "H4C1", identifier_type="gene", return_counter=True, most_common=True
)

[('P68431:H3C1', 8),
 ('P84243:H3-3A', 7),
 ('Q71DI3:H3C15', 7),
 ('Q16695:H3-4', 5),
 ('P49450:CENPA', 5),
 ('B4E1C1:nan', 4),
 ('Q9UER7:DAXX', 3),
 ('Q53F85:nan', 3),
 ('Q16514:TAF12', 2),
 ('P04908:H2AC4', 2),
 ('P0C0S5:H2AZ1', 2),
 ('Q16777:H2AC20', 2),
 ('P06899:H2BC11', 1),
 ('Q16778:H2BC21', 1),
 ('P16104:H2AX', 1),
 ('Q9Y294:ASF1A', 1)]

In [73]:
brca_mutex.get_disrupted_interactors_probabilities("H4C1", identifier_type="gene")

{'P68431:H3C1': 5.74,
 'Q71DI3:H3C15': 4.34,
 'P84243:H3-3A': 4.29,
 'Q16695:H3-4': 3.14,
 'P49450:CENPA': 3.1,
 'B4E1C1:nan': 2.3899999999999997,
 'Q9UER7:DAXX': 2.02,
 'Q53F85:nan': 1.6800000000000002,
 'Q16777:H2AC20': 1.6,
 'P04908:H2AC4': 1.57,
 'P0C0S5:H2AZ1': 1.48,
 'Q16514:TAF12': 1.42,
 'Q16778:H2BC21': 0.95,
 'P06899:H2BC11': 0.86,
 'P16104:H2AX': 0.79,
 'Q9Y294:ASF1A': 0.67}

### `MAP2K4`

In [76]:
brca_mutex.get_disrupted_interactors(
    "MAP2K4", identifier_type="gene", return_counter=True, most_common=True
)

[('Q5S007:LRRK2', 6),
 ('P52564:MAP2K6', 6),
 ('Q16539:MAPK14', 2),
 ('P00533:EGFR', 1),
 ('P35916:FLT4', 1),
 ('Q99558:MAP3K14', 1),
 ('P45984:MAPK9', 1)]

In [77]:
brca_mutex.get_disrupted_interactors_probabilities("MAP2K4", identifier_type="gene")

{'P52564:MAP2K6': 4.35,
 'Q5S007:LRRK2': 3.46,
 'Q16539:MAPK14': 1.4500000000000002,
 'P00533:EGFR': 0.88,
 'Q99558:MAP3K14': 0.81,
 'P35916:FLT4': 0.66,
 'P45984:MAPK9': 0.66}

### `UBC`

In [85]:
brca_mutex.get_disrupted_interactors(
    "UBC", identifier_type="gene", return_counter=True, most_common=True
)

[('P21734:UBC1', 4),
 ('P61077:UBE2D3', 2),
 ('Q9UMX0:UBQLN1', 1),
 ('A8K3R3:nan', 1),
 ('Q99816:TSG101', 1)]

In [86]:
brca_mutex.get_disrupted_interactors_probabilities("UBC", identifier_type="gene")

{'P21734:UBC1': 2.42,
 'P61077:UBE2D3': 1.2,
 'Q99816:TSG101': 0.81,
 'Q9UMX0:UBQLN1': 0.7,
 'A8K3R3:nan': 0.56}

### `PIK3CA`

In [87]:
brca_mutex.get_disrupted_interactors(
    "PIK3CA", identifier_type="gene", return_counter=True, most_common=True
)

[('P27986:PIK3R1', 124),
 ('O00459:PIK3R2', 124),
 ('P43403:ZAP70', 119),
 ('Q92569:PIK3R3', 5)]

In [88]:
brca_mutex.get_disrupted_interactors_probabilities("PIK3CA", identifier_type="gene")

{'P27986:PIK3R1': 75.5,
 'O00459:PIK3R2': 74.36,
 'P43403:ZAP70': 65.45,
 'Q92569:PIK3R3': 3.15}

## OV

### `H4C1`

In [78]:
ov_mutex.get_disrupted_interactors(
    "H4C1", identifier_type="gene", return_counter=True, most_common=True
)

[('P84243:H3-3A', 4),
 ('P68431:H3C1', 3),
 ('P04908:H2AC4', 2),
 ('Q16695:H3-4', 2),
 ('Q71DI3:H3C15', 2),
 ('P49450:CENPA', 2),
 ('P0C0S5:H2AZ1', 2),
 ('Q16777:H2AC20', 2),
 ('Q9UER7:DAXX', 1),
 ('B4E1C1:nan', 1),
 ('Q53F85:nan', 1),
 ('Q8NCD3:HJURP', 1),
 ('Q16514:TAF12', 1),
 ('P06899:H2BC11', 1),
 ('Q16778:H2BC21', 1),
 ('P16104:H2AX', 1),
 ('Q9Y294:ASF1A', 1),
 ('Q9NVP2:ASF1B', 1)]

In [80]:
ov_mutex.get_disrupted_interactors_probabilities("H4C1", identifier_type="gene")

{'P84243:H3-3A': 2.3600000000000003,
 'P68431:H3C1': 2.01,
 'Q16777:H2AC20': 1.65,
 'P04908:H2AC4': 1.63,
 'P0C0S5:H2AZ1': 1.6099999999999999,
 'Q16695:H3-4': 1.2799999999999998,
 'Q71DI3:H3C15': 1.27,
 'P49450:CENPA': 1.22,
 'P16104:H2AX': 0.86,
 'P06899:H2BC11': 0.81,
 'Q9NVP2:ASF1B': 0.8,
 'Q16778:H2BC21': 0.79,
 'Q9Y294:ASF1A': 0.79,
 'Q8NCD3:HJURP': 0.7,
 'Q9UER7:DAXX': 0.67,
 'Q16514:TAF12': 0.66,
 'Q53F85:nan': 0.6,
 'B4E1C1:nan': 0.54}

### `TP53`

In [81]:
ov_mutex.get_disrupted_interactors(
    "TP53", identifier_type="gene", return_counter=True, most_common=True
)

[('Q13625:TP53BP2', 61),
 ('Q96KQ4:PPP1R13B', 61),
 ('P62993:GRB2', 46),
 ('Q8WUF5:PPP1R13L', 40),
 ('Q06187:BTK', 40),
 ('P07948:LYN', 33),
 ('Q9H3D4:TP63', 31),
 ('H2EHT1:TP53', 27),
 ('K7PPA8:TP53', 27),
 ('O15350:TP73', 21),
 ('Q96KQ7:EHMT2', 18),
 ('O75832:PSMD10', 8),
 ('Q9H9B1:EHMT1', 6),
 ('Q99728:BARD1', 6),
 ('Q9ULT8:HECTD1', 6),
 ('Q99466:NOTCH4', 3),
 ('Q53GA5:nan', 3),
 ('Q9GZV1:ANKRD2', 1),
 ('P25963:NFKBIA', 1)]

In [82]:
ov_mutex.get_disrupted_interactors_probabilities("TP53", identifier_type="gene")

{'Q13625:TP53BP2': 50.43,
 'Q96KQ4:PPP1R13B': 47.660000000000004,
 'P62993:GRB2': 34.0,
 'Q06187:BTK': 31.310000000000002,
 'Q8WUF5:PPP1R13L': 28.7,
 'Q9H3D4:TP63': 23.99,
 'P07948:LYN': 22.740000000000002,
 'K7PPA8:TP53': 21.39,
 'H2EHT1:TP53': 21.19,
 'O15350:TP73': 16.11,
 'Q96KQ7:EHMT2': 11.75,
 'O75832:PSMD10': 5.79,
 'Q9ULT8:HECTD1': 4.28,
 'Q99728:BARD1': 4.25,
 'Q9H9B1:EHMT1': 4.07,
 'Q53GA5:nan': 2.12,
 'Q99466:NOTCH4': 1.97,
 'P25963:NFKBIA': 0.73,
 'Q9GZV1:ANKRD2': 0.72}

### `ACTN2`

In [83]:
ov_mutex.get_disrupted_interactors(
    "ACTN2", identifier_type="gene", return_counter=True, most_common=True
)

[('Q9UQM7:CAMK2A', 1),
 ('Q13557:CAMK2D', 1),
 ('P12814:ACTN1', 1),
 ('Q08043:ACTN3', 1)]

In [84]:
ov_mutex.get_disrupted_interactors_probabilities("ACTN2", identifier_type="gene")

{'P12814:ACTN1': 0.69,
 'Q08043:ACTN3': 0.69,
 'Q13557:CAMK2D': 0.62,
 'Q9UQM7:CAMK2A': 0.52}

## HNSC

In [95]:
hnsc_protein_gene_pairs = get_protein_gene_pairs(pd.read_excel(HNSC_PRELIMINARY_DATA_PATH))

In [99]:
hnsc_protein_gene_pairs

[('P01112', 'HRAS'),
 ('P04637', 'TP53'),
 ('P05129', 'PRKCG'),
 ('P15056', 'BRAF'),
 ('P22607', 'FGFR3'),
 ('P42771', 'CDKN2A'),
 ('P61586', 'RHOA'),
 ('P62805', 'H4C1'),
 ('P63000', 'RAC1'),
 ('Q16288', 'NTRK3'),
 ('Q7Z6Z7', 'HUWE1'),
 ('Q969H0', 'FBXW7')]

### `FBXW7`

In [100]:
hnsc_mutex.get_disrupted_interactors(
    "FBXW7", identifier_type="gene", return_counter=True, most_common=True
)

[('P42345:MTOR', 11), ('A6NE52:WDR97', 10), ('P63244:RACK1', 5)]

In [101]:
hnsc_mutex.get_disrupted_interactors_probabilities("FBXW7", identifier_type="gene")

{'P42345:MTOR': 9.09, 'A6NE52:WDR97': 5.38, 'P63244:RACK1': 4.08}

### `TP53`

In [102]:
hnsc_mutex.get_disrupted_interactors(
    "TP53", identifier_type="gene", return_counter=True, most_common=True
)

[('Q96KQ4:PPP1R13B', 49),
 ('Q13625:TP53BP2', 48),
 ('P62993:GRB2', 36),
 ('Q06187:BTK', 32),
 ('Q8WUF5:PPP1R13L', 28),
 ('Q9H3D4:TP63', 26),
 ('P07948:LYN', 23),
 ('H2EHT1:TP53', 22),
 ('K7PPA8:TP53', 22),
 ('Q96KQ7:EHMT2', 18),
 ('O15350:TP73', 15),
 ('Q9H9B1:EHMT1', 9),
 ('Q99728:BARD1', 9),
 ('O75832:PSMD10', 9),
 ('Q9ULT8:HECTD1', 9),
 ('Q99466:NOTCH4', 1)]

In [103]:
hnsc_mutex.get_disrupted_interactors_probabilities("TP53", identifier_type="gene")

{'Q13625:TP53BP2': 38.95,
 'Q96KQ4:PPP1R13B': 38.51,
 'P62993:GRB2': 26.22,
 'Q06187:BTK': 24.8,
 'Q8WUF5:PPP1R13L': 20.93,
 'Q9H3D4:TP63': 19.78,
 'H2EHT1:TP53': 16.68,
 'K7PPA8:TP53': 16.54,
 'P07948:LYN': 16.15,
 'Q96KQ7:EHMT2': 11.85,
 'O15350:TP73': 11.72,
 'O75832:PSMD10': 6.54,
 'Q9ULT8:HECTD1': 6.38,
 'Q99728:BARD1': 6.34,
 'Q9H9B1:EHMT1': 6.22,
 'Q99466:NOTCH4': 0.57}

### `BRAF`

In [104]:
hnsc_mutex.get_disrupted_interactors(
    "BRAF", identifier_type="gene", return_counter=True, most_common=True
)

[('Q13177:PAK2', 3),
 ('P17252:PRKCA', 2),
 ('P53667:LIMK1', 2),
 ('P36507:MAP2K2', 1),
 ('A4QPA9:MAP2K1', 1)]

In [105]:
hnsc_mutex.get_disrupted_interactors_probabilities("BRAF", identifier_type="gene")

{'Q13177:PAK2': 2.08,
 'P17252:PRKCA': 1.4300000000000002,
 'P53667:LIMK1': 1.07,
 'A4QPA9:MAP2K1': 0.61,
 'P36507:MAP2K2': 0.61}

### `RAC1`

In [106]:
hnsc_mutex.get_disrupted_interactors(
    "RAC1", identifier_type="gene", return_counter=True, most_common=True
)

[('Q17R89:ARHGAP44', 8),
 ('Q8NF50:DOCK8', 2),
 ('Q13972:RASGRF1', 2),
 ('Q14185:DOCK1', 1),
 ('Q92608:DOCK2', 1),
 ('Q15286:RAB35', 1),
 ('O14559:ARHGAP33', 1)]

In [107]:
hnsc_mutex.get_disrupted_interactors_probabilities("RAC1", identifier_type="gene")

{'Q17R89:ARHGAP44': 4.88,
 'Q8NF50:DOCK8': 1.58,
 'Q13972:RASGRF1': 1.25,
 'Q92608:DOCK2': 0.79,
 'Q15286:RAB35': 0.76,
 'Q14185:DOCK1': 0.65,
 'O14559:ARHGAP33': 0.64}

### `HUWE1`

In [108]:
hnsc_mutex.get_disrupted_interactors(
    "HUWE1", identifier_type="gene", return_counter=True, most_common=True
)

[('P62837:UBE2D2', 4),
 ('P61077:UBE2D3', 4),
 ('P54725:RAD23A', 4),
 ('P11441:UBL4A', 4),
 ('Q969T4:UBE2E3', 3),
 ('P51668:UBE2D1', 3),
 ('P62253:UBE2G1', 3),
 ('P68036:UBE2L3', 2)]

In [109]:
hnsc_mutex.get_disrupted_interactors_probabilities("HUWE1", identifier_type="gene")

{'P11441:UBL4A': 3.26,
 'P62837:UBE2D2': 3.05,
 'P61077:UBE2D3': 2.52,
 'P54725:RAD23A': 2.5,
 'P51668:UBE2D1': 2.21,
 'Q969T4:UBE2E3': 1.94,
 'P62253:UBE2G1': 1.87,
 'P68036:UBE2L3': 1.2799999999999998}

### `H4C1`

In [111]:
hnsc_mutex.get_disrupted_interactors(
    "H4C1", identifier_type="gene", return_counter=True, most_common=True
)

[('P84243:H3-3A', 11),
 ('P68431:H3C1', 11),
 ('Q9UER7:DAXX', 11),
 ('Q53F85:nan', 10),
 ('Q16695:H3-4', 9),
 ('Q71DI3:H3C15', 9),
 ('P49450:CENPA', 9),
 ('B4E1C1:nan', 8),
 ('Q16514:TAF12', 5),
 ('P06899:H2BC11', 5),
 ('Q16778:H2BC21', 5),
 ('P04908:H2AC4', 2),
 ('P16104:H2AX', 2),
 ('P0C0S5:H2AZ1', 2),
 ('Q9Y294:ASF1A', 2),
 ('Q16777:H2AC20', 2),
 ('Q9NVP2:ASF1B', 2)]

In [112]:
hnsc_mutex.get_disrupted_interactors_probabilities("H4C1", identifier_type="gene")

{'P68431:H3C1': 8.2,
 'P84243:H3-3A': 7.09,
 'Q9UER7:DAXX': 6.77,
 'Q71DI3:H3C15': 6.14,
 'Q16695:H3-4': 6.13,
 'Q53F85:nan': 5.85,
 'P49450:CENPA': 5.32,
 'B4E1C1:nan': 4.64,
 'Q16778:H2BC21': 4.59,
 'P06899:H2BC11': 4.43,
 'Q16514:TAF12': 3.4899999999999998,
 'P16104:H2AX': 1.6600000000000001,
 'Q16777:H2AC20': 1.6600000000000001,
 'P04908:H2AC4': 1.6400000000000001,
 'P0C0S5:H2AZ1': 1.5899999999999999,
 'Q9NVP2:ASF1B': 1.58,
 'Q9Y294:ASF1A': 1.58}

### `CDKN2A`

In [113]:
hnsc_mutex.get_disrupted_interactors(
    "CDKN2A", identifier_type="gene", return_counter=True, most_common=True
)

[('P11802:CDK4', 15),
 ('P29320:EPHA3', 11),
 ('O14920:IKBKB', 11),
 ('P17252:PRKCA', 11),
 ('A4D1G0:CDK6', 9),
 ('Q00534:CDK6', 8),
 ('A1L4K2:MAPK8', 8),
 ('Q9UQ88:CDK11A', 7),
 ('P45983:MAPK8', 7),
 ('O14965:AURKA', 7),
 ('B2R6V2:nan', 7),
 ('P49760:CLK2', 6),
 ('P53779:MAPK10', 6),
 ('O00311:CDC7', 4),
 ('Q8NE63:HIPK4', 4),
 ('A8MWW6:nan', 3),
 ('Q14164:IKBKE', 3),
 ('Q9Y463:DYRK1B', 3),
 ('P07437:TUBB', 2),
 ('Q499Y8:MAPK10', 2),
 ('Q71U36:TUBA1A', 1),
 ('Q9BQE3:TUBA1C', 1),
 ('P68371:TUBB4B', 1)]

In [114]:
hnsc_mutex.get_disrupted_interactors_probabilities("CDKN2A", identifier_type="gene")

{'P11802:CDK4': 10.09,
 'O14920:IKBKB': 6.5,
 'P29320:EPHA3': 6.46,
 'P17252:PRKCA': 6.12,
 'A4D1G0:CDK6': 6.0,
 'Q00534:CDK6': 5.44,
 'A1L4K2:MAPK8': 5.22,
 'B2R6V2:nan': 5.140000000000001,
 'P45983:MAPK8': 4.53,
 'Q9UQ88:CDK11A': 4.51,
 'O14965:AURKA': 4.05,
 'P49760:CLK2': 3.52,
 'P53779:MAPK10': 3.46,
 'O00311:CDC7': 2.5,
 'Q8NE63:HIPK4': 2.1100000000000003,
 'A8MWW6:nan': 1.85,
 'Q14164:IKBKE': 1.83,
 'Q9Y463:DYRK1B': 1.75,
 'P07437:TUBB': 1.4,
 'Q499Y8:MAPK10': 1.24,
 'Q71U36:TUBA1A': 0.86,
 'Q9BQE3:TUBA1C': 0.86,
 'P68371:TUBB4B': 0.85}

### `HRAS`

In [121]:
hnsc_mutex.get_disrupted_interactors(
    "HRAS", identifier_type="gene", return_counter=True, most_common=True
)

[('Q07889:SOS1', 25),
 ('Q07890:SOS2', 25),
 ('G5E9C8:SOS1', 21),
 ('Q13972:RASGRF1', 16),
 ('Q9UJ41:RABGEF1', 15),
 ('Q13671:RIN1', 12),
 ('Q8IV61:RASGRP3', 11),
 ('Q9NZL6:RGL1', 9),
 ('Q12967:RALGDS', 3),
 ('Q15811:ITSN1', 3),
 ('P15498:VAV1', 3),
 ('Q13905:RAPGEF1', 3),
 ('Q13009:TIAM1', 3),
 ('Q9P212:PLCE1', 3),
 ('P10398:ARAF', 1),
 ('P08069:IGF1R', 1),
 ('P06239:LCK', 1),
 ('O95267:RASGRP1', 1)]

In [119]:
hnsc_mutex.get_disrupted_interactors_probabilities("HRAS", identifier_type="gene")

{'Q07889:SOS1': 16.84,
 'Q07890:SOS2': 15.36,
 'G5E9C8:SOS1': 14.9,
 'Q9UJ41:RABGEF1': 10.01,
 'Q13972:RASGRF1': 8.63,
 'Q13671:RIN1': 6.84,
 'Q8IV61:RASGRP3': 5.87,
 'Q9NZL6:RGL1': 4.82,
 'P15498:VAV1': 2.16,
 'Q13009:TIAM1': 1.8900000000000001,
 'Q15811:ITSN1': 1.83,
 'Q13905:RAPGEF1': 1.71,
 'Q9P212:PLCE1': 1.6500000000000001,
 'Q12967:RALGDS': 1.56,
 'P06239:LCK': 0.76,
 'P08069:IGF1R': 0.72,
 'P10398:ARAF': 0.65,
 'O95267:RASGRP1': 0.52}

## GBM

### `TP53`

In [123]:
gbm_mutex.get_disrupted_interactors(
    "TP53", identifier_type="gene", return_counter=True, most_common=True
)

[('Q13625:TP53BP2', 30),
 ('Q96KQ4:PPP1R13B', 30),
 ('P62993:GRB2', 22),
 ('P07948:LYN', 19),
 ('Q9H3D4:TP63', 18),
 ('Q8WUF5:PPP1R13L', 18),
 ('Q06187:BTK', 18),
 ('H2EHT1:TP53', 14),
 ('K7PPA8:TP53', 14),
 ('O15350:TP73', 7),
 ('Q96KQ7:EHMT2', 6),
 ('Q9H9B1:EHMT1', 5),
 ('Q99728:BARD1', 5),
 ('O75832:PSMD10', 5),
 ('Q9ULT8:HECTD1', 5),
 ('Q99466:NOTCH4', 2),
 ('Q9GZV1:ANKRD2', 1),
 ('P25963:NFKBIA', 1),
 ('Q53GA5:nan', 1)]

In [124]:
gbm_mutex.get_disrupted_interactors_probabilities("TP53", identifier_type="gene")

{'Q13625:TP53BP2': 24.52,
 'Q96KQ4:PPP1R13B': 23.21,
 'P62993:GRB2': 16.43,
 'Q06187:BTK': 13.98,
 'Q9H3D4:TP63': 13.91,
 'P07948:LYN': 13.03,
 'Q8WUF5:PPP1R13L': 12.94,
 'K7PPA8:TP53': 11.120000000000001,
 'H2EHT1:TP53': 11.06,
 'O15350:TP73': 5.34,
 'Q96KQ7:EHMT2': 3.9000000000000004,
 'O75832:PSMD10': 3.68,
 'Q99728:BARD1': 3.5700000000000003,
 'Q9ULT8:HECTD1': 3.45,
 'Q9H9B1:EHMT1': 3.37,
 'Q99466:NOTCH4': 1.4100000000000001,
 'Q53GA5:nan': 0.64,
 'P25963:NFKBIA': 0.63,
 'Q9GZV1:ANKRD2': 0.62}

## ESCA

### `TP53`

In [125]:
esca_mutex.get_disrupted_interactors(
    "TP53", identifier_type="gene", return_counter=True, most_common=True
)

[('Q13625:TP53BP2', 30),
 ('Q96KQ4:PPP1R13B', 30),
 ('P62993:GRB2', 19),
 ('Q06187:BTK', 18),
 ('P07948:LYN', 18),
 ('Q8WUF5:PPP1R13L', 17),
 ('Q9H3D4:TP63', 13),
 ('H2EHT1:TP53', 11),
 ('K7PPA8:TP53', 11),
 ('Q96KQ7:EHMT2', 8),
 ('O15350:TP73', 6),
 ('O75832:PSMD10', 3),
 ('Q99466:NOTCH4', 2),
 ('Q9H9B1:EHMT1', 2),
 ('Q99728:BARD1', 2),
 ('Q9ULT8:HECTD1', 2),
 ('Q53GA5:nan', 1)]

In [126]:
esca_mutex.get_disrupted_interactors_probabilities("TP53", identifier_type="gene")

{'Q13625:TP53BP2': 24.0,
 'Q96KQ4:PPP1R13B': 22.84,
 'P62993:GRB2': 14.02,
 'Q06187:BTK': 14.02,
 'Q8WUF5:PPP1R13L': 11.969999999999999,
 'P07948:LYN': 11.69,
 'Q9H3D4:TP63': 10.27,
 'K7PPA8:TP53': 8.56,
 'H2EHT1:TP53': 8.55,
 'Q96KQ7:EHMT2': 5.21,
 'O15350:TP73': 4.65,
 'O75832:PSMD10': 2.1,
 'Q9ULT8:HECTD1': 1.46,
 'Q99728:BARD1': 1.38,
 'Q9H9B1:EHMT1': 1.37,
 'Q99466:NOTCH4': 1.2,
 'Q53GA5:nan': 0.65}

### `H4C1`

In [127]:
esca_mutex.get_disrupted_interactors(
    "H4C1", identifier_type="gene", return_counter=True, most_common=True
)

[('P68431:H3C1', 3),
 ('Q9UER7:DAXX', 3),
 ('Q53F85:nan', 3),
 ('Q16514:TAF12', 2),
 ('P06899:H2BC11', 2),
 ('Q16778:H2BC21', 2),
 ('P84243:H3-3A', 2),
 ('Q16695:H3-4', 2),
 ('Q71DI3:H3C15', 2),
 ('P49450:CENPA', 2),
 ('B4E1C1:nan', 2)]

In [128]:
esca_mutex.get_disrupted_interactors_probabilities("H4C1", identifier_type="gene")

{'P68431:H3C1': 2.17,
 'Q16778:H2BC21': 1.83,
 'P06899:H2BC11': 1.79,
 'Q53F85:nan': 1.78,
 'Q9UER7:DAXX': 1.75,
 'P84243:H3-3A': 1.45,
 'Q16695:H3-4': 1.45,
 'Q16514:TAF12': 1.4100000000000001,
 'Q71DI3:H3C15': 1.3900000000000001,
 'P49450:CENPA': 1.37,
 'B4E1C1:nan': 1.1}