# COVID-19 Related Queries for BTE Use Case Exploration 

In [42]:
import pandas as pd
## Load BTE
from biothings_explorer.user_query_dispatcher import FindConnection
from biothings_explorer.hint import Hint
ht = Hint()

## Functions that will be used
# Check for every intermediate node type in Predict funciton
def predict_many(input_object, intermediate_node_list, output_type):
    df_list = []
    for inter in intermediate_node_list:
        try: 
            print("Intermediate Node type running:")
            print(inter)
            fc = FindConnection(input_obj=input_object, output_obj=output_type, intermediate_nodes=[inter])
            fc.connect(verbose=False)
            df = fc.display_table_view()
            rows = df.shape[0]
            if(rows > 0):
                df_list.append(df)
        except:
            print("FAILED")
    if(len(df_list) > 0):
        return pd.concat(df_list)
    else:
        return None
    
# all intermediate node types

node_type_list = (['Gene', 'SequenceVariant', 'ChemicalSubstance', 'Disease', 
                   'MolecularActivity', 'BiologicalProcess', 'CellularComponent', 
                   'Pathway', 'AnatomicalEntity', 'PhenotypicFeature'])

## 1.1 TMPRSS2 -> NAFAMOSTAT
### In what ways can the TMPRSS2 Gene be connected to NAFAMOSTAT?
### 1.1 Query 

In [43]:
tmprss2 = ht.query("TMPRSS2")['Gene'][0]

all_tmprss2_predictions = predict_many(tmprss2,node_type_list,'ChemicalSubstance')

Intermediate Node type running:
Gene
Intermediate Node type running:
SequenceVariant
Intermediate Node type running:
ChemicalSubstance
Intermediate Node type running:
Disease
API 8.7 pharos failed
API 8.4 pharos failed
API 8.15 pharos failed
API 8.1 pharos failed
API 8.14 pharos failed
API 8.12 pharos failed
API 8.2 pharos failed
API 8.6 pharos failed
API 8.13 pharos failed
API 8.10 pharos failed
API 8.3 pharos failed
API 8.5 pharos failed
API 8.11 pharos failed
API 8.8 pharos failed
API 8.9 pharos failed
API 8.17 pharos failed
API 8.22 pharos failed
API 8.16 pharos failed
API 8.18 pharos failed
API 8.21 pharos failed
API 8.23 pharos failed
API 8.20 pharos failed
API 8.25 pharos failed
API 8.19 pharos failed
API 8.36 pharos failed
API 8.31 pharos failed
API 8.32 pharos failed
API 8.33 pharos failed
API 8.26 pharos failed
API 8.35 pharos failed
API 8.29 pharos failed
API 8.34 pharos failed
API 8.37 pharos failed
API 8.24 pharos failed
API 8.27 pharos failed
API 8.30 pharos failed
API 8.

### 1.1 Results table 

In [44]:
## FUT 175 (Futhan) is another name for Nafamostat 
all_tmprss2_predictions[(all_tmprss2_predictions["output_name"] == "FUT 175")]

Unnamed: 0,input,input_type,pred1,pred1_source,pred1_api,pred1_pubmed,node1_type,node1_name,node1_id,pred2,pred2_source,pred2_api,pred2_pubmed,output_type,output_name,output_id
30984,TMPRSS2,Gene,physically_interacts_with,,BioLink API,32296183,Gene,TNF,NCBIGene:7124,physically_interacts_with,,DGIdb API,,ChemicalSubstance,FUT 175,name:FUT 175
2405,TMPRSS2,Gene,related_to,scibite,Automat CORD19 Scibite API,,ChemicalSubstance,CAMOSTAT,name:CAMOSTAT,negatively_regulates,SEMMED,SEMMED Chemical API,9322090.0,ChemicalSubstance,FUT 175,name:FUT 175
2406,TMPRSS2,Gene,related_to,scigraph,Automat CORD19 Scigraph API,,ChemicalSubstance,CAMOSTAT,name:CAMOSTAT,negatively_regulates,SEMMED,SEMMED Chemical API,9322090.0,ChemicalSubstance,FUT 175,name:FUT 175
2407,TMPRSS2,Gene,physically_interacts_with,drugbank,MyChem.info API,,ChemicalSubstance,CAMOSTAT,name:CAMOSTAT,negatively_regulates,SEMMED,SEMMED Chemical API,9322090.0,ChemicalSubstance,FUT 175,name:FUT 175
43018,TMPRSS2,Gene,related_to,scibite,Automat CORD19 Scibite API,,Disease,CORONAVINAE INFECTIOUS DISEASE,MONDO:MONDO:0005719,related_to,scibite,Automat CORD19 Scibite API,,ChemicalSubstance,FUT 175,name:FUT 175
43019,TMPRSS2,Gene,related_to,CTD,CTD API,24027332|24227843|27550352|27733646|28778717,Disease,CORONAVINAE INFECTIOUS DISEASE,MONDO:MONDO:0005719,related_to,scibite,Automat CORD19 Scibite API,,ChemicalSubstance,FUT 175,name:FUT 175


## 1.2 Question: Is the only way to get from TMPRSS2 to Blood Coagulation through Nafamostat (Fut 175)? 

In [48]:
tmprss2_to_blood_coagulation = predict_many(tmprss2,node_type_list,'BiologicalProcess')

Intermediate Node type running:
Gene
Intermediate Node type running:
SequenceVariant
Intermediate Node type running:
ChemicalSubstance
Intermediate Node type running:
Disease
Intermediate Node type running:
MolecularActivity
Intermediate Node type running:
BiologicalProcess
Intermediate Node type running:
CellularComponent
Intermediate Node type running:
Pathway
Intermediate Node type running:
AnatomicalEntity
Intermediate Node type running:
PhenotypicFeature


#### TMPRSS2 to Blood Coagulation through any node type:

In [50]:
tmprss2_to_blood_coagulation[tmprss2_to_blood_coagulation['output_name'].str.contains('COAGULATION', regex=False)]

Unnamed: 0,input,input_type,pred1,pred1_source,pred1_api,pred1_pubmed,node1_type,node1_name,node1_id,pred2,pred2_source,pred2_api,pred2_pubmed,output_type,output_name,output_id
4950,TMPRSS2,Gene,physically_interacts_with,SEMMED,SEMMED Gene API,20713528,Gene,C0017337,UMLS:C0017337,affects,SEMMED,SEMMED Gene API,"11410270,11841337,16612563,16676068,16862193,1...",BiologicalProcess,BLOOD COAGULATION,name:BLOOD COAGULATION
8807,TMPRSS2,Gene,physically_interacts_with,SEMMED,SEMMED Gene API,1850025928282546,Gene,PTEN,NCBIGene:5728,related_to,Translator Text Mining Provider,CORD Gene API,,BiologicalProcess,COAGULATION,GO:GO:0050817
8808,TMPRSS2,Gene,physically_interacts_with,,BioLink API,32296183,Gene,PLP2,NCBIGene:5355,related_to,Translator Text Mining Provider,CORD Gene API,,BiologicalProcess,COAGULATION,GO:GO:0050817
8809,TMPRSS2,Gene,physically_interacts_with,,BioLink API,32296183,Gene,TNF,NCBIGene:7124,related_to,Translator Text Mining Provider,CORD Gene API,,BiologicalProcess,COAGULATION,GO:GO:0050817
8810,TMPRSS2,Gene,physically_interacts_with,,BioLink API,32296183,Gene,IGFBP5,NCBIGene:3488,related_to,Translator Text Mining Provider,CORD Gene API,,BiologicalProcess,COAGULATION,GO:GO:0050817
364,TMPRSS2,Gene,related_to,scigraph,Automat CORD19 Scigraph API,,ChemicalSubstance,CHEBI:35222,CHEBI:CHEBI:35222,related_to,Translator Text Mining Provider,CORD Chemical API,,BiologicalProcess,COAGULATION,GO:GO:0050817
1117,TMPRSS2,Gene,related_to,scibite,Automat CORD19 Scibite API,,ChemicalSubstance,FUT 175,name:FUT 175,affects,SEMMED,SEMMED Chemical API,3443413,BiologicalProcess,BLOOD COAGULATION,name:BLOOD COAGULATION
1118,TMPRSS2,Gene,related_to,scigraph,Automat CORD19 Scigraph API,,ChemicalSubstance,FUT 175,name:FUT 175,affects,SEMMED,SEMMED Chemical API,3443413,BiologicalProcess,BLOOD COAGULATION,name:BLOOD COAGULATION
1119,TMPRSS2,Gene,related_to,scibite,Automat CORD19 Scibite API,,ChemicalSubstance,FUT 175,name:FUT 175,disrupts,SEMMED,SEMMED Chemical API,3443413,BiologicalProcess,BLOOD COAGULATION,name:BLOOD COAGULATION
1120,TMPRSS2,Gene,related_to,scigraph,Automat CORD19 Scigraph API,,ChemicalSubstance,FUT 175,name:FUT 175,disrupts,SEMMED,SEMMED Chemical API,3443413,BiologicalProcess,BLOOD COAGULATION,name:BLOOD COAGULATION


#### TMPRSS2 to Blood Coagulation through any ChemicalSubstance type node:

In [55]:
tmprss2_to_blood_coagulation[(tmprss2_to_blood_coagulation['node1_type'] == "ChemicalSubstance") & (tmprss2_to_blood_coagulation['output_name'].str.contains('COAGULATION', regex=False))]

Unnamed: 0,input,input_type,pred1,pred1_source,pred1_api,pred1_pubmed,node1_type,node1_name,node1_id,pred2,pred2_source,pred2_api,pred2_pubmed,output_type,output_name,output_id
364,TMPRSS2,Gene,related_to,scigraph,Automat CORD19 Scigraph API,,ChemicalSubstance,CHEBI:35222,CHEBI:CHEBI:35222,related_to,Translator Text Mining Provider,CORD Chemical API,,BiologicalProcess,COAGULATION,GO:GO:0050817
1117,TMPRSS2,Gene,related_to,scibite,Automat CORD19 Scibite API,,ChemicalSubstance,FUT 175,name:FUT 175,affects,SEMMED,SEMMED Chemical API,3443413.0,BiologicalProcess,BLOOD COAGULATION,name:BLOOD COAGULATION
1118,TMPRSS2,Gene,related_to,scigraph,Automat CORD19 Scigraph API,,ChemicalSubstance,FUT 175,name:FUT 175,affects,SEMMED,SEMMED Chemical API,3443413.0,BiologicalProcess,BLOOD COAGULATION,name:BLOOD COAGULATION
1119,TMPRSS2,Gene,related_to,scibite,Automat CORD19 Scibite API,,ChemicalSubstance,FUT 175,name:FUT 175,disrupts,SEMMED,SEMMED Chemical API,3443413.0,BiologicalProcess,BLOOD COAGULATION,name:BLOOD COAGULATION
1120,TMPRSS2,Gene,related_to,scigraph,Automat CORD19 Scigraph API,,ChemicalSubstance,FUT 175,name:FUT 175,disrupts,SEMMED,SEMMED Chemical API,3443413.0,BiologicalProcess,BLOOD COAGULATION,name:BLOOD COAGULATION


1.2 NOTES: Tables show that TMPRSS2 -> coagulation can also be found through 'CHEBI:35222' Chemical Substance, as well as through many other node types that are not drugs

## 1.3 TMPRSS2 -> Camostat
### In what ways can the TMPRSS2 Gene be connected to Camostat?

In [56]:
all_tmprss2_predictions[all_tmprss2_predictions["output_name"] == "CAMOSTAT"]

Unnamed: 0,input,input_type,pred1,pred1_source,pred1_api,pred1_pubmed,node1_type,node1_name,node1_id,pred2,pred2_source,pred2_api,pred2_pubmed,output_type,output_name,output_id
3172,TMPRSS2,Gene,negatively_regulates,SEMMED,SEMMED Gene API,25221645,Gene,C1710301,UMLS:C1710301,negatively_regulates,SEMMED,SEMMED Gene API,2402733225666761.0,ChemicalSubstance,CAMOSTAT,name:CAMOSTAT
3173,TMPRSS2,Gene,physically_interacts_with,SEMMED,SEMMED Gene API,25520876,Gene,C1710301,UMLS:C1710301,negatively_regulates,SEMMED,SEMMED Gene API,2402733225666761.0,ChemicalSubstance,CAMOSTAT,name:CAMOSTAT
3174,TMPRSS2,Gene,physically_interacts_with,,BioLink API,21068237,Gene,ACE2,NCBIGene:59272,related_to,scigraph,Automat CORD19 Scigraph API,,ChemicalSubstance,CAMOSTAT,name:CAMOSTAT
3175,TMPRSS2,Gene,physically_interacts_with,,BioLink API,,Gene,TMPRSS4,NCBIGene:56649,related_to,scibite,Automat CORD19 Scibite API,,ChemicalSubstance,CAMOSTAT,name:CAMOSTAT
3176,TMPRSS2,Gene,physically_interacts_with,,BioLink API,,Gene,TMPRSS4,NCBIGene:56649,related_to,scigraph,Automat CORD19 Scigraph API,,ChemicalSubstance,CAMOSTAT,name:CAMOSTAT
42864,TMPRSS2,Gene,related_to,scibite,Automat CORD19 Scibite API,,Disease,SEVERE ACUTE RESPIRATORY SYNDROME,MONDO:MONDO:0005091,related_to,scibite,Automat CORD19 Scibite API,,ChemicalSubstance,CAMOSTAT,name:CAMOSTAT
42865,TMPRSS2,Gene,related_to,scigraph,Automat CORD19 Scigraph API,,Disease,SEVERE ACUTE RESPIRATORY SYNDROME,MONDO:MONDO:0005091,related_to,scibite,Automat CORD19 Scibite API,,ChemicalSubstance,CAMOSTAT,name:CAMOSTAT
42866,TMPRSS2,Gene,related_to,CTD,CTD API,22496216|24227843|30626688,Disease,SEVERE ACUTE RESPIRATORY SYNDROME,MONDO:MONDO:0005091,related_to,scibite,Automat CORD19 Scibite API,,ChemicalSubstance,CAMOSTAT,name:CAMOSTAT
42867,TMPRSS2,Gene,related_to,DISEASE,DISEASES API,,Disease,SEVERE ACUTE RESPIRATORY SYNDROME,MONDO:MONDO:0005091,related_to,scibite,Automat CORD19 Scibite API,,ChemicalSubstance,CAMOSTAT,name:CAMOSTAT
42868,TMPRSS2,Gene,related_to,scibite,Automat CORD19 Scibite API,,Disease,CORONAVINAE INFECTIOUS DISEASE,MONDO:MONDO:0005719,related_to,scibite,Automat CORD19 Scibite API,,ChemicalSubstance,CAMOSTAT,name:CAMOSTAT
