# Example: RDF workflow

This notebook provides insights on how the RDF is generated from the property table via the [rdf.py](../src/pyBiodatafuse/graph/rdf.py) module.

In [1]:
import os; os.chdir(os.path.abspath(os.path.join(os.getcwd(), '..', 'src')))
import pandas as pd
from pyBiodatafuse.graph import rdf
from pyBiodatafuse import constants

  from .autonotebook import tqdm as notebook_tqdm


### Load the sample property table

In [2]:
data = pd.read_pickle('../combined_df.pkl')
data.head(3)

Unnamed: 0,identifier,identifier.source,target,target.source,Bgee,DisGeNET,MINERVA,WikiPathways,OpenTargets_Reactome,OpenTargets_GO,OpenTargets_Location,OpenTargets_Diseases,OpenTargets_Compounds,MolMeDB_transporter_inhibitor,PubChem_Assays,StringDB
0,AHR,HGNC,ENSG00000106546,Ensembl,"[{'anatomical_entity_id': 'UBERON_0000178', 'a...","[{'disease_id': 'umls:C2350344', 'disease_name...","[{'pathway_id': 953.0, 'pathway_label': 'Kynur...","[{'pathway_id': 'WP5130', 'pathway_label': 'Th...","[{'pathway_label': 'Endogenous sterols', 'path...","[{'go_id': 'GO:0005667', 'go_name': 'transcrip...","[{'location_id': 'SL-0086', 'location': 'Cytop...","[{'disease_id': 'umls:C0033860', 'disease_name...","[{'chembl_id': 'CHEMBL259571', 'drugbank_id': ...","[{'compound_name': nan, 'InChIKey': nan, 'SMIL...","[{'pubchem_assay_id': nan, 'assay_type': nan, ...","[{'stringdb_link_to': 'CHRND', 'Ensembl': 'ENS..."
1,ALG14,HGNC,ENSG00000172339,Ensembl,"[{'anatomical_entity_id': 'UBERON_0000178', 'a...","[{'disease_id': 'umls:C0751882', 'disease_name...","[{'pathway_id': nan, 'pathway_label': nan, 'pa...","[{'pathway_id': 'WP5153', 'pathway_label': 'N-...",[{'pathway_label': 'Biosynthesis of the N-glyc...,"[{'go_id': 'GO:0043541', 'go_name': 'UDP-N-ace...","[{'location_id': 'SL-0097', 'location': 'Endop...","[{'disease_id': nan, 'disease_name': nan, 'the...","[{'chembl_id': nan, 'drugbank_id': nan, 'compo...","[{'compound_name': nan, 'InChIKey': nan, 'SMIL...","[{'pubchem_assay_id': nan, 'assay_type': nan, ...","[{'stringdb_link_to': 'GMPPB', 'Ensembl': 'ENS..."
2,ALG2,HGNC,ENSG00000119523,Ensembl,"[{'anatomical_entity_id': 'UBERON_0000178', 'a...","[{'disease_id': 'umls:C0751882', 'disease_name...","[{'pathway_id': nan, 'pathway_label': nan, 'pa...","[{'pathway_id': 'WP5153', 'pathway_label': 'N-...",[{'pathway_label': 'Biosynthesis of the N-glyc...,"[{'go_id': 'GO:0000033', 'go_name': 'alpha-1,3...","[{'location_id': 'SL-0162', 'location': 'Membr...","[{'disease_id': nan, 'disease_name': nan, 'the...","[{'chembl_id': nan, 'drugbank_id': nan, 'compo...","[{'compound_name': nan, 'InChIKey': nan, 'SMIL...","[{'pubchem_assay_id': nan, 'assay_type': nan, ...","[{'stringdb_link_to': 'SLC5A7', 'Ensembl': 'EN..."


### Generating RDF from table

In [3]:
g  = rdf.generate_rdf(data)

Binding sio to http://semanticscience.org/resource/
Binding hgnc to http://bio2rdf.org/hgnc:
Binding obo to http://purl.obolibrary.org/obo/
Binding umls to https://uts-ws.nlm.nih.gov/rest/semantic-network/2015AB/CUI/
Binding ensembl to https://identifiers.org/ensembl:
Binding dcat to http://www.w3.org/ns/dcat#
Binding biodatafuse to https://biodatafuse.org/
Binding foaf to http://xmlns.com/foaf/0.1/
Binding skos to http://www.w3.org/2004/02/skos/core#
Binding owl to http://www.w3.org/2002/07/owl#
Binding rdf to http://www.w3.org/1999/02/22-rdf-syntax-ns#
Binding rdfs to http://www.w3.org/2000/01/rdf-schema#
Binding xsd to http://www.w3.org/2001/XMLSchema#


### Print out result

In [4]:
print(g.serialize(format="turtle"))

@prefix dcat: <http://www.w3.org/ns/dcat#> .
@prefix life_cycle_base_node: <https://biodatafuse.org/rdf/life_cycle> .
@prefix obo: <http://purl.obolibrary.org/obo/> .
@prefix rdfs: <http://www.w3.org/2000/01/rdf-schema#> .
@prefix sio: <http://semanticscience.org/resource/> .
@prefix skos: <http://www.w3.org/2004/02/skos/core#> .
@prefix xsd: <http://www.w3.org/2001/XMLSchema#> .

<https://biodatafuse.org/rdf/experimental_process/000000/AHR> a sio:SIO_001077 ;
    sio:SIO_000229 <https://biodatafuse.org/rdf/gene_expression_value/000000/AHR_UBERON_0000178> ;
    sio:SIO_000230 obo:UBERON_0000178,
        <https://biodatafuse.org/rdf/gene/000000/> .

<https://biodatafuse.org/rdf/experimental_process/000001/ALG14> a sio:SIO_001077 ;
    sio:SIO_000229 <https://biodatafuse.org/rdf/gene_expression_value/000001/ALG14_UBERON_0000178> ;
    sio:SIO_000230 obo:UBERON_0000178,
        <https://biodatafuse.org/rdf/gene/000001/> .

<https://biodatafuse.org/rdf/experimental_process/000002/ALG2> a s