In [1]:
import json
import os
import sys
import rdflib
from SPARQLWrapper import SPARQLWrapper, JSON
import pandas as pd
import numpy as np

## Setup SPARQL / Python Interface

### Define SPARQL Request Function

In [2]:
#Credit - Doug Fils

def get_sparql_dataframe(service, query):
    """
    Helper function to convert SPARQL results into a Pandas data frame.
    """
    sparql = SPARQLWrapper(service)
    sparql.setQuery(query)
    sparql.setReturnFormat(JSON)
    result = sparql.query()

    processed_results = json.load(result.response)
    cols = processed_results['head']['vars']

    out = []
    for row in processed_results['results']['bindings']:
        item = []
        for c in cols:
            item.append(row.get(c, {}).get('value'))
        out.append(item)

    return pd.DataFrame(out, columns=cols)

### Set SPARQL Endpoint and base URIs

In [3]:
BCODMO_SERVE = "https://lod.bco-dmo.org/sparql"  #BCO-DMO SPARQL Endpoint
BCODMO_PREF = "http://lod.bco-dmo.org/id/"       #BCO-DMO URI base

## Basic SPARQL Queries
SPARQL is queried in as a string. Can define variables within SPARQL, then query result will be returned in dataframe format which can be used as python variables. Can also return SPARQL query in other formats (like straight json or lists). 

**NOTE:** The BCO-DMO SPARQL endpoint (like many public SPARQL endpoints) limits results to 10,000.

Helpful SPARQL Cheat Sheet: http://www.iro.umontreal.ca/~lapalme/ift6281/sparql-1_1-cheat-sheet.pdf

### Properties ("predicates" in Subject-Predicate-Object model) in BCO-DMO

Also see https://ocean-data.org/schema/ for ontology

#### List all the properties in the BCO-DMO Knowledge Graph

In [4]:
propertyQuery = '''
SELECT DISTINCT ?property
WHERE { [] ?property [] }
ORDER BY ?property
'''

In [5]:
propertySearch = get_sparql_dataframe(BCODMO_SERVE, propertyQuery)

In [6]:
propertySearch.style.set_properties(**{'width': '600px'})

Unnamed: 0,property
0,http://digital-repositories.org/ontologies/dspace/0.1.0#checksum
1,http://digital-repositories.org/ontologies/dspace/0.1.0#checksumAlgorithm
2,http://digital-repositories.org/ontologies/dspace/0.1.0#hasBitstream
3,http://digital-repositories.org/ontologies/dspace/0.1.0#isPartOfCollection
4,http://digital-repositories.org/ontologies/dspace/0.1.0#isPartOfItem
5,http://digital-repositories.org/ontologies/dspace/0.1.0#mimeType
6,http://digital-repositories.org/ontologies/dspace/0.1.0#size
7,http://jena.hpl.hp.com/2003/03/result-set#binding
8,http://jena.hpl.hp.com/2003/03/result-set#resultVariable
9,http://jena.hpl.hp.com/2003/03/result-set#size


#### Get more information about the properties

In [7]:
propertyQuery = '''
SELECT DISTINCT ?dataset_parameter ?masterParam
WHERE { ?dataset_parameter odo:isInstanceOf ?masterParam  .
}
'''

In [8]:
propertySearch = get_sparql_dataframe(BCODMO_SERVE, propertyQuery)

In [9]:
propertySearch.style.set_properties(**{'width': '600px'})

Unnamed: 0,dataset_parameter,masterParam
0,http://lod.bco-dmo.org/id/dataset-parameter/744650,http://lod.bco-dmo.org/id/parameter/830
1,http://lod.bco-dmo.org/id/dataset-parameter/744651,http://lod.bco-dmo.org/id/parameter/2009
2,http://lod.bco-dmo.org/id/dataset-parameter/744652,http://lod.bco-dmo.org/id/parameter/976
3,http://lod.bco-dmo.org/id/dataset-parameter/744653,http://lod.bco-dmo.org/id/parameter/1678
4,http://lod.bco-dmo.org/id/dataset-parameter/744654,http://lod.bco-dmo.org/id/parameter/542214
5,http://lod.bco-dmo.org/id/dataset-parameter/744655,http://lod.bco-dmo.org/id/parameter/806
6,http://lod.bco-dmo.org/id/dataset-parameter/744656,http://lod.bco-dmo.org/id/parameter/1741
7,http://lod.bco-dmo.org/id/dataset-parameter/744659,http://lod.bco-dmo.org/id/parameter/1740
8,http://lod.bco-dmo.org/id/dataset-parameter/744660,http://lod.bco-dmo.org/id/parameter/1740
9,http://lod.bco-dmo.org/id/dataset-parameter/744661,http://lod.bco-dmo.org/id/parameter/941


#### Find out more about "Monitored Properties"

In [10]:
monitoredPropertiesQuery = '''
SELECT DISTINCT ?masterParam ?shortDesc
WHERE { 
?masterParam odo:hasParameterShortDescription ?shortDesc .
?masterParam owl:deprecated 0 . #Binay - only show those that are not deprecated
}
ORDER BY ?masterParam'''

In [11]:
monitoredPropertiesSearch = get_sparql_dataframe(BCODMO_SERVE, monitoredPropertiesQuery)

In [12]:
monitoredPropertiesSearch.style.set_properties(**{'width': '600px'})

Unnamed: 0,masterParam,shortDesc
0,http://lod.bco-dmo.org/id/parameter/1001,SST at 5m
1,http://lod.bco-dmo.org/id/parameter/1002,time_capture
2,http://lod.bco-dmo.org/id/parameter/1003,time_end
3,http://lod.bco-dmo.org/id/parameter/1004,time_end_local
4,http://lod.bco-dmo.org/id/parameter/1005,time_gmt
5,http://lod.bco-dmo.org/id/parameter/1006,time_of_day
6,http://lod.bco-dmo.org/id/parameter/1007,time_local
7,http://lod.bco-dmo.org/id/parameter/1008,time_release
8,http://lod.bco-dmo.org/id/parameter/1009,time_start
9,http://lod.bco-dmo.org/id/parameter/1010,time_start_local


#### DESCRIBE a monitored property

In [20]:
monitoredPropertiesQuery = '''
DESCRIBE <http://lod.bco-dmo.org/id/parameter/901>
'''

In [24]:
monitoredPropertiesSearch = get_sparql_dataframe(BCODMO_SERVE, monitoredPropertiesQuery)
#ignore the error



In [25]:
monitoredPropertiesSearch.style.set_properties(**{'width': '600px'})

Unnamed: 0,s,p,o
0,http://lod.bco-dmo.org/id/dataset-parameter/22017,http://ocean-data.org/schema/isInstanceOf,http://lod.bco-dmo.org/id/parameter/901
1,http://lod.bco-dmo.org/id/dataset-parameter/8822,http://ocean-data.org/schema/isInstanceOf,http://lod.bco-dmo.org/id/parameter/901
2,http://lod.bco-dmo.org/id/dataset-parameter/716564,http://ocean-data.org/schema/isInstanceOf,http://lod.bco-dmo.org/id/parameter/901
3,http://lod.bco-dmo.org/id/dataset-parameter/739497,http://ocean-data.org/schema/isInstanceOf,http://lod.bco-dmo.org/id/parameter/901
4,http://lod.bco-dmo.org/id/dataset-parameter/527228,http://ocean-data.org/schema/isInstanceOf,http://lod.bco-dmo.org/id/parameter/901
5,http://lod.bco-dmo.org/id/dataset-parameter/551281,http://ocean-data.org/schema/isInstanceOf,http://lod.bco-dmo.org/id/parameter/901
6,http://lod.bco-dmo.org/id/dataset-parameter/765614,http://ocean-data.org/schema/isInstanceOf,http://lod.bco-dmo.org/id/parameter/901
7,http://lod.bco-dmo.org/id/dataset-parameter/560389,http://ocean-data.org/schema/isInstanceOf,http://lod.bco-dmo.org/id/parameter/901
8,http://lod.bco-dmo.org/id/dataset-parameter/739495,http://ocean-data.org/schema/isInstanceOf,http://lod.bco-dmo.org/id/parameter/901
9,http://lod.bco-dmo.org/id/dataset-parameter/724297,http://ocean-data.org/schema/isInstanceOf,http://lod.bco-dmo.org/id/parameter/901
