## Query Examples

Examples of bodies used in POST /search requests.

First, install the DCP python client:

In [3]:
import sys
!{sys.executable} -m pip install hca
import hca.dss
dss_client = hca.dss.DSSClient()



#### Bundles from Humans

In [4]:
es_query = {
    "query": {
        "bool": {
            "must": [
                {
                    "match": {
                        "files.donor_organism_json.genus_species.text": "Homo sapiens"
                    }
                }
            ]
        }
    }
}
dss_client.post_search(es_query=es_query, replica="aws")

{'es_query': {'query': {'bool': {'must': [{'match': {'files.donor_organism_json.genus_species.text': 'Homo sapiens'}}]}}},
 'results': [{'bundle_fqid': '80a13e23-de15-4430-9cab-da355442238f.2018-12-11T232118.032657Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/80a13e23-de15-4430-9cab-da355442238f?version=2018-12-11T232118.032657Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '2ae40f28-5db1-4d9c-89c8-6ea23461cf40.2018-12-11T230120.798178Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/2ae40f28-5db1-4d9c-89c8-6ea23461cf40?version=2018-12-11T230120.798178Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '190040a8-339c-4de5-bfa2-286bc5e6cefb.2018-12-11T225932.024147Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/190040a8-339c-4de5-bfa2-286bc5e6cefb?version=2018-12-11T225932.024147Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '5083f7be-976d-4b72-8578-1ff517cd3341.2018-12-11T225454.369560Z',
  

#### Bundles from diseased organisms

In [9]:
es_query = {
    "query": {
        "bool": {
            "must_not": [
                {
                    "match": {
                        "files.donor_organism_json.diseases.ontology": "PATO:0000461"
                    }
                }
            ]
        }
    }
}
dss_client.post_search(es_query=es_query, replica="aws")

# Or slightly worse (better to use the ontology term directly)
es_query = {
    "query": {
        "bool": {
            "must_not": [
                {
                    "match": {
                        "files.donor_organism_json.diseases.text": "normal"
                    }
                }
            ]
        }
    }
}
dss_client.post_search(es_query=es_query, replica="aws")

{'es_query': {'query': {'bool': {'must_not': [{'match': {'files.donor_organism_json.diseases.text': 'normal'}}]}}},
 'results': [{'bundle_fqid': '419f7703-cbd7-42f6-bed5-7251279eb533.2018-12-10T221505.027443Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/419f7703-cbd7-42f6-bed5-7251279eb533?version=2018-12-10T221505.027443Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '5cebd56b-1829-47f2-936d-273517824512.2018-12-10T221353.618665Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/5cebd56b-1829-47f2-936d-273517824512?version=2018-12-10T221353.618665Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '8b265331-6bbb-4a8c-a464-96981537bac8.2018-12-10T221214.762762Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/8b265331-6bbb-4a8c-a464-96981537bac8?version=2018-12-10T221214.762762Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '61ab2ac4-34ea-4cf3-a699-88a8adf83088.2018-12-10T221132.231897Z',
   'bundl

#### Bundles from Contributors at Sanger

In [10]:
es_query = {
    "query": {
        "bool": {
            "must": [
                {
                    "regexp": {
                        "files.project_json.contributors.email": ".*@sanger.ac.uk"
                    }
                }
            ]
        }
    }
}
dss_client.post_search(es_query=es_query, replica="aws")

{'es_query': {'query': {'bool': {'must': [{'regexp': {'files.project_json.contributors.email': '.*@sanger.ac.uk'}}]}}},
 'results': [{'bundle_fqid': '0f7528b8-8067-43bc-abb5-3115031c4d67.2018-12-11T023229.913065Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/0f7528b8-8067-43bc-abb5-3115031c4d67?version=2018-12-11T023229.913065Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '9d9c985b-e655-4646-8ff5-49dc2e768213.2018-12-11T022908.214893Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/9d9c985b-e655-4646-8ff5-49dc2e768213?version=2018-12-11T022908.214893Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '91cc94ec-7ba7-4db0-a7ca-6d1449a847ee.2018-12-11T013141.412846Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/91cc94ec-7ba7-4db0-a7ca-6d1449a847ee?version=2018-12-11T013141.412846Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '81f920f3-8645-439c-868e-1bf16ab9b0a7.2018-12-11T013132.284148Z',
   'b

#### Bundles from DroNc-seq or Drop-seq

In [11]:
es_query = {
    "query": {
        "bool": {
            "must": [
                {
                    "terms": {
                        "files.sequencing_protocol_json.sequencing_approach.text": [
                            "Drop-Seq",
                            "DroNc-Seq"
                        ]
                    }
                }
            ]
        }
    }
}
dss_client.post_search(es_query=es_query, replica="aws")

{'es_query': {'query': {'bool': {'must': [{'terms': {'files.sequencing_protocol_json.sequencing_approach.text': ['Drop-Seq',
        'DroNc-Seq']}}]}}},
 'results': [{'bundle_fqid': 'a5c9f145-38e3-47a2-b45d-19257077115b.2018-12-05T230950.335985Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/a5c9f145-38e3-47a2-b45d-19257077115b?version=2018-12-05T230950.335985Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': 'ec67ee8c-7189-4955-8f09-93553713abfc.2018-12-05T230945.608726Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/ec67ee8c-7189-4955-8f09-93553713abfc?version=2018-12-05T230945.608726Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '72aec3e9-4b33-43f3-868f-4c51b23f5a22.2018-12-05T230927.286277Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/72aec3e9-4b33-43f3-868f-4c51b23f5a22?version=2018-12-05T230927.286277Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '9cc57169-cb1c-4760-9283-de862a55171e.

#### Analysis Bundles Produced by Secondary Analysis Service

In [12]:
es_query = {
    "query": {
        "bool": {
            "must": [
                {
                    "match": {
                        "files.analysis_protocol_json.protocol_type.text": "analysis"
                    }
                }
            ]
        }
    }
}
dss_client.post_search(es_query=es_query, replica="aws")

{'es_query': {'query': {'bool': {'must': [{'match': {'files.analysis_protocol_json.protocol_type.text': 'analysis'}}]}}},
 'results': [{'bundle_fqid': '80a13e23-de15-4430-9cab-da355442238f.2018-12-11T232118.032657Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/80a13e23-de15-4430-9cab-da355442238f?version=2018-12-11T232118.032657Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '2ae40f28-5db1-4d9c-89c8-6ea23461cf40.2018-12-11T230120.798178Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/2ae40f28-5db1-4d9c-89c8-6ea23461cf40?version=2018-12-11T230120.798178Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '190040a8-339c-4de5-bfa2-286bc5e6cefb.2018-12-11T225932.024147Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/190040a8-339c-4de5-bfa2-286bc5e6cefb?version=2018-12-11T225932.024147Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '5083f7be-976d-4b72-8578-1ff517cd3341.2018-12-11T225454.369560Z',
   

#### Bundles Containing the File "E18_20160930_Neurons_Sample_71_S068_L007_I1_006.fastq.gz"

In [14]:
es_query = {
    "query": {
        "bool": {
            "must": [
                {
                    "match": {
                        "manifest.files.name": "E18_20160930_Neurons_Sample_71_S068_L007_I1_006.fastq.gz"
                    }
                }
            ]
        }
    }
}
dss_client.post_search(es_query=es_query, replica="aws")

{'es_query': {'query': {'bool': {'must': [{'match': {'manifest.files.name': 'E18_20160930_Neurons_Sample_71_S068_L007_I1_006.fastq.gz'}}]}}},
 'results': [{'bundle_fqid': 'ead66505-a78b-44ee-81f6-418be859ab65.2018-12-06T043139.806469Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/ead66505-a78b-44ee-81f6-418be859ab65?version=2018-12-06T043139.806469Z&replica=aws',
   'search_score': None}],
 'total_hits': 1}

#### Bundles Created After July 4, 2018

In [17]:
es_query = {
    "query": {
        "bool": {
            "must": [
                {
                    "range": {
                        "manifest.version": {
                            "gte": "2018-07-04T100000.000000Z"
                        }
                    }
                }
            ]
        }
    }
}
dss_client.post_search(es_query=es_query, replica="aws")

{'es_query': {'query': {'bool': {'must': [{'range': {'manifest.version': {'gte': '2018-07-04T100000.000000Z'}}}]}}},
 'results': [{'bundle_fqid': '80a13e23-de15-4430-9cab-da355442238f.2018-12-11T232118.032657Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/80a13e23-de15-4430-9cab-da355442238f?version=2018-12-11T232118.032657Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '2ae40f28-5db1-4d9c-89c8-6ea23461cf40.2018-12-11T230120.798178Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/2ae40f28-5db1-4d9c-89c8-6ea23461cf40?version=2018-12-11T230120.798178Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '190040a8-339c-4de5-bfa2-286bc5e6cefb.2018-12-11T225932.024147Z',
   'bundle_url': 'https://dss.data.humancellatlas.org/v1/bundles/190040a8-339c-4de5-bfa2-286bc5e6cefb?version=2018-12-11T225932.024147Z&replica=aws',
   'search_score': None},
  {'bundle_fqid': '5083f7be-976d-4b72-8578-1ff517cd3341.2018-12-11T225454.369560Z',
   'bund