Understanding what data products are released about a species is important in understanding what we know about the species and what gaps may exist in current knowledge.  This notebook leverages USGS SB to return official data release items that mention species of interest.

In [1]:
#Import needed packages
import json
import bispy
from IPython.display import display
from joblib import Parallel, delayed
from sciencebasepy import SbSession

sb = SbSession()
bis_utils = bispy.bis.Utils()

In [2]:
# Open up the cached explore ITIS list with species names from ITIS Exploration.ipynb
with open("cache/itis_explore.json", "r") as f:
    itis_explore = json.loads(f.read())

This function finds items in ScienceBase containing a given WLCI species name within the item

In [3]:
# Use joblib to run multiple requests for ScienceBase records in parallel via ITIS scientific names
sb_results = Parallel(n_jobs=8)(delayed(sb.find_items_by_any_text)(name) for name in [r["scientific_name"] for r in itis_explore])
sb_results

[{'total': 16,
  'took': '1s',
  'selflink': {'rel': 'self',
   'url': 'https://www.sciencebase.gov/catalog/items?q=Oncorhynchus+clarkii+pleuriticus&max=20'},
  'items': [{'link': {'rel': 'self',
     'url': 'https://www.sciencebase.gov/catalog/item/537f6b24e4b021317a86fa9c'},
    'relatedItems': {'link': {'url': 'https://www.sciencebase.gov/catalog/itemLinks?itemId=537f6b24e4b021317a86fa9c',
      'rel': 'related'}},
    'id': '537f6b24e4b021317a86fa9c',
    'title': 'Colorado river cutthroat (Oncorhynchus clarkii pleuriticus) distribution and status by HUC8',
    'summary': 'Colorado river cutthroat (Oncorhynchus clarkii pleuriticus) status data created for the Western Division of the American Fisheries Society (WDAFS)',
    'hasChildren': False,
    '_searchHit': {'_score': 930.1424}},
   {'link': {'rel': 'self',
     'url': 'https://www.sciencebase.gov/catalog/item/4f4e49d1e4b07f02db5db976'},
    'relatedItems': {'link': {'url': 'https://www.sciencebase.gov/catalog/itemLinks?itemId

In [4]:
# Cache the array of retrieved documents and return/display a random sample for verification
display(bis_utils.doc_cache("cache/sciencebase.json", sb_results))

{'Doc Cache File': 'cache/sciencebase.json',
 'Number of Documents in Cache': 170,
 'Document Number 167': {'total': 0,
  'took': '242ms',
  'selflink': {'rel': 'self',
   'url': 'https://www.sciencebase.gov/catalog/items?q=Puccinellia+rupestris&max=20'},
  'items': []}}

Check to see if any invalid/not accepted ITIS specie names matched with ScienceBase records

In [5]:
# Open up the cached updated ITIS list with invalid/not accepted species names from ITIS Exploration.ipynb
with open("cache/invalid_itis.json", "r") as f:
    invalid_itis = json.loads(f.read())

In [6]:
# Use joblib to run multiple requests for ScienceBase documents in parallel via the invalid/not accepted ITIS scientific names
invalid_sb_result = Parallel(n_jobs=8)(delayed(sb.find_items_by_any_text)(name) for name in [r["scientific_name"] for r in invalid_itis])
invalid_sb_result

[{'total': 65,
  'took': '5ms',
  'selflink': {'rel': 'self',
   'url': 'https://www.sciencebase.gov/catalog/items?q=Clupea+pallasi&max=20'},
  'nextlink': {'rel': 'next',
   'url': 'https://www.sciencebase.gov/catalog/items?q=Clupea+pallasi&max=20&offset=20'},
  'items': [{'link': {'rel': 'self',
     'url': 'https://www.sciencebase.gov/catalog/item/5053977be4b097cd4fce6091'},
    'relatedItems': {'link': {'url': 'https://www.sciencebase.gov/catalog/itemLinks?itemId=5053977be4b097cd4fce6091',
      'rel': 'related'}},
    'id': '5053977be4b097cd4fce6091',
    'title': "Reproductive biology of the Pacific herring Clupea pallasi pallasi in Lake Nerpich'e (Kamchatka).",
    'hasChildren': False,
    '_searchHit': {'_score': 686.2032}},
   {'link': {'rel': 'self',
     'url': 'https://www.sciencebase.gov/catalog/item/505380efe4b097cd4fce027d'},
    'relatedItems': {'link': {'url': 'https://www.sciencebase.gov/catalog/itemLinks?itemId=505380efe4b097cd4fce027d',
      'rel': 'related'}},
  