In [None]:
# ===================================================
# 1. IMPORTS
# ===================================================

# Can use the following commented out pip commands to install python libraries if needed:

#!python3 -m pip install configparser
#!python3 -m pip install psycopg2-binary
#!python3 -m pip install jinja2

#import all libraries, functions, and variables from run_queries.py
from src.run_queries import *

In [None]:
# ===================================================
# 2. INPUT VARIABLES
# ===================================================

# schema name where PEDSnet tables live
schema = 'pedsnet_data'

# schema name where the OMOP/PEDSnet vocabulary tables live (In case it is different from where the clinical data live)
vocab_schema = 'vocabulary'

# version tag (used to differentiate results from different runs. Ex) "chop_v58_sub2"
version = 'chop_submission_1'

# List of tables to run checks for
# Can comment out or remove any tables that you don't want to be checked
tables = [
    'person',
    'death',
    'location',
    'care_site',
    'provider',
    'visit_occurrence',
    'condition_occurrence',
    'procedure_occurrence'
    'observation',
    'drug_exposure',
    'measurement',
    'measurement_organism',
    'immunization',
    'device_exposure',
    'adt_occurrence',
    'visit_payer',
    'specialty',
    'location_history',
    'location_fips',
    'hash_token',
    'fact_relationship'
]

In [None]:
# ===================================================
# 3. DDL For Results
# ===================================================

# Create empty tables to house data quality results
ddl = read_and_render_sql_file('src/sql/create_tables.sql')
execute_sql_file(ddl)

In [None]:
# ===================================================
# 4. Run Data Quality Checks
# ===================================================

# Runs all checks for each table name in the "tables" input variable
for table in tables:
    print('\n')
    print("=" * 70)
    print(f"Starting Data Quality Assesment of the {table} table.")
    print("=" * 70)
    render_and_execute_checks_on_table(version, schema, vocab_schema, table)
    print("=" * 70)
    print(f"Data Quality Assesment of the {table} table is complete.")
    print("=" * 70)
    print('\n')

In [None]:
# ===================================================
# 5. Export Results
# ===================================================

# Exports populated metric tables
# Writes them as a zip file containing a .csv for each table
# output can be found in the results sub directory
# output file name will be named your version

export_results(version)