### This notebook shows examples of how to use the cyclops.query API on GEMINI.

## Example 1. Get all patient encounters from delirium cohort, join with labs, limit to 100 rows.

In [1]:
from cyclops.processors.constants import SMH
from cyclops.query import gemini

patients = gemini.patients(delirium_cohort=True)
patients_labs = gemini.events(patients=patients, category="lab")
patients_labs.run(limit=100)
print(f"{len(patients_labs.data)} rows extracted!")

2022-04-28 04:21:51,952 [1;37mINFO[0m cyclops.config  - Log file is /mnt/nfs/home/krishnanam/vector-delirium/log.log
2022-04-28 04:21:53,019 [1;37mINFO[0m cyclops.query.utils - Log file is /mnt/nfs/home/krishnanam/vector-delirium/log.log
2022-04-28 04:21:53,029 [1;37mINFO[0m cyclops.utils.profile - Log file is /mnt/nfs/home/krishnanam/vector-delirium/log.log
2022-04-28 04:21:53,034 [1;37mINFO[0m cyclops.orm     - Log file is /mnt/nfs/home/krishnanam/vector-delirium/log.log
2022-04-28 04:21:53,040 [1;37mINFO[0m cyclops.query.interface - Log file is /mnt/nfs/home/krishnanam/vector-delirium/log.log
2022-04-28 04:21:53,697 [1;37mINFO[0m cyclops.orm     - Database setup, ready to run queries!
2022-04-28 04:21:54,136 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-28 04:21:54,139 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 0.428156 s


100 rows extracted!


## Example 2. Get all patient encounters from delirium cohort, join diagnosis codes, filter responsible diagnoses made, limit to 100 rows.

In [2]:
patients = gemini.patients(delirium_cohort=True)
patients_diagnoses = gemini.diagnoses(diagnosis_types=["M"], patients=patients)
patients_diagnoses.run(limit=100)
print(f"{len(patients_diagnoses.data)} rows extracted!")

2022-04-28 04:21:54,514 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-28 04:21:54,517 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 0.355859 s


100 rows extracted!


## Example 3. Get all patient encounters from year 2020, join with labs, filter only sodium tests, limit to 100 rows.

In [3]:
patients = gemini.patients(years=[2020])
patients_labs = gemini.events(patients=patients, labels=["sodium"], category="lab")
patients_labs.run(limit=100)
print(f"{len(patients_labs.data)} rows extracted!")

2022-04-28 04:21:54,711 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-28 04:21:54,713 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 0.175184 s


100 rows extracted!


## Example 4. Get all patient encounters from year 2019, from the months of july and august join with interventions, limit to 1000 rows.

In [4]:
patients = gemini.patients(years=[2019], months=[7, 8])
patients_interventions = gemini.events(patients=patients, category="intervention")
patients_interventions.run(limit=1000)
print(f"{len(patients_interventions.data)} rows extracted!")

2022-04-28 04:21:55,124 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-28 04:21:55,127 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 0.392923 s


1000 rows extracted!


## Example 5. Get all patient encounters from St. Michael's hospital from Jan 2020 to June 2020, join with vitals, filter Systolic BP measurements (substring match).

In [5]:
patients = gemini.patients(
    hospitals=[SMH], from_date="2020-01-01", to_date="2020-06-30"
)
patients_vitals = gemini.events(patients=patients, labels="systolic", category="vitals")
patients_vitals.run()
print(f"{len(patients_vitals.data)} rows extracted!")

2022-04-28 04:21:58,993 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-28 04:21:58,999 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 3.848576 s


44774 rows extracted!


## Example 6. Get all patient encounters from all hospitals, from years [2018, 2019, 2020], join with labs and vitals (large query!!).

In [6]:
patients = gemini.patients(years=[2018, 2019, 2020], include_er_data=True)
patients_labs = gemini.events(patients=patients, category="lab")
patients_vitals = gemini.events(patients=patients, category="vitals")
patients.run()
patients_labs.run()
patients_vitals.run()
print(f"{len(patients.data)} rows extracted!")
print(f"{len(patients_labs.data)} rows extracted!")
print(f"{len(patients_vitals.data)} rows extracted!")

SAVE_PATH = "/mnt/nfs/project/delirium/sprint_demo/APR-28-2022"
patients.save(SAVE_PATH, "admin_er_2018_2020")
patients_labs.save(SAVE_PATH, "labs_2018_2020")
patients_vitals.save(SAVE_PATH, "vitals_2018_2020")

2022-04-28 04:22:02,099 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-28 04:22:02,104 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 3.010244 s
2022-04-28 04:33:45,579 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-28 04:33:45,593 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 703.485801 s
2022-04-28 04:37:20,455 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-28 04:37:20,464 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 214.867849 s
2022-04-28 04:37:20,469 [1;37mINFO[0m cyclops.query.interface - Saving queried data to /mnt/nfs/project/delirium/sprint_demo/APR-28-2022/admin_er_2018_2020.gzip


90699 rows extracted!
10684768 rows extracted!
5831063 rows extracted!


2022-04-28 04:37:21,189 [1;37mINFO[0m cyclops.query.interface - Saving queried data to /mnt/nfs/project/delirium/sprint_demo/APR-28-2022/labs_2018_2020.gzip
2022-04-28 04:38:18,093 [1;37mINFO[0m cyclops.query.interface - Saving queried data to /mnt/nfs/project/delirium/sprint_demo/APR-28-2022/vitals_2018_2020.gzip
