### This notebook shows examples of how to use the cyclops.query API on GEMINI.

## Example 1. Get all patient encounters from delirium cohort, join with labs, limit to 100 rows.

In [1]:
from cyclops.processors.constants import SMH
from cyclops.query import gemini

patients = gemini.patients(delirium_cohort=True)
patients_labs = gemini.events(patients=patients, category="lab")
patients_labs.run(limit=100)
print(f"{len(patients_labs.data)} rows extracted!")

2022-04-27 08:50:42,770 [1;37mINFO[0m cyclops.config  - Log file is /mnt/nfs/home/krishnanam/vector-delirium/log.log
2022-04-27 08:50:43,613 [1;37mINFO[0m cyclops.query.utils - Log file is /mnt/nfs/home/krishnanam/vector-delirium/log.log
2022-04-27 08:50:43,620 [1;37mINFO[0m cyclops.utils.profile - Log file is /mnt/nfs/home/krishnanam/vector-delirium/log.log
2022-04-27 08:50:43,632 [1;37mINFO[0m cyclops.orm     - Log file is /mnt/nfs/home/krishnanam/vector-delirium/log.log
2022-04-27 08:50:43,638 [1;37mINFO[0m cyclops.query.interface - Log file is /mnt/nfs/home/krishnanam/vector-delirium/log.log
2022-04-27 08:50:44,627 [1;37mINFO[0m cyclops.orm     - Database setup, ready to run queries!
2022-04-27 08:50:44,824 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-27 08:50:44,827 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 0.187703 s


100 rows extracted!


## Example 2. Get all patient encounters from delirium cohort, join diagnosis codes, filter responsible diagnoses made, limit to 100 rows.

In [2]:
patients = gemini.patients(delirium_cohort=True)
patients_diagnoses = gemini.diagnoses(diagnosis_types=["M"], patients=patients)
patients_diagnoses.run(limit=100)
print(f"{len(patients_diagnoses.data)} rows extracted!")

2022-04-27 08:50:45,180 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-27 08:50:45,183 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 0.334929 s


100 rows extracted!


## Example 3. Get all patient encounters from year 2020, join with labs, filter only sodium tests, limit to 100 rows.

In [3]:
patients = gemini.patients(years=[2020])
patients_labs = gemini.events(patients=patients, labels=["sodium"], category="lab")
patients_labs.run(limit=100)
print(f"{len(patients_labs.data)} rows extracted!")

2022-04-27 08:50:45,411 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-27 08:50:45,415 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 0.212241 s


100 rows extracted!


## Example 4. Get all patient encounters from year 2019, from the months of july and august join with interventions, limit to 1000 rows.

In [4]:
patients = gemini.patients(years=[2019], months=[7, 8])
patients_interventions = gemini.events(patients=patients, category="intervention")
patients_interventions.run(limit=1000)
print(f"{len(patients_interventions.data)} rows extracted!")

2022-04-27 08:50:45,942 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-27 08:50:45,946 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 0.509603 s


1000 rows extracted!


## Example 5. Get all patient encounters from St. Michael's hospital from Jan 2020 to June 2020, join with vitals, filter Systolic BP measurements (substring match).

In [5]:
patients = gemini.patients(
    hospitals=[SMH], from_date="2020-01-01", to_date="2020-06-30"
)
patients_vitals = gemini.events(patients=patients, labels="systolic", category="vitals")
patients_vitals.run()
print(f"{len(patients_vitals.data)} rows extracted!")

2022-04-27 08:50:49,845 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-27 08:50:49,850 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 3.877923 s


44774 rows extracted!


## Example 6. Get all patient encounters from all hospitals, from years [2018, 2019, 2020], join with labs and vitals (large query!!).

In [6]:
patients = gemini.patients(years=[2018, 2019, 2020], include_er_data=True)
patients_labs = gemini.events(patients=patients, category="lab")
patients_vitals = gemini.events(patients=patients, category="vitals")
patients.run()
patients_labs.run()
patients_vitals.run()
print(f"{len(patients.data)} rows extracted!")
print(f"{len(patients_labs.data)} rows extracted!")
print(f"{len(patients_vitals.data)} rows extracted!")

SAVE_PATH = "/mnt/nfs/project/delirium/drift_exp"
patients.save(SAVE_PATH, "admin_er_allhosp_2018_2020")
patients_labs.save(SAVE_PATH, "labs_allhosp_2018_2020")
patients_vitals.save(SAVE_PATH, "vitals_allhosp_2018_2020")

2022-04-27 08:50:52,896 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-27 08:50:52,900 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 2.977458 s
2022-04-27 09:01:16,234 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-27 09:01:16,254 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 623.351256 s
2022-04-27 09:04:53,780 [1;37mINFO[0m cyclops.orm     - Query returned successfully!
2022-04-27 09:04:53,792 [1;37mINFO[0m cyclops.utils.profile - Finished executing function run_query in 217.532059 s
2022-04-27 09:04:53,798 [1;37mINFO[0m cyclops.query.interface - Saving queried data to /mnt/nfs/project/delirium/drift_exp/admin_er_allhosp_2018_2020.gzip


90699 rows extracted!
10684768 rows extracted!
5831063 rows extracted!


2022-04-27 09:04:54,894 [1;37mINFO[0m cyclops.query.interface - Saving queried data to /mnt/nfs/project/delirium/drift_exp/labs_allhosp_2018_2020.gzip
2022-04-27 09:05:51,502 [1;37mINFO[0m cyclops.query.interface - Saving queried data to /mnt/nfs/project/delirium/drift_exp/vitals_allhosp_2018_2020.gzip
