In [1]:
# data wrangling
import pandas as pd

# plotting
import matplotlib.pyplot as plt

# other
import time

# sklearn
from sklearn.model_selection import train_test_split

# local files
from sofascores import compute_sofa

In [2]:
DATA_FILEPATH = "all_hourly_data.h5"

patients = pd.read_hdf(DATA_FILEPATH, "patients")
vitals_labs = pd.read_hdf(DATA_FILEPATH, "vitals_labs")
vitals_labs_mean = pd.read_hdf(DATA_FILEPATH, "vitals_labs_mean")
interventions = pd.read_hdf(DATA_FILEPATH, "interventions")

In [3]:
print(patients.columns)
print(interventions.columns)

Index(['gender', 'ethnicity', 'age', 'insurance', 'admittime',
       'diagnosis_at_admission', 'dischtime', 'discharge_location',
       'fullcode_first', 'dnr_first', 'fullcode', 'dnr', 'dnr_first_charttime',
       'cmo_first', 'cmo_last', 'cmo', 'deathtime', 'intime', 'outtime',
       'los_icu', 'admission_type', 'first_careunit', 'mort_icu', 'mort_hosp',
       'hospital_expire_flag', 'hospstay_seq', 'readmission_30', 'max_hours'],
      dtype='object')
Index(['vent', 'vaso', 'adenosine', 'dobutamine', 'dopamine', 'epinephrine',
       'isuprel', 'milrinone', 'norepinephrine', 'phenylephrine',
       'vasopressin', 'colloid_bolus', 'crystalloid_bolus', 'nivdurations'],
      dtype='object')


In [4]:
for column in vitals_labs.columns:
    print(column)
print()
print(vitals_labs.shape)

('alanine aminotransferase', 'count')
('alanine aminotransferase', 'mean')
('alanine aminotransferase', 'std')
('albumin', 'count')
('albumin', 'mean')
('albumin', 'std')
('albumin ascites', 'count')
('albumin ascites', 'mean')
('albumin ascites', 'std')
('albumin pleural', 'count')
('albumin pleural', 'mean')
('albumin pleural', 'std')
('albumin urine', 'count')
('albumin urine', 'mean')
('albumin urine', 'std')
('alkaline phosphate', 'count')
('alkaline phosphate', 'mean')
('alkaline phosphate', 'std')
('anion gap', 'count')
('anion gap', 'mean')
('anion gap', 'std')
('asparate aminotransferase', 'count')
('asparate aminotransferase', 'mean')
('asparate aminotransferase', 'std')
('basophils', 'count')
('basophils', 'mean')
('basophils', 'std')
('bicarbonate', 'count')
('bicarbonate', 'mean')
('bicarbonate', 'std')
('bilirubin', 'count')
('bilirubin', 'mean')
('bilirubin', 'std')
('blood urea nitrogen', 'count')
('blood urea nitrogen', 'mean')
('blood urea nitrogen', 'std')
('co2', 'c

In [5]:
for column in vitals_labs_mean.columns:
    print(column)
print()
print(vitals_labs_mean.shape)

('alanine aminotransferase', 'mean')
('albumin', 'mean')
('albumin ascites', 'mean')
('albumin pleural', 'mean')
('albumin urine', 'mean')
('alkaline phosphate', 'mean')
('anion gap', 'mean')
('asparate aminotransferase', 'mean')
('basophils', 'mean')
('bicarbonate', 'mean')
('bilirubin', 'mean')
('blood urea nitrogen', 'mean')
('co2', 'mean')
('co2 (etco2, pco2, etc.)', 'mean')
('calcium', 'mean')
('calcium ionized', 'mean')
('calcium urine', 'mean')
('cardiac index', 'mean')
('cardiac output thermodilution', 'mean')
('cardiac output fick', 'mean')
('central venous pressure', 'mean')
('chloride', 'mean')
('chloride urine', 'mean')
('cholesterol', 'mean')
('cholesterol hdl', 'mean')
('cholesterol ldl', 'mean')
('creatinine', 'mean')
('creatinine ascites', 'mean')
('creatinine body fluid', 'mean')
('creatinine pleural', 'mean')
('creatinine urine', 'mean')
('diastolic blood pressure', 'mean')
('eosinophils', 'mean')
('fibrinogen', 'mean')
('fraction inspired oxygen', 'mean')
('fraction 