# DL Survival - Ventilation Outcomes
 Updated 21/11/21

In [1]:
import pandas as pd
import numpy as np
import math
import statistics
from datetime import datetime
import datetime as dt
from datetime import timedelta
import json
import miceforest as mf
from sklearn.experimental import enable_iterative_imputer
from sklearn.impute import IterativeImputer

pd.set_option('display.max_columns', None)

## 1. Data cleaning

- Import MIMIC III data
- Review column unique values, assign correct data types
- Impute missing values


### 1.1: Importing data

In [2]:
df = pd.read_csv('mimic_combined.csv')

#### 1.1.1: Column lists

In [3]:
#view and reorder columns
cols = list(df.columns)
new_cols = ['Unnamed: 0','hadm_id','subject_id','gender','ethnicity','marital_status','insurance','language','aortic','mit','tricuspid',
            'pulmonary','cabg','temp','bg_temp','hr','spo2','rr','sbp','dbp','meanbp','weight','height','cardiac_index','pt','ptt',
            'inr','inr_1','fibrinogen','hb','hematocrit','plts','wcc','lymphocytes','neutrophils','alp','ast','alt','ggt',
            'bilirubin_indirect','bilirubin_direct','bilirubin_total','chloride','magnesium','potassium','crp','bleed_time','albumin',
            'creatinine','free_calcium','sodium','bicarb','bun','hba1c','glucose','lactate','po2','pco2','baseexcess','ph','aado2',
            'fio2','ffp','insulin','cryo','prbc','infection','ventrate','tidalvol','vent_array','reintubation','liver_severe','liver_mild',
            'rheum','cvd','aids','ckd','copd','arrhythmia','pud','smoking','pvd','paraplegia','ccf','met_ca','t2dm','t1dm','malig','mi',
            'dementia','first_careunit','last_careunit','admission_location','admission_type','hospital_expire_flag','admittime',
            'dischtime','intime','outtime','ext_time','reint_time','los','icustay_seq','deathtime','plt','diab_un','diab_cc',
            'dtoutput','specimen','dod']

ptinfo=['Unnamed: 0','hadm_id','subject_id']

demographics=['gender','ethnicity','marital_status','insurance','language']

proceduretype=['aortic','mit','tricuspid','pulmonary','cabg']

vitals=['temp','bg_temp','hr','spo2','rr','sbp','dbp','meanbp','weight','height','cardiac_index']

labs=['pt','ptt','inr','inr_1','fibrinogen','hb','hematocrit','plts','wcc','lymphocytes','neutrophils','alp','ast','alt','ggt',
'bilirubin_indirect','bilirubin_direct','bilirubin_total','chloride','magnesium','potassium','crp','bleed_time',
'albumin','creatinine','free_calcium','sodium','bicarb','bun','hba1c','glucose','lactate']

bloodgases=['po2','pco2','baseexcess','ph','aado2','fio2']

products=['ffp','insulin','cryo','prbc','infection']

ventilation=['ventrate','tidalvol','vent_array','reintubation']

comorbidities=['liver_severe','liver_mild','rheum','cvd','aids','ckd','copd','arrhythmia','pud','smoking','pvd',
'paraplegia','ccf','met_ca','t2dm','t1dm','malig','mi','dementia']

adm_cat=['first_careunit','last_careunit','admission_location','admission_type','hospital_expire_flag']

adm_num=['admittime','dischtime','intime','outtime','ext_time','reint_time','los','icustay_seq','deathtime']

others=['plt','diab_un','diab_cc','dtoutput','specimen','dod']

timeseries=[*vitals,*labs,*bloodgases,*products,*ventilation,'plt','dtoutput']
timeseries = [i for i in timeseries if i not in ('weight','height','reintubation', 'infection', 'vent_array')]
    
timeseries_valuenames = {'cardiac_index':'ci',
                         'plts':'bloodproduct',
                         'ffp':'bloodproduct',
                         'insulin':'amount',
                         'cryo':'bloodproduct',
                         'prbc':'bloodproduct',
                         'dtoutput':'output'}

In [4]:
df = df[new_cols]
df.head(10)

Unnamed: 0.1,Unnamed: 0,hadm_id,subject_id,gender,ethnicity,marital_status,insurance,language,aortic,mit,tricuspid,pulmonary,cabg,temp,bg_temp,hr,spo2,rr,sbp,dbp,meanbp,weight,height,cardiac_index,pt,ptt,inr,inr_1,fibrinogen,hb,hematocrit,plts,wcc,lymphocytes,neutrophils,alp,ast,alt,ggt,bilirubin_indirect,bilirubin_direct,bilirubin_total,chloride,magnesium,potassium,crp,bleed_time,albumin,creatinine,free_calcium,sodium,bicarb,bun,hba1c,glucose,lactate,po2,pco2,baseexcess,ph,aado2,fio2,ffp,insulin,cryo,prbc,infection,ventrate,tidalvol,vent_array,reintubation,liver_severe,liver_mild,rheum,cvd,aids,ckd,copd,arrhythmia,pud,smoking,pvd,paraplegia,ccf,met_ca,t2dm,t1dm,malig,mi,dementia,first_careunit,last_careunit,admission_location,admission_type,hospital_expire_flag,admittime,dischtime,intime,outtime,ext_time,reint_time,los,icustay_seq,deathtime,plt,diab_un,diab_cc,dtoutput,specimen,dod
0,0,173798,29491,M,white,DIVORCED,Private,ENGL,1,0,0,0,0,"[{'charttime': datetime.datetime(2111, 2, 16, ...",[],"[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...",69.5,167.64,[],[],[],"[{'charttime': datetime.datetime(2111, 2, 17, ...","[{'charttime': datetime.datetime(2111, 2, 17, ...",[],"[{'charttime': datetime.datetime(2111, 2, 17, ...",[],[],"[{'charttime': datetime.datetime(2111, 2, 17, ...",[],[],[],[],[],[],[],[],[],"[{'charttime': datetime.datetime(2111, 2, 17, ...",[],"[{'charttime': datetime.datetime(2111, 2, 16, ...",[],[],[],"[{'charttime': datetime.datetime(2111, 2, 17, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 17, ...","[{'charttime': datetime.datetime(2111, 2, 17, ...",[],"[{'charttime': datetime.datetime(2111, 2, 16, ...",[],"[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...",[],[],[],[],[],[],"[{'suspected_infection_time': None, 'antibioti...",[],[],"[{'starttime': datetime.datetime(2111, 2, 16, ...",0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYS REFERRAL/NORMAL DELI,ELECTIVE,0,2111-02-16 07:15:00,2111-02-21 15:49:00,2111-02-16 10:20:19,2111-02-17 11:21:23,2111-02-16 13:00:00,,1.0424,1,,"[{'charttime': datetime.datetime(2111, 2, 17, ...",0,0,[],[],
1,1,197759,26775,M,white,WIDOWED,Medicare,ENGL,1,0,0,0,1,"[{'charttime': datetime.datetime(2192, 4, 20, ...",[],"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",82.0,157.48,"[{'charttime': datetime.datetime(2192, 4, 20, ...",[],"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",[],"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",[],[],[],[],[],[],[],"[{'charttime': datetime.datetime(2192, 4, 20, ...",[],"[{'charttime': datetime.datetime(2192, 4, 20, ...",[],[],[],"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",[],"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",[],[],[],[],[],[],"[{'suspected_infection_time': None, 'antibioti...",[],[],"[{'starttime': datetime.datetime(2192, 4, 20, ...",0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYS REFERRAL/NORMAL DELI,ELECTIVE,0,2192-04-20 07:15:00,2192-04-24 13:23:00,2192-04-20 09:59:48,2192-04-21 16:50:54,2192-04-20 15:00:00,,1.2855,1,,"[{'charttime': datetime.datetime(2192, 4, 20, ...",0,0,[],[],
2,2,193167,23782,F,unknown,MARRIED,Medicare,,0,0,0,0,1,"[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 2, 8...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...",66.2,162.56,"[{'charttime': datetime.datetime(2170, 1, 1, 2...",[],"[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...",[],"[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...",[],"[{'charttime': datetime.datetime(2170, 1, 2, 3...",[],[],"[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 2, 3...",[],[],[],"[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 2, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...",[],[],"[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 1, 2...",[],"[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...",[],"[{'charttime': datetime.datetime(2170, 1, 2, 8...",[],[],[],[],"[{'suspected_infection_time': None, 'antibioti...",[],"[{'charttime': datetime.datetime(2170, 1, 2, 8...","[{'starttime': datetime.datetime(2170, 1, 1, 2...",0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,TRANSFER FROM HOSP/EXTRAM,EMERGENCY,0,2169-12-29 17:57:00,2170-01-11 14:00:00,2170-01-01 19:06:41,2170-01-08 10:10:13,2170-01-02 13:30:00,,6.6275,1,,"[{'charttime': datetime.datetime(2170, 1, 1, 2...",0,0,[],[],
3,3,127967,32056,F,other,DIVORCED,Private,ENGL,0,1,0,0,0,"[{'charttime': datetime.datetime(2141, 4, 3, 1...",[],"[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...",70.0,154.94,"[{'charttime': datetime.datetime(2141, 4, 3, 1...",[],"[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 9...",[],"[{'charttime': datetime.datetime(2141, 4, 3, 1...",[],[],[],[],[],[],[],[],[],"[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 4, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 9...",[],[],[],"[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...",[],"[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 9...",[],[],[],[],[],[],"[{'suspected_infection_time': None, 'antibioti...",[],[],"[{'starttime': datetime.datetime(2141, 4, 3, 1...",0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,CSRU,CSRU,PHYS REFERRAL/NORMAL DELI,ELECTIVE,0,2141-04-03 07:15:00,2141-04-08 14:46:00,2141-04-03 09:54:55,2141-04-04 11:17:58,2141-04-03 19:00:00,,1.0577,1,,"[{'charttime': datetime.datetime(2141, 4, 3, 1...",0,0,[],[],
4,4,115784,2907,F,white,MARRIED,Private,ENGL,0,0,0,0,1,"[{'charttime': datetime.datetime(2188, 1, 15, ...",[],"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",72.1,167.64,[],[],"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",[],"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",[],"[{'charttime': datetime.datetime(2188, 1, 16, ...",[],[],[],[],[],[],[],[],[],"[{'charttime': datetime.datetime(2188, 1, 16, ...","[{'charttime': datetime.datetime(2188, 1, 16, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",[],[],[],"[{'charttime': datetime.datetime(2188, 1, 16, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 16, ...","[{'charttime': datetime.datetime(2188, 1, 16, ...",[],"[{'charttime': datetime.datetime(2188, 1, 15, ...",[],"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",[],[],[],[],[],"[{'charttime': datetime.datetime(2188, 1, 17, ...","[{'suspected_infection_time': None, 'antibioti...",[],"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'starttime': datetime.datetime(2188, 1, 15, ...",0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,CLINIC REFERRAL/PREMATURE,EMERGENCY,0,2188-01-14 17:13:00,2188-01-20 15:24:00,2188-01-15 11:56:32,2188-01-18 11:17:26,2188-01-15 23:30:00,,2.9728,1,,"[{'charttime': datetime.datetime(2188, 1, 15, ...",0,0,[],[],
5,5,155783,26071,M,white,MARRIED,Private,ENGL,1,0,0,0,0,"[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...",127.3,175.26,"[{'charttime': datetime.datetime(2174, 10, 21,...",[],"[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...",[],"[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 30,...","[{'charttime': datetime.datetime(2174, 10, 30,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...",[],[],[],"[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 22,...","[{'charttime': datetime.datetime(2174, 10, 21,...",[],[],"[{'charttime': datetime.datetime(2174, 10, 27,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...",[],"[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...","[{'charttime': datetime.datetime(2174, 10, 21,...",[],[],[],[],[],"[{'charttime': datetime.datetime(2174, 10, 22,...","[{'suspected_infection_time': None, 'antibioti...",[],[],"[{'starttime': datetime.datetime(2174, 10, 21,...",0,0,0,0,0,0,0,0,1,0,0,1,0,1,0,0,0,0,0,0,CSRU,CSRU,EMERGENCY ROOM ADMIT,EMERGENCY,0,2174-10-21 10:01:00,2174-11-12 15:25:00,2174-10-21 10:01:55,2174-11-01 19:20:48,2174-10-31 03:35:00,,11.3881,1,,"[{'charttime': datetime.datetime(2174, 10, 21,...",1,0,[],[],
6,6,108745,29931,M,white,MARRIED,Private,,0,0,0,0,1,"[{'charttime': datetime.datetime(2156, 6, 25, ...",[],"[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...",78.8,172.72,"[{'charttime': datetime.datetime(2156, 6, 25, ...",[],"[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...",[],"[{'charttime': datetime.datetime(2156, 6, 25, ...",[],[],[],[],[],[],[],[],[],"[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 26, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...",[],[],[],"[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 17, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'charttime': datetime.datetime(2156, 6, 25, ...",[],[],[],[],[],[],"[{'suspected_infection_time': None, 'antibioti...",[],"[{'charttime': datetime.datetime(2156, 6, 25, ...","[{'starttime': datetime.datetime(2156, 6, 25, ...",0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYS REFERRAL/NORMAL DELI,ELECTIVE,0,2156-06-25 07:15:00,2156-06-29 13:10:00,2156-06-25 11:19:49,2156-06-26 16:25:04,2156-06-25 15:00:00,,1.212,1,,"[{'charttime': datetime.datetime(2156, 6, 25, ...",0,0,[],[],
7,7,129543,5455,M,white,MARRIED,Medicare,,0,0,0,0,1,"[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 19, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...",103.6,182.88,"[{'charttime': datetime.datetime(2178, 8, 18, ...",[],"[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...",[],"[{'charttime': datetime.datetime(2178, 8, 18, ...",[],[],[],[],[],[],[],[],[],"[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...",[],[],[],"[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 11, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 19, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...","[{'charttime': datetime.datetime(2178, 8, 18, ...",[],[],[],[],[],[],"[{'suspected_infection_time': None, 'antibioti...",[],[],"[{'starttime': datetime.datetime(2178, 8, 18, ...",0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYS REFERRAL/NORMAL DELI,ELECTIVE,0,2178-08-18 07:15:00,2178-08-24 14:50:00,2178-08-18 10:15:20,2178-08-20 12:03:21,2178-08-18 18:00:00,,2.075,1,,"[{'charttime': datetime.datetime(2178, 8, 18, ...",1,0,[],[],
8,8,129900,17708,M,white,MARRIED,Medicare,,0,0,0,0,1,"[{'charttime': datetime.datetime(2199, 12, 4, ...",[],"[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...",98.18,179.07,"[{'charttime': datetime.datetime(2199, 12, 4, ...",[],"[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...",[],"[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...",[],"[{'charttime': datetime.datetime(2199, 12, 5, ...",[],[],[],[],[],[],[],[],[],"[{'charttime': datetime.datetime(2199, 12, 5, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...",[],[],[],"[{'charttime': datetime.datetime(2199, 12, 5, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 5, ...","[{'charttime': datetime.datetime(2199, 12, 5, ...","[{'charttime': datetime.datetime(2199, 9, 15, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...",[],"[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...","[{'charttime': datetime.datetime(2199, 12, 4, ...",[],[],[],[],[],[],"[{'suspected_infection_time': None, 'antibioti...",[],[],"[{'starttime': datetime.datetime(2199, 12, 4, ...",0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,CSRU,CSRU,PHYS REFERRAL/NORMAL DELI,ELECTIVE,0,2199-12-04 08:00:00,2199-12-09 18:49:00,2199-12-04 11:48:21,2199-12-05 09:51:39,2199-12-04 21:00:00,,0.919,1,,"[{'charttime': datetime.datetime(2199, 12, 4, ...",0,0,[],[],
9,9,179048,30553,F,black,SINGLE,Private,ENGL,1,0,0,0,0,"[{'charttime': datetime.datetime(2193, 7, 23, ...",[],"[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...",67.4,157.48,"[{'charttime': datetime.datetime(2193, 7, 23, ...",[],"[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...",[],"[{'charttime': datetime.datetime(2193, 7, 23, ...",[],[],"[{'charttime': datetime.datetime(2193, 7, 23, ...",[],[],[],[],[],[],[],[],[],"[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 24, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...",[],[],[],"[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 1, 1...","[{'charttime': datetime.datetime(2193, 7, 23, ...",[],"[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'charttime': datetime.datetime(2193, 7, 23, ...",[],[],[],[],[],"[{'charttime': datetime.datetime(2193, 7, 23, ...","[{'suspected_infection_time': None, 'antibioti...",[],[],"[{'starttime': datetime.datetime(2193, 7, 23, ...",0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYS REFERRAL/NORMAL DELI,ELECTIVE,0,2193-07-23 11:00:00,2193-07-29 16:30:00,2193-07-23 10:19:06,2193-07-24 12:07:15,2193-07-23 19:00:00,,1.0751,1,,"[{'charttime': datetime.datetime(2193, 7, 23, ...",1,0,[],[],


### 1.2: Cleaning data types

#### 1.2.0: NaN assignment

In [5]:
df = df.replace('NaT',np.datetime64('NaT'))
df = df.replace(['[]','NaN',np.datetime64('NaT')],np.NaN)

#### 1.2.1: Datetime columns

In [6]:
# set column types as datetime
time_cols = ['admittime','dischtime','intime','outtime','reint_time','ext_time','deathtime']
for col in time_cols:
    df[col] = pd.to_datetime(df[col], format='%Y-%m-%d %H:%M:%S')

#dod
df['dod'] = pd.to_datetime(df['dod'], format='%Y-%m-%d')

In [7]:
## CHECK FOR ROWS WHERE DEATHTIME < INTIME OR ADMITTIME

In [8]:
df[time_cols].dtypes

admittime     datetime64[ns]
dischtime     datetime64[ns]
intime        datetime64[ns]
outtime       datetime64[ns]
reint_time    datetime64[ns]
ext_time      datetime64[ns]
deathtime     datetime64[ns]
dtype: object

#### 1.2.2: Demographics

In [9]:
for x in demographics:
    print(x,': ',df[x].unique())

gender :  ['M' 'F']
ethnicity :  ['white' 'unknown' 'other' 'black' 'asian' 'hispanic' 'native' 'WHITE'
 'OTHER' 'UNKNOWN' 'UNABLE TO OBTAIN' 'ASIAN' 'HISPANIC/LATINO'
 'BLACK/AFRICAN AMERICAN' 'AMERICAN INDIAN/ALASKA NATIVE']
marital_status :  ['DIVORCED' 'WIDOWED' 'MARRIED' 'SINGLE' nan 'UNKNOWN (DEFAULT)'
 'SEPARATED']
insurance :  ['Private' 'Medicare' 'Medicaid' 'Government' 'Self Pay' 'Other']
language :  ['ENGL' nan 'CAPE' 'RUSS' 'MAND' 'PORT' 'CAMB' 'SPAN' 'PTUN' 'CANT' 'ITAL'
 'POLI' 'PERS' 'VIET' '*GUJ' 'URDU' '*BEN' 'KORE' 'ALBA' '*LEB' 'AMER'
 'GREE' 'HAIT' 'THAI' 'HIND' 'TURK' 'GERM' 'ARAB' 'ETHI' 'ENGLISH' '?']


In [10]:
#ethnicity
df.replace({'ethnicity':
                {'unknown': np.NaN,'UNKNOWN':np.NaN,'UNABLE TO OBTAIN':np.NaN,
                'OTHER':'other','WHITE':'white','BLACK/AFRICAN AMERICAN':'black','ASIAN':'asian',
                'HISPANIC/LATINO':'hispanic','AMERICAN INDIAN/ALASKA NATIVE':'native'
                }
            }, 
            inplace=True)
print(df['ethnicity'].unique())

['white' nan 'other' 'black' 'asian' 'hispanic' 'native']


In [11]:
#marital_status
df.replace({'marital_status':
                {'UNKNOWN (DEFAULT)': np.NaN
                }
            }, 
            inplace=True)
print(df['marital_status'].unique())

['DIVORCED' 'WIDOWED' 'MARRIED' 'SINGLE' nan 'SEPARATED']


In [12]:
#language
df.replace({'language':
                {'ENGLISH':'ENGL','?':np.NaN
                }
            }, 
            inplace=True)
print(df['marital_status'].unique())

['DIVORCED' 'WIDOWED' 'MARRIED' 'SINGLE' nan 'SEPARATED']


#### 1.2.3: ✔Procedure type

In [13]:
for x in proceduretype:
    print(x,': ',df[x].unique())

aortic :  [1 0]
mit :  [0 1]
tricuspid :  [0 1]
pulmonary :  [0 1]
cabg :  [0 1]


#### 1.2.4: **Vitals / Blood Gases / Products + infection / Ventilation


In [14]:
# wait for Jahan/others
# ventrate seems to be empty

#### 1.2.5: ✔Comorbidities

In [15]:
for x in comorbidities:
    print(x,': ',df[x].unique())

liver_severe :  [0 1]
liver_mild :  [0 1]
rheum :  [0 1]
cvd :  [0 1]
aids :  [0 1]
ckd :  [0 1]
copd :  [0 1]
arrhythmia :  [0 1]
pud :  [0 1]
smoking :  [0 1]
pvd :  [0 1]
paraplegia :  [0 1]
ccf :  [0 1]
met_ca :  [0 1]
t2dm :  [0 1]
t1dm :  [0 1]
malig :  [0 1]
mi :  [0 1]
dementia :  [0 1]


#### 1.2.6: Admissions (categorical)

In [16]:
for x in adm_cat:
    print(x,': ',df[x].unique())

first_careunit :  ['CSRU' 'CCU' 'SICU' 'MICU' 'TSICU'
 'Cardiac Vascular Intensive Care Unit (CVICU)' 'Coronary Care Unit (CCU)'
 'Medical Intensive Care Unit (MICU)'
 'Medical/Surgical Intensive Care Unit (MICU/SICU)' 'Trauma SICU (TSICU)'
 'Surgical Intensive Care Unit (SICU)'
 'Neuro Surgical Intensive Care Unit (Neuro SICU)' 'Neuro Intermediate']
last_careunit :  ['CSRU' 'TSICU' 'CCU' 'MICU' 'SICU'
 'Cardiac Vascular Intensive Care Unit (CVICU)' 'Coronary Care Unit (CCU)'
 'Medical Intensive Care Unit (MICU)'
 'Medical/Surgical Intensive Care Unit (MICU/SICU)' 'Trauma SICU (TSICU)'
 'Surgical Intensive Care Unit (SICU)'
 'Neuro Surgical Intensive Care Unit (Neuro SICU)']
admission_location :  ['PHYS REFERRAL/NORMAL DELI' 'TRANSFER FROM HOSP/EXTRAM'
 'CLINIC REFERRAL/PREMATURE' 'EMERGENCY ROOM ADMIT'
 'TRANSFER FROM OTHER HEALT' 'TRANSFER FROM SKILLED NUR'
 'PHYSICIAN REFERRAL' 'TRANSFER FROM HOSPITAL' 'EMERGENCY ROOM'
 'PROCEDURE SITE' 'WALK-IN/SELF REFERRAL' 'PACU'
 'INFORMATION N

In [17]:
#first_careunit
df.replace({'first_careunit':
                {'Cardiac Vascular Intensive Care Unit (CVICU)':'CVICU',
                'Coronary Care Unit (CCU)':'CCU',
                'Medical Intensive Care Unit (MICU)':'MICU',
                'Surgical Intensive Care Unit (SICU)':'SICU',
                'Neuro Intermediate':'Neuro Inter',
                'Medical/Surgical Intensive Care Unit (MICU/SICU)':'MICU/SICU',
                'Trauma SICU (TSICU)':'TSICU',
                'Neuro Surgical Intensive Care Unit (Neuro SICU)':'Neuro SICU'
                }
            }, 
            inplace=True)
print(df['first_careunit'].unique())

['CSRU' 'CCU' 'SICU' 'MICU' 'TSICU' 'CVICU' 'MICU/SICU' 'Neuro SICU'
 'Neuro Inter']


In [18]:
#last_careunit
df.replace({'last_careunit':
                {'Cardiac Vascular Intensive Care Unit (CVICU)':'CVICU',
                'Coronary Care Unit (CCU)':'CCU',
                'Medical Intensive Care Unit (MICU)':'MICU',
                'Surgical Intensive Care Unit (SICU)':'SICU',
                'Neuro Intermediate':'Neuro Inter',
                'Medical/Surgical Intensive Care Unit (MICU/SICU)':'MICU/SICU',
                'Trauma SICU (TSICU)':'TSICU',
                'Neuro Surgical Intensive Care Unit (Neuro SICU)':'Neuro SICU'
                }
            }, 
            inplace=True)
print(df['last_careunit'].unique())

['CSRU' 'TSICU' 'CCU' 'MICU' 'SICU' 'CVICU' 'MICU/SICU' 'Neuro SICU']


In [19]:
#admission_location
df.replace({'admission_location':
                {'TRANSFER FROM HOSP/EXTRAM':'TRANSFER FROM HOSPITAL',
                'PHYS REFERRAL/NORMAL DELI':'PHYSICIAN REFERRAL',
                'TRANSFER FROM SKILLED NUR':'TRANSFER FROM SKILLED NURSING FACILITY',
                'INFORMATION NOT AVAILABLE':np.NaN,
                'CLINIC REFERRAL':'CLINIC REFERRAL/PREMATURE',
                'EMERGENCY ROOM ADMIT':'EMERGENCY ROOM',
                }
            }, 
            inplace=True)
print(df['admission_location'].unique())

['PHYSICIAN REFERRAL' 'TRANSFER FROM HOSPITAL' 'CLINIC REFERRAL/PREMATURE'
 'EMERGENCY ROOM' 'TRANSFER FROM OTHER HEALT'
 'TRANSFER FROM SKILLED NURSING FACILITY' 'PROCEDURE SITE'
 'WALK-IN/SELF REFERRAL' 'PACU' nan 'AMBULATORY SURGERY TRANSFER'
 'INTERNAL TRANSFER TO OR FROM PSYCH']


#### 1.2.7: Others

In [20]:
# for x in others:
#     print(x,': ',df[x].unique())

### 1.3: Parsing time series data

In [21]:
df['vent_array'][14]

"[{'starttime': datetime.datetime(2138, 7, 25, 18, 0), 'endtime': datetime.datetime(2138, 7, 28, 6, 0), 'duration_hours': 60.0}\n {'starttime': datetime.datetime(2138, 7, 29, 12, 0), 'endtime': datetime.datetime(2138, 8, 5, 11, 30), 'duration_hours': 167.5}]"

In [22]:
def va_parser(row, output=6):
    """
    Takes row from `df` returns a list of starttime, endtime, vent duration 
    for first and (if applicable) second intubations

    Parameters
    ----------
    row : row in df
    output_ : select which output you want (use list index below) - e.g. args=[6] for all output when using df.apply()

    Returns
    -------
    single list variable containing  
        [0] int_time1: first intubation starttime
        [1] ext_time1: first intubation endtime
        [2] duration1: first intubation duration
        [3] int_time2: second intubation starttime
        [4] ext_time2: second intubation endtime 
        [5] duration2: second intubation duration
        [6] all

    """
    int_time1=np.NaN
    ext_time1=np.NaN
    duration1=np.NaN
    int_time2=np.NaN
    ext_time2=np.NaN
    duration2=np.NaN
    value = row['vent_array']
    list=[]
    '''a = value
    print(value)'''
    if value == np.NaN or pd.isna(value):
        return np.NaN
    a = value.replace("'",'"')
    a = a.replace('\n ...\n',',').replace('\n', ',').replace('...', '')
    a = a.replace('datetime.','"dt.')
    a = a.replace('),', ')",')
    a = json.loads(a)
    b = [(i['starttime'], i['endtime'], i['duration_hours']) for i in a]
    int_time1=dt.datetime.strptime(b[0][0],'dt.datetime(%Y, %m, %d, %H, %M)')
    ext_time1=dt.datetime.strptime(b[0][1],'dt.datetime(%Y, %m, %d, %H, %M)')
    duration1=b[0][2]
    
    if output==0:
        return int_time1
    if output==1:
        return ext_time1
    if output==2:
        return duration1

    if len(b)>=2:
        int_time2=dt.datetime.strptime(b[1][0],'dt.datetime(%Y, %m, %d, %H, %M)')
        ext_time2=dt.datetime.strptime(b[1][1],'dt.datetime(%Y, %m, %d, %H, %M)')
        duration2=b[1][2]
    if output==3:
        return int_time2
    if output==4:
        return ext_time2
    if output==5:
        return duration2
    if output==6:
        return int_time1, ext_time1, duration1, int_time2, ext_time2, duration2

In [23]:
df['int_time1']=df.apply(va_parser, args=[0], axis=1)
df['ext_time1']=df.apply(va_parser, args=[1], axis=1)
df['duration1']=df.apply(va_parser, args=[2], axis=1)
df['int_time2']=df.apply(va_parser, args=[3], axis=1)
df['ext_time2']=df.apply(va_parser, args=[4], axis=1)
df['duration2']=df.apply(va_parser, args=[5], axis=1)
df.head()

Unnamed: 0.1,Unnamed: 0,hadm_id,subject_id,gender,ethnicity,marital_status,insurance,language,aortic,mit,tricuspid,pulmonary,cabg,temp,bg_temp,hr,spo2,rr,sbp,dbp,meanbp,weight,height,cardiac_index,pt,ptt,inr,inr_1,fibrinogen,hb,hematocrit,plts,wcc,lymphocytes,neutrophils,alp,ast,alt,ggt,bilirubin_indirect,bilirubin_direct,bilirubin_total,chloride,magnesium,potassium,crp,bleed_time,albumin,creatinine,free_calcium,sodium,bicarb,bun,hba1c,glucose,lactate,po2,pco2,baseexcess,ph,aado2,fio2,ffp,insulin,cryo,prbc,infection,ventrate,tidalvol,vent_array,reintubation,liver_severe,liver_mild,rheum,cvd,aids,ckd,copd,arrhythmia,pud,smoking,pvd,paraplegia,ccf,met_ca,t2dm,t1dm,malig,mi,dementia,first_careunit,last_careunit,admission_location,admission_type,hospital_expire_flag,admittime,dischtime,intime,outtime,ext_time,reint_time,los,icustay_seq,deathtime,plt,diab_un,diab_cc,dtoutput,specimen,dod,int_time1,ext_time1,duration1,int_time2,ext_time2,duration2
0,0,173798,29491,M,white,DIVORCED,Private,ENGL,1,0,0,0,0,"[{'charttime': datetime.datetime(2111, 2, 16, ...",,"[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...",69.5,167.64,,,,"[{'charttime': datetime.datetime(2111, 2, 17, ...","[{'charttime': datetime.datetime(2111, 2, 17, ...",,"[{'charttime': datetime.datetime(2111, 2, 17, ...",,,"[{'charttime': datetime.datetime(2111, 2, 17, ...",,,,,,,,,,"[{'charttime': datetime.datetime(2111, 2, 17, ...",,"[{'charttime': datetime.datetime(2111, 2, 16, ...",,,,"[{'charttime': datetime.datetime(2111, 2, 17, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 17, ...","[{'charttime': datetime.datetime(2111, 2, 17, ...",,"[{'charttime': datetime.datetime(2111, 2, 16, ...",,"[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...",,,,,,,"[{'suspected_infection_time': None, 'antibioti...",,,"[{'starttime': datetime.datetime(2111, 2, 16, ...",0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,2111-02-16 07:15:00,2111-02-21 15:49:00,2111-02-16 10:20:19,2111-02-17 11:21:23,2111-02-16 13:00:00,NaT,1.0424,1,NaT,"[{'charttime': datetime.datetime(2111, 2, 17, ...",0,0,,,NaT,2111-02-16 10:00:00,2111-02-16 13:00:00,3.0,NaT,NaT,
1,1,197759,26775,M,white,WIDOWED,Medicare,ENGL,1,0,0,0,1,"[{'charttime': datetime.datetime(2192, 4, 20, ...",,"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",82.0,157.48,"[{'charttime': datetime.datetime(2192, 4, 20, ...",,"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",,"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",,,,,,,,"[{'charttime': datetime.datetime(2192, 4, 20, ...",,"[{'charttime': datetime.datetime(2192, 4, 20, ...",,,,"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",,"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",,,,,,,"[{'suspected_infection_time': None, 'antibioti...",,,"[{'starttime': datetime.datetime(2192, 4, 20, ...",0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,2192-04-20 07:15:00,2192-04-24 13:23:00,2192-04-20 09:59:48,2192-04-21 16:50:54,2192-04-20 15:00:00,NaT,1.2855,1,NaT,"[{'charttime': datetime.datetime(2192, 4, 20, ...",0,0,,,NaT,2192-04-20 12:00:00,2192-04-20 15:00:00,3.0,NaT,NaT,
2,2,193167,23782,F,,MARRIED,Medicare,,0,0,0,0,1,"[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 2, 8...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...",66.2,162.56,"[{'charttime': datetime.datetime(2170, 1, 1, 2...",,"[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...",,"[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...",,"[{'charttime': datetime.datetime(2170, 1, 2, 3...",,,"[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 2, 3...",,,,"[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 2, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...",,,"[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 1, 2...",,"[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...",,"[{'charttime': datetime.datetime(2170, 1, 2, 8...",,,,,"[{'suspected_infection_time': None, 'antibioti...",,"[{'charttime': datetime.datetime(2170, 1, 2, 8...","[{'starttime': datetime.datetime(2170, 1, 1, 2...",0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,TRANSFER FROM HOSPITAL,EMERGENCY,0,2169-12-29 17:57:00,2170-01-11 14:00:00,2170-01-01 19:06:41,2170-01-08 10:10:13,2170-01-02 13:30:00,NaT,6.6275,1,NaT,"[{'charttime': datetime.datetime(2170, 1, 1, 2...",0,0,,,NaT,2170-01-01 20:00:00,2170-01-02 13:30:00,17.5,NaT,NaT,
3,3,127967,32056,F,other,DIVORCED,Private,ENGL,0,1,0,0,0,"[{'charttime': datetime.datetime(2141, 4, 3, 1...",,"[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...",70.0,154.94,"[{'charttime': datetime.datetime(2141, 4, 3, 1...",,"[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 9...",,"[{'charttime': datetime.datetime(2141, 4, 3, 1...",,,,,,,,,,"[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 4, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 9...",,,,"[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...",,"[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 9...",,,,,,,"[{'suspected_infection_time': None, 'antibioti...",,,"[{'starttime': datetime.datetime(2141, 4, 3, 1...",0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,2141-04-03 07:15:00,2141-04-08 14:46:00,2141-04-03 09:54:55,2141-04-04 11:17:58,2141-04-03 19:00:00,NaT,1.0577,1,NaT,"[{'charttime': datetime.datetime(2141, 4, 3, 1...",0,0,,,NaT,2141-04-03 12:00:00,2141-04-03 19:00:00,7.0,NaT,NaT,
4,4,115784,2907,F,white,MARRIED,Private,ENGL,0,0,0,0,1,"[{'charttime': datetime.datetime(2188, 1, 15, ...",,"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",72.1,167.64,,,"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",,"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",,"[{'charttime': datetime.datetime(2188, 1, 16, ...",,,,,,,,,,"[{'charttime': datetime.datetime(2188, 1, 16, ...","[{'charttime': datetime.datetime(2188, 1, 16, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",,,,"[{'charttime': datetime.datetime(2188, 1, 16, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 16, ...","[{'charttime': datetime.datetime(2188, 1, 16, ...",,"[{'charttime': datetime.datetime(2188, 1, 15, ...",,"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",,,,,,"[{'charttime': datetime.datetime(2188, 1, 17, ...","[{'suspected_infection_time': None, 'antibioti...",,"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'starttime': datetime.datetime(2188, 1, 15, ...",0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,CLINIC REFERRAL/PREMATURE,EMERGENCY,0,2188-01-14 17:13:00,2188-01-20 15:24:00,2188-01-15 11:56:32,2188-01-18 11:17:26,2188-01-15 23:30:00,NaT,2.9728,1,NaT,"[{'charttime': datetime.datetime(2188, 1, 15, ...",0,0,,,NaT,2188-01-15 18:00:00,2188-01-15 23:30:00,5.5,NaT,NaT,


In [24]:
def inf_parser(value, timeLimits=None):
    if value == np.NaN or pd.isna(value):
        return 0
    a = value.replace("'", '"')
    a = a.replace('\n ...\n',',').replace('\n', ',').replace('...', '')
    a = a.replace('datetime.', '"dt.')
    a = a.replace('": None', '": "None"')
    for valuename in ['antibiotic','antibiotic_time']:
        a = a.replace(f'), "{valuename}"', f')", "{valuename}"')
    a = json.loads(a)
    b = [(eval(i['suspected_infection_time']), eval(i['antibiotic_time']), i['antibiotic'], i['specimen'], 
               i['positiveculture']) for i in a]
    sus = [i[0] for i in b]
    abx = [i[1] for i in b]
    pos = [i[4] for i in b]
    inf_ = 0
    for i in range(len(sus)):
        if sus[i]==None:
            sus[i]=dt.datetime(1000, 1, 1, 0, 0)
        if abx[i]==None:
            abx[i]=dt.datetime(1000, 1, 1, 0, 0)
        if ((sus[i]>= timeLimits[0] and sus[i]<=timeLimits[1]) or (abx[i]>= timeLimits[0] and abx[i]<=timeLimits[1])) and pos[i] == 1.0:
            temp = 1
            break
        else:
            continue
    return inf_

In [25]:
def ts_parser(value, timeDelta=None, timeLimits=None, valuename='value'):
    # timeDelta is timedelta in hours from earliest entry
    # timeLimits = (startTime, endTime)
    # if both timeDelta and timeLimits are provided, timeDelta overrules.
    # if both are None, then all timepoints are accepted
    if value == np.NaN or pd.isna(value):
        return np.NaN, np.NaN, np.NaN
    a = value.replace("'", '"')
    a = a.replace('\n ...\n',',').replace('\n', ',').replace('...', '')
    a = a.replace('datetime.', '"dt.')
    a = a.replace(f'), "{valuename}"', f')", "{valuename}"')
    a = a.replace('"unit": None', '"unit": "None"')
    a = a.replace('starttime', 'charttime')
    a = json.loads(a)
    b = [(eval(i['charttime']), i[valuename]) for i in a]
    
    if timeDelta:
        startTime = min(b, key=lambda x:x[0])[0]
        inc_b = [i[1] for i in b if i[0] <= startTime + dt.timedelta(hours=timeDelta)]
    else:
        if timeLimits:
            inc_b = [i[1] for i in b if i[0] >= timeLimits[0] and i[0] <= timeLimits[1]]
        else:
            inc_b = [i[1] for i in b]
    if len(inc_b) == 0:
        return np.NaN, np.NaN, np.NaN
    
    return sum(inc_b) / len(inc_b), max(inc_b), min(inc_b)

In [26]:
# delete all rows where int_time1 OR ext_time1 are missing
df = df[~(pd.isnull(df['int_time1']) | pd.isnull(df['ext_time1']))]
df = df.reset_index()
df = df.drop(axis=1, columns=['index', 'Unnamed: 0'], inplace=False)
df

Unnamed: 0,hadm_id,subject_id,gender,ethnicity,marital_status,insurance,language,aortic,mit,tricuspid,pulmonary,cabg,temp,bg_temp,hr,spo2,rr,sbp,dbp,meanbp,weight,height,cardiac_index,pt,ptt,inr,inr_1,fibrinogen,hb,hematocrit,plts,wcc,lymphocytes,neutrophils,alp,ast,alt,ggt,bilirubin_indirect,bilirubin_direct,bilirubin_total,chloride,magnesium,potassium,crp,bleed_time,albumin,creatinine,free_calcium,sodium,bicarb,bun,hba1c,glucose,lactate,po2,pco2,baseexcess,ph,aado2,fio2,ffp,insulin,cryo,prbc,infection,ventrate,tidalvol,vent_array,reintubation,liver_severe,liver_mild,rheum,cvd,aids,ckd,copd,arrhythmia,pud,smoking,pvd,paraplegia,ccf,met_ca,t2dm,t1dm,malig,mi,dementia,first_careunit,last_careunit,admission_location,admission_type,hospital_expire_flag,admittime,dischtime,intime,outtime,ext_time,reint_time,los,icustay_seq,deathtime,plt,diab_un,diab_cc,dtoutput,specimen,dod,int_time1,ext_time1,duration1,int_time2,ext_time2,duration2
0,173798,29491,M,white,DIVORCED,Private,ENGL,1,0,0,0,0,"[{'charttime': datetime.datetime(2111, 2, 16, ...",,"[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...",69.50,167.64,,,,"[{'charttime': datetime.datetime(2111, 2, 17, ...","[{'charttime': datetime.datetime(2111, 2, 17, ...",,"[{'charttime': datetime.datetime(2111, 2, 17, ...",,,"[{'charttime': datetime.datetime(2111, 2, 17, ...",,,,,,,,,,"[{'charttime': datetime.datetime(2111, 2, 17, ...",,"[{'charttime': datetime.datetime(2111, 2, 16, ...",,,,"[{'charttime': datetime.datetime(2111, 2, 17, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 17, ...","[{'charttime': datetime.datetime(2111, 2, 17, ...",,"[{'charttime': datetime.datetime(2111, 2, 16, ...",,"[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...","[{'charttime': datetime.datetime(2111, 2, 16, ...",,,,,,,"[{'suspected_infection_time': None, 'antibioti...",,,"[{'starttime': datetime.datetime(2111, 2, 16, ...",0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,2111-02-16 07:15:00,2111-02-21 15:49:00,2111-02-16 10:20:19,2111-02-17 11:21:23,2111-02-16 13:00:00,NaT,1.042400,1,NaT,"[{'charttime': datetime.datetime(2111, 2, 17, ...",0,0,,,NaT,2111-02-16 10:00:00,2111-02-16 13:00:00,3.0,NaT,NaT,
1,197759,26775,M,white,WIDOWED,Medicare,ENGL,1,0,0,0,1,"[{'charttime': datetime.datetime(2192, 4, 20, ...",,"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",82.00,157.48,"[{'charttime': datetime.datetime(2192, 4, 20, ...",,"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",,"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",,,,,,,,"[{'charttime': datetime.datetime(2192, 4, 20, ...",,"[{'charttime': datetime.datetime(2192, 4, 20, ...",,,,"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",,"[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...","[{'charttime': datetime.datetime(2192, 4, 20, ...",,,,,,,"[{'suspected_infection_time': None, 'antibioti...",,,"[{'starttime': datetime.datetime(2192, 4, 20, ...",0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,2192-04-20 07:15:00,2192-04-24 13:23:00,2192-04-20 09:59:48,2192-04-21 16:50:54,2192-04-20 15:00:00,NaT,1.285500,1,NaT,"[{'charttime': datetime.datetime(2192, 4, 20, ...",0,0,,,NaT,2192-04-20 12:00:00,2192-04-20 15:00:00,3.0,NaT,NaT,
2,193167,23782,F,,MARRIED,Medicare,,0,0,0,0,1,"[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 2, 8...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...",66.20,162.56,"[{'charttime': datetime.datetime(2170, 1, 1, 2...",,"[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 2...",,"[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...",,"[{'charttime': datetime.datetime(2170, 1, 2, 3...",,,"[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 2, 3...",,,,"[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 2, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...",,,"[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 2, 3...","[{'charttime': datetime.datetime(2170, 1, 1, 2...",,"[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 2...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...","[{'charttime': datetime.datetime(2170, 1, 1, 1...",,"[{'charttime': datetime.datetime(2170, 1, 2, 8...",,,,,"[{'suspected_infection_time': None, 'antibioti...",,"[{'charttime': datetime.datetime(2170, 1, 2, 8...","[{'starttime': datetime.datetime(2170, 1, 1, 2...",0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,TRANSFER FROM HOSPITAL,EMERGENCY,0,2169-12-29 17:57:00,2170-01-11 14:00:00,2170-01-01 19:06:41,2170-01-08 10:10:13,2170-01-02 13:30:00,NaT,6.627500,1,NaT,"[{'charttime': datetime.datetime(2170, 1, 1, 2...",0,0,,,NaT,2170-01-01 20:00:00,2170-01-02 13:30:00,17.5,NaT,NaT,
3,127967,32056,F,other,DIVORCED,Private,ENGL,0,1,0,0,0,"[{'charttime': datetime.datetime(2141, 4, 3, 1...",,"[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...",70.00,154.94,"[{'charttime': datetime.datetime(2141, 4, 3, 1...",,"[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 9...",,"[{'charttime': datetime.datetime(2141, 4, 3, 1...",,,,,,,,,,"[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 4, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 9...",,,,"[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 1...",,"[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 1...","[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 9...","[{'charttime': datetime.datetime(2141, 4, 3, 9...",,,,,,,"[{'suspected_infection_time': None, 'antibioti...",,,"[{'starttime': datetime.datetime(2141, 4, 3, 1...",0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,2141-04-03 07:15:00,2141-04-08 14:46:00,2141-04-03 09:54:55,2141-04-04 11:17:58,2141-04-03 19:00:00,NaT,1.057700,1,NaT,"[{'charttime': datetime.datetime(2141, 4, 3, 1...",0,0,,,NaT,2141-04-03 12:00:00,2141-04-03 19:00:00,7.0,NaT,NaT,
4,115784,2907,F,white,MARRIED,Private,ENGL,0,0,0,0,1,"[{'charttime': datetime.datetime(2188, 1, 15, ...",,"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",72.10,167.64,,,"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",,"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",,"[{'charttime': datetime.datetime(2188, 1, 16, ...",,,,,,,,,,"[{'charttime': datetime.datetime(2188, 1, 16, ...","[{'charttime': datetime.datetime(2188, 1, 16, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",,,,"[{'charttime': datetime.datetime(2188, 1, 16, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 16, ...","[{'charttime': datetime.datetime(2188, 1, 16, ...",,"[{'charttime': datetime.datetime(2188, 1, 15, ...",,"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'charttime': datetime.datetime(2188, 1, 15, ...",,,,,,"[{'charttime': datetime.datetime(2188, 1, 17, ...","[{'suspected_infection_time': None, 'antibioti...",,"[{'charttime': datetime.datetime(2188, 1, 15, ...","[{'starttime': datetime.datetime(2188, 1, 15, ...",0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,CLINIC REFERRAL/PREMATURE,EMERGENCY,0,2188-01-14 17:13:00,2188-01-20 15:24:00,2188-01-15 11:56:32,2188-01-18 11:17:26,2188-01-15 23:30:00,NaT,2.972800,1,NaT,"[{'charttime': datetime.datetime(2188, 1, 15, ...",0,0,,,NaT,2188-01-15 18:00:00,2188-01-15 23:30:00,5.5,NaT,NaT,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9469,22392962,18862411,M,white,SINGLE,Medicare,ENGL,0,1,0,0,1,"[{'charttime': datetime.datetime(2138, 2, 20, ...",,"[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...",80.60,170.00,,"[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...",,"[{'charttime': datetime.datetime(2138, 2, 19, ...",,,"[{'charttime': datetime.datetime(2138, 2, 19, ...",,,,,,,,,,"[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 21, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...",,,,"[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 18, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...",,"[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...","[{'charttime': datetime.datetime(2138, 2, 19, ...",,,,"[{'charttime': datetime.datetime(2138, 2, 19, ...",,,[{'suspected_infection_time': datetime.datetim...,,,"[{'starttime': datetime.datetime(2138, 2, 19, ...",0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,CVICU,CVICU,PHYSICIAN REFERRAL,ELECTIVE,0,2138-02-18 14:00:00,2138-02-26 15:00:00,2138-02-19 13:09:54,2138-02-22 17:25:25,2138-02-19 16:00:00,NaT,3.177442,1,NaT,"[{'charttime': datetime.datetime(2138, 2, 19, ...",0,0,,,NaT,2138-02-19 13:09:00,2138-02-19 16:00:00,3.0,NaT,NaT,
9470,22890957,17196174,F,white,MARRIED,Other,ENGL,1,0,0,0,1,"[{'charttime': datetime.datetime(2195, 4, 15, ...",,"[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...",67.60,163.00,,"[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...",,"[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...",,,,,,,,"[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 16, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...",,,,"[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 14, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...","[{'charttime': datetime.datetime(2195, 4, 15, ...",,,,"[{'charttime': datetime.datetime(2195, 4, 15, ...",,,[{'suspected_infection_time': datetime.datetim...,,,"[{'starttime': datetime.datetime(2195, 4, 15, ...",0,0,0,1,0,0,0,0,1,0,1,0,0,0,0,1,0,0,0,0,CVICU,CVICU,PHYSICIAN REFERRAL,ELECTIVE,0,2195-04-14 10:30:00,2195-04-20 14:38:00,2195-04-15 08:49:09,2195-04-18 22:25:35,2195-04-15 22:00:00,NaT,3.566968,1,NaT,"[{'charttime': datetime.datetime(2195, 4, 15, ...",0,1,,,NaT,2195-04-15 12:00:00,2195-04-15 22:00:00,10.0,NaT,NaT,
9471,23679187,18771362,M,white,SINGLE,Other,ENGL,0,0,0,0,1,"[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...",75.95,169.00,,"[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...",,"[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 18, ...","[{'charttime': datetime.datetime(2132, 2, 18, ...","[{'charttime': datetime.datetime(2132, 2, 18, ...",,,,"[{'charttime': datetime.datetime(2132, 2, 18, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 18, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...",,,,"[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 6, 2...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...","[{'charttime': datetime.datetime(2132, 2, 17, ...",,,,"[{'charttime': datetime.datetime(2132, 2, 17, ...",,,[{'suspected_infection_time': datetime.datetim...,,,"[{'starttime': datetime.datetime(2132, 2, 17, ...",0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CVICU,CVICU,TRANSFER FROM HOSPITAL,URGENT,0,2132-02-06 18:53:00,2132-02-21 16:06:00,2132-02-17 14:27:20,2132-02-20 18:08:08,2132-02-18 00:00:00,NaT,3.153333,1,NaT,"[{'charttime': datetime.datetime(2132, 2, 17, ...",0,0,,,NaT,2132-02-17 16:21:00,2132-02-18 00:00:00,8.0,NaT,NaT,
9472,29365550,19243474,M,white,DIVORCED,Medicare,ENGL,1,0,0,0,1,"[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 30, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...",84.30,178.00,,"[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...",,"[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 2, 2, 1...","[{'charttime': datetime.datetime(2118, 2, 2, 1...","[{'charttime': datetime.datetime(2118, 2, 2, 1...",,,,"[{'charttime': datetime.datetime(2118, 2, 2, 1...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 30, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...",,,,"[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2116, 9, 14, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'charttime': datetime.datetime(2118, 1, 29, ...",,"[{'charttime': datetime.datetime(2118, 1, 29, ...",,"[{'charttime': datetime.datetime(2118, 1, 29, ...",,"[{'starttime': datetime.datetime(2118, 1, 29, ...",[{'suspected_infection_time': datetime.datetim...,,"[{'charttime': datetime.datetime(2118, 1, 29, ...","[{'starttime': datetime.datetime(2118, 1, 29, ...",0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,CVICU,CVICU,TRANSFER FROM HOSPITAL,URGENT,0,2118-01-22 14:17:00,2118-02-11 14:55:00,2118-01-29 10:12:54,2118-02-02 16:37:09,2118-01-30 00:00:00,NaT,4.266840,1,NaT,"[{'charttime': datetime.datetime(2118, 1, 29, ...",0,0,,,2119-11-25,2118-01-29 12:00:00,2118-01-30 00:00:00,12.0,NaT,NaT,


### 1.4: Handling missing data

#### 1.4.0 Assessing for missing data

In [27]:
# check % missing values
def missing_values_table(df): 
    mis_val = df.isnull().sum()
    mis_val_percent = 100 * df.isnull().sum() / len(df)
    mis_val_table = pd.concat([mis_val, mis_val_percent], axis=1)
    mis_val_table_ren_columns = mis_val_table.rename(columns = {0: 'Missing Values', 1: '% Missing Values'})
    return mis_val_table_ren_columns

missing_data = missing_values_table(df)

In [28]:
#set limit and get list of variables missing above limit in `missing_cols`
# missing_limit = 50 #allen
missing_limit = 80 #marcel
missing_cols = missing_data.loc[missing_data['% Missing Values']>missing_limit].index.tolist()
print(missing_cols)
missing_data = missing_data.loc[missing_data['% Missing Values']>missing_limit]
missing_data = missing_data.sort_values(by=['% Missing Values'])
pd.set_option('display.max_rows', None)
missing_data

['plts', 'ggt', 'bilirubin_indirect', 'bilirubin_direct', 'crp', 'bleed_time', 'albumin', 'aado2', 'ffp', 'cryo', 'ventrate', 'reint_time', 'deathtime', 'dtoutput', 'specimen', 'dod', 'int_time2', 'ext_time2', 'duration2']


Unnamed: 0,Missing Values,% Missing Values
plts,7785,82.172261
albumin,7879,83.16445
ffp,7928,83.681655
aado2,8018,84.631623
dod,8059,85.064387
cryo,8567,90.42643
ext_time2,8845,93.360777
reint_time,8845,93.360777
int_time2,8845,93.360777
duration2,8845,93.360777


In [29]:
pd.reset_option('display.max_rows')

In [30]:
#df = df.drop(axis=1, columns=list(missing_data.index), inplace=False) #allen
df = df.drop(axis=1, columns=[i for i in list(missing_data.index) if i not in ['duration2','int_time2','ext_time2','aado2','fio2']], inplace=False) #marcel
print(list(df.columns))

['hadm_id', 'subject_id', 'gender', 'ethnicity', 'marital_status', 'insurance', 'language', 'aortic', 'mit', 'tricuspid', 'pulmonary', 'cabg', 'temp', 'bg_temp', 'hr', 'spo2', 'rr', 'sbp', 'dbp', 'meanbp', 'weight', 'height', 'cardiac_index', 'pt', 'ptt', 'inr', 'inr_1', 'fibrinogen', 'hb', 'hematocrit', 'wcc', 'lymphocytes', 'neutrophils', 'alp', 'ast', 'alt', 'bilirubin_total', 'chloride', 'magnesium', 'potassium', 'creatinine', 'free_calcium', 'sodium', 'bicarb', 'bun', 'hba1c', 'glucose', 'lactate', 'po2', 'pco2', 'baseexcess', 'ph', 'aado2', 'fio2', 'insulin', 'prbc', 'infection', 'tidalvol', 'vent_array', 'reintubation', 'liver_severe', 'liver_mild', 'rheum', 'cvd', 'aids', 'ckd', 'copd', 'arrhythmia', 'pud', 'smoking', 'pvd', 'paraplegia', 'ccf', 'met_ca', 't2dm', 't1dm', 'malig', 'mi', 'dementia', 'first_careunit', 'last_careunit', 'admission_location', 'admission_type', 'hospital_expire_flag', 'admittime', 'dischtime', 'intime', 'outtime', 'ext_time', 'los', 'icustay_seq', 'pl

#### 1.4.1 Beginning imputation

In [31]:
dfForImpute = pd.DataFrame([0 for i in range(df.shape[0])])

# generating timeseries summary values
for column in timeseries:
    if column not in df.columns:
        continue
    x = timeseries_valuenames[column] if column in timeseries_valuenames else "value"
    meanList = []
    maxList = []
    minList = []
    for i in range(len(df[column])):
        y = ts_parser(df[column][i], timeLimits=(df['int_time1'][i].to_pydatetime(), df['ext_time1'][i].to_pydatetime()), valuename=x)
        meanList.append(y[0])
        maxList.append(y[1])
        minList.append(y[2])
    dfForImpute[column+'_mean'] = meanList
    dfForImpute[column+'_max'] = maxList
    dfForImpute[column+'_min'] = minList

  dfForImpute[column+'_mean'] = meanList
  dfForImpute[column+'_max'] = maxList
  dfForImpute[column+'_min'] = minList


In [32]:
# generating infection during ventilation binary values

x = timeseries_valuenames[column] if column in timeseries_valuenames else "value"
infList = []
column='infection'
for i in range(len(df[column])):
    y = inf_parser(df[column][i], timeLimits=(df['int_time1'][i].to_pydatetime(), df['ext_time1'][i].to_pydatetime()))
    infList.append(y)
dfForImpute['infection_vent'] = infList

  dfForImpute['infection_vent'] = infList


In [39]:
# add on non-time data for imputation

#extraColumns = [i for i in df.columns if i not in list(dfForImpute.columns) + timeseries + ['infection', 'vent_array', 'int_time1', 'ext_time1'] + ptinfo + adm_num] #allen
extraColumns = [i for i in df.columns if i not in list(dfForImpute.columns) + timeseries + ['vent_array','infection'] + ptinfo + adm_num] #marcel

for i in extraColumns:
    if i in ('weight', 'height', 'duration1','duration2'):
        dfForImpute[i] = df[i]
    else:
        dfForImpute[i] = df[i].astype('category')
dfForImpute.drop(axis=1, columns=[0], inplace=True)
dfForImpute2 = dfForImpute.copy()

In [40]:
# before imputation again
dfForImpute

Unnamed: 0,temp_mean,temp_max,temp_min,bg_temp_mean,bg_temp_max,bg_temp_min,hr_mean,hr_max,hr_min,spo2_mean,spo2_max,spo2_min,rr_mean,rr_max,rr_min,sbp_mean,sbp_max,sbp_min,dbp_mean,dbp_max,dbp_min,meanbp_mean,meanbp_max,meanbp_min,cardiac_index_mean,cardiac_index_max,cardiac_index_min,pt_mean,pt_max,pt_min,ptt_mean,ptt_max,ptt_min,inr_mean,inr_max,inr_min,inr_1_mean,inr_1_max,inr_1_min,fibrinogen_mean,fibrinogen_max,fibrinogen_min,hb_mean,hb_max,hb_min,hematocrit_mean,hematocrit_max,hematocrit_min,wcc_mean,wcc_max,wcc_min,lymphocytes_mean,lymphocytes_max,lymphocytes_min,neutrophils_mean,neutrophils_max,neutrophils_min,alp_mean,alp_max,alp_min,ast_mean,ast_max,ast_min,alt_mean,alt_max,alt_min,bilirubin_total_mean,bilirubin_total_max,bilirubin_total_min,chloride_mean,chloride_max,chloride_min,magnesium_mean,magnesium_max,magnesium_min,potassium_mean,potassium_max,potassium_min,creatinine_mean,creatinine_max,creatinine_min,free_calcium_mean,free_calcium_max,free_calcium_min,sodium_mean,sodium_max,sodium_min,bicarb_mean,bicarb_max,bicarb_min,bun_mean,bun_max,bun_min,hba1c_mean,hba1c_max,hba1c_min,glucose_mean,glucose_max,glucose_min,lactate_mean,lactate_max,lactate_min,po2_mean,po2_max,po2_min,pco2_mean,pco2_max,pco2_min,baseexcess_mean,baseexcess_max,baseexcess_min,ph_mean,ph_max,ph_min,aado2_mean,aado2_max,aado2_min,fio2_mean,fio2_max,fio2_min,insulin_mean,insulin_max,insulin_min,prbc_mean,prbc_max,prbc_min,tidalvol_mean,tidalvol_max,tidalvol_min,plt_mean,plt_max,plt_min,infection_vent,gender,ethnicity,marital_status,insurance,language,aortic,mit,tricuspid,pulmonary,cabg,weight,height,reintubation,liver_severe,liver_mild,rheum,cvd,aids,ckd,copd,arrhythmia,pud,smoking,pvd,paraplegia,ccf,met_ca,t2dm,t1dm,malig,mi,dementia,first_careunit,last_careunit,admission_location,admission_type,hospital_expire_flag,diab_un,diab_cc,int_time1,ext_time1,duration1,int_time2,ext_time2,duration2
0,36.031745,36.444444,35.611110,,,,89.000000,98.0,79.0,100.000000,100.0,100.0,14.230769,16.0,14.0,111.166667,123.0,90.0,54.750000,59.0,44.0,68.333333,74.0,55.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,3.900000,3.9,3.9,,,,1.2800,1.28,1.28,137.0,137.0,137.0,,,,,,,,,,95.000000,159.0,79.0,,,,2.000000,2.0,2.0,45.000000,45.0,45.0,2.000000,2.0,2.0,7.390000,7.39,7.39,,,,,,,,,,,,,,,,,,,0,M,white,DIVORCED,Private,ENGL,1,0,0,0,0,69.50,167.64,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,0,0,2111-02-16 10:00:00,2111-02-16 13:00:00,3.0,NaT,NaT,
1,36.376923,36.500000,36.099998,,,,84.538462,90.0,78.0,99.923077,100.0,99.0,15.576923,24.5,11.0,106.384615,123.0,81.0,51.000000,59.0,41.0,65.538462,76.0,52.0,2.293039,4.05128,1.84615,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,4.200000,4.2,4.2,,,,1.2700,1.28,1.26,136.5,137.0,136.0,,,,,,,,,,100.500000,103.0,98.0,,,,0.000000,0.0,0.0,44.000000,47.0,41.0,0.000000,0.0,0.0,7.365000,7.38,7.35,,,,,,,,,,,,,,,,,,,0,M,white,WIDOWED,Medicare,ENGL,1,0,0,0,1,82.00,157.48,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,0,0,2192-04-20 12:00:00,2192-04-20 15:00:00,3.0,NaT,NaT,
2,36.235714,36.799999,35.400002,36.3,36.6,36.0,84.910714,93.0,71.0,98.785714,100.0,96.0,19.071429,38.0,10.0,125.196429,194.0,76.0,54.642857,73.0,40.0,78.053571,113.0,53.0,2.346591,3.35227,1.35795,,,,46.133333,73.2,32.2,1.60,2.0,1.3,1.60,2.0,1.3,,,,12.450000,12.7,12.2,38.0,38.0,38.0,20.7,20.7,20.7,,,,,,,49.0,49.0,49.0,81.0,81.0,81.0,33.0,33.0,33.0,0.5,0.5,0.5,110.500000,111.0,110.0,2.500000,2.6,2.4,4.475000,5.1,3.4,0.95,1.1,0.8,1.1125,1.18,0.95,136.0,137.0,135.0,22.0,22.0,22.0,18.0,19.0,17.0,,,,129.760000,181.0,87.0,1.650000,1.8,1.5,-4.000000,-1.0,-7.0,36.000000,44.0,31.0,-4.000000,-1.0,-7.0,7.353750,7.40,7.28,,,,40.0,40.0,40.0,,,,,,,415.0,490.0,340.0,62.0,63.0,61.0,0,F,,MARRIED,Medicare,,0,0,0,0,1,66.20,162.56,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,TRANSFER FROM HOSPITAL,EMERGENCY,0,0,0,2170-01-01 20:00:00,2170-01-02 13:30:00,17.5,NaT,NaT,
3,35.726316,36.799999,34.500000,,,,71.190476,83.0,58.0,99.772727,100.0,98.0,12.500000,17.0,10.0,120.545455,152.0,96.0,53.136364,66.0,39.0,76.285714,98.0,58.0,2.498595,2.92135,1.85393,,,,41.500000,41.5,41.5,1.20,1.2,1.2,1.20,1.2,1.2,,,,11.000000,11.0,11.0,,,,10.4,10.4,10.4,,,,,,,,,,,,,,,,,,,112.000000,112.0,112.0,,,,4.166667,4.6,3.6,0.90,0.9,0.9,1.2050,1.25,1.16,139.0,139.0,139.0,26.0,26.0,26.0,17.0,17.0,17.0,,,,125.722222,165.0,74.0,,,,-0.500000,0.0,-1.0,49.000000,51.0,44.0,-0.500000,0.0,-1.0,7.330000,7.38,7.30,,,,,,,,,,,,,,,,136.0,136.0,136.0,0,F,other,DIVORCED,Private,ENGL,0,1,0,0,0,70.00,154.94,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,0,0,2141-04-03 12:00:00,2141-04-03 19:00:00,7.0,NaT,NaT,
4,36.194445,36.388889,36.000002,,,,82.153846,88.0,74.0,100.000000,100.0,100.0,13.153846,26.0,10.0,107.615385,126.0,94.0,59.538462,67.0,47.0,93.307692,277.0,63.0,,,,,,,32.200000,32.2,32.2,1.50,1.5,1.5,1.50,1.5,1.5,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,3.650000,3.8,3.5,,,,1.2800,1.28,1.28,,,,,,,,,,,,,110.000000,115.0,105.0,,,,-2.750000,0.0,-5.0,41.000000,44.0,38.0,-2.750000,0.0,-5.0,7.337500,7.39,7.31,,,,,,,,,,,,,,,,102.0,102.0,102.0,0,F,white,MARRIED,Private,ENGL,0,0,0,0,1,72.10,167.64,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,CLINIC REFERRAL/PREMATURE,EMERGENCY,0,0,0,2188-01-15 18:00:00,2188-01-15 23:30:00,5.5,NaT,NaT,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9469,,,,,,,80.000000,81.0,79.0,99.833333,100.0,99.0,14.000000,14.0,14.0,118.666667,139.0,103.0,69.916667,80.0,57.0,87.500000,103.0,72.0,,,,,,,,,,,,,,,,,,,12.100000,12.1,12.1,,,,12.3,12.3,12.3,,,,,,,,,,,,,,,,,,,113.000000,113.0,113.0,,,,3.900000,3.9,3.9,0.70,0.7,0.7,1.1200,1.12,1.12,137.0,137.0,137.0,22.0,22.0,22.0,13.0,13.0,13.0,,,,138.000000,138.0,138.0,,,,218.000000,218.0,218.0,38.000000,38.0,38.0,-1.000000,-1.0,-1.0,7.380000,7.38,7.38,,,,,,,,,,,,,,,,84.0,84.0,84.0,0,M,white,SINGLE,Medicare,ENGL,0,1,0,0,1,80.60,170.00,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,CVICU,CVICU,PHYSICIAN REFERRAL,ELECTIVE,0,0,0,2138-02-19 13:09:00,2138-02-19 16:00:00,3.0,NaT,NaT,
9470,35.431667,37.390000,34.100000,,,,78.400000,100.0,59.0,99.800000,100.0,98.0,15.500000,25.0,10.0,109.000000,125.0,76.0,58.066667,70.0,41.0,77.200000,91.0,54.0,,,,,,,,,,,,,,,,,,,11.000000,11.5,10.5,33.5,35.0,32.0,,,,,,,,,,,,,,,,,,,,,,108.000000,108.0,108.0,,,,3.780000,3.9,3.5,,,,1.1675,1.27,1.10,137.0,137.0,137.0,,,,,,,,,,123.250000,138.0,104.0,,,,186.750000,280.0,134.0,38.000000,43.0,32.0,-0.250000,0.0,-1.0,7.402500,7.46,7.37,,,,,,,14.381326,26.677310,6.666667,,,,,,,,,,0,F,white,MARRIED,Other,ENGL,1,0,0,0,1,67.60,163.00,0,0,0,1,0,0,0,0,1,0,1,0,0,0,0,1,0,0,0,0,CVICU,CVICU,PHYSICIAN REFERRAL,ELECTIVE,0,0,1,2195-04-15 12:00:00,2195-04-15 22:00:00,10.0,NaT,NaT,
9471,36.666667,36.720000,36.610000,36.7,36.7,36.7,77.416667,86.0,68.0,99.888889,100.0,99.0,16.923077,25.0,14.0,102.916667,120.0,87.0,69.916667,82.0,61.0,82.250000,94.0,72.0,,,,13.500000,13.5,13.5,31.000000,31.0,31.0,1.20,1.2,1.2,1.20,1.2,1.2,,,,13.500000,13.5,13.5,,,,11.4,11.4,11.4,,,,,,,,,,,,,,,,,,,106.000000,106.0,106.0,,,,4.325000,4.5,4.2,0.70,0.7,0.7,1.2000,1.27,1.15,136.5,137.0,136.0,24.0,24.0,24.0,12.0,12.0,12.0,,,,131.333333,150.0,120.0,1.100000,1.1,1.1,205.250000,417.0,120.0,47.750000,52.0,43.0,-1.750000,0.0,-3.0,7.315000,7.38,7.29,,,,,,,3.107415,7.470447,0.166724,,,,,,,142.0,142.0,142.0,0,M,white,SINGLE,Other,ENGL,0,0,0,0,1,75.95,169.00,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CVICU,CVICU,TRANSFER FROM HOSPITAL,URGENT,0,0,0,2132-02-17 16:21:00,2132-02-18 00:00:00,8.0,NaT,NaT,
9472,37.281667,38.390000,36.100000,,,,70.294118,80.0,64.0,98.625000,100.0,95.0,22.764706,27.5,17.0,109.470588,128.0,79.0,48.235294,54.0,37.0,67.235294,76.0,50.0,,,,15.900000,15.9,15.9,30.000000,30.0,30.0,1.50,1.5,1.5,1.50,1.5,1.5,,,,9.400000,9.6,9.2,29.0,29.0,29.0,12.2,12.2,12.2,,,,,,,,,,,,,,,,,,,100.333333,103.0,97.0,,,,4.962500,5.7,3.9,5.20,5.2,5.2,1.1725,1.31,1.09,136.0,138.0,134.0,25.0,25.0,25.0,24.0,24.0,24.0,,,,114.666667,152.0,91.0,1.550000,1.8,1.3,106.800000,143.0,82.0,42.000000,45.0,40.0,1.600000,4.0,0.0,7.411667,7.45,7.37,,,,40.0,40.0,40.0,10.000000,10.000000,10.000000,906.000000,906.0,906.00000,450.0,450.0,450.0,133.0,133.0,133.0,0,M,white,DIVORCED,Medicare,ENGL,1,0,0,0,1,84.30,178.00,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,CVICU,CVICU,TRANSFER FROM HOSPITAL,URGENT,0,0,0,2118-01-29 12:00:00,2118-01-30 00:00:00,12.0,NaT,NaT,


In [43]:
dfForImpute2 = dfForImpute.drop(axis=1, columns=['int_time1', 'ext_time1', 'duration1','int_time2', 'ext_time2','duration2'])

kds = mf.ImputationKernel(
  dfForImpute2,
  datasets=1,
  save_all_iterations=True,
  random_state=1991
)

# Run the MICE algorithm for 3 iterations
kds.mice(3)

print(kds)

dfImputed = kds.complete_data(dataset=0, inplace=False)
print(dfImputed.isnull().sum(0))

# after imputation
dfImputed.head(10)

              Class: ImputationKernel
           Datasets: 1
         Iterations: 3
  Imputed Variables: 138
save_all_iterations: True
temp_mean               0
temp_max                0
temp_min                0
bg_temp_mean            0
bg_temp_max             0
                       ..
admission_location      0
admission_type          0
hospital_expire_flag    0
diab_un                 0
diab_cc                 0
Length: 172, dtype: int64


Unnamed: 0,temp_mean,temp_max,temp_min,bg_temp_mean,bg_temp_max,bg_temp_min,hr_mean,hr_max,hr_min,spo2_mean,spo2_max,spo2_min,rr_mean,rr_max,rr_min,sbp_mean,sbp_max,sbp_min,dbp_mean,dbp_max,dbp_min,meanbp_mean,meanbp_max,meanbp_min,cardiac_index_mean,cardiac_index_max,cardiac_index_min,pt_mean,pt_max,pt_min,ptt_mean,ptt_max,ptt_min,inr_mean,inr_max,inr_min,inr_1_mean,inr_1_max,inr_1_min,fibrinogen_mean,fibrinogen_max,fibrinogen_min,hb_mean,hb_max,hb_min,hematocrit_mean,hematocrit_max,hematocrit_min,wcc_mean,wcc_max,wcc_min,lymphocytes_mean,lymphocytes_max,lymphocytes_min,neutrophils_mean,neutrophils_max,neutrophils_min,alp_mean,alp_max,alp_min,ast_mean,ast_max,ast_min,alt_mean,alt_max,alt_min,bilirubin_total_mean,bilirubin_total_max,bilirubin_total_min,chloride_mean,chloride_max,chloride_min,magnesium_mean,magnesium_max,magnesium_min,potassium_mean,potassium_max,potassium_min,creatinine_mean,creatinine_max,creatinine_min,free_calcium_mean,free_calcium_max,free_calcium_min,sodium_mean,sodium_max,sodium_min,bicarb_mean,bicarb_max,bicarb_min,bun_mean,bun_max,bun_min,hba1c_mean,hba1c_max,hba1c_min,glucose_mean,glucose_max,glucose_min,lactate_mean,lactate_max,lactate_min,po2_mean,po2_max,po2_min,pco2_mean,pco2_max,pco2_min,baseexcess_mean,baseexcess_max,baseexcess_min,ph_mean,ph_max,ph_min,aado2_mean,aado2_max,aado2_min,fio2_mean,fio2_max,fio2_min,insulin_mean,insulin_max,insulin_min,prbc_mean,prbc_max,prbc_min,tidalvol_mean,tidalvol_max,tidalvol_min,plt_mean,plt_max,plt_min,infection_vent,gender,ethnicity,marital_status,insurance,language,aortic,mit,tricuspid,pulmonary,cabg,weight,height,reintubation,liver_severe,liver_mild,rheum,cvd,aids,ckd,copd,arrhythmia,pud,smoking,pvd,paraplegia,ccf,met_ca,t2dm,t1dm,malig,mi,dementia,first_careunit,last_careunit,admission_location,admission_type,hospital_expire_flag,diab_un,diab_cc
0,36.031745,36.444444,35.61111,37.45,37.8,37.0,89.0,98.0,79.0,100.0,100.0,100.0,14.230769,16.0,14.0,111.166667,123.0,90.0,54.75,59.0,44.0,68.333333,74.0,55.0,3.370576,3.9235,2.78488,14.45,15.0,14.3,28.85,29.1,29.2,1.283333,1.3,1.3,1.29,1.3,1.3,136.0,139.0,138.0,11.05,11.0,11.2,32.666667,33.0,32.0,16.1,17.5,14.8,10.4,13.3,8.5,85.0,86.0,83.7,100.5,109.0,85.0,25.0,26.0,28.0,17.75,18.0,17.0,0.5,0.5,0.5,110.5,112.0,109.0,1.9,2.1,1.7,3.9,3.9,3.9,0.9,1.0,0.8,1.28,1.28,1.28,137.0,137.0,137.0,23.0,23.0,23.0,16.666667,18.0,15.0,6.4,6.4,6.1,95.0,159.0,79.0,1.95,2.1,1.9,2.0,2.0,2.0,45.0,45.0,45.0,2.0,2.0,2.0,7.39,7.39,7.39,482.0,490.0,478.0,46.666667,50.0,40.0,202.666667,291.0,184.0,466.666673,800.0,275.00001,800.0,800.0,800.0,143.0,153.0,129.0,0,M,white,DIVORCED,Private,ENGL,1,0,0,0,0,69.5,167.64,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,0,0
1,36.376923,36.5,36.099998,36.675,37.0,36.3,84.538462,90.0,78.0,99.923077,100.0,99.0,15.576923,24.5,11.0,106.384615,123.0,81.0,51.0,59.0,41.0,65.538462,76.0,52.0,2.293039,4.05128,1.84615,15.8,16.4,15.6,38.7,38.7,39.2,1.4,1.5,1.4,1.4,1.5,1.4,179.0,179.0,179.0,12.35,13.1,11.7,30.5,29.0,30.0,6.8,6.9,6.4,9.8,12.5,7.5,69.2,69.4,69.0,53.0,54.0,52.0,82.0,90.0,74.0,70.0,70.0,65.0,0.65,0.7,0.6,107.666667,111.0,105.0,1.98,2.2,1.9,4.2,4.2,4.2,0.7,0.7,0.7,1.27,1.28,1.26,136.5,137.0,136.0,23.0,24.0,22.0,13.0,14.0,12.0,6.0,6.0,6.0,100.5,103.0,98.0,2.7,2.7,2.1,0.0,0.0,0.0,44.0,47.0,41.0,0.0,0.0,0.0,7.365,7.38,7.35,352.0,357.0,356.0,50.0,50.0,50.0,232.4,357.0,0.0,300.0,551.0,0.0,800.0,800.0,800.0,117.333333,135.0,120.0,0,M,white,WIDOWED,Medicare,ENGL,1,0,0,0,1,82.0,157.48,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,0,0
2,36.235714,36.799999,35.400002,36.3,36.6,36.0,84.910714,93.0,71.0,98.785714,100.0,96.0,19.071429,38.0,10.0,125.196429,194.0,76.0,54.642857,73.0,40.0,78.053571,113.0,53.0,2.346591,3.35227,1.35795,16.9,22.1,13.8,46.133333,73.2,32.2,1.6,2.0,1.3,1.6,2.0,1.3,187.0,203.0,175.0,12.45,12.7,12.2,38.0,38.0,38.0,20.7,20.7,20.7,9.72,11.9,9.0,82.3,85.0,80.2,49.0,49.0,49.0,81.0,81.0,81.0,33.0,33.0,33.0,0.5,0.5,0.5,110.5,111.0,110.0,2.5,2.6,2.4,4.475,5.1,3.4,0.95,1.1,0.8,1.1125,1.18,0.95,136.0,137.0,135.0,22.0,22.0,22.0,18.0,19.0,17.0,5.4,5.4,5.4,129.76,181.0,87.0,1.65,1.8,1.5,-4.0,-1.0,-7.0,36.0,44.0,31.0,-4.0,-1.0,-7.0,7.35375,7.4,7.28,487.0,567.0,400.0,40.0,40.0,40.0,226.5,635.0,24.266668,700.000006,1400.0,350.0,415.0,490.0,340.0,62.0,63.0,61.0,0,F,hispanic,MARRIED,Medicare,HIND,0,0,0,0,1,66.2,162.56,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,TRANSFER FROM HOSPITAL,EMERGENCY,0,0,0
3,35.726316,36.799999,34.5,36.74,36.8,36.6,71.190476,83.0,58.0,99.772727,100.0,98.0,12.5,17.0,10.0,120.545455,152.0,96.0,53.136364,66.0,39.0,76.285714,98.0,58.0,2.498595,2.92135,1.85393,13.3,13.3,13.3,41.5,41.5,41.5,1.2,1.2,1.2,1.2,1.2,1.2,143.0,144.0,143.0,11.0,11.0,11.0,33.0,33.0,33.0,10.4,10.4,10.4,13.6,13.6,13.3,81.3,82.0,81.5,246.0,354.0,194.0,499.4,564.0,434.0,122.0,236.0,140.0,0.9,1.2,0.8,112.0,112.0,112.0,2.65,2.9,2.4,4.166667,4.6,3.6,0.9,0.9,0.9,1.205,1.25,1.16,139.0,139.0,139.0,26.0,26.0,26.0,17.0,17.0,17.0,5.7,5.7,5.7,125.722222,165.0,74.0,1.05,1.3,0.9,-0.5,0.0,-1.0,49.0,51.0,44.0,-0.5,0.0,-1.0,7.33,7.38,7.3,467.25,546.0,398.0,40.0,40.0,40.0,207.333333,319.0,0.0,216.666667,375.0,0.0,685.714286,717.0,600.0,136.0,136.0,136.0,0,F,other,DIVORCED,Private,ENGL,0,1,0,0,0,70.0,154.94,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,0,0
4,36.194445,36.388889,36.000002,35.7,35.9,35.4,82.153846,88.0,74.0,100.0,100.0,100.0,13.153846,26.0,10.0,107.615385,126.0,94.0,59.538462,67.0,47.0,93.307692,277.0,63.0,3.25392,6.43243,2.295,16.3,16.3,16.3,32.2,32.2,32.2,1.5,1.5,1.5,1.5,1.5,1.5,274.0,285.0,249.0,10.466667,11.6,9.2,31.25,33.0,29.0,16.05,17.6,14.6,21.3,21.0,22.3,72.0,71.0,71.6,37.0,38.0,37.0,46.0,50.0,43.0,33.0,38.0,32.0,3.6,3.5,3.3,108.0,108.0,108.0,3.075,3.5,2.7,3.65,3.8,3.5,1.25,1.3,1.2,1.28,1.28,1.28,137.0,139.0,135.0,18.75,19.0,18.0,21.5,22.0,21.0,5.05,5.1,5.0,110.0,115.0,105.0,1.45,1.9,1.0,-2.75,0.0,-5.0,41.0,44.0,38.0,-2.75,0.0,-5.0,7.3375,7.39,7.31,360.0,356.0,335.0,70.0,100.0,50.0,350.0,700.0,242.0,800.0,1400.0,626.0,533.333333,600.0,400.0,102.0,102.0,102.0,0,F,white,MARRIED,Private,ENGL,0,0,0,0,1,72.1,167.64,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,CLINIC REFERRAL/PREMATURE,EMERGENCY,0,0,0
5,37.676623,39.666668,35.599998,37.3,37.9,36.7,77.592949,110.0,57.0,94.810811,100.0,89.0,21.285075,37.5,11.5,131.819489,178.0,83.0,49.565495,77.0,29.0,69.021972,116.0,42.0,3.159012,4.57031,2.10938,16.45,21.3,13.5,34.5,52.3,29.7,1.511111,1.9,1.2,1.511111,1.9,1.2,241.0,241.0,241.0,10.8,11.9,9.8,32.5,35.0,30.0,12.241667,16.1,7.8,8.5,8.5,8.5,83.5,83.5,83.5,87.0,121.0,53.0,66.666667,118.0,34.0,60.333333,92.0,24.0,0.466667,0.5,0.4,112.357143,119.0,106.0,3.0,3.1,2.7,3.961224,4.5,3.2,2.28,3.1,1.5,1.133488,1.23,1.05,145.647059,152.0,140.0,23.846154,29.0,20.0,60.866667,85.0,28.0,5.5,5.5,5.5,109.974684,189.0,58.0,1.525,2.1,1.3,0.145161,4.0,-2.0,38.419355,54.0,26.0,0.145161,4.0,-2.0,7.416308,7.5,7.3,360.0,364.0,364.0,43.333333,60.0,40.0,120.0,50.0,2.0,187.5,375.0,0.0,600.0,700.0,500.0,189.416667,245.0,137.0,0,M,white,MARRIED,Private,ENGL,1,0,0,0,0,127.3,175.26,0,0,0,0,0,0,0,0,1,0,0,1,0,1,0,0,0,0,0,0,CSRU,CSRU,EMERGENCY ROOM,EMERGENCY,0,1,0
6,36.781818,37.299999,36.400002,36.666667,36.7,36.2,93.666667,97.0,89.0,99.25,100.0,99.0,16.769231,26.0,14.0,116.5,141.0,91.0,56.833333,67.0,46.0,75.666667,93.0,59.0,2.88325,3.25381,2.51269,13.8,13.8,13.8,40.9,40.9,40.9,1.2,1.2,1.2,1.2,1.2,1.2,312.166667,422.0,365.0,12.5,12.5,12.5,35.0,36.0,33.0,20.5,20.5,20.5,10.0,9.8,9.9,87.1,87.4,87.0,34.0,37.0,34.0,85.25,74.0,77.0,82.0,76.0,81.0,1.3,1.4,1.3,115.0,115.0,115.0,2.18,2.3,2.2,3.9,4.2,3.6,0.7,0.7,0.7,1.25,1.25,1.25,139.0,139.0,139.0,25.0,25.0,25.0,15.0,15.0,15.0,10.0,8.1,7.9,102.5,118.0,87.0,1.5,1.5,1.4,0.0,0.0,0.0,43.0,43.0,43.0,0.0,0.0,0.0,7.37,7.37,7.37,486.0,506.0,456.0,62.5,92.0,40.0,185.333333,286.0,0.0,370.0,370.0,370.0,625.0,700.0,550.0,218.0,218.0,218.0,0,M,white,MARRIED,Private,ENGL,0,0,0,0,1,78.8,172.72,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,0,0
7,36.195455,37.200001,35.900002,37.0,37.5,36.5,80.363636,87.0,79.0,100.0,100.0,100.0,15.75,24.0,12.0,112.681818,142.0,84.0,64.545455,76.0,49.0,80.545455,100.0,62.0,2.280173,3.12069,1.95259,14.9,14.9,14.9,28.1,28.1,28.1,1.3,1.3,1.3,1.3,1.3,1.3,572.0,630.0,497.0,11.3,11.3,11.3,29.5,30.0,29.0,34.8,35.7,34.5,8.05,8.0,8.0,85.6,86.9,86.0,37.0,37.0,37.0,236.0,229.0,245.0,191.666667,154.0,233.0,1.05,1.1,0.9,111.0,111.0,111.0,2.2,2.6,1.8,4.05,4.2,3.9,0.9,0.9,0.9,1.19,1.23,1.15,142.0,142.0,142.0,22.0,22.0,22.0,11.0,11.0,11.0,6.2,6.3,6.6,148.4,172.0,123.0,5.544444,6.7,4.5,-2.666667,-2.0,-3.0,38.0,43.0,35.0,-2.666667,-2.0,-3.0,7.363333,7.38,7.33,473.0,477.0,475.0,45.0,50.0,40.0,227.0,300.0,0.0,375.0,375.0,375.0,565.0,600.0,500.0,232.0,232.0,232.0,0,M,white,MARRIED,Medicare,CAPE,0,0,0,0,1,103.6,182.88,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,1,0
8,37.821053,38.200001,37.5,37.275,37.6,37.2,84.210526,104.0,75.0,98.0,100.0,92.0,14.805556,20.0,10.0,117.842105,150.0,100.0,56.315789,69.0,49.0,76.842105,94.0,64.0,2.53125,2.53125,2.53125,14.8125,14.9,14.8,30.2,30.7,29.9,1.333333,1.3,1.4,1.35,1.3,1.4,268.25,280.0,266.0,12.2,13.0,11.6,37.166667,38.0,36.0,11.4,15.6,7.2,7.2,9.0,6.8,79.8,82.0,78.9,37.5,44.0,45.0,55.0,54.0,49.0,52.0,85.0,30.0,0.7,0.7,0.7,104.5,107.0,103.0,2.15,2.4,1.9,4.4,4.5,4.3,6.7,7.7,5.9,1.16,1.19,1.13,139.5,140.0,138.0,26.5,27.0,26.0,20.0,22.0,18.0,6.0,5.9,6.0,140.833333,150.0,120.0,1.3,1.4,1.0,-1.25,1.0,-3.0,44.75,59.0,35.0,-1.25,1.0,-3.0,7.345,7.42,7.3,383.0,385.0,384.0,70.0,100.0,50.0,177.666667,260.0,0.0,420.0,700.0,270.0,540.0,600.0,400.0,134.666667,157.0,110.0,0,M,white,MARRIED,Medicare,PTUN,0,0,0,0,1,98.18,179.07,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,0,0
9,36.529412,37.599998,35.299999,38.05,38.2,37.9,86.055556,99.0,79.0,100.0,100.0,100.0,14.222222,16.0,14.0,116.888889,147.0,85.0,60.5,76.0,49.0,80.444444,99.0,64.0,2.178978,2.80114,1.66477,15.4,15.7,15.1,51.0,51.0,51.0,1.4,1.4,1.4,1.4,1.4,1.4,292.0,295.0,283.0,8.3,8.3,8.3,25.5,26.0,26.0,10.2,10.2,10.2,12.9,12.9,12.9,70.4,70.7,70.4,40.0,41.0,40.0,712.6,594.0,625.0,276.25,341.0,181.0,0.6,0.7,0.5,119.0,119.0,119.0,2.333333,2.5,2.0,3.95,4.3,3.6,0.5,0.5,0.5,1.065,1.12,1.01,139.0,139.0,139.0,23.0,23.0,23.0,15.0,15.0,15.0,5.3,5.3,5.3,116.857143,167.0,67.0,2.633333,2.7,2.5,1.0,1.0,1.0,37.0,37.0,37.0,1.0,1.0,1.0,7.44,7.44,7.44,450.0,465.0,438.0,50.0,50.0,50.0,159.0,286.0,0.0,272.0,272.0,272.0,470.0,500.0,450.0,127.0,127.0,127.0,0,F,black,SINGLE,Private,ENGL,1,0,0,0,0,67.4,157.48,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,1,0


In [45]:
y = np.asarray([i.to_pydatetime() for i in df["int_time1"]])
z = np.asarray([i.to_pydatetime() for i in df["outtime"]])
dfImputed['icu_stay_duration'] = [i.total_seconds() for i in z-y]
dfImputed[['hadm_id','subject_id']] = df[['hadm_id','subject_id']]
dfImputed[['int_time1', 'ext_time1', 'duration1','int_time2', 'ext_time2','duration2']] = df[['int_time1', 'ext_time1', 'duration1','int_time2', 'ext_time2','duration2']] #marcel not #allen
dfImputed

Unnamed: 0,temp_mean,temp_max,temp_min,bg_temp_mean,bg_temp_max,bg_temp_min,hr_mean,hr_max,hr_min,spo2_mean,spo2_max,spo2_min,rr_mean,rr_max,rr_min,sbp_mean,sbp_max,sbp_min,dbp_mean,dbp_max,dbp_min,meanbp_mean,meanbp_max,meanbp_min,cardiac_index_mean,cardiac_index_max,cardiac_index_min,pt_mean,pt_max,pt_min,ptt_mean,ptt_max,ptt_min,inr_mean,inr_max,inr_min,inr_1_mean,inr_1_max,inr_1_min,fibrinogen_mean,fibrinogen_max,fibrinogen_min,hb_mean,hb_max,hb_min,hematocrit_mean,hematocrit_max,hematocrit_min,wcc_mean,wcc_max,wcc_min,lymphocytes_mean,lymphocytes_max,lymphocytes_min,neutrophils_mean,neutrophils_max,neutrophils_min,alp_mean,alp_max,alp_min,ast_mean,ast_max,ast_min,alt_mean,alt_max,alt_min,bilirubin_total_mean,bilirubin_total_max,bilirubin_total_min,chloride_mean,chloride_max,chloride_min,magnesium_mean,magnesium_max,magnesium_min,potassium_mean,potassium_max,potassium_min,creatinine_mean,creatinine_max,creatinine_min,free_calcium_mean,free_calcium_max,free_calcium_min,sodium_mean,sodium_max,sodium_min,bicarb_mean,bicarb_max,bicarb_min,bun_mean,bun_max,bun_min,hba1c_mean,hba1c_max,hba1c_min,glucose_mean,glucose_max,glucose_min,lactate_mean,lactate_max,lactate_min,po2_mean,po2_max,po2_min,pco2_mean,pco2_max,pco2_min,baseexcess_mean,baseexcess_max,baseexcess_min,ph_mean,ph_max,ph_min,aado2_mean,aado2_max,aado2_min,fio2_mean,fio2_max,fio2_min,insulin_mean,insulin_max,insulin_min,prbc_mean,prbc_max,prbc_min,tidalvol_mean,tidalvol_max,tidalvol_min,plt_mean,plt_max,plt_min,infection_vent,gender,ethnicity,marital_status,insurance,language,aortic,mit,tricuspid,pulmonary,cabg,weight,height,reintubation,liver_severe,liver_mild,rheum,cvd,aids,ckd,copd,arrhythmia,pud,smoking,pvd,paraplegia,ccf,met_ca,t2dm,t1dm,malig,mi,dementia,first_careunit,last_careunit,admission_location,admission_type,hospital_expire_flag,diab_un,diab_cc,icu_stay_duration,hadm_id,subject_id,int_time1,ext_time1,duration1,int_time2,ext_time2,duration2
0,36.031745,36.444444,35.611110,37.450000,37.8,37.0,89.000000,98.0,79.0,100.000000,100.0,100.0,14.230769,16.0,14.0,111.166667,123.0,90.0,54.750000,59.0,44.0,68.333333,74.0,55.0,3.370576,3.92350,2.78488,14.450000,15.0,14.3,28.850000,29.1,29.2,1.283333,1.3,1.3,1.29,1.3,1.3,136.0,139.0,138.0,11.050000,11.0,11.2,32.666667,33.0,32.0,16.10,17.5,14.8,10.400000,13.3,8.5,85.00,86.0,83.7,100.500000,109.0,85.0,25.00,26.0,28.0,17.750000,18.0,17.0,0.500000,0.5,0.5,110.500000,112.0,109.0,1.900000,2.1,1.7,3.900000,3.9,3.9,0.90,1.0,0.8,1.2800,1.28,1.28,137.0,137.0,137.0,23.00,23.0,23.0,16.666667,18.0,15.0,6.40,6.4,6.1,95.000000,159.0,79.0,1.950000,2.1,1.9,2.000000,2.0,2.0,45.000000,45.0,45.0,2.000000,2.0,2.0,7.390000,7.39,7.39,482.00,490.0,478.0,46.666667,50.0,40.0,202.666667,291.000000,184.000000,466.666673,800.000000,275.000010,800.000000,800.0,800.0,143.000000,153.0,129.0,0,M,white,DIVORCED,Private,ENGL,1,0,0,0,0,69.50,167.64,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,0,0,91283.0,173798,29491,2111-02-16 10:00:00,2111-02-16 13:00:00,3.0,NaT,NaT,
1,36.376923,36.500000,36.099998,36.675000,37.0,36.3,84.538462,90.0,78.0,99.923077,100.0,99.0,15.576923,24.5,11.0,106.384615,123.0,81.0,51.000000,59.0,41.0,65.538462,76.0,52.0,2.293039,4.05128,1.84615,15.800000,16.4,15.6,38.700000,38.7,39.2,1.400000,1.5,1.4,1.40,1.5,1.4,179.0,179.0,179.0,12.350000,13.1,11.7,30.500000,29.0,30.0,6.80,6.9,6.4,9.800000,12.5,7.5,69.20,69.4,69.0,53.000000,54.0,52.0,82.00,90.0,74.0,70.000000,70.0,65.0,0.650000,0.7,0.6,107.666667,111.0,105.0,1.980000,2.2,1.9,4.200000,4.2,4.2,0.70,0.7,0.7,1.2700,1.28,1.26,136.5,137.0,136.0,23.00,24.0,22.0,13.000000,14.0,12.0,6.00,6.0,6.0,100.500000,103.0,98.0,2.700000,2.7,2.1,0.000000,0.0,0.0,44.000000,47.0,41.0,0.000000,0.0,0.0,7.365000,7.38,7.35,352.00,357.0,356.0,50.000000,50.0,50.0,232.400000,357.000000,0.000000,300.000000,551.000000,0.000000,800.000000,800.0,800.0,117.333333,135.0,120.0,0,M,white,WIDOWED,Medicare,ENGL,1,0,0,0,1,82.00,157.48,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,0,0,103854.0,197759,26775,2192-04-20 12:00:00,2192-04-20 15:00:00,3.0,NaT,NaT,
2,36.235714,36.799999,35.400002,36.300000,36.6,36.0,84.910714,93.0,71.0,98.785714,100.0,96.0,19.071429,38.0,10.0,125.196429,194.0,76.0,54.642857,73.0,40.0,78.053571,113.0,53.0,2.346591,3.35227,1.35795,16.900000,22.1,13.8,46.133333,73.2,32.2,1.600000,2.0,1.3,1.60,2.0,1.3,187.0,203.0,175.0,12.450000,12.7,12.2,38.000000,38.0,38.0,20.70,20.7,20.7,9.720000,11.9,9.0,82.30,85.0,80.2,49.000000,49.0,49.0,81.00,81.0,81.0,33.000000,33.0,33.0,0.500000,0.5,0.5,110.500000,111.0,110.0,2.500000,2.6,2.4,4.475000,5.1,3.4,0.95,1.1,0.8,1.1125,1.18,0.95,136.0,137.0,135.0,22.00,22.0,22.0,18.000000,19.0,17.0,5.40,5.4,5.4,129.760000,181.0,87.0,1.650000,1.8,1.5,-4.000000,-1.0,-7.0,36.000000,44.0,31.0,-4.000000,-1.0,-7.0,7.353750,7.40,7.28,487.00,567.0,400.0,40.000000,40.0,40.0,226.500000,635.000000,24.266668,700.000006,1400.000000,350.000000,415.000000,490.0,340.0,62.000000,63.0,61.0,0,F,hispanic,MARRIED,Medicare,HIND,0,0,0,0,1,66.20,162.56,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,TRANSFER FROM HOSPITAL,EMERGENCY,0,0,0,569413.0,193167,23782,2170-01-01 20:00:00,2170-01-02 13:30:00,17.5,NaT,NaT,
3,35.726316,36.799999,34.500000,36.740000,36.8,36.6,71.190476,83.0,58.0,99.772727,100.0,98.0,12.500000,17.0,10.0,120.545455,152.0,96.0,53.136364,66.0,39.0,76.285714,98.0,58.0,2.498595,2.92135,1.85393,13.300000,13.3,13.3,41.500000,41.5,41.5,1.200000,1.2,1.2,1.20,1.2,1.2,143.0,144.0,143.0,11.000000,11.0,11.0,33.000000,33.0,33.0,10.40,10.4,10.4,13.600000,13.6,13.3,81.30,82.0,81.5,246.000000,354.0,194.0,499.40,564.0,434.0,122.000000,236.0,140.0,0.900000,1.2,0.8,112.000000,112.0,112.0,2.650000,2.9,2.4,4.166667,4.6,3.6,0.90,0.9,0.9,1.2050,1.25,1.16,139.0,139.0,139.0,26.00,26.0,26.0,17.000000,17.0,17.0,5.70,5.7,5.7,125.722222,165.0,74.0,1.050000,1.3,0.9,-0.500000,0.0,-1.0,49.000000,51.0,44.0,-0.500000,0.0,-1.0,7.330000,7.38,7.30,467.25,546.0,398.0,40.000000,40.0,40.0,207.333333,319.000000,0.000000,216.666667,375.000000,0.000000,685.714286,717.0,600.0,136.000000,136.0,136.0,0,F,other,DIVORCED,Private,ENGL,0,1,0,0,0,70.00,154.94,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,CSRU,CSRU,PHYSICIAN REFERRAL,ELECTIVE,0,0,0,83878.0,127967,32056,2141-04-03 12:00:00,2141-04-03 19:00:00,7.0,NaT,NaT,
4,36.194445,36.388889,36.000002,35.700000,35.9,35.4,82.153846,88.0,74.0,100.000000,100.0,100.0,13.153846,26.0,10.0,107.615385,126.0,94.0,59.538462,67.0,47.0,93.307692,277.0,63.0,3.253920,6.43243,2.29500,16.300000,16.3,16.3,32.200000,32.2,32.2,1.500000,1.5,1.5,1.50,1.5,1.5,274.0,285.0,249.0,10.466667,11.6,9.2,31.250000,33.0,29.0,16.05,17.6,14.6,21.300000,21.0,22.3,72.00,71.0,71.6,37.000000,38.0,37.0,46.00,50.0,43.0,33.000000,38.0,32.0,3.600000,3.5,3.3,108.000000,108.0,108.0,3.075000,3.5,2.7,3.650000,3.8,3.5,1.25,1.3,1.2,1.2800,1.28,1.28,137.0,139.0,135.0,18.75,19.0,18.0,21.500000,22.0,21.0,5.05,5.1,5.0,110.000000,115.0,105.0,1.450000,1.9,1.0,-2.750000,0.0,-5.0,41.000000,44.0,38.0,-2.750000,0.0,-5.0,7.337500,7.39,7.31,360.00,356.0,335.0,70.000000,100.0,50.0,350.000000,700.000000,242.000000,800.000000,1400.000000,626.000000,533.333333,600.0,400.0,102.000000,102.0,102.0,0,F,white,MARRIED,Private,ENGL,0,0,0,0,1,72.10,167.64,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CSRU,CSRU,CLINIC REFERRAL/PREMATURE,EMERGENCY,0,0,0,235046.0,115784,2907,2188-01-15 18:00:00,2188-01-15 23:30:00,5.5,NaT,NaT,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
9469,36.940000,37.670000,36.330000,36.750000,36.8,36.7,80.000000,81.0,79.0,99.833333,100.0,99.0,14.000000,14.0,14.0,118.666667,139.0,103.0,69.916667,80.0,57.0,87.500000,103.0,72.0,3.194444,3.47150,2.18972,13.166667,15.4,11.9,41.500000,47.6,34.7,1.200000,1.4,1.1,1.20,1.4,1.1,225.0,232.0,217.0,12.100000,12.1,12.1,35.000000,35.0,35.0,12.30,12.3,12.3,6.233333,6.7,5.6,68.50,69.3,68.0,52.000000,54.0,50.0,90.75,90.0,75.0,23.000000,22.0,15.0,3.520000,3.5,3.5,113.000000,113.0,113.0,1.700000,1.8,1.6,3.900000,3.9,3.9,0.70,0.7,0.7,1.1200,1.12,1.12,137.0,137.0,137.0,22.00,22.0,22.0,13.000000,13.0,13.0,5.70,5.5,5.5,138.000000,138.0,138.0,1.750000,1.9,1.5,218.000000,218.0,218.0,38.000000,38.0,38.0,-1.000000,-1.0,-1.0,7.380000,7.38,7.38,453.00,472.0,439.0,67.500000,100.0,50.0,2.791667,4.500000,2.000000,312.499995,349.999987,300.000000,766.666667,800.0,700.0,84.000000,84.0,84.0,0,M,white,SINGLE,Medicare,ENGL,0,1,0,0,1,80.60,170.00,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,CVICU,CVICU,PHYSICIAN REFERRAL,ELECTIVE,0,0,0,274585.0,22392962,18862411,2138-02-19 13:09:00,2138-02-19 16:00:00,3.0,NaT,NaT,
9470,35.431667,37.390000,34.100000,36.537500,37.1,36.0,78.400000,100.0,59.0,99.800000,100.0,98.0,15.500000,25.0,10.0,109.000000,125.0,76.0,58.066667,70.0,41.0,77.200000,91.0,54.0,3.076382,6.09442,1.79558,15.566667,16.1,15.8,44.900000,48.9,41.0,1.416667,1.4,1.4,1.40,1.4,1.4,257.0,258.0,252.0,11.000000,11.5,10.5,33.500000,35.0,32.0,20.30,23.0,18.6,8.750000,8.8,8.6,87.45,88.4,86.0,34.000000,39.0,26.0,59.00,65.0,57.0,17.000000,18.0,17.0,3.100000,4.1,3.4,108.000000,108.0,108.0,2.163158,2.6,1.9,3.780000,3.9,3.5,0.60,0.6,0.6,1.1675,1.27,1.10,137.0,137.0,137.0,24.00,25.0,23.0,14.500000,17.0,12.0,6.50,6.5,6.5,123.250000,138.0,104.0,2.133333,2.6,1.5,186.750000,280.0,134.0,38.000000,43.0,32.0,-0.250000,0.0,-1.0,7.402500,7.46,7.37,416.00,419.0,402.0,63.333333,100.0,60.0,14.381326,26.677310,6.666667,187.500000,150.000000,175.000000,500.000000,500.0,500.0,104.500000,100.0,104.0,0,F,white,MARRIED,Other,ENGL,1,0,0,0,1,67.60,163.00,0,0,0,1,0,0,0,0,1,0,1,0,0,0,0,1,0,0,0,0,CVICU,CVICU,PHYSICIAN REFERRAL,ELECTIVE,0,0,1,296735.0,22890957,17196174,2195-04-15 12:00:00,2195-04-15 22:00:00,10.0,NaT,NaT,
9471,36.666667,36.720000,36.610000,36.700000,36.7,36.7,77.416667,86.0,68.0,99.888889,100.0,99.0,16.923077,25.0,14.0,102.916667,120.0,87.0,69.916667,82.0,61.0,82.250000,94.0,72.0,2.094444,2.38756,1.93069,13.500000,13.5,13.5,31.000000,31.0,31.0,1.200000,1.2,1.2,1.20,1.2,1.2,207.0,195.0,204.0,13.500000,13.5,13.5,33.111111,34.0,31.0,11.40,11.4,11.4,12.500000,14.0,12.9,76.00,75.0,76.0,50.000000,58.0,45.0,188.00,233.0,104.0,219.333333,173.0,217.0,0.450000,0.5,0.4,106.000000,106.0,106.0,3.000000,3.8,2.4,4.325000,4.5,4.2,0.70,0.7,0.7,1.2000,1.27,1.15,136.5,137.0,136.0,24.00,24.0,24.0,12.000000,12.0,12.0,6.40,6.4,6.6,131.333333,150.0,120.0,1.100000,1.1,1.1,205.250000,417.0,120.0,47.750000,52.0,43.0,-1.750000,0.0,-3.0,7.315000,7.38,7.29,279.00,285.0,282.0,41.111111,50.0,40.0,3.107415,7.470447,0.166724,300.000000,350.000010,247.000008,750.000000,752.0,700.0,142.000000,142.0,142.0,0,M,white,SINGLE,Other,ENGL,0,0,0,0,1,75.95,169.00,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,CVICU,CVICU,TRANSFER FROM HOSPITAL,URGENT,0,0,0,265628.0,23679187,18771362,2132-02-17 16:21:00,2132-02-18 00:00:00,8.0,NaT,NaT,
9472,37.281667,38.390000,36.100000,37.550000,37.8,37.1,70.294118,80.0,64.0,98.625000,100.0,95.0,22.764706,27.5,17.0,109.470588,128.0,79.0,48.235294,54.0,37.0,67.235294,76.0,50.0,2.407500,3.31395,1.83838,15.900000,15.9,15.9,30.000000,30.0,30.0,1.500000,1.5,1.5,1.50,1.5,1.5,234.0,257.0,212.0,9.400000,9.6,9.2,29.000000,29.0,29.0,12.20,12.2,12.2,16.900000,17.1,16.8,53.00,56.0,53.0,46.666667,51.0,43.0,58.00,57.0,60.0,7.000000,10.0,3.0,0.433333,0.5,0.4,100.333333,103.0,97.0,2.433333,2.6,2.4,4.962500,5.7,3.9,5.20,5.2,5.2,1.1725,1.31,1.09,136.0,138.0,134.0,25.00,25.0,25.0,24.000000,24.0,24.0,5.10,5.1,5.1,114.666667,152.0,91.0,1.550000,1.8,1.3,106.800000,143.0,82.0,42.000000,45.0,40.0,1.600000,4.0,0.0,7.411667,7.45,7.37,473.50,482.0,471.0,40.000000,40.0,40.0,10.000000,10.000000,10.000000,906.000000,906.000000,906.000000,450.000000,450.0,450.0,133.000000,133.0,133.0,0,M,white,DIVORCED,Medicare,ENGL,1,0,0,0,1,84.30,178.00,0,0,1,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,CVICU,CVICU,TRANSFER FROM HOSPITAL,URGENT,0,0,0,362229.0,29365550,19243474,2118-01-29 12:00:00,2118-01-30 00:00:00,12.0,NaT,NaT,


In [46]:
#dfImputed.to_csv('imputed.csv') #allen
dfImputed.to_csv('imputed_m.csv')  #marcel