## Import Libraries

In [1121]:
import pandas as pd
import numpy as np
from sklearn.utils import resample

## Import Tables

In [1122]:
# Doug's Path
diagnoses_icd = pd.read_csv('data/mimic-iv-0.4/hosp/diagnoses_icd.csv.gz', compression='gzip')
d_icd_diagnoses = pd.read_csv('data/mimic-iv-0.4/hosp/d_icd_diagnoses.csv.gz', compression='gzip')
admissions = pd.read_csv('data/mimic-iv-0.4/core/admissions.csv.gz', compression='gzip')
d_labitems = pd.read_csv('data/mimic-iv-0.4/hosp/d_labitems.csv.gz', compression='gzip')

# # Stephen's Path
# path = "D:\\Bootcamp\\MIMIC IV\\"
# admissions = pd.read_csv(path + "core\\admissions.csv.gz", compression='gzip')
# diagnoses_icd = pd.read_csv(path + "hosp\\diagnoses_icd.csv.gz", compression='gzip')
# d_icd_diagnoses = pd.read_csv(path + "hosp\\d_icd_diagnoses.csv.gz", compression='gzip')
# d_labitems = pd.read_csv(path + "hosp\\d_labitems.csv.gz", compression='gzip')

## Pull codes related to Acute Kidney Failure

In [1123]:
# Congestive Heart Failure
# chf_codes = list(map(str, d_icd_diagnoses[(d_icd_diagnoses['long_title'].str.lower().str.contains('congestive')) & (d_icd_diagnoses['long_title'].str.lower().str.contains('heart'))]['icd_code']))

kidney_list = list(d_icd_diagnoses[(d_icd_diagnoses['long_title'].str.lower().str.contains('kidney')) & (d_icd_diagnoses['long_title'].str.lower().str.contains('failure'))]['icd_code'])
pd.DataFrame(diagnoses_icd[diagnoses_icd['icd_code'].isin(kidney_list)].icd_code.value_counts()).reset_index().head(20).merge(d_icd_diagnoses, left_index = True, left_on = "index", right_on = 'icd_code', how = 'left')

# ICD Codes we care about
# 5849, N179, 5845, N170
akf_codes = ['5849   ', 'N179   ', '5845   ', 'N170   ']


## Start filtering down to only records where AKF is True

In [1124]:
diagnoses_icd_akf = diagnoses_icd[diagnoses_icd['icd_code'].isin(akf_codes)]


In [1125]:
diagnoses_icd_akf.head()

Unnamed: 0,subject_id,hadm_id,seq_num,icd_code,icd_version
76,19586042,23279761,2,5849,9
517,16108683,21607477,4,5845,9
537,14411859,24976204,12,5845,9
826,17752053,24437021,2,5849,9
893,16569548,24870770,5,5849,9


## Generate new Admissions table with hospital stay duration and AKF flag

In [1126]:
admissions_akf = admissions[['subject_id', 'hadm_id', 'admittime', 'dischtime', 'ethnicity']]

admissions_akf['AKF_subj'] = np.where(admissions_akf.subject_id.isin(diagnoses_icd_akf.subject_id), 1, 0)
admissions_akf['AKF_adm'] = np.where(admissions_akf.hadm_id.isin(diagnoses_icd_akf.hadm_id), 1, 0)
admissions_akf['time_spent'] = pd.to_datetime(admissions_akf['dischtime']) - pd.to_datetime(admissions_akf['admittime'])


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  This is separate from the ipykernel package so we can avoid doing imports until
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  after removing the cwd from sys.path.
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  """


In [1127]:
admissions_akf.head(10)

Unnamed: 0,subject_id,hadm_id,admittime,dischtime,ethnicity,AKF_subj,AKF_adm,time_spent
0,12427812,21593330,2184-01-06 11:51:00,2184-01-10 11:45:00,UNKNOWN,0,0,3 days 23:54:00
1,14029832,22059088,2120-01-18 01:28:00,2120-01-20 16:13:00,OTHER,0,0,2 days 14:45:00
2,14495017,22484010,2175-01-28 15:41:00,2175-01-29 16:00:00,WHITE,0,0,1 days 00:19:00
3,13676048,23865469,2193-01-19 05:27:00,2193-01-24 18:59:00,WHITE,0,0,5 days 13:32:00
4,13831972,27763544,2131-01-27 04:03:00,2131-01-27 05:39:00,WHITE,0,0,0 days 01:36:00
5,18523038,25414328,2142-08-26 17:14:00,2142-08-27 10:00:00,WHITE,0,0,0 days 16:46:00
6,16705931,20580522,2174-10-24 11:30:00,2174-10-24 18:45:00,WHITE,1,0,0 days 07:15:00
7,19963742,24951506,2171-07-04 15:58:00,2171-07-05 13:37:00,UNKNOWN,0,0,0 days 21:39:00
8,10903424,22568585,2181-01-31 13:09:00,2181-01-31 13:42:00,WHITE,0,0,0 days 00:33:00
9,15030422,21975876,2149-09-21 23:54:00,2149-09-22 03:59:00,WHITE,0,0,0 days 04:05:00


## Sample Target Patients for Modeling

In [1128]:
target_sample = admissions_akf[['subject_id', 'AKF_subj']].drop_duplicates()

target_sample = resample(target_sample, n_samples = 10000, replace = False, stratify = target_sample.AKF_subj, random_state = 0)

print('Number of unique Patients: ', target_sample.subject_id.nunique())
print('\nSample Breakdown:')
print(target_sample.AKF_subj.value_counts())

Number of unique Patients:  10000

Sample Breakdown:
0    8846
1    1154
Name: AKF_subj, dtype: int64


In [1129]:
# identify first akf visit for NON-AKF patients
sample_non = target_sample[target_sample.AKF_subj==0]
admissions_non = admissions[admissions.subject_id.isin(sample_non.subject_id)]
admissions_non['admittime'] = pd.to_datetime(admissions_non.admittime)
first_non = admissions_non.loc[admissions_non.groupby('subject_id').admittime.idxmin()]
# sanity checks
print(first_non.shape)                 # number of rows
print(first_non.subject_id.nunique())  # matches number of patients
print(first_non.hadm_id.nunique())     # matches number of visits

# pull out hospital visits for target non-akf samples
sample_non = sample_non.merge(first_non, how='inner', on='subject_id')
sample_non = sample_non[['subject_id', 'hadm_id', 'AKF_subj']]
sample_non = sample_non.rename({'AKF_subj':'AKF'}, axis=1)

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  after removing the cwd from sys.path.


(8846, 15)
8846
8846


In [1130]:
# identify first akf visit for all AKF patients
sample_akf = target_sample[target_sample.AKF_subj==1]
first_akf = admissions_akf[admissions_akf.subject_id.isin(sample_akf.subject_id)]
first_akf['admittime'] = pd.to_datetime(first_akf.admittime)
first_akf = first_akf.loc[first_akf[first_akf.AKF_adm==1].groupby('subject_id').admittime.idxmin()]
first_akf = first_akf[['subject_id', 'hadm_id', 'AKF_adm']]
# sanity checks
print(np.mean(first_akf.AKF_adm))   # make sure everyone has AKF
print(first_akf.shape)                 # make sure number of rows...
print(first_akf.subject_id.nunique())  # ...matches number of patients
print(first_akf.hadm_id.nunique())     # ...matches number of visits

# pull out hospital visits for target akf samples
sample_akf = sample_akf.merge(first_akf, how='inner', on='subject_id')
sample_akf = sample_akf[['subject_id', 'hadm_id', 'AKF_adm']]
sample_akf = sample_akf.rename({'AKF_adm':'AKF'}, axis=1)

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  after removing the cwd from sys.path.


1.0
(1154, 3)
1154
1154


In [1131]:
# merge back together and write to file
admissions_sample = pd.concat([sample_akf, sample_non])
admissions_sample = admissions_sample.reset_index(drop=True)
print(admissions_sample.shape)                  # sanity check
print(admissions_sample.subject_id.nunique())   # sanity check

(10000, 3)
10000


Generate pickle file so we all work on the exact same data

In [1132]:
admissions_sample.to_pickle('admissions_sample.pkl')

In [13]:
# admissions_sample = pd.read_pickle("admissions_sample.pkl")

## Pull Chart and Lab data only where it matches our sample patient list

## We have Decided not to use Chart data after exploring it further

In [14]:
# %%time #run this for next time

# chunksize = 3*(10 ** 6)
# counter=0
# chartevents_sample = []
# for chunk in pd.read_csv('data/mimic-iv-0.4/icu/chartevents.csv.gz', compression='gzip', chunksize=chunksize):
#     chartevents_sample.append(chunk[chunk['subject_id'].isin(list(admissions_sample.subject_id))])
#     counter+=1
#     print(f'chunk {counter} processed')

# chartevents_final = pd.concat(chartevents_sample)


In [15]:
# chartevents_final.to_pickle("chartevents_final.pkl")

In [16]:
# chartevents_final = pd.read_pickle("chartevents_final.pkl")

In [17]:
# chartevents_final.shape

(7602370, 10)

Load Lab Events table

In [1133]:
%%time

chunksize = 3*(10 ** 6)
counter=0
lab_events_sample = []
for chunk in pd.read_csv('data/mimic-iv-0.4/hosp/labevents.csv.gz', compression='gzip', chunksize=chunksize):
    lab_events_sample.append(chunk[chunk['subject_id'].isin(list(admissions_sample.subject_id))])
    counter+=1
    print(f'chunk {counter} processed')

lab_events_final = pd.concat(lab_events_sample)
# 3min 52s


chunk 1 processed
chunk 2 processed
chunk 3 processed




chunk 4 processed
chunk 5 processed
chunk 6 processed
chunk 7 processed
chunk 8 processed
chunk 9 processed




chunk 10 processed




chunk 11 processed
chunk 12 processed
chunk 13 processed
chunk 14 processed
chunk 15 processed




chunk 16 processed
chunk 17 processed
chunk 18 processed
chunk 19 processed
chunk 20 processed
chunk 21 processed
chunk 22 processed
chunk 23 processed




chunk 24 processed
chunk 25 processed
chunk 26 processed
chunk 27 processed
chunk 28 processed
chunk 29 processed
chunk 30 processed
chunk 31 processed
chunk 32 processed
chunk 33 processed
chunk 34 processed
chunk 35 processed
chunk 36 processed
chunk 37 processed
chunk 38 processed
chunk 39 processed
chunk 40 processed
chunk 41 processed
CPU times: user 4min 25s, sys: 24.3 s, total: 4min 49s
Wall time: 4min 52s


In [1134]:
# lab_events_final.to_pickle("lab_events_final.pkl")

In [20]:
lab_events_final = pd.read_pickle("lab_events_final.pkl")

In [1135]:
lab_events_final.shape

(4570117, 15)

## Manipulating the Data

Take only records related to our sample patients

Filter lab events based on first hospital visit of our sample population

In [1136]:
admissions_sample = pd.read_pickle("admissions_sample.pkl")

In [1137]:
# lab_events_sampled = lab_events_final.copy()
%time lab_events_sampled = lab_events_final[lab_events_final['hadm_id'].isin(admissions_sample.hadm_id)]


CPU times: user 1.32 s, sys: 913 ms, total: 2.24 s
Wall time: 2.75 s


Check how many patients have had each test done

In [1138]:
lab_events_sampled.groupby('itemid')['subject_id'].nunique().sort_values(ascending = False).head(10)

itemid
51221    6119
51265    6002
51222    5956
51301    5949
51248    5948
51249    5948
51250    5948
51279    5948
51277    5948
50971    5397
Name: subject_id, dtype: int64

Most common tests performed on patients with AKF

In [1139]:
lab_events_sampled[lab_events_sampled['subject_id'].isin(list(admissions_sample[admissions_sample['AKF'] == 1].subject_id))].groupby('itemid')['subject_id'].nunique().sort_values(ascending = False).head(10)


itemid
50912    1140
50971    1139
50902    1138
50983    1138
51006    1138
50882    1137
50868    1137
50931    1136
51221    1135
51265    1134
Name: subject_id, dtype: int64

Item Black List

In [1257]:
item_black_list = [50920]
# 50920 - test results are text in comments - need to come back and figure out how to handle this


Take only the X most commonly performed tests

In [1258]:
top_test_num = 40

lab_events_valid = lab_events_sampled[~lab_events_sampled['itemid'].isin(item_black_list)]

# On patients with AKF
itemid_sub_sample = lab_events_valid[lab_events_valid['subject_id'].isin(list(admissions_sample[admissions_sample['AKF'] == 1].subject_id))].groupby('itemid')['subject_id'].nunique().sort_values(ascending = False).head(top_test_num).reset_index().rename(columns = {'index' : 'itemid'}).itemid.to_list()
# On all sample patients
# itemid_sub_sample = lab_events_sampled.groupby('itemid')['subject_id'].nunique().sort_values(ascending = False).head(top_test_num).reset_index().rename(columns = {'index' : 'itemid'}).itemid.to_list()

lab_events_sampled_sub = lab_events_sampled[lab_events_sampled['itemid'].isin(itemid_sub_sample)]
# lab_events_sampled_sub = lab_events_sampled[lab_events_sampled['itemid'].isin([51466])]

lab_events_sampled_sub


Unnamed: 0,labevent_id,subject_id,hadm_id,specimen_id,itemid,charttime,storetime,value,valuenum,valueuom,ref_range_lower,ref_range_upper,flag,priority,comments
1695,30338499,12455866,24494044.0,13622007,51221,2135-02-16 04:07:00,2135-02-16 04:50:00,34.7,34.7,%,34.0,45.0,,ROUTINE,
1696,30338500,12455866,24494044.0,13622007,51222,2135-02-16 04:07:00,2135-02-16 04:50:00,11.1,11.1,g/dL,11.2,15.7,abnormal,ROUTINE,
1697,30338501,12455866,24494044.0,13622007,51248,2135-02-16 04:07:00,2135-02-16 04:50:00,31.4,31.4,pg,26.0,32.0,,ROUTINE,
1698,30338502,12455866,24494044.0,13622007,51249,2135-02-16 04:07:00,2135-02-16 04:50:00,32.0,32.0,g/dL,32.0,37.0,,ROUTINE,
1699,30338503,12455866,24494044.0,13622007,51250,2135-02-16 04:07:00,2135-02-16 04:50:00,98,98.0,fL,82.0,98.0,,ROUTINE,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
122202390,29500021,12390274,26496227.0,62980950,51275,2183-10-23 06:25:00,2183-10-23 08:14:00,94.6,94.6,sec,22.0,35.0,abnormal,ROUTINE,
122202391,29500022,12390274,26496227.0,80463807,51237,2183-10-24 06:50:00,2183-10-24 08:44:00,2.5,2.5,,0.9,1.1,abnormal,ROUTINE,
122202392,29500023,12390274,26496227.0,80463807,51274,2183-10-24 06:50:00,2183-10-24 08:44:00,26.0,26.0,sec,10.4,13.4,abnormal,ROUTINE,
122202393,29500024,12390274,26496227.0,80463807,51275,2183-10-24 06:50:00,2183-10-24 08:44:00,95.4,95.4,sec,22.0,35.0,abnormal,ROUTINE,


In [1259]:
lab_events_sampled_sub[lab_events_sampled_sub['itemid'] == 50920].comments.value_counts()

Series([], Name: comments, dtype: int64)

## Code to look into specific test values

In [1260]:
# lab_events_sampled_sub.groupby(['subject_id', 'hadm_id', 'itemid']).count()


In [1261]:
lab_events_sampled_sub_tiny = lab_events_sampled_sub[(lab_events_sampled_sub['subject_id'] == 19988493) & (lab_events_sampled_sub['hadm_id'] == 25600709.0) & (lab_events_sampled_sub['itemid'].isin([51237]))]#.valuenum.describe()
# lab_events_sampled_sub.loc[(lab_events_sampled_sub['subject_id'] == 19988493) & (lab_events_sampled_sub['hadm_id'] == 25600709.0) & (lab_events_sampled_sub['itemid'].isin([51478, 51484])),]



In [1262]:
# lab_events_sampled_sub_tiny['comments'] = lab_events_sampled_sub_tiny['comments'].replace(np.nan, 'NA')

lab_events_sampled_sub_tiny


Unnamed: 0,labevent_id,subject_id,hadm_id,specimen_id,itemid,charttime,storetime,value,valuenum,valueuom,ref_range_lower,ref_range_upper,flag,priority,comments
116765206,124205250,19988493,25600709.0,29865343,51237,2116-09-26 23:36:00,2116-09-27 00:26:00,1.1,1.1,,0.9,1.1,,STAT,
116765231,124205276,19988493,25600709.0,1870784,51237,2116-09-27 13:35:00,2116-09-27 14:09:00,1.2,1.2,,0.9,1.1,abnormal,STAT,
116765292,124205338,19988493,25600709.0,57401788,51237,2116-09-28 03:53:00,2116-09-28 05:02:00,1.0,1.0,,0.9,1.1,,ROUTINE,
116765394,124205451,19988493,25600709.0,75955093,51237,2116-09-30 06:20:00,2116-09-30 08:16:00,1.0,1.0,,0.9,1.1,,ROUTINE,


## Special updates for Urine sample tests

In [1263]:
print(lab_events_sampled_sub[(lab_events_sampled_sub['itemid'] == 51484)].value.unique())

print(lab_events_sampled_sub[(lab_events_sampled_sub['itemid'] == 51478)].value.unique())


['10' '40' '150' '80' '15' '50' nan 'TR' 'NEG' '20' '100' ' ']
['100' '300' '250' '70' '1000' '150' nan '200' 'NEG' 'TR' '>1000' '500'
 ' ']


In [1264]:
# lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51237) & (lab_events_sampled_sub['value'].isin(['>21.8', '>19.2', 'ERROR', 'UNABLE TO REPORT'])), ]


In [1265]:
# Other invalid value imputation
# For now set them all to normal/most common value
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51237) & (lab_events_sampled_sub['value'].isin([np.nan, 'ERROR', 'UNABLE TO REPORT'])), ['value', 'valuenum']] = 1.1
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51237) & (lab_events_sampled_sub['value'].isin(['>21.8'])), ['value', 'valuenum']] = 22
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51237) & (lab_events_sampled_sub['value'].isin(['>19.2'])), ['value', 'valuenum']] = 20

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51275) &  (lab_events_sampled_sub['value'].isin(['>150'])), ['value', 'valuenum']] = 175

# Should we just delete these?
# For 5k patients there are 6 records here
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51274) &  (lab_events_sampled_sub['value'].isin(['ERROR'])), ['value', 'valuenum']] = 11

# Should we just delete these?
# For 5k patients there are 1 records here
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51275) &  (lab_events_sampled_sub['value'].isin(['UNABLE TO REPORT'])), ['value', 'valuenum']] = 31

# Clumsy..
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51275) &  (lab_events_sampled_sub['value'].isin(['34..3'])), ['value', 'valuenum']] = 34.3


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self.obj[item] = s


In [1292]:
# Used to investigate bad data

lab_events_sampled_sub[lab_events_sampled_sub['value'] == 'Hazy']


Unnamed: 0,labevent_id,subject_id,hadm_id,specimen_id,itemid,charttime,storetime,value,valuenum,valueuom,ref_range_lower,ref_range_upper,flag,priority,comments
29206683,837862,10071770,20058526.0,43821983,51506,2167-12-06 22:35:00,2167-12-07 00:38:00,Hazy,,,,,,STAT,
29209799,3778019,10308297,27825244.0,21148621,51506,2189-01-23 15:32:00,2189-01-23 15:50:00,Hazy,,,,,,STAT,
29209840,3812668,10312004,28618375.0,27772278,51506,2111-11-08 00:44:00,2111-11-08 01:14:00,Hazy,,,,,,STAT,
29211496,5514860,10455613,27463431.0,69865966,51506,2192-04-12 15:42:00,2192-04-12 16:36:00,Hazy,,,,,,STAT,
29211497,5514877,10455613,27463431.0,31718314,51506,2192-04-12 16:05:00,2192-04-12 16:35:00,Hazy,,,,,,STAT,
29212511,6565399,10543835,29816199.0,12733735,51506,2193-01-19 08:28:00,2193-01-19 09:17:00,Hazy,,,,,,STAT,
29216171,10099394,10831490,25326327.0,33086536,51506,2127-01-20 02:18:00,2127-01-20 02:29:00,Hazy,,,,,,STAT,
29219268,13163543,11071368,26751790.0,7552103,51506,2137-11-14 20:36:00,2137-11-14 21:18:00,Hazy,,,,,,STAT,
29222726,16549016,11343910,26218486.0,65301522,51506,2190-09-07 22:25:00,2190-09-07 22:40:00,Hazy,,,,,,STAT,
29223489,17226732,11398464,27871803.0,19429645,51506,2116-02-20 23:38:00,2116-02-21 00:51:00,Hazy,,,,,,STAT,


In [1315]:
# Used to investigate bad data
pd.set_option('display.max_rows', 200)

# lab_events_sampled_sub[lab_events_sampled_sub['itemid'] == 51237].value.value_counts().reset_index().sort_values(by = 'index')
# lab_events_sampled_sub[lab_events_sampled_sub['itemid'] == 51514][['value', 'comments']].drop_duplicates()
lab_events_sampled_sub[lab_events_sampled_sub['itemid'] == 51506][['flag', 'comments', 'value', 'valuenum', 'ref_range_lower', 'ref_range_upper']].drop_duplicates()


# 51466 - measures blood in urine; value and comments sometimes differ; need to add mapping
# 51486 - same as above, leukocytes in the urine
# 51487 - same as above, nitrite in the urine
# 51464 - same as above, bilirubin in the urine
# 51484 - same as above, ketone in the urine
# 51478 - same as above, glucose in the urine
# 51514 - same as above, urobilinogen in the urine
# 51492 - same as above, protein in the urine
# 51506 - same as above, urine appearance

# lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51506) & (lab_events_sampled_sub['ref_range_lower'].isnull()), 'ref_range_lower'] = 0
# lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51506) & (lab_events_sampled_sub['ref_range_upper'].isnull()), 'ref_range_upper'] = 0


Unnamed: 0,flag,comments,value,valuenum,ref_range_lower,ref_range_upper
83770,,Clear.,0.0,0.0,,
1149471,,Hazy.,1.0,1.0,,
9637718,,CLEAR.,0.0,0.0,,
9639299,abnormal,Cloudy*.,2.0,2.0,,
9639950,,Cloudy.,2.0,2.0,,
9740128,abnormal,Hazy*.,1.0,1.0,,
29206683,,,1.0,1.0,,
29206684,,,2.0,2.0,,
29206703,,,0.0,0.0,,
29210338,abnormal,,2.0,2.0,,


In [1316]:
%%time

# 51466
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51466) & (lab_events_sampled_sub['value'].isin([np.nan])), ['value']] = lab_events_sampled_sub['comments']
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51466) & (lab_events_sampled_sub['value'].isin(['NEG.  ', 'NEG', ' '])), ['value', 'valuenum']] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51466) & (lab_events_sampled_sub['value'].isin(['TR', 'TR.  ', 'TR*.  '])), ['value', 'valuenum']] = 1
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51466) & (lab_events_sampled_sub['value'].isin(['SM', 'SM .  ', 'SM*.  '])), ['value', 'valuenum']] = 2
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51466) & (lab_events_sampled_sub['value'].isin(['MOD', 'MOD.  ', 'MOD*.  '])), ['value', 'valuenum']] = 3
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51466) & (lab_events_sampled_sub['value'].isin(['LG', 'LG.  ', 'LG*.  ', 'LGE'])), ['value', 'valuenum']] = 4

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51466) & (lab_events_sampled_sub['ref_range_lower'].isnull()), 'ref_range_lower'] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51466) & (lab_events_sampled_sub['ref_range_upper'].isnull()), 'ref_range_upper'] = 0

# 51514
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51514) & (lab_events_sampled_sub['value'].isin([np.nan])), ['value']] = lab_events_sampled_sub['comments']
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51514) & (lab_events_sampled_sub['value'].isin(['NEG.  ', 'NEG', 'NORMAL.  ', ' '])), ['value', 'valuenum']] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51514) & (lab_events_sampled_sub['value'].isin(['>8'])), ['value', 'valuenum']] = 10
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51514) & (lab_events_sampled_sub['value'].isin(['>12.  '])), ['value', 'valuenum']] = 15

# 51464
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51464) & (lab_events_sampled_sub['value'].isin([np.nan])), ['value']] = lab_events_sampled_sub['comments']
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51464) & (lab_events_sampled_sub['value'].isin(['NEG.  ', 'NEG', ' '])), ['value', 'valuenum']] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51464) & (lab_events_sampled_sub['value'].isin(['SM', 'SM .  ', 'SM*.  '])), ['value', 'valuenum']] = 1
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51464) & (lab_events_sampled_sub['value'].isin(['MOD', 'MOD.  ', 'MOD*.  '])), ['value', 'valuenum']] = 2
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51464) & (lab_events_sampled_sub['value'].isin(['LG', 'LG.  ', 'LG*.  ', 'LGE'])), ['value', 'valuenum']] = 3

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51464) & (lab_events_sampled_sub['ref_range_lower'].isnull()), 'ref_range_lower'] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51464) & (lab_events_sampled_sub['ref_range_upper'].isnull()), 'ref_range_upper'] = 0

# 51487
# Should Pos be marked abnormal?
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51487) & (lab_events_sampled_sub['value'].isin([np.nan])), ['value']] = lab_events_sampled_sub['comments']
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51487) & (lab_events_sampled_sub['value'].isin(['NEG.  ', 'NEG', ' '])), ['value', 'valuenum']] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51487) & (lab_events_sampled_sub['value'].isin(['POS.  ', 'POS', 'POS*.  '])), ['value', 'valuenum']] = 1

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51487) & (lab_events_sampled_sub['ref_range_lower'].isnull()), 'ref_range_lower'] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51487) & (lab_events_sampled_sub['ref_range_upper'].isnull()), 'ref_range_upper'] = 0

# 51492
# Should Pos be marked abnormal?
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51492) & (lab_events_sampled_sub['value'].isin([np.nan])), ['value']] = lab_events_sampled_sub['comments']
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51492) & (lab_events_sampled_sub['value'].isin(['NEG.  ', 'NEG', ' '])), ['value', 'valuenum']] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51492) & (lab_events_sampled_sub['value'].isin(['TR', 'TR.  ', 'TR*.  '])), ['value', 'valuenum']] = 10
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51492) & (lab_events_sampled_sub['value'].str.contains('TR.')), ['value', 'valuenum']] = 10
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51492) & (lab_events_sampled_sub['value'].isin(['>300'])), ['value', 'valuenum']] = 350
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51492) & (lab_events_sampled_sub['value'].isin(['>600.  ', '>600*.  '])), ['value', 'valuenum']] = 700

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51492) & (lab_events_sampled_sub['ref_range_lower'].isnull()), 'ref_range_lower'] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51492) & (lab_events_sampled_sub['ref_range_upper'].isnull()), 'ref_range_upper'] = 0

# 51486
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51486) & (lab_events_sampled_sub['value'].isin([np.nan])), ['value']] = lab_events_sampled_sub['comments']
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51486) & (lab_events_sampled_sub['value'].isin(['NEG.  ', 'NEG', ' '])), ['value', 'valuenum']] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51486) & (lab_events_sampled_sub['value'].isin(['TR', 'TR.  ', 'TR*.  '])), ['value', 'valuenum']] = 1
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51486) & (lab_events_sampled_sub['value'].isin(['SM', 'SM .  ', 'SM*.  '])), ['value', 'valuenum']] = 2
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51486) & (lab_events_sampled_sub['value'].isin(['MOD', 'MOD.  ', 'MOD*.  '])), ['value', 'valuenum']] = 3
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51486) & (lab_events_sampled_sub['value'].isin(['LG', 'LG.  ', 'LG*.  ', 'LGE'])), ['value', 'valuenum']] = 4

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51486) & (lab_events_sampled_sub['ref_range_lower'].isnull()), 'ref_range_lower'] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51486) & (lab_events_sampled_sub['ref_range_upper'].isnull()), 'ref_range_upper'] = 0

# 51506
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51506) & (lab_events_sampled_sub['value'].isin([np.nan])), ['value']] = lab_events_sampled_sub['comments']
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51506) & (lab_events_sampled_sub['value'].isin(['Clear.  ', 'CLEAR.  ', 'Clear', ' '])), ['value', 'valuenum']] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51506) & (lab_events_sampled_sub['value'].isin(['SlHazy'])), ['value', 'valuenum']] = 0.5
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51506) & (lab_events_sampled_sub['value'].isin(['Hazy.  ', 'Hazy*.  ', 'Hazy', 'HAZY', 'HAZY*.  '])), ['value', 'valuenum']] = 1
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51506) & (lab_events_sampled_sub['value'].isin(['Cloudy*.  ', 'Cloudy.  ', 'Cloudy', 'CLO', 'CLOUDY'])), ['value', 'valuenum']] = 2

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51506) & (lab_events_sampled_sub['ref_range_lower'].isnull()), 'ref_range_lower'] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51506) & (lab_events_sampled_sub['ref_range_upper'].isnull()), 'ref_range_upper'] = 0


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  self.obj[item] = s


CPU times: user 3.97 s, sys: 108 ms, total: 4.08 s
Wall time: 4.11 s


In [1269]:
# lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51466)]['value'].map({'' : 0.0, 'NEG' : 0.0, 'TR' : 1.0, 'SM' : 2.0, 'MOD' : 3.0, 'LG' : 4.0, 'LGE' : 4.0}).fillna(0.0)
# lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51466)]['value']
# = lab_events_sampled_sub['GarageFinish'].map({'NA' : 0.0, 'Unf' : 1.0, 'RFn' : 2.0, 'Fin' : 3.0})


In [1317]:
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51484) & (lab_events_sampled_sub['value'].isin([np.nan, ' ', 'TR', 'NEG'])), ['value', 'valuenum']] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51478) & (lab_events_sampled_sub['value'].isin([np.nan, ' ', 'TR', 'NEG'])), ['value', 'valuenum']] = 0

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51484) & (lab_events_sampled_sub['ref_range_lower'].isnull()), 'ref_range_lower'] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51478) & (lab_events_sampled_sub['ref_range_lower'].isnull()), 'ref_range_lower'] = 0

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51484) & (lab_events_sampled_sub['ref_range_upper'].isnull()), 'ref_range_upper'] = 0
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51478) & (lab_events_sampled_sub['ref_range_upper'].isnull()), 'ref_range_upper'] = 0

# What are good replacement values for these?
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51484) & (lab_events_sampled_sub['value'].isin(['>80'])), ['value', 'valuenum']] = 120
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51478) & (lab_events_sampled_sub['value'].isin(['>1000'])), ['value', 'valuenum']] = 1250

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51498) & (lab_events_sampled_sub['value'].isin(['<1.005'])), ['value', 'valuenum']] = 1.000
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51498) & (lab_events_sampled_sub['value'].isin(['<=1.005'])), ['value', 'valuenum']] = 1.000
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51498) & (lab_events_sampled_sub['value'].isin(['>1.030'])), ['value', 'valuenum']] = 1.035
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51498) & (lab_events_sampled_sub['value'].isin(['>1.035'])), ['value', 'valuenum']] = 1.040
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51498) & (lab_events_sampled_sub['value'].isin(['>1.050'])), ['value', 'valuenum']] = 1.055
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51498) & (lab_events_sampled_sub['value'].isin(['>=1.035'])), ['value', 'valuenum']] = 1.040
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51498) & (lab_events_sampled_sub['value'].isin([' '])), ['value', 'valuenum']] = 1.015

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51237) & (lab_events_sampled_sub['value'].isin(['>13.4'])), ['value', 'valuenum']] = 15

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51491) & (lab_events_sampled_sub['value'].isin([' '])), ['value', 'valuenum']] = 6.0

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51498) & (lab_events_sampled_sub['value'].isin(['>1.070'])), ['value', 'valuenum']] = 1.080

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51484) & (lab_events_sampled_sub['value'].astype(float) > 0), 'flag'] = 'abnormal'
lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51478) & (lab_events_sampled_sub['value'].astype(float) > 0), 'flag'] = 'abnormal'

lab_events_sampled_sub.loc[(lab_events_sampled_sub['itemid'] == 51466) & (lab_events_sampled_sub['value'].astype(float) > 0), 'flag'] = 'abnormal'


In [1318]:
# Check on differences between value and valuenum columns

lab_events_sampled_sub.loc[((lab_events_sampled_sub['value'].astype(str) + str('.0')) != lab_events_sampled_sub['valuenum'].astype(str)) & ((lab_events_sampled_sub['value'].astype(str) + str('0')) != lab_events_sampled_sub['valuenum'].astype(str)) & ((lab_events_sampled_sub['value'].astype(str)) != lab_events_sampled_sub['valuenum'].astype(str)) & ((lab_events_sampled_sub['value'].astype(str)) != lab_events_sampled_sub['valuenum'].astype(str) + str('0')) & ((str('0') + lab_events_sampled_sub['value'].astype(str)) != lab_events_sampled_sub['valuenum'].astype(str)), ]


Unnamed: 0,labevent_id,subject_id,hadm_id,specimen_id,itemid,charttime,storetime,value,valuenum,valueuom,ref_range_lower,ref_range_upper,flag,priority,comments
336856,33996144,12745561,20731073.0,57802208,51498,2181-01-08 20:52:00,2181-01-08 20:59:00,1.007,1.007,,1.001,1.035,,STAT,
381840,34543514,12785796,24422068.0,27729972,51498,2169-10-08 21:50:00,2169-10-08 22:32:00,1.007,1.007,,1.001,1.035,,STAT,
459851,35481972,12868507,28608077.0,5597239,51498,2149-02-22 13:08:00,2149-02-22 14:10:00,1.017,1.017,,1.001,1.035,,ROUTINE,
517552,35979020,12907424,25601761.0,54048977,51498,2117-10-22 11:08:00,2117-10-22 12:41:00,1.009,1.009,,1.001,1.035,,STAT,
565211,36414065,12945367,26553474.0,47170199,51498,2166-07-20 03:28:00,2166-07-20 04:29:00,1.019,1.019,,1.001,1.035,,ROUTINE,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
120951761,16272155,11319328,29695432.0,17340353,51498,2142-06-18 22:06:00,2142-06-18 22:43:00,1.017,1.017,,1.001,1.035,,STAT,
121164400,18401469,11500075,29528054.0,53881996,51498,2130-02-06 23:57:00,2130-02-07 04:10:00,1.027,1.027,,1.001,1.035,,ROUTINE,
121405813,20996771,11706286,26677566.0,76625408,51498,2200-12-20 11:41:00,2200-12-20 12:02:00,1.017,1.017,,1.001,1.035,,ROUTINE,
121517405,22034085,11791735,26645051.0,65960542,51498,2181-02-22 10:03:00,2181-02-22 10:46:00,1.019,1.019,,1.001,1.035,,ROUTINE,


In [1200]:
# lab_events_sampled_sub.loc[(lab_events_sampled_sub['subject_id'] == 19988493) & (lab_events_sampled_sub['hadm_id'] == 25600709.0) & (lab_events_sampled_sub['itemid'].isin([51478, 51484])),]


## Get Aggregate Test Values

In [1319]:
%time lab_events_sampled_sub_grouped = lab_events_sampled_sub.groupby(['subject_id', 'hadm_id', 'itemid']).agg({'itemid' : ['count'], 'valuenum' : ['min', 'max', 'mean'], 'flag' : ['count'], 'ref_range_lower' : ['min'], 'ref_range_upper' : ['min']})
# 'comments' : ['unique'], 


CPU times: user 299 ms, sys: 41.4 ms, total: 341 ms
Wall time: 341 ms


In [1320]:
lab_events_sampled_sub_grouped.reset_index(inplace = True)
lab_events_sampled_sub_grouped.columns = ['subject_id', 'hadm_id', 'itemid', 'count', 'min', 'max', 'mean', 'abn_percent', 'range_min', 'range_max']
# 'comments', 


In [1321]:
# lab_events_sampled_sub_grouped[lab_events_sampled_sub_grouped['itemid'] == 51221]

missing_vals = lab_events_sampled_sub_grouped.isnull().sum(axis = 0) 
missing_vals[missing_vals > 0].sort_values()

min     84
max     84
mean    84
dtype: int64

In [1322]:
lab_events_sampled_sub_grouped['below_min'] = np.where(lab_events_sampled_sub_grouped['min'] < lab_events_sampled_sub_grouped['range_min'], lab_events_sampled_sub_grouped['range_min'] - lab_events_sampled_sub_grouped['min'], 0)
lab_events_sampled_sub_grouped['above_max'] = np.where(lab_events_sampled_sub_grouped['max'] > lab_events_sampled_sub_grouped['range_max'], lab_events_sampled_sub_grouped['max'] - lab_events_sampled_sub_grouped['range_max'], 0)
lab_events_sampled_sub_grouped['abn_percent'] = lab_events_sampled_sub_grouped['abn_percent'] / lab_events_sampled_sub_grouped['count']


In [1323]:
lab_events_sampled_sub_grouped

Unnamed: 0,subject_id,hadm_id,itemid,count,min,max,mean,abn_percent,range_min,range_max,below_min,above_max
0,10001877,21320596.0,50868,2,11.00,13.00,12.000,0.0,8.0,20.0,0.00,0.0
1,10001877,21320596.0,50882,2,28.00,32.00,30.000,0.0,22.0,32.0,0.00,0.0
2,10001877,21320596.0,50902,2,103.00,106.00,104.500,0.0,96.0,108.0,0.00,0.0
3,10001877,21320596.0,50912,2,1.30,1.40,1.350,1.0,0.5,1.2,0.00,0.2
4,10001877,21320596.0,50931,1,116.00,116.00,116.000,1.0,70.0,100.0,0.00,16.0
...,...,...,...,...,...,...,...,...,...,...,...,...
163150,19999565,20486927.0,51250,2,90.00,91.00,90.500,0.0,82.0,98.0,0.00,0.0
163151,19999565,20486927.0,51265,2,320.00,354.00,337.000,0.0,150.0,440.0,0.00,0.0
163152,19999565,20486927.0,51277,2,12.90,13.30,13.100,0.0,10.5,15.5,0.00,0.0
163153,19999565,20486927.0,51279,2,3.33,3.98,3.655,1.0,4.2,5.4,0.87,0.0


## Merge Admissions data so we can group by ethnicity/gender to grab average range min and max

In [46]:
# Here is where we merge Admissions

# lab_events_sampled_sub_grouped.merge(d_icd_diagnoses, left_index = True, left_on = "index", right_on = 'icd_code', how = 'left')


In [1324]:
# For now aggregate all patients together

lab_range_min_max = lab_events_sampled_sub_grouped.groupby('itemid').agg({'range_min' : 'mean', 'range_max' : 'mean'})
lab_range_min_max.reset_index(inplace = True)

lab_range_dic = dict(zip(lab_range_min_max['itemid'], zip(lab_range_min_max['range_min'], lab_range_min_max['range_max'])))
lab_range_dic


{50861: (0.0, 40.0),
 50863: (37.513502285002076, 126.29663481512256),
 50868: (8.372040586245772, 19.560315670800453),
 50878: (0.0, 40.0),
 50882: (22.0, 32.0),
 50885: (0.0, 4.160468031759298),
 50893: (8.40543572044939, 10.289322691976224),
 50902: (96.0, 108.0),
 50912: (0.44546661608499916, 1.1454666160849576),
 50931: (69.89815902859381, 100.82941637289463),
 50960: (1.5984241908008092, 2.5936967632029453),
 50970: (2.7192450360027816, 4.530045821514294),
 50971: (3.3293866963124787, 5.144080044468837),
 50983: (133.36922503725782, 145.36922503725782),
 51006: (6.0, 20.0),
 51146: (0.0, 1.588577291381669),
 51221: (37.32194803072397, 49.36509233534891),
 51222: (12.54833781061071, 16.729415715245025),
 51237: (0.9000000000000562, 1.0999999999999375),
 51244: (20.01812585499316, 48.47127222982216),
 51248: (26.296065904505717, 31.90652320107599),
 51249: (31.32901815736382, 35.65803631472764),
 51250: (81.62609280430397, 98.37390719569603),
 51265: (150.0, 425.1449516827724),
 51

Pivot the table so we have feature columns related to test results

In [1207]:
lab_events_sampled_sub_grouped[lab_events_sampled_sub_grouped['hadm_id'] == 23248240.0]

Unnamed: 0,subject_id,hadm_id,itemid,count,min,max,mean,abn_percent,range_min,range_max,below_min,above_max


In [1325]:
lab_events_sampled_sub_grouped['new_index'] = list(zip(lab_events_sampled_sub_grouped['subject_id'], lab_events_sampled_sub_grouped['hadm_id']))


In [1326]:
%time lab_events_sampled_pivot = lab_events_sampled_sub_grouped.pivot(index = 'new_index', columns = 'itemid', values = ['min', 'max', 'mean', 'abn_percent', 'below_min', 'above_max'])
# 'comments', 


CPU times: user 78.7 ms, sys: 15.3 ms, total: 93.9 ms
Wall time: 96 ms


In [1327]:
pd.options.display.max_columns = 500

lab_events_sampled_pivot = lab_events_sampled_pivot.reset_index()
lab_events_sampled_pivot['subject_id'], lab_events_sampled_pivot['hadm_id'] = zip(*lab_events_sampled_pivot['new_index'])
lab_events_sampled_pivot.drop(['new_index'], axis = 1, inplace = True)


  obj = obj._drop_axis(labels, axis, level=level, errors=errors)


In [52]:
# missing_vals = lab_events_sampled_pivot.isnull().sum(axis = 0) 
# missing_vals[missing_vals > 0].sort_values()

## Start Data Imputation

Copy table, retain original for Random Forest

In [1328]:
lab_events_impute = lab_events_sampled_pivot.copy()

In [54]:
# lab_events_sampled_pivot = lab_events_impute

In [55]:
# d_labitems = pd.read_csv('data/mimic-iv-0.4/hosp/d_labitems.csv.gz', compression='gzip')


In [1329]:
# lab_events_impute.columns

d_labitems[d_labitems['itemid'].isin(itemid_sub_sample)]

Unnamed: 0,itemid,label,fluid,category,loinc_code
52,50861,Alanine Aminotransferase (ALT),Blood,Chemistry,1742-6
76,50863,Alkaline Phosphatase,Blood,Chemistry,6768-6
115,50868,Anion Gap,Blood,Chemistry,1863-0
153,50878,Asparate Aminotransferase (AST),Blood,Chemistry,1920-8
190,51146,Basophils,Blood,Hematology,704-7
212,50882,Bicarbonate,Blood,Chemistry,1963-8
222,51464,Bilirubin,Urine,Hematology,5770-3
229,50885,"Bilirubin, Total",Blood,Chemistry,1975-2
258,51466,Blood,Urine,Hematology,
282,50893,"Calcium, Total",Blood,Chemistry,2000-8


In [1332]:
%%time

np.random.seed(0)

for labitem in lab_range_dic:
    for ind in lab_events_sampled_pivot[lab_events_sampled_pivot[('mean', labitem)].isnull()].index:
        val_max = lab_range_dic[labitem][1]
        val_min = lab_range_dic[labitem][0]

        val_ave = (val_max + val_min) / 2
        val_std = (val_max - val_ave) * .333

        ran_vals = np.random.normal(val_ave, val_std, 50)
        impute_min = min(ran_vals)
        impute_max = max(ran_vals)
        impute_mean = np.mean(ran_vals)
        
        val_min = lab_events_sampled_pivot[('min', labitem)][ind]
        val_max = lab_events_sampled_pivot[('max', labitem)][ind]
        val_mean = lab_events_sampled_pivot[('mean', labitem)][ind]
        
        lab_events_sampled_pivot[('min', labitem)][ind] = np.where(np.isnan(val_min), impute_min, val_min)
        lab_events_sampled_pivot[('max', labitem)][ind] = np.where(np.isnan(val_max), impute_max, val_max)
        lab_events_sampled_pivot[('mean', labitem)][ind] = np.where(np.isnan(val_mean), impute_mean, val_mean)
#         patient[('mean', labitem)].replace(np.nan, impute_mean)
#         patient[('abn_count', labitem)].replace(np.nan, 0)
# 5k patients
# 10 items - 2.5s
# 20 items - 6s
# 30 items - 28.6s

# 10k patients
# 40 items - 1m 34s

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy


CPU times: user 1min 33s, sys: 621 ms, total: 1min 33s
Wall time: 1min 34s


In [1333]:
for lab_itemid in lab_range_dic:
    lab_events_sampled_pivot[( 'above_max', lab_itemid)] = lab_events_sampled_pivot[( 'above_max', lab_itemid)].replace(np.nan, 0)
    lab_events_sampled_pivot[( 'below_min', lab_itemid)] = lab_events_sampled_pivot[( 'below_min', lab_itemid)].replace(np.nan, 0)
    lab_events_sampled_pivot[( 'abn_percent', lab_itemid)] = lab_events_sampled_pivot[( 'abn_percent', lab_itemid)].replace(np.nan, 0)
#     lab_events_sampled_pivot[( 'comments', lab_itemid)] = lab_events_sampled_pivot[( 'comments', lab_itemid)].replace(np.nan, np.array(np.nan))


In [1334]:
missing_vals = lab_events_sampled_pivot.isnull().sum(axis = 0) 
missing_vals[missing_vals > 0].sort_values()

Series([], dtype: int64)

In [1335]:
lab_events_sampled_pivot

Unnamed: 0_level_0,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,subject_id,hadm_id
itemid,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,Unnamed: 241_level_1,Unnamed: 242_level_1
0,2.997088,51.875587,11.000000,7.192662,28.000000,-0.030222,8.712124,103.000000,1.300000,116.000000,1.720807,2.909850,3.500000,140.000000,40.000000,0.390133,39.300000,12.900000,2.900000,22.769974,31.500000,32.900000,96.000000,95.000000,29.400000,35.500000,14.600000,4.100000,4.900000,0.0,0.0,0.0,0.0,0.0,0.0,5.458682,0.0,1.004187,0.0,0.253369,35.116566,107.659947,13.000000,36.444315,32.000000,3.243196,9.972855,106.000000,1.400000,116.000000,2.519348,4.152207,3.600000,145.000000,47.000000,1.322023,39.300000,12.900000,3.000000,44.175318,31.500000,32.900000,96.000000,95.000000,30.600000,35.500000,14.600000,4.100000,4.900000,0.0,0.0,0.0,0.0,0.0,0.0,7.813433,0.0,1.029526,0.0,0.919134,20.936125,82.895319,12.000000,20.170673,30.000000,2.100599,9.414059,104.500000,1.350000,116.000000,2.068347,3.585984,3.550000,142.500000,43.500000,0.818097,39.300000,12.900000,2.950000,33.768759,31.500000,32.900000,96.000000,95.000000,30.000000,35.500000,14.600000,4.100000,4.900000,0.0,0.0,0.0,0.0,0.0,0.0,6.451515,0.0,1.017424,0.0,0.608275,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.000000,0.000,0.0,0.00,0.0,1.000000,0.0,1.00,1.0,1.0,0.0,0.0,0.000000,0.0,1.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.7,1.1,0.0,0.0,0.0,0.0,0.0,55.0,0.0,0.0,0.0,0.50,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.2,16.0,0.0,0.0,0.0,0.0,27.0,0.0,0.0,0.0,1.9,0.0,0.0,0.0,0.0,0.0,17.2,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10001877,21320596.0
1,8.502958,42.563595,10.193396,3.329270,24.033822,9.500000,8.849326,97.341420,0.555639,71.902029,1.735081,3.079829,3.602654,134.225802,7.276216,0.199821,39.464173,13.487843,0.906960,24.327817,26.762869,31.574106,80.745531,199.690059,10.097198,26.580360,11.441106,4.344073,5.333141,0.0,0.0,0.0,0.0,0.0,0.0,5.752620,0.0,1.005363,0.0,0.289124,32.626622,113.369253,17.922574,34.519860,30.749347,9.500000,10.289063,107.197838,1.009893,97.083726,2.590251,4.147307,4.770449,144.222954,17.214012,1.233413,47.605115,16.049808,1.067653,48.720870,30.868970,34.908220,94.673671,396.003821,12.475355,34.342181,14.765301,5.588843,10.342467,0.0,0.0,0.0,0.0,0.0,0.0,7.510084,0.0,1.031955,0.0,0.804833,19.860518,82.902413,14.133664,20.863701,27.310695,9.500000,9.322523,101.935952,0.777818,84.950583,2.091110,3.645794,4.226222,138.849958,12.733493,0.766628,43.948501,14.639790,0.993173,34.235197,29.130385,33.377137,89.074325,291.329743,11.230896,30.430946,12.920632,5.036211,7.596984,0.0,0.0,0.0,0.0,0.0,0.0,6.543635,0.0,1.018809,0.0,0.588818,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.000000,0.000,0.0,0.00,0.0,0.000000,0.0,0.00,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10002305,29924799.0
2,10.068224,45.124179,10.000000,6.207528,23.000000,0.134158,7.700000,103.000000,0.700000,78.000000,1.500000,1.500000,3.600000,135.000000,17.000000,0.293749,34.600000,11.800000,1.300000,19.710321,29.400000,34.100000,86.000000,215.000000,14.800000,32.200000,13.700000,4.010000,11.300000,0.0,0.0,0.0,0.0,0.0,0.0,5.388687,0.0,0.999706,0.0,0.367356,35.871744,116.273930,14.000000,33.587622,27.000000,3.990090,8.200000,106.000000,0.900000,131.000000,2.400000,3.600000,4.600000,141.000000,24.000000,1.343694,39.200000,13.600000,1.300000,42.518730,30.300000,35.300000,87.000000,414.000000,14.800000,32.200000,14.200000,4.560000,15.600000,0.0,0.0,0.0,0.0,0.0,0.0,7.710818,0.0,1.033396,0.0,0.829843,21.708522,84.468800,12.714286,21.270116,25.428571,2.175172,8.014286,104.750000,0.800000,101.857143,1.950000,2.466667,4.125000,138.500000,20.285714,0.802675,37.262500,12.814286,1.300000,33.512477,29.771429,34.585714,86.142857,291.857143,14.800000,32.200000,13.842857,4.300000,13.142857,0.0,0.0,0.0,0.0,0.0,0.0,6.593207,0.0,1.019267,0.0,0.598061,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.428571,0.125,0.5,0.00,0.0,0.428571,0.0,1.00,1.0,1.0,0.0,0.0,0.285714,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.7,0.0,0.0,0.0,0.1,1.2,0.0,0.0,0.0,0.0,5.4,2.2,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.59,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,31.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,0.2,0.0,0.0,0.3,0.0,0.0,1.4,0.0,0.0,0.0,4.6,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10003046,26048429.0
3,5.192135,46.960747,10.285499,7.885413,23.519880,7.000000,8.571769,97.662939,0.546662,73.690120,1.711040,3.021489,3.497371,132.807198,8.349347,0.330113,39.397553,12.860433,0.943063,21.112103,26.958905,31.332047,84.588624,136.373125,10.222489,26.746379,11.482002,4.416524,4.961947,0.0,0.0,0.0,0.0,0.0,0.0,5.485266,0.0,1.007352,0.0,0.294764,34.407151,117.746618,17.590545,31.647699,30.219652,7.000000,10.075479,105.486049,1.016000,96.310622,2.623454,4.385983,4.833780,144.094278,19.795792,1.557683,48.666197,15.920874,1.049453,44.981012,31.487523,34.810884,97.883102,354.804109,12.419864,33.814800,14.358810,5.577389,9.493844,0.0,0.0,0.0,0.0,0.0,0.0,7.476731,0.0,1.027497,0.0,0.932848,19.383891,82.213672,14.015614,20.726256,26.526470,7.000000,9.381088,102.146848,0.815436,85.520123,2.124743,3.669531,4.174752,139.380182,13.438019,0.801909,43.246255,14.620847,0.991510,34.270489,29.242339,33.440477,89.881860,272.539297,11.233248,29.810369,13.030749,4.991010,7.549923,0.0,0.0,0.0,0.0,0.0,0.0,6.471691,0.0,1.017066,0.0,0.600110,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000000,0.000,0.0,0.00,0.0,0.000000,0.0,0.00,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10003619,22029522.0
4,6.213900,38.967323,9.665789,-5.968614,23.368636,9.100000,8.715162,98.577412,0.567741,73.373483,1.823347,2.865983,3.523774,135.817396,7.949785,0.413042,36.929292,13.047198,0.909149,26.195502,27.077019,31.592700,85.221055,148.943883,9.973353,23.527726,11.056237,4.408653,4.581118,0.0,0.0,0.0,0.0,0.0,0.0,5.641294,0.0,1.006180,0.0,0.416629,35.046998,108.382078,17.442492,32.004954,32.276601,9.100000,10.212273,106.649646,1.065124,93.109747,2.568620,4.143643,5.026288,144.459133,19.485053,1.334336,47.576082,17.612370,1.056959,43.341469,31.018576,35.449698,97.230070,414.837140,12.541499,34.448200,14.383967,5.439404,10.334049,0.0,0.0,0.0,0.0,0.0,0.0,7.675755,0.0,1.027870,0.0,0.950611,19.169242,78.287915,13.647137,18.238603,27.178056,9.100000,9.396506,102.623303,0.813325,85.420539,2.143240,3.589295,4.280528,139.599349,12.607573,0.823044,43.004801,14.728392,0.999509,34.334367,29.051363,33.447208,89.735927,276.650764,11.292039,29.851395,12.918443,4.979181,7.500039,0.0,0.0,0.0,0.0,0.0,0.0,6.445369,0.0,1.018689,0.0,0.658282,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.000000,0.000,0.0,0.00,0.0,0.000000,0.0,0.00,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10003939,22561709.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
8109,6.416863,51.625240,9.681436,10.373504,23.510786,5.900000,8.270673,97.266194,0.519337,72.999882,1.655599,2.873887,3.625218,134.687267,8.662937,0.135768,38.812549,13.079045,0.940601,27.073886,27.139609,32.234841,82.105933,172.711736,10.268260,24.536180,11.080318,4.314118,3.484800,0.0,0.0,0.0,0.0,0.0,0.0,5.124408,0.0,1.009482,0.0,0.265568,31.421360,122.045011,18.802476,34.682301,31.002901,5.900000,10.002229,105.913992,1.047043,96.999959,2.492746,4.222231,4.876310,142.945095,17.968089,1.366485,47.247595,16.740744,1.084053,43.997687,30.840806,35.441410,96.676333,380.543192,12.676653,35.310368,14.899079,5.485214,11.052365,0.0,0.0,0.0,0.0,0.0,0.0,7.517992,0.0,1.031913,0.0,0.897921,18.651249,85.155625,14.453087,22.082737,27.167588,5.900000,9.311518,102.006612,0.774500,85.668451,2.102091,3.571794,4.259626,139.379366,12.501138,0.810273,43.218617,14.645108,1.006120,34.117331,28.946836,33.562173,89.405157,285.633693,11.205778,29.956128,12.906096,4.993155,7.871360,0.0,0.0,0.0,0.0,0.0,0.0,6.457806,0.0,1.018112,0.0,0.584025,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000000,0.000,0.0,0.00,0.0,0.000000,0.0,0.00,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19992732,26054225.0
8110,2.647704,46.201928,15.000000,3.026479,25.000000,0.478166,9.000000,106.000000,0.900000,106.000000,2.300000,4.200000,4.300000,142.000000,14.000000,-0.077239,43.800000,14.700000,0.917266,26.532383,28.900000,33.600000,86.000000,181.000000,10.342111,26.459899,15.000000,5.080000,6.600000,0.0,0.0,0.0,0.0,0.0,0.0,4.895399,0.0,0.994633,0.0,0.373001,34.996085,109.545270,15.000000,33.300532,25.000000,3.269628,9.000000,106.000000,0.900000,106.000000,2.300000,4.200000,4.300000,142.000000,14.000000,1.254840,43.800000,14.700000,1.076884,43.058540,28.900000,33.600000,86.000000,181.000000,12.315285,34.563190,15.000000,5.080000,6.600000,0.0,0.0,0.0,0.0,0.0,0.0,7.276665,0.0,1.028252,0.0,0.848010,20.015116,85.308048,15.000000,19.473612,25.000000,1.945947,9.000000,106.000000,0.900000,106.000000,2.300000,4.200000,4.300000,142.000000,14.000000,0.823788,43.800000,14.700000,1.003315,34.690025,28.900000,33.600000,86.000000,181.000000,11.300130,30.079784,15.000000,5.080000,6.600000,0.0,0.0,0.0,0.0,0.0,0.0,6.430284,0.0,1.018342,0.0,0.627433,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.000000,0.000,0.0,0.00,0.0,0.000000,0.0,0.00,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19993501,29469659.0
8111,2.107809,49.482091,9.512278,3.506271,22.796961,8.100000,8.611315,98.796909,0.377824,73.245093,1.784712,2.844369,3.792310,135.306818,8.838752,0.337455,39.960258,13.267441,0.912956,23.237294,26.750093,32.055179,83.256674,179.775561,10.212243,25.262227,11.397791,4.572239,5.287445,0.0,0.0,0.0,0.0,0.0,0.0,5.263032,0.0,1.003079,0.0,0.294892,38.483430,115.147427,19.353132,30.966201,29.820915,8.100000,9.899158,104.993242,1.005288,96.191956,2.567219,4.151670,4.966684,143.664262,17.519976,1.428553,47.883590,15.985655,1.090858,46.114719,31.308057,34.976675,97.809682,378.234164,12.227934,33.759630,15.112118,5.548716,10.359374,0.0,0.0,0.0,0.0,0.0,0.0,7.383318,0.0,1.028776,0.0,0.823796,19.627579,85.132792,13.868937,19.832656,26.401906,8.100000,9.333959,101.732765,0.805182,85.623946,2.089200,3.607557,4.243464,139.445306,13.201811,0.741716,43.373549,14.657867,0.990615,34.422652,29.093080,33.517320,89.922277,285.728675,11.204807,29.915370,13.142710,5.006642,7.710596,0.0,0.0,0.0,0.0,0.0,0.0,6.403438,0.0,1.017003,0.0,0.589674,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.000000,0.000,0.0,0.00,0.0,0.000000,0.0,0.00,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19993967,21550111.0
8112,27.000000,211.000000,11.000000,27.000000,29.000000,1.200000,8.400000,97.000000,1.000000,90.000000,2.000000,3.300000,3.900000,135.000000,16.000000,0.200000,44.400000,14.000000,1.100000,24.200000,26.200000,31.200000,83.000000,321.000000,12.200000,30.700000,14.200000,5.320000,6.100000,0.0,0.0,0.0,0.0,0.0,0.0,5.282076,0.0,1.007125,0.0,0.244298,27.000000,211.000000,14.000000,27.000000,35.000000,1.200000,8.800000,99.000000,1.100000,109.000000,2.100000,4.000000,5.300000,141.000000,21.000000,0.200000,48.800000,15.200000,1.100000,24.200000,26.500000,31.900000,84.000000,355.000000,12.200000,30.700000,14.600000,5.810000,7.700000,0.0,0.0,0.0,0.0,0.0,0.0,7.307679,0.0,1.029810,0.0,0.836206,27.000000,211.000000,12.750000,27.000000,31.750000,1.200000,8.566667,98.000000,1.025000,96.250000,2.066667,3.666667,4.400000,138.250000,18.000000,0.200000,46.100000,14.525000,1.100000,24.200000,26.350000,31.550000,83.750000,335.250000,12.200000,30.700000,14.450000,5.515000,7.100000,0.0,0.0,0.0,0.0,0.0,0.0,6.423791,0.0,1.018455,0.0,0.588578,0.0,1.0,0.0,0.0,0.5,0.0,0.0,0.0,0.0,0.250000,0.000,0.0,0.25,0.0,0.250000,0.0,0.00,0.0,0.0,0.0,1.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.8,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,81.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,9.0,0.0,0.0,0.2,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19995127,21801907.0


In [1336]:
lab_events_impute_KNN = lab_events_impute.copy()

In [1337]:
lab_events_impute_KNN

Unnamed: 0_level_0,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,subject_id,hadm_id
itemid,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,Unnamed: 241_level_1,Unnamed: 242_level_1
0,,,11.0,,28.0,,,103.0,1.3,116.0,,,3.5,140.0,40.0,,39.3,12.9,2.9,,31.5,32.9,96.0,95.0,29.4,35.5,14.6,4.10,4.9,,,,,,,,,,,,,,13.0,,32.0,,,106.0,1.4,116.0,,,3.6,145.0,47.0,,39.3,12.9,3.0,,31.5,32.9,96.0,95.0,30.6,35.5,14.6,4.10,4.9,,,,,,,,,,,,,,12.000000,,30.000000,,,104.50,1.350,116.000000,,,3.550,142.50,43.500000,,39.3000,12.900000,2.95,,31.500000,32.900000,96.000000,95.000000,30.0,35.5,14.600000,4.100,4.900000,,,,,,,,,,,,,,0.0,,0.0,,,0.0,1.0,1.000000,,,0.00,0.0,1.000000,,1.00,1.0,1.0,,0.0,0.000000,0.0,1.0,1.0,1.0,0.0,1.0,0.0,,,,,,,,,,,,,,0.0,,0.0,,,0.0,0.0,0.0,,,0.0,0.0,0.0,,0.7,1.1,0.0,,0.0,0.0,0.0,55.0,0.0,0.0,0.0,0.50,0.0,,,,,,,,,,,,,,0.0,,0.0,,,0.0,0.2,16.0,,,0.0,0.0,27.0,,0.0,0.0,1.9,,0.0,0.0,0.0,0.0,17.2,0.5,0.0,0.0,0.0,,,,,,,,,,,,10001877,21320596.0
1,,,,,,9.5,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,9.5,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,9.5,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2.5,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,10002305,29924799.0
2,,,10.0,,23.0,,7.7,103.0,0.7,78.0,1.5,1.5,3.6,135.0,17.0,,34.6,11.8,1.3,,29.4,34.1,86.0,215.0,14.8,32.2,13.7,4.01,11.3,,,,,,,,,,,,,,14.0,,27.0,,8.2,106.0,0.9,131.0,2.4,3.6,4.6,141.0,24.0,,39.2,13.6,1.3,,30.3,35.3,87.0,414.0,14.8,32.2,14.2,4.56,15.6,,,,,,,,,,,,,,12.714286,,25.428571,,8.014286,104.75,0.800,101.857143,1.950000,2.466667,4.125,138.50,20.285714,,37.2625,12.814286,1.30,,29.771429,34.585714,86.142857,291.857143,14.8,32.2,13.842857,4.300,13.142857,,,,,,,,,,,,,,0.0,,0.0,,1.0,0.0,0.0,0.428571,0.125,0.5,0.00,0.0,0.428571,,1.00,1.0,1.0,,0.0,0.285714,0.0,0.0,1.0,0.0,0.0,1.0,1.0,,,,,,,,,,,,,,0.0,,0.0,,0.7,0.0,0.0,0.0,0.1,1.2,0.0,0.0,0.0,,5.4,2.2,0.0,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.59,0.0,,,,,,,,,,,,,,0.0,,0.0,,0.0,0.0,0.0,31.0,0.0,0.0,0.0,0.0,4.0,,0.0,0.0,0.2,,0.0,0.3,0.0,0.0,1.4,0.0,0.0,0.0,4.6,,,,,,,,,,,,10003046,26048429.0
3,,,,,,7.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,7.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,7.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,10003619,22029522.0
4,,,,,,9.1,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,9.1,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,9.1,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,2.1,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,10003939,22561709.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
8109,,,,,,5.9,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,5.9,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,5.9,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,19992732,26054225.0
8110,,,15.0,,25.0,,9.0,106.0,0.9,106.0,2.3,4.2,4.3,142.0,14.0,,43.8,14.7,,,28.9,33.6,86.0,181.0,,,15.0,5.08,6.6,,,,,,,,,,,,,,15.0,,25.0,,9.0,106.0,0.9,106.0,2.3,4.2,4.3,142.0,14.0,,43.8,14.7,,,28.9,33.6,86.0,181.0,,,15.0,5.08,6.6,,,,,,,,,,,,,,15.000000,,25.000000,,9.000000,106.00,0.900,106.000000,2.300000,4.200000,4.300,142.00,14.000000,,43.8000,14.700000,,,28.900000,33.600000,86.000000,181.000000,,,15.000000,5.080,6.600000,,,,,,,,,,,,,,0.0,,0.0,,0.0,0.0,0.0,1.000000,0.000,0.0,0.00,0.0,0.000000,,0.00,0.0,,,0.0,0.000000,0.0,0.0,,,0.0,0.0,0.0,,,,,,,,,,,,,,0.0,,0.0,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,0.0,,,0.0,0.0,0.0,0.0,,,0.0,0.00,0.0,,,,,,,,,,,,,,0.0,,0.0,,0.0,0.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,,0.0,0.0,,,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,,,,,,,,,,,,19993501,29469659.0
8111,,,,,,8.1,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,8.1,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,8.1,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,1.1,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,19993967,21550111.0
8112,27.0,211.0,11.0,27.0,29.0,1.2,8.4,97.0,1.0,90.0,2.0,3.3,3.9,135.0,16.0,0.2,44.4,14.0,1.1,24.2,26.2,31.2,83.0,321.0,12.2,30.7,14.2,5.32,6.1,,,,,,,,,,,,27.0,211.0,14.0,27.0,35.0,1.2,8.8,99.0,1.1,109.0,2.1,4.0,5.3,141.0,21.0,0.2,48.8,15.2,1.1,24.2,26.5,31.9,84.0,355.0,12.2,30.7,14.6,5.81,7.7,,,,,,,,,,,,27.0,211.0,12.750000,27.0,31.750000,1.2,8.566667,98.00,1.025,96.250000,2.066667,3.666667,4.400,138.25,18.000000,0.2,46.1000,14.525000,1.10,24.2,26.350000,31.550000,83.750000,335.250000,12.2,30.7,14.450000,5.515,7.100000,,,,,,,,,,,,0.0,1.0,0.0,0.0,0.5,0.0,0.0,0.0,0.0,0.250000,0.000,0.0,0.25,0.0,0.250000,0.0,0.00,0.0,0.0,0.0,1.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.8,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,,,,,,,,,,,,0.0,81.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,9.0,0.0,0.0,0.2,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,19995127,21801907.0


In [1338]:
missing_vals = lab_events_impute_KNN.isnull().sum(axis = 0) 
missing_vals[missing_vals > 0].sort_values()

             itemid
above_max    51221     1995
below_min    51221     1995
abn_percent  51221     1995
max          51221     1996
mean         51221     1996
                       ... 
abn_percent  51466     5872
above_max    51514     5872
min          51498     5900
mean         51498     5900
max          51498     5900
Length: 240, dtype: int64

In [1339]:
%%time

from sklearn.impute import KNNImputer
imputer = KNNImputer(n_neighbors=10)
lab_events_impute_KNN_imputed = imputer.fit_transform(lab_events_impute_KNN)

# 3min 8s

CPU times: user 2min 41s, sys: 30.5 s, total: 3min 12s
Wall time: 3min 8s


In [1340]:
lab_events_impute_KNN_imputed = pd.DataFrame(lab_events_impute_KNN_imputed)
lab_events_impute_KNN_imputed.columns = lab_events_impute_KNN.columns
lab_events_impute_KNN_imputed

Unnamed: 0_level_0,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,subject_id,hadm_id
itemid,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,Unnamed: 241_level_1,Unnamed: 242_level_1
0,25.8,77.0,11.0,49.4,28.0,2.76,7.80,103.0,1.30,116.0,1.80,2.37,3.50,140.0,40.0,0.16,39.30,12.90,2.90,17.32,31.50,32.90,96.0,95.0,29.40,35.50,14.60,4.100,4.90,0.2,1.1,110.0,0.0,1.2,0.1,5.60,80.0,1.0167,0.7,0.30,35.7,98.5,13.0,64.7,32.0,3.97,8.66,106.0,1.40,116.0,2.35,4.38,3.60,145.0,47.0,0.29,39.30,12.90,3.00,21.23,31.50,32.90,96.0,95.0,30.60,35.50,14.60,4.100,4.90,0.2,1.9,120.0,0.0,1.8,0.1,6.00,116.5,1.0201,1.1,0.3,31.383333,88.180000,12.000000,55.663333,30.000000,3.398000,8.227745,104.500000,1.350000,116.000000,2.073045,3.258286,3.550000,142.500000,43.500000,0.221667,39.300000,12.900000,2.950000,19.123333,31.500000,32.900000,96.000000,95.000000,30.000000,35.500000,14.600000,4.100000,4.900000,0.200000,1.541667,113.333333,0.0,1.400000,0.100000,5.762500,97.000000,1.018442,0.875000,0.300000,0.226667,0.176667,0.000000,0.333333,0.000000,0.475000,0.480546,0.000000,1.000000,1.000000,0.008696,0.334851,0.000000,0.000000,1.000000,0.000000,1.000000,1.000000,1.000000,0.516667,0.000000,0.000000,0.000000,1.000000,1.000000,1.000000,0.000000,1.000000,0.000000,0.0,0.550000,0.233333,0.050000,0.100000,0.0,0.0,0.10,0.00,0.100000,0.100000,0.0,0.7,0.0,0.0,0.0,0.0,0.62,0.0,0.0,0.0,0.02,0.41,0.00,0.0,0.0,0.0,0.70,1.10,0.0,8.90,0.00,0.00,0.0,55.0,0.0,0.00,0.0,0.500,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.16,8.5,6.8,0.0,31.5,0.0,2.12,0.0,0.0,0.20,16.0,0.02,0.44,0.00,0.0,27.0,0.0,0.00,0.00,1.90,0.0,0.00,0.00,0.0,0.0,17.20,0.50,0.00,0.000,0.00,0.2,1.9,120.0,0.0,1.8,0.1,0.0,116.5,0.0000,1.1,0.1,10001877.0,21320596.0
1,29.2,77.3,13.7,42.5,22.3,9.50,8.54,95.9,2.36,86.4,1.75,2.91,3.70,132.5,24.9,0.23,33.93,11.44,1.12,21.68,30.09,33.19,89.6,170.6,12.45,28.54,14.43,3.760,5.96,0.2,1.6,10.0,2.0,0.4,0.1,6.40,72.0,1.0171,0.2,1.20,37.0,86.3,18.6,60.1,25.7,9.50,9.31,104.3,2.55,143.0,3.96,3.74,4.28,139.7,32.2,0.55,38.43,13.03,1.53,24.43,31.21,34.41,92.2,351.7,16.27,57.33,14.82,4.253,9.32,0.2,2.0,10.0,2.0,0.7,0.1,6.60,73.0,1.0179,0.2,1.2,33.030000,82.340000,16.009697,51.566667,23.991284,9.500000,8.939333,100.434610,2.448894,101.716699,2.027061,3.302917,4.003325,136.466429,27.731667,0.353667,36.131095,12.205000,1.250238,22.987000,30.681000,33.771667,90.826667,230.615000,13.761976,41.077383,14.612833,3.992300,7.503333,0.200000,1.800000,10.000000,2.0,0.500000,0.100000,6.537500,72.250000,1.017475,0.200000,1.200000,0.133333,0.200000,0.110526,0.200000,0.206579,1.000000,0.081250,0.326623,0.185000,0.397241,0.046316,0.326250,0.050000,0.216558,0.265000,0.033333,0.550000,0.495000,0.436905,0.600000,0.260000,0.205000,0.050000,0.193333,0.436905,0.342628,0.220000,0.650000,0.085000,0.0,0.675000,0.100000,0.200000,0.000000,0.0,0.0,0.10,0.10,0.000000,0.200000,0.0,0.6,0.1,0.0,0.8,0.0,0.15,2.8,0.0,0.1,0.03,0.16,0.06,3.6,0.0,0.0,4.87,1.63,0.0,4.05,0.00,0.00,0.0,20.8,0.0,0.00,0.0,0.647,0.26,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.16,9.1,17.4,1.3,34.0,0.0,2.50,0.0,0.6,1.60,46.4,1.84,0.10,0.00,0.0,14.2,0.1,0.00,0.00,0.45,0.0,0.80,0.38,0.3,90.5,3.88,24.72,0.19,0.000,0.51,0.2,2.0,10.0,2.0,0.7,0.1,0.0,73.0,0.0008,0.2,1.0,10002305.0,29924799.0
2,18.4,114.1,10.0,25.7,23.0,1.60,7.70,103.0,0.70,78.0,1.50,1.50,3.60,135.0,17.0,0.35,34.60,11.80,1.30,13.36,29.40,34.10,86.0,215.0,14.80,32.20,13.70,4.010,11.30,0.1,0.9,100.0,2.0,0.8,0.1,5.85,22.0,1.0194,0.5,0.20,26.5,136.2,14.0,30.2,27.0,1.77,8.20,106.0,0.90,131.0,2.40,3.60,4.60,141.0,24.0,0.43,39.20,13.60,1.30,15.60,30.30,35.30,87.0,414.0,14.80,32.20,14.20,4.560,15.60,0.1,1.7,100.0,3.0,1.4,0.2,6.05,26.0,1.0207,0.7,0.2,22.414935,124.908874,12.714286,27.850649,25.428571,1.691364,8.014286,104.750000,0.800000,101.857143,1.950000,2.466667,4.125000,138.500000,20.285714,0.386667,37.262500,12.814286,1.300000,14.483333,29.771429,34.585714,86.142857,291.857143,14.800000,32.200000,13.842857,4.300000,13.142857,0.100000,1.300000,100.000000,2.5,1.100000,0.150000,5.950000,24.000000,1.020050,0.600000,0.200000,0.072727,0.436364,0.000000,0.100000,0.000000,0.200000,1.000000,0.000000,0.000000,0.428571,0.125000,0.500000,0.000000,0.000000,0.428571,0.000000,1.000000,1.000000,1.000000,0.833333,0.000000,0.285714,0.000000,0.000000,1.000000,0.000000,0.000000,1.000000,1.000000,0.0,0.650000,0.100000,0.250000,0.000000,0.0,0.0,0.30,0.00,0.200000,0.100000,0.0,0.0,0.0,0.0,0.0,0.0,0.70,0.0,0.0,0.0,0.10,1.20,0.00,0.0,0.0,0.0,5.40,2.20,0.0,7.96,0.00,0.00,0.0,0.0,0.0,0.00,0.0,0.590,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.18,5.2,40.5,0.0,4.1,0.0,0.40,0.0,0.0,0.00,31.0,0.00,0.00,0.00,0.0,4.0,0.0,0.00,0.00,0.20,0.0,0.00,0.30,0.0,0.0,1.40,0.00,0.00,0.000,4.60,0.1,1.7,100.0,3.0,1.4,0.2,0.0,26.0,0.0000,0.7,0.1,10003046.0,26048429.0
3,61.5,92.3,10.6,33.2,19.7,7.00,8.42,100.4,0.76,82.6,1.82,3.29,4.01,134.9,13.3,0.48,33.14,11.36,1.12,24.68,31.65,32.62,93.5,179.4,12.39,29.53,14.40,3.466,10.01,0.2,1.3,10.0,16.0,1.5,0.1,5.65,51.0,1.0112,0.6,0.30,312.9,124.7,16.9,477.2,26.3,7.00,9.10,109.6,1.17,172.5,2.34,4.98,4.87,141.4,32.2,0.65,42.81,14.41,1.66,29.69,33.82,34.61,101.1,297.9,17.86,60.06,15.61,4.339,16.58,0.4,2.0,70.0,30.0,2.1,0.2,6.00,102.0,1.0173,0.9,0.5,204.185606,106.962121,13.659783,233.025000,23.355399,7.000000,8.790433,104.561907,0.900102,121.061235,2.018886,3.967113,4.415845,138.073576,22.233441,0.517724,37.249505,12.725788,1.310585,27.142236,32.689977,33.592273,97.371095,227.966464,14.314395,43.336787,15.016525,3.856309,12.455569,0.233333,1.666667,40.500000,23.0,1.672222,0.122222,5.836111,71.333333,1.013933,0.716667,0.333333,0.438636,0.404545,0.049255,0.391667,0.212192,0.000000,0.315873,0.297170,0.205455,0.651581,0.016246,0.193343,0.137566,0.112880,0.433954,0.000000,0.788095,0.916667,0.662576,0.645122,0.582133,0.224657,0.317552,0.341206,0.662576,0.413285,0.300000,0.666667,0.304205,0.0,0.683333,0.277778,0.250000,0.233333,0.0,0.0,0.20,0.00,0.200000,0.111111,0.0,0.5,1.0,0.0,2.8,0.0,0.42,0.7,0.0,5.0,0.02,0.19,0.00,1.4,0.5,0.0,8.45,2.84,0.0,6.19,0.00,0.16,0.0,32.9,0.0,0.00,0.0,1.044,0.21,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.16,284.8,15.9,0.6,445.7,0.0,0.00,0.0,3.1,0.25,71.9,0.11,0.51,0.22,0.4,17.2,0.0,1.18,0.90,0.57,1.7,2.62,0.37,3.4,20.5,5.48,25.46,0.84,0.076,5.66,0.4,2.0,70.0,30.0,2.1,0.2,0.0,102.0,0.0000,0.9,0.2,10003619.0,22029522.0
4,39.3,86.8,9.9,28.2,23.5,9.10,8.12,102.0,1.18,86.4,1.83,2.85,3.83,137.5,16.2,0.15,32.21,11.25,1.19,17.99,29.90,33.16,87.1,182.9,13.21,30.23,14.72,3.665,6.80,0.0,0.3,0.0,14.5,0.3,0.0,5.80,6.0,1.0134,0.1,0.00,247.6,114.3,15.3,452.5,29.0,9.10,8.81,109.5,2.57,185.7,2.44,4.66,4.58,143.1,43.8,0.34,38.13,12.91,1.77,19.81,31.17,35.04,92.0,232.7,18.87,55.58,15.91,4.243,12.62,0.2,0.9,45.0,21.5,1.3,0.1,6.10,37.0,1.0183,0.5,0.2,161.818939,98.562121,12.603095,220.125000,26.227884,9.100000,8.456924,105.301944,1.733100,127.862408,2.070180,3.555709,4.190397,140.228796,28.147446,0.199390,35.147367,12.072849,1.400903,18.803902,30.568354,34.097904,89.664341,207.544207,15.282986,41.085906,15.387130,3.948880,9.291700,0.033333,0.616667,23.000000,18.0,0.672222,0.022222,5.961111,16.333333,1.015483,0.266667,0.033333,0.438636,0.137879,0.044907,0.225000,0.120701,1.000000,0.516667,0.197222,0.338182,0.528333,0.025038,0.329678,0.001852,0.135648,0.586190,0.000000,0.832143,0.875000,0.650000,0.595122,0.478561,0.349476,0.317552,0.364156,0.650000,0.352899,0.485714,0.765000,0.215944,0.0,0.283333,0.127778,0.400000,0.033333,0.0,0.0,0.00,0.00,0.000000,0.011111,0.0,0.0,1.0,0.0,1.1,0.0,0.48,0.1,0.0,7.6,0.01,0.19,0.00,0.6,0.1,0.0,9.07,3.19,0.0,5.67,0.39,0.12,1.1,32.9,0.0,0.00,0.0,1.021,0.21,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.20,220.5,8.2,0.3,425.6,0.3,2.10,0.0,3.1,1.59,85.2,0.14,0.81,0.02,1.0,27.1,0.0,1.14,0.65,0.68,0.0,1.03,0.72,1.3,0.7,6.23,21.39,1.66,0.104,2.40,0.2,0.9,45.0,21.5,1.3,0.1,0.0,37.0,0.0000,0.5,0.1,10003939.0,22561709.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
8109,80.2,112.0,12.3,191.1,23.1,5.90,8.36,100.4,1.07,114.2,1.99,3.28,3.81,135.9,20.5,0.13,32.29,10.85,1.20,23.10,29.25,33.10,87.0,193.3,14.70,26.91,13.29,3.699,9.11,0.1,0.7,0.0,0.0,0.1,0.0,6.10,18.0,1.0183,0.1,0.20,305.6,119.6,15.4,856.2,25.9,5.90,8.75,104.9,1.64,189.5,2.22,3.96,4.47,139.7,34.4,0.55,35.82,11.90,1.96,35.07,29.67,33.95,88.8,216.0,21.43,34.68,13.51,4.061,13.91,0.1,1.7,7.0,1.0,0.6,0.0,6.60,29.0,1.0243,0.5,0.6,220.283333,115.661667,13.611250,525.825000,24.571250,5.900000,8.559583,102.450833,1.302429,152.068333,2.122917,3.615417,4.101458,137.671667,26.831667,0.303333,33.443762,11.218667,1.558125,28.674167,29.422000,33.507833,87.888333,204.750000,17.591250,30.493333,13.408167,3.825750,11.069000,0.100000,1.212121,2.333333,0.5,0.200606,0.000000,6.329242,22.915152,1.020866,0.323030,0.327273,0.508333,0.200000,0.022917,0.441667,0.131250,0.000000,0.350000,0.090000,0.370000,0.708333,0.016667,0.156250,0.064583,0.130000,0.478571,0.000000,0.580000,0.655000,0.687500,0.558333,0.000000,0.240000,0.000000,0.200000,0.587500,0.200000,0.086667,0.580000,0.475000,0.0,0.483030,0.033333,0.177273,0.009091,0.0,0.0,0.20,0.12,0.036364,0.054545,0.0,0.0,0.0,0.0,1.0,0.0,0.36,1.2,0.0,0.0,0.03,0.04,0.00,1.1,0.0,0.0,5.76,2.07,0.0,4.06,0.00,0.19,0.0,10.2,0.0,0.22,0.0,0.724,0.16,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.16,274.2,34.3,0.5,826.0,0.0,0.00,0.0,0.0,0.66,89.4,0.00,0.41,0.19,0.0,17.3,0.0,0.00,0.00,0.86,4.7,0.00,0.14,0.0,0.0,8.51,3.48,0.09,0.000,5.05,0.1,1.7,7.0,1.0,0.6,0.0,0.0,29.0,0.0016,0.5,0.3,19992732.0,26054225.0
8110,36.4,71.5,15.0,37.2,25.0,2.21,9.00,106.0,0.90,106.0,2.30,4.20,4.30,142.0,14.0,0.25,43.80,14.70,1.23,18.87,28.90,33.60,86.0,181.0,13.73,30.27,15.00,5.080,6.60,0.0,0.5,0.0,14.5,0.6,0.0,6.00,43.5,1.0201,0.3,0.40,47.4,82.2,15.0,49.0,25.0,2.68,9.00,106.0,0.90,106.0,2.30,4.20,4.30,142.0,14.0,0.35,43.80,14.70,1.52,20.67,28.90,33.60,86.0,181.0,16.94,32.47,15.00,5.080,6.60,0.0,1.1,15.0,15.5,1.2,0.0,6.05,50.0,1.0210,0.5,0.4,40.720000,75.600000,15.000000,42.028333,25.000000,2.391667,9.000000,106.000000,0.900000,106.000000,2.300000,4.200000,4.300000,142.000000,14.000000,0.300000,43.800000,14.700000,1.362750,19.770000,28.900000,33.600000,86.000000,181.000000,15.223667,31.161667,15.000000,5.080000,6.600000,0.000000,0.816667,10.000000,15.0,0.966667,0.000000,6.025000,46.750000,1.020533,0.416667,0.400000,0.333333,0.160000,0.000000,0.507500,0.000000,0.033333,0.000000,0.000000,0.000000,1.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.787500,0.550000,0.000000,0.000000,0.000000,0.000000,0.770833,0.278571,0.000000,0.000000,0.000000,0.0,0.416667,0.066667,0.400000,0.166667,0.0,0.0,0.30,0.10,0.200000,0.100000,0.0,0.4,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.00,0.00,0.00,0.0,0.0,0.0,0.00,0.00,0.0,4.17,0.00,0.00,0.0,0.0,0.0,0.02,0.0,0.000,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.14,17.2,0.9,0.0,15.6,0.0,0.43,0.0,0.0,0.00,6.0,0.00,0.00,0.00,0.0,0.0,0.0,0.00,0.00,0.42,0.0,0.00,0.00,0.0,0.0,4.14,1.52,0.00,0.000,0.00,0.0,1.1,15.0,15.5,1.2,0.0,0.0,50.0,0.0014,0.5,0.1,19993501.0,29469659.0
8111,45.2,104.1,12.3,32.4,25.3,8.10,8.25,99.8,1.65,86.6,1.90,3.14,3.47,137.8,14.8,0.35,36.42,12.07,1.20,18.85,29.64,32.79,89.3,298.8,13.40,29.01,14.35,4.059,9.50,0.1,1.3,15.0,1.0,0.9,0.0,6.20,16.0,1.0175,0.3,0.00,49.4,112.6,15.1,40.1,28.9,8.10,8.75,103.4,1.96,124.6,2.29,3.87,4.18,140.4,20.6,0.36,39.98,13.25,1.32,19.18,30.10,33.53,90.8,341.4,14.49,55.61,14.64,4.471,12.59,0.1,1.5,15.0,1.0,1.0,0.0,6.25,18.0,1.0182,0.4,0.4,47.300000,107.978571,13.513929,36.250000,27.296667,8.100000,8.503000,101.579206,1.811294,99.751484,2.062738,3.528500,3.795833,138.992143,17.527778,0.355000,38.213403,12.673086,1.262222,19.015000,29.871484,33.182143,90.013919,320.127564,14.007222,40.832059,14.488013,4.267741,10.701758,0.100000,1.400000,15.000000,1.0,0.950000,0.000000,6.225000,17.000000,1.017850,0.350000,0.200000,0.300000,0.328571,0.000000,0.250000,0.079167,1.000000,0.333333,0.033333,0.203333,0.356758,0.014286,0.102500,0.231250,0.000000,0.298333,0.000000,0.395588,0.536538,0.361111,0.600000,0.200000,0.296154,0.200000,0.177839,0.361111,0.304902,0.200000,0.586538,0.237363,0.0,0.450000,0.100000,0.100000,0.100000,0.0,0.0,0.10,0.10,0.100000,0.050000,0.0,0.0,0.0,0.0,0.1,0.0,0.37,0.0,0.0,1.4,0.00,0.11,0.10,0.0,0.0,0.0,3.83,1.50,0.0,4.08,0.08,0.11,0.2,3.8,0.0,0.17,0.0,0.526,0.02,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.20,24.3,12.8,0.0,11.8,0.5,1.10,0.0,0.2,0.93,27.2,0.07,0.08,0.02,0.0,3.2,0.0,0.00,0.05,0.22,0.0,0.81,0.25,0.6,22.2,1.70,24.47,0.43,0.039,2.37,0.1,1.5,15.0,1.0,1.0,0.0,0.0,18.0,0.0011,0.4,0.3,19993967.0,21550111.0
8112,27.0,211.0,11.0,27.0,29.0,1.20,8.40,97.0,1.00,90.0,2.00,3.30,3.90,135.0,16.0,0.20,44.40,14.00,1.10,24.20,26.20,31.20,83.0,321.0,12.20,30.70,14.20,5.320,6.10,0.0,1.2,15.0,1.0,0.8,0.0,6.10,13.0,1.0161,0.3,0.00,27.0,211.0,14.0,27.0,35.0,1.20,8.80,99.0,1.10,109.0,2.10,4.00,5.30,141.0,21.0,0.20,48.80,15.20,1.10,24.20,26.50,31.90,84.0,355.0,12.20,30.70,14.60,5.810,7.70,0.0,1.2,15.0,1.0,0.8,0.0,6.15,13.0,1.0165,0.3,0.0,27.000000,211.000000,12.750000,27.000000,31.750000,1.200000,8.566667,98.000000,1.025000,96.250000,2.066667,3.666667,4.400000,138.250000,18.000000,0.200000,46.100000,14.525000,1.100000,24.200000,26.350000,31.550000,83.750000,335.250000,12.200000,30.700000,14.450000,5.515000,7.100000,0.000000,1.200000,15.000000,1.0,0.800000,0.000000,6.125000,13.000000,1.016300,0.300000,0.000000,0.000000,1.000000,0.000000,0.000000,0.500000,0.000000,0.000000,0.000000,0.000000,0.250000,0.000000,0.000000,0.250000,0.000000,0.250000,0.000000,0.000000,0.000000,0.000000,0.000000,1.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.0,0.400000,0.100000,0.100000,0.100000,0.0,0.0,0.10,0.10,0.100000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.00,0.00,0.00,0.0,0.0,0.0,0.00,0.00,0.0,0.00,0.80,0.00,0.0,0.0,0.0,0.00,0.0,0.000,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.20,0.0,81.0,0.0,0.0,3.0,0.00,0.0,0.0,0.00,9.0,0.00,0.00,0.20,0.0,1.0,0.0,0.00,0.00,0.00,0.0,0.00,0.00,0.0,0.0,0.00,0.00,0.00,0.000,0.00,0.0,1.2,15.0,1.0,0.8,0.0,0.0,13.0,0.0011,0.3,0.0,19995127.0,21801907.0


## Standardize the Data for use in Models

In [1341]:
from sklearn.preprocessing import StandardScaler

scaler = StandardScaler()


In [1342]:
labs_scaled = lab_events_sampled_pivot
labs_scaled_KNN = lab_events_impute_KNN_imputed


In [1343]:
labs_scaled

Unnamed: 0_level_0,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,subject_id,hadm_id
itemid,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,Unnamed: 241_level_1,Unnamed: 242_level_1
0,2.997088,51.875587,11.000000,7.192662,28.000000,-0.030222,8.712124,103.000000,1.300000,116.000000,1.720807,2.909850,3.500000,140.000000,40.000000,0.390133,39.300000,12.900000,2.900000,22.769974,31.500000,32.900000,96.000000,95.000000,29.400000,35.500000,14.600000,4.100000,4.900000,0.0,0.0,0.0,0.0,0.0,0.0,5.458682,0.0,1.004187,0.0,0.253369,35.116566,107.659947,13.000000,36.444315,32.000000,3.243196,9.972855,106.000000,1.400000,116.000000,2.519348,4.152207,3.600000,145.000000,47.000000,1.322023,39.300000,12.900000,3.000000,44.175318,31.500000,32.900000,96.000000,95.000000,30.600000,35.500000,14.600000,4.100000,4.900000,0.0,0.0,0.0,0.0,0.0,0.0,7.813433,0.0,1.029526,0.0,0.919134,20.936125,82.895319,12.000000,20.170673,30.000000,2.100599,9.414059,104.500000,1.350000,116.000000,2.068347,3.585984,3.550000,142.500000,43.500000,0.818097,39.300000,12.900000,2.950000,33.768759,31.500000,32.900000,96.000000,95.000000,30.000000,35.500000,14.600000,4.100000,4.900000,0.0,0.0,0.0,0.0,0.0,0.0,6.451515,0.0,1.017424,0.0,0.608275,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.000000,0.000,0.0,0.00,0.0,1.000000,0.0,1.00,1.0,1.0,0.0,0.0,0.000000,0.0,1.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.7,1.1,0.0,0.0,0.0,0.0,0.0,55.0,0.0,0.0,0.0,0.50,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.2,16.0,0.0,0.0,0.0,0.0,27.0,0.0,0.0,0.0,1.9,0.0,0.0,0.0,0.0,0.0,17.2,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10001877,21320596.0
1,8.502958,42.563595,10.193396,3.329270,24.033822,9.500000,8.849326,97.341420,0.555639,71.902029,1.735081,3.079829,3.602654,134.225802,7.276216,0.199821,39.464173,13.487843,0.906960,24.327817,26.762869,31.574106,80.745531,199.690059,10.097198,26.580360,11.441106,4.344073,5.333141,0.0,0.0,0.0,0.0,0.0,0.0,5.752620,0.0,1.005363,0.0,0.289124,32.626622,113.369253,17.922574,34.519860,30.749347,9.500000,10.289063,107.197838,1.009893,97.083726,2.590251,4.147307,4.770449,144.222954,17.214012,1.233413,47.605115,16.049808,1.067653,48.720870,30.868970,34.908220,94.673671,396.003821,12.475355,34.342181,14.765301,5.588843,10.342467,0.0,0.0,0.0,0.0,0.0,0.0,7.510084,0.0,1.031955,0.0,0.804833,19.860518,82.902413,14.133664,20.863701,27.310695,9.500000,9.322523,101.935952,0.777818,84.950583,2.091110,3.645794,4.226222,138.849958,12.733493,0.766628,43.948501,14.639790,0.993173,34.235197,29.130385,33.377137,89.074325,291.329743,11.230896,30.430946,12.920632,5.036211,7.596984,0.0,0.0,0.0,0.0,0.0,0.0,6.543635,0.0,1.018809,0.0,0.588818,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.000000,0.000,0.0,0.00,0.0,0.000000,0.0,0.00,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10002305,29924799.0
2,10.068224,45.124179,10.000000,6.207528,23.000000,0.134158,7.700000,103.000000,0.700000,78.000000,1.500000,1.500000,3.600000,135.000000,17.000000,0.293749,34.600000,11.800000,1.300000,19.710321,29.400000,34.100000,86.000000,215.000000,14.800000,32.200000,13.700000,4.010000,11.300000,0.0,0.0,0.0,0.0,0.0,0.0,5.388687,0.0,0.999706,0.0,0.367356,35.871744,116.273930,14.000000,33.587622,27.000000,3.990090,8.200000,106.000000,0.900000,131.000000,2.400000,3.600000,4.600000,141.000000,24.000000,1.343694,39.200000,13.600000,1.300000,42.518730,30.300000,35.300000,87.000000,414.000000,14.800000,32.200000,14.200000,4.560000,15.600000,0.0,0.0,0.0,0.0,0.0,0.0,7.710818,0.0,1.033396,0.0,0.829843,21.708522,84.468800,12.714286,21.270116,25.428571,2.175172,8.014286,104.750000,0.800000,101.857143,1.950000,2.466667,4.125000,138.500000,20.285714,0.802675,37.262500,12.814286,1.300000,33.512477,29.771429,34.585714,86.142857,291.857143,14.800000,32.200000,13.842857,4.300000,13.142857,0.0,0.0,0.0,0.0,0.0,0.0,6.593207,0.0,1.019267,0.0,0.598061,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.428571,0.125,0.5,0.00,0.0,0.428571,0.0,1.00,1.0,1.0,0.0,0.0,0.285714,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.7,0.0,0.0,0.0,0.1,1.2,0.0,0.0,0.0,0.0,5.4,2.2,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.59,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,31.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,0.2,0.0,0.0,0.3,0.0,0.0,1.4,0.0,0.0,0.0,4.6,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10003046,26048429.0
3,5.192135,46.960747,10.285499,7.885413,23.519880,7.000000,8.571769,97.662939,0.546662,73.690120,1.711040,3.021489,3.497371,132.807198,8.349347,0.330113,39.397553,12.860433,0.943063,21.112103,26.958905,31.332047,84.588624,136.373125,10.222489,26.746379,11.482002,4.416524,4.961947,0.0,0.0,0.0,0.0,0.0,0.0,5.485266,0.0,1.007352,0.0,0.294764,34.407151,117.746618,17.590545,31.647699,30.219652,7.000000,10.075479,105.486049,1.016000,96.310622,2.623454,4.385983,4.833780,144.094278,19.795792,1.557683,48.666197,15.920874,1.049453,44.981012,31.487523,34.810884,97.883102,354.804109,12.419864,33.814800,14.358810,5.577389,9.493844,0.0,0.0,0.0,0.0,0.0,0.0,7.476731,0.0,1.027497,0.0,0.932848,19.383891,82.213672,14.015614,20.726256,26.526470,7.000000,9.381088,102.146848,0.815436,85.520123,2.124743,3.669531,4.174752,139.380182,13.438019,0.801909,43.246255,14.620847,0.991510,34.270489,29.242339,33.440477,89.881860,272.539297,11.233248,29.810369,13.030749,4.991010,7.549923,0.0,0.0,0.0,0.0,0.0,0.0,6.471691,0.0,1.017066,0.0,0.600110,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000000,0.000,0.0,0.00,0.0,0.000000,0.0,0.00,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10003619,22029522.0
4,6.213900,38.967323,9.665789,-5.968614,23.368636,9.100000,8.715162,98.577412,0.567741,73.373483,1.823347,2.865983,3.523774,135.817396,7.949785,0.413042,36.929292,13.047198,0.909149,26.195502,27.077019,31.592700,85.221055,148.943883,9.973353,23.527726,11.056237,4.408653,4.581118,0.0,0.0,0.0,0.0,0.0,0.0,5.641294,0.0,1.006180,0.0,0.416629,35.046998,108.382078,17.442492,32.004954,32.276601,9.100000,10.212273,106.649646,1.065124,93.109747,2.568620,4.143643,5.026288,144.459133,19.485053,1.334336,47.576082,17.612370,1.056959,43.341469,31.018576,35.449698,97.230070,414.837140,12.541499,34.448200,14.383967,5.439404,10.334049,0.0,0.0,0.0,0.0,0.0,0.0,7.675755,0.0,1.027870,0.0,0.950611,19.169242,78.287915,13.647137,18.238603,27.178056,9.100000,9.396506,102.623303,0.813325,85.420539,2.143240,3.589295,4.280528,139.599349,12.607573,0.823044,43.004801,14.728392,0.999509,34.334367,29.051363,33.447208,89.735927,276.650764,11.292039,29.851395,12.918443,4.979181,7.500039,0.0,0.0,0.0,0.0,0.0,0.0,6.445369,0.0,1.018689,0.0,0.658282,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.000000,0.000,0.0,0.00,0.0,0.000000,0.0,0.00,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10003939,22561709.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
8109,6.416863,51.625240,9.681436,10.373504,23.510786,5.900000,8.270673,97.266194,0.519337,72.999882,1.655599,2.873887,3.625218,134.687267,8.662937,0.135768,38.812549,13.079045,0.940601,27.073886,27.139609,32.234841,82.105933,172.711736,10.268260,24.536180,11.080318,4.314118,3.484800,0.0,0.0,0.0,0.0,0.0,0.0,5.124408,0.0,1.009482,0.0,0.265568,31.421360,122.045011,18.802476,34.682301,31.002901,5.900000,10.002229,105.913992,1.047043,96.999959,2.492746,4.222231,4.876310,142.945095,17.968089,1.366485,47.247595,16.740744,1.084053,43.997687,30.840806,35.441410,96.676333,380.543192,12.676653,35.310368,14.899079,5.485214,11.052365,0.0,0.0,0.0,0.0,0.0,0.0,7.517992,0.0,1.031913,0.0,0.897921,18.651249,85.155625,14.453087,22.082737,27.167588,5.900000,9.311518,102.006612,0.774500,85.668451,2.102091,3.571794,4.259626,139.379366,12.501138,0.810273,43.218617,14.645108,1.006120,34.117331,28.946836,33.562173,89.405157,285.633693,11.205778,29.956128,12.906096,4.993155,7.871360,0.0,0.0,0.0,0.0,0.0,0.0,6.457806,0.0,1.018112,0.0,0.584025,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000000,0.000,0.0,0.00,0.0,0.000000,0.0,0.00,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19992732,26054225.0
8110,2.647704,46.201928,15.000000,3.026479,25.000000,0.478166,9.000000,106.000000,0.900000,106.000000,2.300000,4.200000,4.300000,142.000000,14.000000,-0.077239,43.800000,14.700000,0.917266,26.532383,28.900000,33.600000,86.000000,181.000000,10.342111,26.459899,15.000000,5.080000,6.600000,0.0,0.0,0.0,0.0,0.0,0.0,4.895399,0.0,0.994633,0.0,0.373001,34.996085,109.545270,15.000000,33.300532,25.000000,3.269628,9.000000,106.000000,0.900000,106.000000,2.300000,4.200000,4.300000,142.000000,14.000000,1.254840,43.800000,14.700000,1.076884,43.058540,28.900000,33.600000,86.000000,181.000000,12.315285,34.563190,15.000000,5.080000,6.600000,0.0,0.0,0.0,0.0,0.0,0.0,7.276665,0.0,1.028252,0.0,0.848010,20.015116,85.308048,15.000000,19.473612,25.000000,1.945947,9.000000,106.000000,0.900000,106.000000,2.300000,4.200000,4.300000,142.000000,14.000000,0.823788,43.800000,14.700000,1.003315,34.690025,28.900000,33.600000,86.000000,181.000000,11.300130,30.079784,15.000000,5.080000,6.600000,0.0,0.0,0.0,0.0,0.0,0.0,6.430284,0.0,1.018342,0.0,0.627433,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.000000,0.000,0.0,0.00,0.0,0.000000,0.0,0.00,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19993501,29469659.0
8111,2.107809,49.482091,9.512278,3.506271,22.796961,8.100000,8.611315,98.796909,0.377824,73.245093,1.784712,2.844369,3.792310,135.306818,8.838752,0.337455,39.960258,13.267441,0.912956,23.237294,26.750093,32.055179,83.256674,179.775561,10.212243,25.262227,11.397791,4.572239,5.287445,0.0,0.0,0.0,0.0,0.0,0.0,5.263032,0.0,1.003079,0.0,0.294892,38.483430,115.147427,19.353132,30.966201,29.820915,8.100000,9.899158,104.993242,1.005288,96.191956,2.567219,4.151670,4.966684,143.664262,17.519976,1.428553,47.883590,15.985655,1.090858,46.114719,31.308057,34.976675,97.809682,378.234164,12.227934,33.759630,15.112118,5.548716,10.359374,0.0,0.0,0.0,0.0,0.0,0.0,7.383318,0.0,1.028776,0.0,0.823796,19.627579,85.132792,13.868937,19.832656,26.401906,8.100000,9.333959,101.732765,0.805182,85.623946,2.089200,3.607557,4.243464,139.445306,13.201811,0.741716,43.373549,14.657867,0.990615,34.422652,29.093080,33.517320,89.922277,285.728675,11.204807,29.915370,13.142710,5.006642,7.710596,0.0,0.0,0.0,0.0,0.0,0.0,6.403438,0.0,1.017003,0.0,0.589674,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.000000,0.000,0.0,0.00,0.0,0.000000,0.0,0.00,0.0,0.0,0.0,0.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19993967,21550111.0
8112,27.000000,211.000000,11.000000,27.000000,29.000000,1.200000,8.400000,97.000000,1.000000,90.000000,2.000000,3.300000,3.900000,135.000000,16.000000,0.200000,44.400000,14.000000,1.100000,24.200000,26.200000,31.200000,83.000000,321.000000,12.200000,30.700000,14.200000,5.320000,6.100000,0.0,0.0,0.0,0.0,0.0,0.0,5.282076,0.0,1.007125,0.0,0.244298,27.000000,211.000000,14.000000,27.000000,35.000000,1.200000,8.800000,99.000000,1.100000,109.000000,2.100000,4.000000,5.300000,141.000000,21.000000,0.200000,48.800000,15.200000,1.100000,24.200000,26.500000,31.900000,84.000000,355.000000,12.200000,30.700000,14.600000,5.810000,7.700000,0.0,0.0,0.0,0.0,0.0,0.0,7.307679,0.0,1.029810,0.0,0.836206,27.000000,211.000000,12.750000,27.000000,31.750000,1.200000,8.566667,98.000000,1.025000,96.250000,2.066667,3.666667,4.400000,138.250000,18.000000,0.200000,46.100000,14.525000,1.100000,24.200000,26.350000,31.550000,83.750000,335.250000,12.200000,30.700000,14.450000,5.515000,7.100000,0.0,0.0,0.0,0.0,0.0,0.0,6.423791,0.0,1.018455,0.0,0.588578,0.0,1.0,0.0,0.0,0.5,0.0,0.0,0.0,0.0,0.250000,0.000,0.0,0.25,0.0,0.250000,0.0,0.00,0.0,0.0,0.0,1.0,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.8,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,81.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,9.0,0.0,0.0,0.2,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19995127,21801907.0


In [1344]:
scaler.fit(labs_scaled.loc[:, ('min', 50861) : ('above_max', 51514)])
labs_scaled.loc[:, ('min', 50861) : ('above_max', 51514)] = scaler.transform(labs_scaled.loc[:, ('min', 50861) : ('above_max', 51514)])

scaler.fit(labs_scaled_KNN.loc[:, ('min', 50861) : ('above_max', 51514)])
labs_scaled_KNN.loc[:, ('min', 50861) : ('above_max', 51514)] = scaler.transform(labs_scaled_KNN.loc[:, ('min', 50861) : ('above_max', 51514)])


In [1345]:
pd.DataFrame(labs_scaled_KNN)

Unnamed: 0_level_0,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,min,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,max,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,mean,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,abn_percent,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,below_min,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,above_max,subject_id,hadm_id
itemid,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,50861,50863,50868,50878,50882,50885,50893,50902,50912,50931,50960,50970,50971,50983,51006,51146,51221,51222,51237,51244,51248,51249,51250,51265,51274,51275,51277,51279,51301,51464,51466,51478,51484,51486,51487,51491,51492,51498,51506,51514,Unnamed: 241_level_1,Unnamed: 242_level_1
0,-0.266859,-0.397199,-0.347562,0.087319,1.469562,-0.065554,-0.868565,0.581629,0.508489,0.684559,-0.126524,-0.723958,-0.636273,0.937203,2.761055,-0.600666,0.784658,0.634403,7.453598,-0.198872,0.475357,0.073734,0.750795,-1.429922,5.712699,0.823431,0.211976,0.568440,-0.844949,0.592599,0.245036,0.875654,-0.406964,0.746537,0.821233,-0.819146,1.591234,0.244589,1.564859,-0.131228,-0.271184,-0.360081,-0.928519,-0.224798,1.437159,0.046059,-0.524113,0.020250,0.020320,-0.391343,0.174096,0.237692,-1.461298,1.158297,1.204005,-0.401487,0.211476,0.111665,1.881529,-0.192500,0.171238,-0.745423,0.384443,-1.654598,1.855042,-0.517983,-0.146785,-0.072146,-0.791246,0.187223,0.562910,0.585443,-0.541573,0.792888,0.345560,-0.535144,1.475628,0.202771,1.662266,-0.402683,-0.292120,-0.369517,-0.822334,-0.179322,1.752732,0.015326,-0.982584,0.385100,0.245502,-0.165935,0.234019,-0.319648,-1.524260,1.300483,1.988815,-0.538917,0.577427,0.433017,4.911614,-0.208133,0.332770,-0.344901,0.585653,-1.718883,4.170173,-0.101860,0.020915,0.323463,-0.912270,0.421779,0.503475,0.777205,-0.493033,0.723911,0.647279,-0.787257,1.683313,0.261488,1.737773,-0.268792,-0.288515,-0.325235,-0.454838,-0.038182,-0.732729,0.585625,0.607251,-0.707924,2.546810,1.225460,-0.418394,0.222477,-0.510323,-0.522470,1.942260,-0.231259,0.871995,0.800025,1.483308,-0.246986,-0.839965,-0.716654,-0.646092,2.638083,1.513518,2.616925,-0.710926,0.793106,-0.990920,-0.200033,0.397273,0.833453,-0.603839,0.228242,-0.13741,-0.139778,-0.183291,-0.440472,0.276428,-0.162790,0.0,0.433267,-0.310823,0.0,-0.622196,0.0,0.676104,-0.391819,-0.1662,-0.267616,-0.146983,0.456330,-0.419848,-0.407061,-0.311850,0.0,-0.963299,-0.527833,-0.07608,0.693285,-0.245430,-0.419084,-0.243990,1.859676,-0.074274,-0.404260,0.0,-0.399565,-0.276411,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.099777,0.0,-0.342768,-0.270626,-0.422091,-0.336559,-0.229636,-0.269395,0.297441,-0.068217,-0.491223,-0.215081,-0.404041,-0.105849,0.186100,-0.318823,-0.264181,1.101513,-0.124576,-0.219946,-0.282657,1.874558,-0.304237,-0.545284,-0.397458,-0.424705,-0.245233,1.754979,-0.697723,-0.495859,-0.159080,-0.335487,0.187223,0.562910,0.585443,-0.541573,0.792888,0.345560,-0.165043,1.475628,-0.377813,1.662266,-0.454730,10001877.0,21320596.0
1,-0.222071,-0.391690,0.774897,-0.031307,-0.154531,2.070029,0.295981,-1.065383,2.053808,-0.476959,-0.321136,-0.002565,-0.165694,-1.046233,1.081170,-0.319866,0.040925,0.057151,-0.283621,0.256838,-0.055582,0.280128,-0.167762,-0.471561,-0.266796,-0.205069,0.108194,0.103351,-0.581010,0.592599,0.878913,-0.221164,-0.231458,-0.345255,0.821233,0.980289,1.372199,0.319940,-0.126779,0.891398,-0.267533,-0.497602,0.789563,-0.233402,-0.510749,1.511717,0.293110,-0.391068,0.997919,-0.154817,2.953270,-0.383799,-0.407501,-0.415739,0.371436,0.144513,0.064973,0.173965,-0.063213,0.108536,0.062580,0.419477,-0.135679,0.738324,-0.117719,0.398639,-0.038986,0.188585,-0.331688,0.187223,0.671485,-0.372319,-0.404239,-0.462005,0.345560,0.729439,0.643194,-0.166025,-0.658075,0.375444,-0.282114,-0.457645,1.037351,-0.201320,-0.426105,1.822461,0.477059,-0.793131,1.504737,-0.612903,0.040975,-0.253772,-0.305280,-0.839391,0.664093,-0.073114,0.073333,0.121291,-0.223968,0.193637,0.020588,0.353023,-0.157021,-0.062116,-0.227992,0.402853,0.028136,0.151686,-0.452300,0.421779,0.822681,-0.305423,-0.327916,-0.474922,0.647279,1.016030,1.068173,0.077529,-0.432596,0.694999,-0.640443,-0.231808,0.373233,-0.534984,0.123365,2.063262,-0.746284,0.686573,-0.118943,-0.711642,-0.145972,0.188870,-0.180947,0.745879,-0.230398,0.206842,-0.328072,-0.585844,-0.293848,0.028660,-0.161616,-0.068450,-0.497320,-0.033237,-0.265358,0.157855,-0.090163,-0.171690,-0.744195,-0.200033,0.850279,0.008017,0.108800,-0.486417,-0.13741,-0.139778,-0.183291,0.400298,-0.489482,0.393743,0.0,0.328517,-0.146618,0.0,-0.228362,0.0,-0.453732,1.189013,-0.1662,-0.236832,-0.005727,-0.316978,0.110879,1.457431,-0.311850,0.0,-0.152989,-0.241690,-0.07608,-0.451352,-0.245430,-0.419084,-0.243990,0.389858,-0.074274,-0.404260,0.0,-0.163923,0.406065,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.099777,0.0,-0.342768,-0.268935,-0.287838,0.460051,-0.224951,-0.269395,0.438875,-0.068217,-0.215657,1.050299,-0.135991,3.492821,-0.292091,-0.318823,-0.264181,0.301194,0.154030,-0.219946,-0.282657,-0.059279,-0.304237,-0.035516,0.558978,-0.321516,1.530068,-0.110714,0.391636,-0.357681,-0.159080,-0.278560,0.187223,0.671485,-0.372319,-0.404239,-0.462005,0.345560,-0.165043,0.643194,0.124709,-0.658075,0.443682,10002305.0,29924799.0
2,-0.364340,0.284059,-0.763287,-0.320137,0.044919,-0.433103,-1.025936,0.581629,-0.366219,-0.806578,-1.294195,-1.886203,-0.400984,-0.385087,0.202290,0.161505,0.133719,0.199487,0.498794,-0.612773,-0.315403,0.927776,-0.684451,0.091286,0.562219,0.335780,-0.337460,0.445328,0.748642,0.111235,-0.008515,0.765972,-0.231458,0.200641,0.821233,-0.256823,0.003229,0.753208,0.888204,-0.244853,-0.297017,0.064883,-0.621719,-0.289323,-0.108800,-0.537023,-1.102456,0.020250,-0.404724,-0.259940,0.260406,-0.519751,0.088404,-0.029655,-0.089853,-0.107487,0.194636,0.447122,-0.367492,-0.722136,-0.278378,1.106074,-0.847425,1.319076,-0.320089,-0.656547,-0.342783,0.711753,0.321258,-0.167051,0.345758,0.411304,-0.335571,0.336563,1.098278,-0.429762,-0.256218,0.303352,0.631003,-0.489142,-0.346613,0.184735,-0.491050,-0.328670,0.095073,-0.490102,-1.420441,0.457555,-0.384749,-0.608508,-0.282537,-1.488104,0.021903,-0.118162,0.038547,0.043336,0.253311,0.394572,-0.073620,-0.690631,-0.326118,1.004813,-0.829419,0.686061,0.053163,-0.400486,-0.405075,0.642455,0.544120,-0.018927,0.204862,0.637511,-0.286637,0.324300,1.149502,-0.350978,-0.131039,0.567558,0.853548,-0.375880,-0.868967,0.714595,-0.454838,-0.907586,-0.732729,-0.188376,2.368099,-0.707924,-0.724052,-0.610954,0.423811,0.867760,-0.510323,-0.522470,0.253118,-0.231259,0.871995,0.800025,1.483308,0.800469,-0.839965,0.186766,-0.646092,-0.673471,1.513518,-1.123835,-0.710926,0.793106,1.911732,-0.200033,0.759678,0.008017,0.346346,-0.486417,-0.13741,-0.139778,0.844631,-0.440472,1.042337,-0.162790,0.0,-0.299986,-0.310823,0.0,-0.622196,0.0,0.868416,-0.391819,-0.1662,-0.267616,0.983058,2.899984,-0.419848,-0.407061,-0.311850,0.0,-0.050000,0.066049,-0.07608,0.471438,-0.245430,-0.419084,-0.243990,-0.504067,-0.074274,-0.404260,0.0,-0.255295,-0.276411,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.099777,0.0,0.161167,-0.279929,0.004734,-0.336559,-0.280984,-0.269395,-0.342729,-0.068217,-0.491223,-0.395850,-0.271780,-0.145394,-0.432735,-0.318823,-0.264181,-0.336560,-0.124576,-0.219946,-0.282657,-0.392700,-0.304237,-0.545284,0.357623,-0.424705,-0.245233,-0.458080,-0.720212,-0.495859,-0.159080,0.177975,-0.167051,0.345758,0.411304,-0.335571,0.336563,1.098278,-0.165043,-0.256218,-0.377813,0.631003,-0.454730,10003046.0,26048429.0
3,0.203419,-0.116249,-0.513852,-0.191195,-0.895345,1.277899,0.107136,-0.021502,-0.278748,-0.626072,-0.048679,0.505082,0.563703,-0.411533,-0.209337,0.682990,-0.068488,0.025521,-0.283621,0.570399,0.531840,-0.125543,0.391983,-0.360006,-0.287963,-0.058773,0.089879,-0.298813,0.427434,0.592599,0.498587,-0.221164,0.997086,1.155959,0.821233,-0.706682,0.797231,-0.791488,1.226532,-0.131228,0.507196,-0.064748,0.268002,0.546697,-0.325234,0.849123,0.029084,0.891276,-0.175200,0.103610,0.156834,0.820340,0.506824,0.089140,0.371436,0.354512,0.802538,0.835293,0.108771,0.603365,1.040495,0.573769,1.082502,0.236807,0.101171,0.513269,0.348109,0.335141,0.423151,0.895773,0.671485,0.150096,1.518443,1.135131,1.098278,-0.535144,1.198150,-0.266606,1.146635,-0.229766,0.757848,-0.086088,-0.052532,0.773072,-0.656685,1.082075,0.171628,0.403042,-0.270041,-0.007554,0.006653,0.726603,0.803980,-0.269398,0.202178,0.505811,0.251244,0.354878,-0.041640,0.625726,0.786359,0.209386,0.782484,-0.094472,-0.078366,0.607313,0.255264,-0.065214,0.422686,0.568681,0.657929,0.014127,1.405804,1.086521,0.870489,-0.615977,1.045390,-0.596458,1.228674,-0.233096,0.510750,0.587195,-0.085814,0.179169,0.146626,-0.751286,0.049043,0.560826,-0.052039,0.105737,-0.363715,-0.330436,0.395898,0.138649,0.269031,-0.231259,0.306884,0.571334,0.418380,0.177912,0.678839,-0.006297,0.298767,0.456450,0.447560,0.422165,0.135569,-0.125747,-0.107919,-0.200033,0.880479,1.108598,0.346346,1.181120,-0.13741,-0.139778,0.330670,-0.440472,1.042337,-0.100953,0.0,0.223766,1.331221,0.0,0.756223,0.0,0.195323,0.003389,-0.1662,1.271558,-0.146983,-0.224181,-0.419848,0.318019,0.733577,0.0,0.542673,0.411579,-0.07608,0.053704,-0.245430,-0.129944,-0.243990,0.909881,-0.074274,-0.404260,0.0,0.472468,0.274820,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.099777,0.0,-0.342768,0.508307,-0.306836,0.031107,0.546590,-0.269395,-0.491606,-0.068217,0.932534,-0.169889,0.088853,0.072108,0.284551,0.285882,0.025637,0.488769,-0.124576,0.862296,1.234283,0.100762,0.204455,1.124207,0.533809,0.744767,0.156907,0.113394,0.424920,0.115035,0.921612,0.296294,0.895773,0.671485,0.150096,1.518443,1.135131,1.098278,-0.165043,1.198150,-0.377813,1.146635,-0.354906,10003619.0,22029522.0
4,-0.089023,-0.217244,-0.804860,-0.277156,0.187384,1.943288,-0.364977,0.349656,0.333548,-0.476959,-0.009757,-0.082720,0.140182,0.276058,0.113289,-0.640780,-0.197291,-0.017971,0.020652,-0.128843,-0.127127,0.258777,-0.526574,-0.315637,0.001311,0.044668,0.285234,-0.026600,-0.371851,-0.370129,-0.769168,-0.330846,0.865456,-0.481729,-0.262966,-0.369287,-0.434841,-0.377057,-0.465107,-0.472103,0.323833,-0.181979,-0.222878,0.500501,0.509583,1.405702,-0.335523,0.867081,1.014921,0.219245,0.329454,0.509595,0.057410,0.594020,1.023990,-0.296487,0.014455,0.116458,0.254296,-0.326085,0.047593,0.905495,-0.163054,-0.370978,0.240214,0.325158,0.495108,0.171544,0.011420,0.187223,-0.522846,-0.067577,0.934772,0.222482,0.345560,-0.324380,-0.045717,-0.098971,0.115372,-0.489142,0.500423,-0.212847,-0.542620,0.703801,0.384914,1.703999,-0.512482,0.617519,0.684500,0.205275,0.221991,0.119357,0.197755,0.494975,0.699023,-0.617526,-0.083154,0.062018,0.231243,-0.241350,-0.022350,0.614234,-0.323882,-0.343964,0.183982,0.403624,0.463777,0.082433,-0.136322,-0.312731,-0.639490,-0.169221,0.993014,-0.245516,-0.133956,-0.325125,-0.321587,-0.301490,-0.218239,-0.554360,0.510750,-0.480542,-0.118389,-0.441834,-0.232526,2.063262,0.729694,0.134103,0.382094,-0.290346,-0.300055,0.202263,-0.498124,0.272000,0.719040,-0.231259,0.424351,0.456988,0.378691,0.012525,0.408618,0.388377,0.298767,0.532451,0.407832,0.196274,0.659590,0.145315,-0.364110,-0.200033,-0.569139,0.179983,1.058984,-0.248198,-0.13741,-0.139778,-0.697252,-0.440472,-0.489482,-0.657487,0.0,-0.299986,1.331221,0.0,-0.080674,0.0,0.339557,-0.335361,-0.1662,2.071929,-0.288238,-0.224181,-0.419848,-0.096313,-0.102765,0.0,0.663151,0.600542,-0.07608,-0.069020,0.262389,-0.202229,0.381554,0.909881,-0.074274,-0.404260,0.0,0.435599,0.274820,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.099777,0.0,0.665103,0.327035,-0.404359,-0.152726,0.508922,0.025900,0.289998,-0.068217,0.932534,1.041261,0.206124,0.131426,0.706483,-0.263850,0.460364,1.107765,-0.124576,0.825610,0.812911,0.247467,-0.304237,0.111042,1.414737,0.022446,-0.231501,0.218444,0.241860,0.711385,1.319762,-0.067594,0.187223,-0.522846,-0.067577,0.934772,0.222482,0.345560,-0.165043,-0.045717,-0.377813,0.115372,-0.454730,10003939.0,22561709.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
8109,0.449755,0.245498,0.192881,2.523458,0.073412,0.929361,0.012713,-0.021502,0.173185,0.613926,0.613001,0.491723,0.093124,-0.147075,0.591667,-0.721009,-0.186211,-0.176122,0.064119,0.405257,-0.371886,0.216074,-0.540926,-0.183799,0.526942,-0.445939,-0.587759,0.019909,0.203335,0.111235,-0.262066,-0.330846,-0.406964,-0.754677,-0.262966,0.305501,-0.106288,0.545993,-0.465107,-0.244853,0.486698,-0.122237,-0.192198,1.255537,-0.448911,0.557582,-0.410959,-0.245897,0.224340,0.252533,-0.050309,-0.170162,-0.113057,-0.415739,0.495196,0.144513,-0.374535,-0.367558,0.505657,1.109482,-0.514426,0.064607,-0.601052,-0.526653,0.592640,-0.552414,-0.680879,-0.138607,0.145545,-0.167051,0.345758,-0.398440,-0.472906,-0.576086,-0.407158,0.729439,-0.198809,0.906836,0.115372,-0.143308,0.855660,0.045192,-0.075041,2.345344,-0.215802,0.756305,-0.301902,-0.208790,0.190990,0.962751,0.443387,0.207488,-0.041400,-0.411940,0.588483,-0.250731,-0.354155,-0.321105,0.706267,0.785026,-0.459312,0.141778,-0.578842,-0.378100,0.809189,-0.554928,-0.649644,-0.113954,0.177700,-0.018927,0.096276,-0.385747,-0.451754,-0.873726,-0.357166,0.531451,-0.158002,0.722856,-0.037009,-0.239586,0.773553,-0.231808,-0.283145,0.365470,-0.188809,-0.751286,0.164726,-0.323675,0.486167,0.288124,-0.360673,-0.475369,-0.084878,0.238920,0.400918,-0.231259,-0.248068,-0.146757,0.497042,-0.109163,-0.839965,0.042219,-0.646092,-0.011160,0.210388,-0.375683,-0.466383,-0.364649,0.387840,-0.200033,0.154572,-0.404701,0.000824,-0.421448,-0.13741,-0.139778,0.330670,0.568452,-0.210969,-0.415760,0.0,-0.299986,-0.310823,0.0,-0.129904,0.0,0.051088,0.285680,-0.1662,-0.267616,-0.005727,-0.688166,-0.419848,0.162645,-0.311850,0.0,0.019955,-0.004137,-0.07608,-0.448992,-0.245430,-0.075730,-0.243990,-0.065700,-0.074274,-0.003373,0.0,-0.040492,0.143574,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.099777,0.0,-0.342768,0.478423,-0.073792,-0.030171,1.259285,-0.269395,-0.491606,-0.068217,-0.491223,0.200687,0.243158,-0.145394,0.143906,0.203423,-0.264181,0.495021,-0.124576,-0.219946,-0.282657,0.487530,1.102146,-0.545284,-0.045087,-0.424705,-0.245233,0.537797,-0.563690,-0.430406,-0.159080,0.228205,-0.167051,0.345758,-0.398440,-0.472906,-0.576086,-0.407158,-0.165043,-0.198809,0.627232,0.115372,-0.255083,19992732.0,26054225.0
8110,-0.127225,-0.498194,1.315340,-0.122426,0.614776,-0.239823,1.019889,1.277549,-0.074650,0.292154,1.819594,1.720763,1.246042,1.466119,-0.131462,-0.239637,1.407898,1.346083,0.194522,-0.036865,-0.503679,0.571925,-0.684451,-0.339723,0.184753,0.050579,0.456170,1.908989,-0.421651,-0.370129,-0.515617,-0.330846,0.865456,-0.072307,-0.262966,0.080572,0.591886,0.885073,0.211549,-0.017602,-0.238330,-0.543818,-0.314918,-0.254162,-0.727184,-0.295839,-0.096642,0.020250,-0.404724,-0.478946,0.087786,0.062898,-0.376507,0.267333,-0.652400,-0.275487,0.969247,0.974268,-0.076443,-0.245181,-0.802930,-0.205403,-0.984300,-0.852918,-0.025483,-0.645210,0.049213,1.597901,-0.614493,-0.521326,-0.305695,-0.328785,0.522769,0.108401,-0.407158,-0.429762,0.203056,0.353642,0.115372,-0.316225,-0.235389,-0.559354,0.569057,-0.252539,-0.060332,-0.282704,0.601501,0.819829,-0.270157,-0.478865,1.186803,1.070352,0.492474,1.123152,-0.489526,-0.262494,1.293265,1.240364,0.115970,-0.140888,-0.658285,0.215573,-0.849928,-0.668247,0.167915,-0.494448,0.245966,1.886524,-0.611905,-0.459633,-0.392363,-0.305423,0.745339,0.146695,-0.357166,-0.176467,0.434393,0.659537,0.264065,-0.161704,0.113689,-0.391969,-0.454838,0.610766,-0.732729,-0.657467,-1.021705,-0.707924,-0.724052,1.225460,-0.481362,-1.085882,-0.510323,-0.522470,-1.013738,-0.231259,-1.794821,-1.944270,0.812647,-0.136728,-0.839965,-0.716654,-0.646092,-0.673471,0.789557,-0.081766,-0.710926,-1.963454,-0.990920,-0.200033,-0.085933,-0.198342,1.058984,0.704681,-0.13741,-0.139778,0.844631,0.400298,1.042337,-0.162790,0.0,0.119016,-0.310823,0.0,-0.622196,0.0,-0.814318,-0.391819,-0.1662,-0.267616,-0.429493,-0.811896,-0.419848,-0.407061,-0.311850,0.0,-1.099322,-1.121714,-0.07608,-0.423031,-0.245430,-0.419084,-0.243990,-0.504067,-0.074274,-0.367815,0.0,-1.201065,-0.276411,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.099777,0.0,-0.846703,-0.246099,-0.496817,-0.336559,-0.259433,-0.269395,-0.331564,-0.068217,-0.491223,-0.395850,-0.492215,-0.145394,-0.432735,-0.318823,-0.264181,-0.586660,-0.124576,-0.219946,-0.282657,-0.099290,-0.304237,-0.545284,-0.397458,-0.424705,-0.245233,-0.074296,-0.651846,-0.495859,-0.159080,-0.335487,-0.521326,-0.305695,-0.328785,0.522769,0.108401,-0.407158,-0.165043,0.203056,0.501601,0.115372,-0.454730,19993501.0,29469659.0
8111,-0.011302,0.100432,0.192881,-0.204949,0.700255,1.626436,-0.160395,-0.160686,1.018736,-0.469111,0.262700,0.304695,-0.706860,0.355395,-0.042461,0.161505,0.385785,0.306239,0.064119,-0.038955,-0.225031,-0.004553,-0.210820,1.153596,0.068338,-0.135615,0.059355,0.512356,0.300445,0.111235,0.498587,-0.166323,-0.319211,0.337115,-0.262966,0.530430,-0.161047,0.395291,0.211549,-0.472103,-0.232714,-0.201142,-0.284238,-0.270807,0.478664,1.140664,-0.410959,-0.608824,0.496368,-0.316005,0.070524,-0.257559,-0.562471,-0.207848,-0.281119,-0.254487,0.325983,0.279394,-0.341033,-0.385351,-0.353314,-0.259405,-0.327303,0.642308,-0.362766,0.326417,-0.127185,0.560086,0.008301,-0.167051,0.128607,-0.328785,-0.472906,-0.119761,-0.407158,-0.008234,-0.409309,-0.115735,-0.142444,-0.316225,-0.195408,-0.070749,-0.120178,-0.283568,0.772469,1.407845,-0.417968,-0.461405,0.774104,-0.674400,0.190750,0.079196,-0.863219,0.056382,-0.193152,-0.068409,0.404576,0.331240,-0.187760,-0.219398,-0.287980,-0.118995,-0.273697,1.031432,-0.161566,0.380653,-0.042092,0.591003,0.112814,-0.018927,0.328426,-0.253038,-0.410474,0.124495,-0.357166,0.288898,-0.305017,0.148892,0.049708,-0.375880,-0.012000,0.282994,-0.454838,-0.348683,-0.404650,2.063262,0.108230,-0.565609,-0.058977,-0.841741,-0.377914,-0.685385,1.013044,-0.522470,-0.131865,-0.231259,-0.739860,-0.471850,-0.533057,0.028660,-0.318158,0.219775,-0.051004,-0.084548,-0.504798,0.016730,-0.146596,-0.346625,-0.301939,-0.200033,0.034869,0.008017,-0.366293,0.228242,-0.13741,-0.139778,-0.183291,0.400298,0.276428,-0.441057,0.0,-0.299986,-0.310823,0.0,-0.572967,0.0,0.075127,-0.391819,-0.1662,0.163353,-0.429493,-0.471640,0.464697,-0.407061,-0.311850,0.0,-0.355081,-0.311876,-0.07608,-0.444272,-0.141262,-0.220300,-0.130254,-0.340754,-0.074274,-0.094484,0.0,-0.357887,-0.223913,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.099777,0.0,0.665103,-0.226083,-0.346099,-0.336559,-0.266554,0.222763,-0.082195,-0.068217,-0.399368,0.444724,-0.305286,-0.006984,-0.320220,-0.263850,-0.264181,-0.386580,-0.124576,-0.219946,-0.198382,-0.366026,-0.304237,-0.029144,0.231776,-0.218327,0.190255,-0.416060,0.380392,-0.183140,0.395486,-0.070943,-0.167051,0.128607,-0.328785,-0.472906,-0.119761,-0.407158,-0.165043,-0.409309,0.313155,-0.142444,-0.255083,19993967.0,21550111.0
8112,-0.251052,2.063411,-0.347562,-0.297787,1.754491,-0.559843,0.075662,-0.810212,0.071135,-0.335693,0.651923,0.518441,0.304884,-0.385087,0.091039,-0.440209,1.490997,1.069318,-0.370556,0.520229,-1.520371,-1.136159,-1.115024,1.435019,-0.354989,0.114121,-0.032218,2.237287,-0.546150,-0.370129,0.371811,-0.166323,-0.319211,0.200641,-0.262966,0.305501,-0.243185,0.131562,0.211549,-0.472103,-0.295613,0.908046,-0.621719,-0.295308,2.364734,-0.688095,-0.348096,-1.673412,-0.234706,-0.452665,-0.257453,-0.131318,1.173196,-0.029655,-0.258617,-0.590487,1.811216,1.213880,-0.632083,0.086899,-1.702161,-1.516880,-1.258048,0.769086,-0.678022,-0.719531,-0.146785,2.841916,-0.500123,-0.521326,-0.197119,-0.328785,-0.472906,-0.347924,-0.407158,-0.218998,-0.504991,-0.400714,-0.400259,-0.662059,-0.318753,1.483883,-0.474486,-0.333238,2.387304,-0.635621,-0.287372,-1.498730,-0.126919,-0.783972,0.207243,0.283135,0.761372,-0.206827,-0.153479,-0.615375,1.659138,1.161872,-0.677891,0.319773,-1.630281,-1.425816,-1.172933,1.216178,-0.651063,-0.536226,-0.063479,2.580331,-0.523563,-0.459633,0.081298,-0.253038,-0.410474,-0.075311,-0.357166,0.056216,-0.404434,-0.146076,-0.111060,-0.590056,-1.143197,2.971404,-0.454838,-1.280188,1.339346,-0.751286,-1.021705,-0.707924,-0.724052,-1.184833,-0.481362,-1.085882,1.136560,-0.522470,-0.274738,-0.231259,-1.794821,-1.944270,-1.672741,-1.955992,1.769069,-0.716654,-0.646092,-0.673471,-1.645585,-1.123835,-0.710926,-1.963454,-0.990920,-0.200033,-0.146334,0.008017,-0.366293,0.228242,-0.13741,-0.139778,-0.183291,0.400298,0.276428,-0.719324,0.0,-0.299986,-0.310823,0.0,-0.622196,0.0,-0.814318,-0.391819,-0.1662,-0.267616,-0.429493,-0.811896,-0.419848,-0.407061,-0.311850,0.0,-1.099322,-1.121714,-0.07608,-1.407184,0.796250,-0.419084,-0.243990,-0.504067,-0.074274,-0.404260,0.0,-1.201065,-0.276411,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.099777,0.0,0.665103,-0.294589,0.517683,-0.336559,-0.288668,2.683550,-0.491606,-0.068217,-0.491223,-0.395850,-0.465763,-0.145394,-0.432735,0.230909,-0.264181,-0.524135,-0.124576,-0.219946,-0.282657,-0.659436,-0.304237,-0.545284,-0.397458,-0.424705,-0.245233,-0.654174,-0.720212,-0.495859,-0.159080,-0.335487,-0.521326,-0.197119,-0.328785,-0.472906,-0.347924,-0.407158,-0.165043,-0.504991,0.313155,-0.400259,-0.554553,19995127.0,21801907.0


## Check for Multicollinearity

In [None]:
from statsmodels.stats.outliers_influence import variance_inflation_factor
from statsmodels.tools.tools import add_constant

In [None]:
%%time

labs_scaled_features = labs_scaled.loc[:, ('min', 50868) : ('above_max', 51484)]
add_constant(labs_scaled_features)

high_vif = pd.Series([variance_inflation_factor(labs_scaled_features.values, i) 
               for i in range(labs_scaled_features.shape[1])], 
              index=labs_scaled_features.columns).sort_values(ascending = False)

high_vif.head(20)


In [None]:
labs_scaled_features_limited = labs_scaled_features.copy()
labs_scaled_features_limited.drop([('above_max', 51484),
                                  ('above_max', 51478),
                                  ('max', 51237),
                                  ('mean', 51248)], axis = 1, inplace = True)


In [None]:
%%time

high_vif = pd.Series([variance_inflation_factor(labs_scaled_features_limited.values, i) 
               for i in range(labs_scaled_features_limited.shape[1])], 
              index=labs_scaled_features_limited.columns).sort_values(ascending = False)

high_vif.head(20)


## Save Lab Results for Models

In [1346]:
AKF_final_test = labs_scaled.merge(admissions_sample, how='left', left_on='hadm_id', right_on='hadm_id')
AKF_KNN_final_test = labs_scaled_KNN.merge(admissions_sample, how='left', left_on='hadm_id', right_on='hadm_id')




In [1347]:
# admissions_sample.to_pickle("admissions_sample.pkl")
# admissions_sample.to_pickle("admissions_sample.pkl")
AKF_final_test.to_csv('AKF_final_test.csv.gz', compression="gzip")
AKF_KNN_final_test.to_csv('AKF_KNN_final_test.csv.gz', compression="gzip")
