# Introduction

Exploration of structured data and labels

**Authors**
- Eric Carlson

In [1]:
structured_collection_date = '2016-10-24-16-35'

In [2]:
from datetime import datetime
import configparser
import hashlib
from importlib import reload
import logging
import numpy as np
import os
import pandas as pd
import pathlib as pl
import sys
import yaml

from IPython import display

import etc_utils as eu
import mimic_extraction_utils as meu
import structured_data_utils as sdu

In [3]:
import sqlalchemy as sa
from sqlalchemy.engine import reflection
from sqlalchemy.ext.declarative import declarative_base
from sqlalchemy import create_engine, MetaData, inspect
from sqlalchemy.orm import sessionmaker
from sqlalchemy.ext.automap import automap_base, name_for_scalar_relationship, generate_relationship

In [4]:
reload(eu)
reload(meu)
reload(sdu)

<module 'structured_data_utils' from '/mnt/cbds_homes/ecarlson/Notebooks/mit_frequent_fliers/mit-team-code/software/notebooks/structured_data_utils.py'>

In [5]:
sys.path.append('../icd9')
from icd9 import ICD9

# feel free to replace with your path to the json file
tree = ICD9('../icd9/codes.json')

## Configure pandas and matplot lib for nice web printing

In [6]:
pd.options.display.max_rows = 1000
pd.options.display.max_columns = 50
pd.options.display.max_colwidth = 100

In [7]:
%matplotlib inline

## Load config files, configure logging

In [8]:
work_desc = "gather_structured_data"

In [9]:
time_str, path_config, creds = eu.load_config_v2()
print('Time string: {}'.format(time_str))

print('Paths:')
for k, item in path_config.items():
    print('{}: {}'.format(k, item))

Time string: 2016-10-24-16-45
Paths:
repo_data_dir: ../../data
results_dir: /mnt/cbds_homes/ecarlson/results/mit_frequent_fliers
log_dir: /mnt/cbds_homes/ecarlson/logs/mit_frequent_fliers
input_dir: /mnt/cbds_homes/ecarlson/data/mit_frequent_fliers


In [10]:
logger = logging.getLogger()

eu.configure_logging(logger, work_desc=work_desc, log_directory=path_config['log_dir'], time_str=time_str)

Logging to /mnt/cbds_homes/ecarlson/logs/mit_frequent_fliers/2016-10-24-16-45_gather_structured_data.log


In [11]:
[k for k in creds.keys()]

['mimic2_v2_6', 'postgres', 'mimic3_v1_4']

# Connect to database

In [12]:
db_path = '{sa_driver}://{username}:{password}@{hostname}/{dbname}'.format(**creds['mimic3_v1_4'])
engine = create_engine(db_path)
sm = sessionmaker(bind=engine)
s = sm()
conn = s.connection()

meta = MetaData(schema="mimiciii", bind=engine)
meta.reflect(bind=engine)

In [13]:
base = automap_base(metadata=meta)
base.prepare(engine, reflect=True)

In [14]:
for cls_name in sorted(base.classes.keys()):
    print(cls_name)

admissions
callout
caregivers
chartevents
cptevents
d_cpt
d_icd_diagnoses
d_icd_procedures
d_items
d_labitems
datetimeevents
diagnoses_icd
drgcodes
icustays
inputevents_cv
inputevents_mv
labevents
microbiologyevents
noteevents
outputevents
patients
prescriptions
procedureevents_mv
procedures_icd
services
transfers


In [15]:
note_tb = base.classes['noteevents']

In [16]:
s.query(note_tb.category).count()

2083180

# Load labeled notes

In [17]:
categories = ['Advanced.Cancer', 'Advanced.Heart.Disease', 'Advanced.Lung.Disease',
       'Alcohol.Abuse',
       'Chronic.Neurological.Dystrophies', 'Chronic.Pain.Fibromyalgia',
       'Dementia', 'Depression', 'Developmental.Delay.Retardation',
       'Non.Adherence', 'None',
       'Obesity', 'Other.Substance.Abuse', 
       'Schizophrenia.and.other.Psychiatric.Disorders', 'Unsure',]

In [18]:
data_path = pl.Path(path_config['repo_data_dir'])

In [19]:
[p for p in data_path.glob('*{}*csv'.format(structured_collection_date))]

[PosixPath('../../data/mimic3_note_metadata_2016-10-24-16-35.csv'),
 PosixPath('../../data/notes_icd9_codes_2016-10-24-16-35.csv'),
 PosixPath('../../data/combined_label_data_2016-10-24-16-35.csv')]

In [21]:
labels_path = data_path.joinpath('combined_label_data_{}.csv'.format(structured_collection_date))
note_meta_path = data_path.joinpath('mimic3_note_metadata_{}.csv'.format(structured_collection_date))
note_icd9_path = data_path.joinpath('notes_icd9_codes_{}.csv'.format(structured_collection_date))

In [22]:
labels_df = pd.read_csv(labels_path.as_posix())
note_meta_df = pd.read_csv(note_meta_path.as_posix())
note_icd9_df = pd.read_csv(note_icd9_path.as_posix())

In [23]:
labels_df.head()

Unnamed: 0,subject_id,category,md5,operator,Advanced.Cancer,Advanced.Heart.Disease,Advanced.Lung.Disease,Alcohol.Abuse,Chronic.Neurological.Dystrophies,Chronic.Pain.Fibromyalgia,Dementia,Depression,Developmental.Delay.Retardation,Non.Adherence,None,Obesity,Other.Substance.Abuse,Schizophrenia.and.other.Psychiatric.Disorders,Unsure,row_id_m3,total_m3_distance
0,9973,Discharge,56f2598342cce321539d8975809d487c,JTW,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,,
1,9973,Discharge,56f2598342cce321539d8975809d487c,ETM,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,,
2,3365,Discharge,eaea5c3c7577135a83f1f0fb583e0d53,JTW,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,17170.0,0.000884
3,3365,Discharge,eaea5c3c7577135a83f1f0fb583e0d53,ETM,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,17170.0,0.000884
4,27290,Discharge,e7433c0b75ea00346390f029bb830774,JW,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,50828.0,0.001554


In [24]:
note_meta_df.head()

Unnamed: 0,cgid,chartdate,charttime,hadm_id,md5,note_row_id,storetime,subject_id
0,17770.0,2154-06-03 00:00:00,2154-06-03 17:30:00,172993.0,be74552c73a0f9895c4f372763054d26,1414073.0,2154-06-03 17:51:00,11590
1,17698.0,2183-07-28 00:00:00,2183-07-28 05:41:00,116105.0,2bd0c96855c6107be79d0150e1f121e7,1449706.0,2183-07-28 05:53:00,14342
2,,2170-02-13 00:00:00,,122710.0,bd4bf8040238e3e2cdd7466692defe73,47105.0,,8217
3,18469.0,2175-06-07 00:00:00,2175-06-07 05:39:00,196691.0,6d20d9b6d3cfdc3fc9e8a72fbab0f697,1573953.0,2175-06-07 06:27:00,23829
4,17079.0,2125-04-27 00:00:00,2125-04-27 20:51:00,133059.0,d35003faa86241e60396014264b14a4d,1264491.0,2125-04-27 21:03:00,305


In [25]:
note_icd9_df.head()

Unnamed: 0,code,level,md5,note_row_id,subject_id
0,41071,source,be74552c73a0f9895c4f372763054d26,1414073.0,11590
1,39891,source,be74552c73a0f9895c4f372763054d26,1414073.0,11590
2,390-459,0,be74552c73a0f9895c4f372763054d26,1414073.0,11590
3,393-398,1,be74552c73a0f9895c4f372763054d26,1414073.0,11590
4,398,2,be74552c73a0f9895c4f372763054d26,1414073.0,11590


In [179]:
tree.find('398.91').description

'Rheumatic heart failure (congestive)'

In [180]:
sdu.print_icd9_tree('398.91')

Parents:
- ROOT: ROOT
- 390-459: DISEASES OF THE CIRCULATORY SYSTEM 
- 393-398: CHRONIC RHEUMATIC HEART DISEASE 
- 398: Other rheumatic heart disease
- 398.9: Other and unspecified rheumatic heart diseases
- 398.91: Rheumatic heart failure (congestive)

-> 398.91: Rheumatic heart failure (congestive)

Children:


# Inspect data

In [27]:
note_icd9_df.shape

(89273, 5)

In [26]:
note_icd9_df.query('level == "source"').shape

(21044, 5)

In [35]:
grouped = note_icd9_df.query('level == "source"').groupby('code').count().sort_values('md5', ascending=False)['md5']
display.display(grouped.head())
print(grouped.shape)

code
4280     690
4019     570
42731    499
5849     386
41401    347
Name: md5, dtype: int64

(1852,)


In [37]:
grouped = note_icd9_df.query('level == "0"').groupby('code').count().sort_values('md5', ascending=False)['md5']
display.display(grouped.head())
print(grouped.shape)

code
390-459    4213
460-519    1825
240-279    1801
580-629    1349
520-579    1223
Name: md5, dtype: int64

(41,)


In [38]:
grouped = note_icd9_df.query('level == "1"').groupby('code').count().sort_values('md5', ascending=False)['md5']
display.display(grouped.head())
print(grouped.shape)

code
420-429    2085
270-279    1320
510-519     937
580-589     833
996-999     699
Name: md5, dtype: int64

(181,)


In [39]:
grouped = note_icd9_df.query('level == "2"').groupby('code').count().sort_values('md5', ascending=False)['md5']
display.display(grouped.head())
print(grouped.shape)

code
428    992
276    788
427    755
518    618
401    583
Name: md5, dtype: int64

(632,)


In [40]:
grouped = note_icd9_df.query('level == "3"').groupby('code').count().sort_values('md5', ascending=False)['md5']
display.display(grouped.head())
print(grouped.shape)

code
428.0    690
401.9    570
427.3    546
518.8    505
414.0    408
Name: md5, dtype: int64

(1017,)


In [41]:
grouped = note_icd9_df.query('level == "4"').groupby('code').count().sort_values('md5', ascending=False)['md5']
display.display(grouped.head())
print(grouped.shape)

Series([], Name: md5, dtype: int64)

(0,)


From above, see that there are no "level 4" codes.  As we increase from level 0 to level 3 we get more specific codes, with corresponding increase in number of codes and decrease in the maximum frequency of occurence.  

# Assemble data for classification

## As a first pass, start with a single diagnosis level, combine with labels, inspect

In [43]:
icd9_1lev = note_icd9_df.query('level == "1"')
icd9_1lev.head()

Unnamed: 0,code,level,md5,note_row_id,subject_id
3,393-398,1,be74552c73a0f9895c4f372763054d26,1414073.0,11590
8,393-398,1,be74552c73a0f9895c4f372763054d26,1414073.0,11590
13,393-398,1,be74552c73a0f9895c4f372763054d26,1414073.0,11590
18,042,1,be74552c73a0f9895c4f372763054d26,1414073.0,11590
22,510-519,1,be74552c73a0f9895c4f372763054d26,1414073.0,11590


In [44]:
labels_df.head()

Unnamed: 0,subject_id,category,md5,operator,Advanced.Cancer,Advanced.Heart.Disease,Advanced.Lung.Disease,Alcohol.Abuse,Chronic.Neurological.Dystrophies,Chronic.Pain.Fibromyalgia,Dementia,Depression,Developmental.Delay.Retardation,Non.Adherence,None,Obesity,Other.Substance.Abuse,Schizophrenia.and.other.Psychiatric.Disorders,Unsure,row_id_m3,total_m3_distance
0,9973,Discharge,56f2598342cce321539d8975809d487c,JTW,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,,
1,9973,Discharge,56f2598342cce321539d8975809d487c,ETM,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,,
2,3365,Discharge,eaea5c3c7577135a83f1f0fb583e0d53,JTW,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,17170.0,0.000884
3,3365,Discharge,eaea5c3c7577135a83f1f0fb583e0d53,ETM,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,17170.0,0.000884
4,27290,Discharge,e7433c0b75ea00346390f029bb830774,JW,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,50828.0,0.001554


In [96]:
tmp_df = icd9_1lev.groupby(['subject_id', 'md5', 'code']).agg({'level': lambda x: 1})
tmp_df.rename(columns={'level': 'code'}, inplace=True)
icd9_vec_df = tmp_df.unstack(fill_value=0)
#icd9_vec_df.columns = icd9_vec_df.columns.droplevel()

In [97]:
icd9_vec_df.head()

Unnamed: 0_level_0,Unnamed: 1_level_0,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code,code
Unnamed: 0_level_1,code,001-009,030-041,042,047,050-059,062,070-079,110-118,120-129,130-136,137-139,140-149,150-159,160-165,170-176,179-189,190-199,210-229,235-238,239,240-246,249-259,260-269,270-279,290-299,...,V18,V26,V42,V43,V44,V45,V46,V49,V50,V53,V54,V55,V58,V59,V60,V62,V63,V64,V65,V66,V69,V70,V85,V87,V88
subject_id,md5,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2,Unnamed: 22_level_2,Unnamed: 23_level_2,Unnamed: 24_level_2,Unnamed: 25_level_2,Unnamed: 26_level_2,Unnamed: 27_level_2,Unnamed: 28_level_2,Unnamed: 29_level_2,Unnamed: 30_level_2,Unnamed: 31_level_2,Unnamed: 32_level_2,Unnamed: 33_level_2,Unnamed: 34_level_2,Unnamed: 35_level_2,Unnamed: 36_level_2,Unnamed: 37_level_2,Unnamed: 38_level_2,Unnamed: 39_level_2,Unnamed: 40_level_2,Unnamed: 41_level_2,Unnamed: 42_level_2,Unnamed: 43_level_2,Unnamed: 44_level_2,Unnamed: 45_level_2,Unnamed: 46_level_2,Unnamed: 47_level_2,Unnamed: 48_level_2,Unnamed: 49_level_2,Unnamed: 50_level_2,Unnamed: 51_level_2,Unnamed: 52_level_2
68,27572b36bd4c26c322f50cf65d095d16,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,...,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
109,27d1f5907fa14b6702837a845f84c54e,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0
109,3e0fff775cfb678fdfa06ece68ebfab5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
109,8efc0a2ff698b75ce183e3183c1bf204,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
109,f5f69772c32f1b0ac05b7cf408f7a6db,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


In [98]:
feat_vecs = labels_df.set_index(['subject_id', 'md5'])
feat_vecs = feat_vecs.join(icd9_vec_df)



In [99]:
feat_vecs.head()

Unnamed: 0_level_0,Unnamed: 1_level_0,category,operator,Advanced.Cancer,Advanced.Heart.Disease,Advanced.Lung.Disease,Alcohol.Abuse,Chronic.Neurological.Dystrophies,Chronic.Pain.Fibromyalgia,Dementia,Depression,Developmental.Delay.Retardation,Non.Adherence,None,Obesity,Other.Substance.Abuse,Schizophrenia.and.other.Psychiatric.Disorders,Unsure,row_id_m3,total_m3_distance,"(code, 001-009)","(code, 030-041)","(code, 042)","(code, 047)","(code, 050-059)","(code, 062)",...,"(code, V18)","(code, V26)","(code, V42)","(code, V43)","(code, V44)","(code, V45)","(code, V46)","(code, V49)","(code, V50)","(code, V53)","(code, V54)","(code, V55)","(code, V58)","(code, V59)","(code, V60)","(code, V62)","(code, V63)","(code, V64)","(code, V65)","(code, V66)","(code, V69)","(code, V70)","(code, V85)","(code, V87)","(code, V88)"
subject_id,md5,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1
68,27572b36bd4c26c322f50cf65d095d16,Nursing/Other,JW,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1261174.0,0.0012,0.0,0.0,1.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
68,27572b36bd4c26c322f50cf65d095d16,Nursing/Other,JF,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1261174.0,0.0012,0.0,0.0,1.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
68,27572b36bd4c26c322f50cf65d095d16,Nursing/Other,JF,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1261174.0,0.0012,0.0,0.0,1.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
109,27d1f5907fa14b6702837a845f84c54e,Nursing/Other,JF,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1261605.0,0.111799,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
109,27d1f5907fa14b6702837a845f84c54e,Nursing/Other,JW,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,1261605.0,0.111799,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [113]:
feature_cols = [c for c in feat_vecs.columns if isinstance(c, tuple)]

In [164]:
code_lookup = [{'icd9':icd, 'descr': tree.find(icd[1]).description} for icd in feature_cols]

In [165]:
code_lookup_df = pd.DataFrame(code_lookup).set_index('icd9')

Note: not really an odds ratio, dividing by population mean rather than mean of non-flagged population, otherwise many divide by zeros

In [175]:
all_vecs = feat_vecs[feature_cols].mean()
likely_concepts = dict()
for cat in categories:
    with_label = feat_vecs.loc[feat_vecs[cat]==1, feature_cols].mean()
    with_label = with_label/all_vecs
#     no_label = feat_vecs.loc[feat_vecs[cat]==0, feature_cols].mean()
#     with_label = with_label/no_label
    with_label.name = 'OR'
    with_label = code_lookup_df.join(pd.DataFrame(with_label))
    likely_concepts[cat] = with_label.sort_values('OR', ascending=False)

In [177]:
for cat in categories[:15]:
    print(cat)    
    display.display(likely_concepts[cat].head(20))

Advanced.Cancer


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, 190-199)",MALIGNANT NEOPLASM OF OTHER AND UNSPECIFIED SITES,15.293118
"(code, 140-149)","MALIGNANT NEOPLASM OF LIP, ORAL CAVITY, AND PHARYNX",10.408451
"(code, E933)",Primarily systemic agents,9.050827
"(code, V87)",OTHER SPECIFIED PERSONAL EXPOSURES AND HISTORY PRESENTING HAZARDS TO HEALTH,8.673709
"(code, 150-159)",MALIGNANT NEOPLASM OF DIGESTIVE ORGANS AND PERITONEUM,8.673709
"(code, E936)",Anticonvulsants and anti-Parkinsonism drugs,7.806338
"(code, E870)","Accidental cut, puncture, perforation, or hemorrhage during medical care",6.505282
"(code, 795)","Other and nonspecific abnormal cytological, histological, immunological and DNA test findings",5.204225
"(code, E853)",Accidental poisoning by tranquilizers,4.336854
"(code, 781)",Symptoms involving nervous and musculoskeletal systems,4.336854


Advanced.Heart.Disease


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, E980)","Poisoning by solid or liquid substances, undetermined whether accidentally or purposely inflicted",11.334356
"(code, E941)",Drugs primarily affecting the autonomic nervous system,11.334356
"(code, 799.1)",Respiratory arrest,11.334356
"(code, E937)",Sedatives and hypnotics,11.334356
"(code, 958-959)",CERTAIN TRAUMATIC COMPLICATIONS AND UNSPECIFIED INJURIES,4.533742
"(code, 137-139)",LATE EFFECTS OF INFECTIOUS AND PARASITIC DISEASES,3.778119
"(code, V53)",Fitting and adjustment of other device,3.022495
"(code, E858)",Accidental poisoning by other drugs,2.833589
"(code, 791)",Nonspecific findings on examination of urine,2.833589
"(code, 393-398)",CHRONIC RHEUMATIC HEART DISEASE,2.198178


Advanced.Lung.Disease


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, E869)",Accidental poisoning by other gases and vapors,19.244792
"(code, 980-989)",TOXIC EFFECTS OF SUBSTANCES CHIEFLY NONMEDICINAL AS TO SOURCE,19.244792
"(code, 799.1)",Respiratory arrest,19.244792
"(code, 791)",Nonspecific findings on examination of urine,9.622396
"(code, V46)",Other dependence on machines and devices,7.765442
"(code, 958-959)",CERTAIN TRAUMATIC COMPLICATIONS AND UNSPECIFIED INJURIES,7.697917
"(code, 460-466)",ACUTE RESPIRATORY INFECTIONS,4.557977
"(code, V13)",Personal history of other diseases,4.373816
"(code, 730-739)","OSTEOPATHIES, CHONDROPATHIES, AND ACQUIRED MUSCULOSKELETAL DEFORMITIES",4.166398
"(code, V02)",Carrier or suspected carrier of infectious diseases,4.123884


Alcohol.Abuse


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, 840-848)",SPRAINS AND STRAINS OF JOINTS AND ADJACENT MUSCLES,13.943396
"(code, V65)",Other persons seeking consultation,13.943396
"(code, E901)",Excessive cold,13.943396
"(code, E960)","Fight, brawl, rape",13.943396
"(code, E967)",Perpetrator of child and adult abuse,13.943396
"(code, E980)","Poisoning by solid or liquid substances, undetermined whether accidentally or purposely inflicted",13.943396
"(code, V69)",Problems related to lifestyle,13.943396
"(code, V60)","Housing, household, and economic circumstances",12.842602
"(code, V62)",Other psychosocial circumstances,12.200472
"(code, V11)",Personal history of mental disorder,10.457547


Chronic.Neurological.Dystrophies


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, E936)",Anticonvulsants and anti-Parkinsonism drugs,6.040872
"(code, 617-629)",OTHER DISORDERS OF FEMALE GENITAL TRACT,5.828912
"(code, V88)",ACQUIRED ABSENCE OF OTHER ORGANS AND TISSUE,5.03406
"(code, 791)",Nonspecific findings on examination of urine,5.03406
"(code, 047)",Meningitis due to enterovirus,5.03406
"(code, E901)",Excessive cold,5.03406
"(code, E945)",Agents primarily acting on the smooth and skeletal muscles and respiratory system,5.03406
"(code, 958-959)",CERTAIN TRAUMATIC COMPLICATIONS AND UNSPECIFIED INJURIES,4.027248
"(code, E929)",LATE EFFECTS OF ACCIDENTAL INJURY,3.775545
"(code, V11)",Personal history of mental disorder,3.775545


Chronic.Pain.Fibromyalgia


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, V26)",Procreative management,12.316667
"(code, 338)",PAIN,6.632051
"(code, 614-616)",INFLAMMATORY DISEASE OF FEMALE PELVIC ORGANS,6.158333
"(code, E935)","Analgesics, antipyretics, and antirheumatics",5.278571
"(code, E929)",LATE EFFECTS OF ACCIDENTAL INJURY,4.61875
"(code, V13)",Personal history of other diseases,4.478788
"(code, 520-529)","DISEASES OF ORAL CAVITY, SALIVARY GLANDS, AND JAWS",4.105556
"(code, 796)",Other nonspecific abnormal findings,4.105556
"(code, 725-729)","RHEUMATISM, EXCLUDING THE BACK",3.766253
"(code, 905-909)","LATE EFFECTS OF INJURIES, POISONINGS, TOXIC EFFECTS, AND OTHER EXTERNAL CAUSES",3.649383


Dementia


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, 980-989)",TOXIC EFFECTS OF SUBSTANCES CHIEFLY NONMEDICINAL AS TO SOURCE,30.53719
"(code, E869)",Accidental poisoning by other gases and vapors,30.53719
"(code, V11)",Personal history of mental disorder,7.634298
"(code, 290-299)",PSYCHOSES,6.506504
"(code, 783)","Symptoms concerning nutrition, metabolism, and development",5.816608
"(code, V53)",Fitting and adjustment of other device,4.071625
"(code, 330-337)",HEREDITARY AND DEGENERATIVE DISEASES OF THE CENTRAL NERVOUS SYSTEM,4.035752
"(code, 860-869)","INTERNAL INJURY OF THORAX, ABDOMEN, AND PELVIS",3.940283
"(code, 380-389)",DISEASES OF THE EAR AND MASTOID PROCESS,3.393021
"(code, 617-629)",OTHER DISORDERS OF FEMALE GENITAL TRACT,3.214441


Depression


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, E953.8)",Other specified means,6.779817
"(code, E960)","Fight, brawl, rape",6.779817
"(code, V65)",Other persons seeking consultation,6.779817
"(code, E980)","Poisoning by solid or liquid substances, undetermined whether accidentally or purposely inflicted",6.779817
"(code, V69)",Problems related to lifestyle,6.779817
"(code, E967)",Perpetrator of child and adult abuse,6.779817
"(code, E931)",Other anti-infectives,5.932339
"(code, V62)",Other psychosocial circumstances,4.237385
"(code, 540-543)",APPENDICITIS,4.237385
"(code, V60)","Housing, household, and economic circumstances",3.925157


Developmental.Delay.Retardation


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, 317-319)",MENTAL RETARDATION,48.123728
"(code, 787)",Symptoms involving digestive system,8.238573
"(code, 327)",ORGANIC SLEEP DISORDERS,5.698863
"(code, 690-698)",OTHER INFLAMMATORY CONDITIONS OF SKIN AND SUBCUTANEOUS TISSUE,5.492382
"(code, 320-326)",INFLAMMATORY DISEASES OF THE CENTRAL NERVOUS SYSTEM,5.121275
"(code, E939)",Psychotropic agents,4.737179
"(code, 780)",General symptoms,3.694131
"(code, 393-398)",CHRONIC RHEUMATIC HEART DISEASE,3.445221
"(code, 240-246)",DISORDERS OF THYROID GLAND,3.069447
"(code, 555-558)",NONINFECTIOUS ENTERITIS AND COLITIS,3.056245


Non.Adherence


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, 047)",Meningitis due to enterovirus,19.447368
"(code, E980)","Poisoning by solid or liquid substances, undetermined whether accidentally or purposely inflicted",19.447368
"(code, E858)",Accidental poisoning by other drugs,9.723684
"(code, E967)",Perpetrator of child and adult abuse,9.723684
"(code, 614-616)",INFLAMMATORY DISEASE OF FEMALE PELVIC ORGANS,9.723684
"(code, E950.0)","Analgesics, antipyretics, and antirheumatics",9.723684
"(code, E901)",Excessive cold,9.723684
"(code, E960)","Fight, brawl, rape",7.778947
"(code, V62)",Other psychosocial circumstances,4.861842
"(code, 960-979)","POISONING BY DRUGS, MEDICINAL AND BIOLOGICAL SUBSTANCES",4.714514


None


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, 793)",Nonspecific abnormal findings on radiological and other examination of body structure,1.916494
"(code, V07)",Need for isolation and other prophylactic measures,1.916494
"(code, 900-904)",INJURY TO BLOOD VESSELS,1.916494
"(code, E957.1)",Other man-made structures,1.916494
"(code, E944)","Water, mineral, and uric acid metabolism drugs",1.916494
"(code, E940)",Central nervous system stimulants,1.916494
"(code, E938)",Other central nervous system depressants and anesthetics,1.916494
"(code, E950.2)",Other sedatives and hypnotics,1.916494
"(code, E950.3)",Tranquilizers and other psychotropic agents,1.916494
"(code, 239)",NEOPLASMS OF UNSPECIFIED NATURE,1.916494


Obesity


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, E950.0)","Analgesics, antipyretics, and antirheumatics",12.91958
"(code, V18)",Family history of certain other specific conditions,6.45979
"(code, E917)",Striking against or struck accidentally by objects or persons,5.167832
"(code, 327)",ORGANIC SLEEP DISORDERS,4.468426
"(code, E929)",LATE EFFECTS OF ACCIDENTAL INJURY,4.306527
"(code, 905-909)","LATE EFFECTS OF INJURIES, POISONINGS, TOXIC EFFECTS, AND OTHER EXTERNAL CAUSES",3.828024
"(code, V64)","Persons encountering health services for specific procedures, not carried out",3.691309
"(code, 130-136)",OTHER INFECTIOUS AND PARASITIC DISEASES,3.605464
"(code, 720-724)",DORSOPATHIES,3.412719
"(code, V17)",Family history of certain chronic disabling diseases,3.334085


Other.Substance.Abuse


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, 840-848)",SPRAINS AND STRAINS OF JOINTS AND ADJACENT MUSCLES,22.393939
"(code, E960)","Fight, brawl, rape",22.393939
"(code, V69)",Problems related to lifestyle,22.393939
"(code, E967)",Perpetrator of child and adult abuse,22.393939
"(code, E980)","Poisoning by solid or liquid substances, undetermined whether accidentally or purposely inflicted",22.393939
"(code, V60)","Housing, household, and economic circumstances",14.732855
"(code, E854)",Accidental poisoning by other psychotropic agents,13.436364
"(code, 062)",Mosquito-borne viral encephalitis,11.19697
"(code, E950.0)","Analgesics, antipyretics, and antirheumatics",11.19697
"(code, E850)","Accidental poisoning by analgesics, antipyretics, and antirheumatics",9.797348


Schizophrenia.and.other.Psychiatric.Disorders


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, V69)",Problems related to lifestyle,11.096096
"(code, E958.9)",Unspecified means,11.096096
"(code, E901)",Excessive cold,11.096096
"(code, V85)",BODY MASS INDEX,8.322072
"(code, E960)","Fight, brawl, rape",6.657658
"(code, V60)","Housing, household, and economic circumstances",6.424056
"(code, E853)",Accidental poisoning by tranquilizers,5.548048
"(code, 850-854)","INTRACRANIAL INJURY, EXCLUDING THOSE WITH SKULL FRACTURE",5.548048
"(code, V13)",Personal history of other diseases,5.04368
"(code, E939)",Psychotropic agents,4.993243


Unsure


Unnamed: 0_level_0,descr,OR
icd9,Unnamed: 1_level_1,Unnamed: 2_level_1
"(code, E937)",Sedatives and hypnotics,9.523196
"(code, E945)",Agents primarily acting on the smooth and skeletal muscles and respiratory system,4.761598
"(code, E936)",Anticonvulsants and anti-Parkinsonism drugs,4.761598
"(code, E858)",Accidental poisoning by other drugs,3.571198
"(code, 830-839)",DISLOCATION,3.174399
"(code, 137-139)",LATE EFFECTS OF INFECTIOUS AND PARASITIC DISEASES,3.174399
"(code, E939)",Psychotropic agents,2.856959
"(code, E934)",Agents primarily affecting blood constituents,2.555004
"(code, 617-629)",OTHER DISORDERS OF FEMALE GENITAL TRACT,2.506104
"(code, V16)",Family history of malignant neoplasm,2.380799
