In [None]:
import pandas as pd 
import numpy as np

# call the 00-load-raw-data notebook to bring the pecarn_tbi dataframe into the environment
%run 00-load-raw-data.ipynb

print("START: 01-data-labelling.ipynb")

# Data Labelling
The majority of the TBI data is encoded with numeric categories.

It is helpful to convert these numeric categories into their actual string-like equivalents for use in visualisations and to make the data more human readable.

This does mean that the final cleaned dataset will need to be turned back into numeric data in a later step, however this is very straightforward to do using scikit-learn tools.

In [None]:
pecarn_tbi_yesno = ['No', 'Yes']
pecarn_tbi_yesnona = ['No', 'Yes', 'NA']

pecarn_tbi['Certification'].cat.categories = ['Emergency Medicine', 'Pediatrics', 'Pediatrics Emergency Medicine', 'Emergency Medicine and Pediatrics', 'Other']

# injury type
pecarn_tbi['High_impact_InjSev'].cat.categories = ['Low', 'Moderate', 'High']
pecarn_tbi['InjuryMech'].cat.categories = ['Occupant Vehicle', 'Pedestrian Vehicle', 'Bike Vehicle', 'Bike', 'Other Transport',
    'Fall to Ground', 'Stationary Object', 'Fall Elevation', 'Fall Stairs', 'Sports', 'Assault', 'Object Struck Head', 'Other']

# amnesia and loss of consciousness
pecarn_tbi['Amnesia_verb'].cat.categories = ['No','Yes','Pre/Non Verbal']
pecarn_tbi['LOCSeparate'].cat.categories = ['No','Yes','Suspected']
pecarn_tbi['LocLen'].cat.categories = ['<5sec','5sec-<1min','1-5min','>5min', 'NA']

# seizure
pecarn_tbi['Seiz'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['SeizOccur'].cat.categories = ['Immediate','Within 30min','After 30min','NA']
pecarn_tbi['SeizLen'].cat.categories = ['<1min', '1-<5min', '5-15min', '>15min','NA']

pecarn_tbi['ActNorm'].cat.categories = pecarn_tbi_yesno

# headache
pecarn_tbi['HA_verb'].cat.categories = ['No','Yes','Pre/Non Verbal']
pecarn_tbi['HASeverity'].cat.categories = ['Mild','Moderate','Severe','NA']
pecarn_tbi['HAStart'].cat.categories = ['Before', 'Within 1hr', '1-4hr', '>4hrs','NA']

# vomit
pecarn_tbi['Vomit'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['VomitNbr'].cat.categories = ['Once',' Twice', '>2 times', 'NA']
pecarn_tbi['VomitStart'].cat.categories = ['Before', 'Within 1hr', '1-4hr', '>4hrs','NA']
pecarn_tbi['VomitLast'].cat.categories = ['<1hr', '1-4hrs','>4hrs', 'NA']

# other
pecarn_tbi['Dizzy'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['Intubated'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['Paralyzed'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['Sedated'].cat.categories = pecarn_tbi_yesno

# altered mental state
pecarn_tbi['AMS'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['AMSAgitated'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['AMSSleep'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['AMSSlow'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['AMSRepeat'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['AMSOth'].cat.categories = pecarn_tbi_yesnona

# skull fractures
pecarn_tbi['SFxPalp'].cat.categories = ['No', 'Yes', 'Unclear']
pecarn_tbi['SFxPalpDepress'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['FontBulg'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['SFxBas'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['SFxBasHem'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['SFxBasOto'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['SFxBasPer'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['SFxBasRet'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['SFxBasRhi'].cat.categories = pecarn_tbi_yesnona

# hematoma
pecarn_tbi['Hema'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['HemaLoc'].cat.categories = ['Frontal', 'Occipital','Parietal/Temporal','NA']
pecarn_tbi['HemaSize'].cat.categories = ['Small','Medium','Large','NA']

# Trauma above clavicle
pecarn_tbi['Clav'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['ClavFace'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['ClavNeck'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['ClavFro'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['ClavOcc'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['ClavPar'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['ClavTem'].cat.categories = pecarn_tbi_yesnona

# Neurological Deficit
pecarn_tbi['NeuroD'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['NeuroDMotor'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['NeuroDSensory'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['NeuroDCranial'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['NeuroDReflex'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['NeuroDOth'].cat.categories = pecarn_tbi_yesnona

# Other Substantial Injury
pecarn_tbi['OSI'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['OSIExtremity'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['OSICut'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['OSICspine'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['OSIFlank'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['OSIAbdomen'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['OSIPelvis'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['OSIOth'].cat.categories = pecarn_tbi_yesnona

pecarn_tbi['Drugs'].cat.categories = pecarn_tbi_yesno

# CT sedation
pecarn_tbi['CTSed'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['CTSedAgitate'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['CTSedAge'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['CTSedRqst'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['CTSedOth'].cat.categories = pecarn_tbi_yesnona

# demographics
pecarn_tbi['Gender'].cat.categories = ['Male', 'Female']
pecarn_tbi['Ethnicity'].cat.categories = ['Hispanic', 'Non-Hispanic']
pecarn_tbi['Race'].cat.categories = ['White', 'Black', 'Asian', 'Native', 'Pacific', 'Other']

# ED data
pecarn_tbi['Observed'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['EDDisposition'].cat.categories = ['Home','OR', 'Admit', 'Admit Short', 'ICU', 'Transfer', 'AMA', 'Death in ED', 'Other']

# CT scan data
pecarn_tbi['CTDone'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['EDCT'].cat.categories = pecarn_tbi_yesnona

# outcome variables
pecarn_tbi['PosCT'].cat.categories = pecarn_tbi_yesnona
pecarn_tbi['DeathTBI'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['HospHead'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['HospHeadPosCT'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['Intub24Head'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['Neurosurgery'].cat.categories = pecarn_tbi_yesno
pecarn_tbi['PosIntFinal'].cat.categories = pecarn_tbi_yesno

In [None]:
# cleanup
del(pecarn_tbi_yesno)
del(pecarn_tbi_yesnona)