

References:
- [Geeks for Geeks - SQLite DataTypes](https://www.geeksforgeeks.org/how-to-check-column-type-in-sqlite/)

In [None]:
import sqlite3
conn = sqlite3.connect('sql_db/emergency_department_database.db')

In [None]:
table_names = ['diagnosis', 'edstays', 'medrecon', 'pyxis', 'triage', 'vitalsign']

tables_data_types = {}

for table_name in table_names:
    tables_data_types[table_name] = conn.execute(f'PRAGMA table_info({table_name});').fetchall()

conn.close()

In [15]:
diagnosis = tables_data_types['diagnosis']
print('DIAGNOSIS datatable:\n')
for column_info in diagnosis:
        print(f"Column: {column_info[1]}, Type: {column_info[2]}")

DIAGNOSIS datatable:

Column: subject_id, Type: INTEGER
Column: stay_id, Type: INTEGER
Column: seq_num, Type: INTEGER
Column: icd_code, Type: TEXT
Column: icd_version, Type: INTEGER
Column: icd_title, Type: TEXT


In [16]:
diagnosis = {
    "diagnosis_mapping": """
    Data Dictionary for the 'diagnosis' table in the MIMIC-IV-ED dataset
    
    Table Description:
    This table provides coded diagnoses associated with each ED visit, based on the International Classification of Diseases (ICD) ontology.
    
    Columns:
    - subject_id: (INTEGER) A unique identifier assigned to each individual patient.
    - stay_id: (INTEGER) A unique identifier for the ED visit.
    - seq_num: (INTEGER) A pseudo-order representing the relevance of the diagnosis, with 1 being the most relevant.
    - icd_code: (TEXT) The coded representation of the diagnosis using the ICD ontology.
    - icd_version: (INTEGER) The version of the ICD ontology used (9 or 10).
    - icd_title: (TEXT) The textual description of the ICD code.
    """
    }

In [4]:
edstays = tables_data_types['edstays']
print('EDSTAYS datatable:\n')
for column_info in edstays:
        print(f"Column: {column_info[1]}, Type: {column_info[2]}")

EDSTAYS datatable:

Column: subject_id, Type: INTEGER
Column: hadm_id, Type: REAL
Column: stay_id, Type: INTEGER
Column: intime, Type: TEXT
Column: outtime, Type: TEXT
Column: gender, Type: TEXT
Column: race, Type: TEXT
Column: arrival_transport, Type: TEXT
Column: disposition, Type: TEXT


In [5]:
edstays = {
    "edstays_mapping":"""
    Data Dictionary for the 'edstays' table in the MIMIC-IV-ED dataset
    
    Table Description:
    This table tracks patient stays in the emergency department (ED). Each row represents a unique ED visit.
    
    Columns:
    - subject_id: (INTEGER) A unique identifier assigned to each individual patient.
    - hadm_id: (REAL) An identifier representing the hospital admission, if the patient was admitted after the ED visit.
    - stay_id: (INTEGER) A unique identifier for the ED visit.
    - intime: (TEXT) The date and time when the patient was admitted to the ED.
    - outtime: (TEXT) The date and time when the patient was discharged from the ED.
    - gender: (TEXT) The patient's gender.
    - race: (TEXT) The patient's race.
    - arrival_transport: (TEXT) The mode of transportation used by the patient to arrive at the ED (e.g., ambulance, walk-in).
    - disposition: (TEXT) The discharge location or status of the patient after the ED visit (e.g., admitted, discharged home).
    """
}

In [6]:
edstays = tables_data_types['medrecon']
print('MEDRECON datatable:\n')
for column_info in edstays:
        print(f"Column: {column_info[1]}, Type: {column_info[2]}")

MEDRECON datatable:

Column: subject_id, Type: INTEGER
Column: stay_id, Type: INTEGER
Column: charttime, Type: TEXT
Column: name, Type: TEXT
Column: gsn, Type: INTEGER
Column: ndc, Type: INTEGER
Column: etc_rn, Type: INTEGER
Column: etccode, Type: REAL
Column: etcdescription, Type: TEXT


In [7]:
medrecon = {
    "medrecon_mapping":"""
    Data Dictionary for the 'medrecon' table in the MIMIC-IV-ED dataset
    
    Table Description:
    This table provides information about the medications the patient was taking prior to their ED visit (medication reconciliation).
    
    Columns:
    - subject_id: (INTEGER) A unique identifier assigned to each individual patient.
    - stay_id: (INTEGER) A unique identifier for the ED visit.
    - charttime: (TEXT) The date and time when the medication reconciliation was documented.
    - name: (TEXT) The textual description of the medication.
    - gsn: (INTEGER) The Generic Sequence Number (GSN) for the medication, if available.
    - ndc: (INTEGER) The National Drug Code (NDC) for the medication, if available.
    - etc_rn: (INTEGER) A sequential number for grouping medications into classes based on an ontology.
    - etccode: (TEXT) The coded representation of the medication class based on an ontology.
    - etcdescription: (TEXT) The textual description of the medication class based on an ontology.
    """
}

In [8]:
pyxis = tables_data_types['pyxis']
print('PYXIS datatable:\n')
for column_info in pyxis:
        print(f"Column: {column_info[1]}, Type: {column_info[2]}")

PYXIS datatable:

Column: subject_id, Type: INTEGER
Column: stay_id, Type: INTEGER
Column: charttime, Type: TEXT
Column: med_rn, Type: INTEGER
Column: name, Type: TEXT
Column: gsn_rn, Type: INTEGER
Column: gsn, Type: REAL


In [9]:
pyxis = {
    "pyxis_mapping": """
    Data Dictionary for the 'pyxis' table in the MIMIC-IV-ED dataset
    
    Table Description:
    This table contains information about medications dispensed from the automated Pyxis MedStation system during the ED visit.
    
    Columns:
    - subject_id: (INTEGER) A unique identifier assigned to each individual patient.
    - stay_id: (INTEGER) A unique identifier for the ED visit.
    - charttime: (TEXT) The date and time when the medication was dispensed.
    - med_rn: (INTEGER) A sequential number for delineating multiple medications dispensed at the same time.
    - name: (TEXT) The textual description of the dispensed medication.
    - gsn_rn: (INTEGER) A sequential number for delineating multiple GSN values associated with the same medication.
    - gsn: (REAL) The Generic Sequence Number (GSN) for the medication, if available.
    """
}

In [10]:
triage = tables_data_types['triage']
print('TRIAGE datatable:\n')
for column_info in triage:
        print(f"Column: {column_info[1]}, Type: {column_info[2]}")

TRIAGE datatable:

Column: subject_id, Type: INTEGER
Column: stay_id, Type: INTEGER
Column: temperature, Type: REAL
Column: heartrate, Type: REAL
Column: resprate, Type: REAL
Column: o2sat, Type: REAL
Column: sbp, Type: REAL
Column: dbp, Type: REAL
Column: pain, Type: TEXT
Column: acuity, Type: REAL
Column: chiefcomplaint, Type: TEXT


In [11]:
triage = {
    "triage_mapping": """
    Data Dictionary for the 'triage' table in the MIMIC-IV-ED dataset
    
    Table Description:
    This table contains information collected during the triage process, including vital signs, pain level, and the chief complaint reported by the patient.
    
    Columns:
    - subject_id: (INTEGER) A unique identifier assigned to each individual patient.
    - stay_id: (INTEGER) A unique identifier for the ED visit.
    - temperature: (REAL) The patient's body temperature recorded at triage.
    - heartrate: (REAL) The patient's heart rate recorded at triage.
    - resprate: (REAL) The patient's respiratory rate recorded at triage.
    - o2sat: (REAL) The patient's oxygen saturation level recorded at triage.
    - sbp: (REAL) The patient's systolic blood pressure recorded at triage.
    - dbp: (REAL) The patient's diastolic blood pressure recorded at triage.
    - pain: (TEXT) The patient's reported pain level at triage.
    - acuity: (INTEGER) The level of severity assigned by the care provider based on the triage assessment.
    - chiefcomplaint: (TEXT) The patient's reported reason for presenting to the ED, often a comma-separated list of entries.
    """
}

In [12]:
vitalsign = tables_data_types['vitalsign']
print('VITALSIGN datatable:\n')
for column_info in vitalsign:
        print(f"Column: {column_info[1]}, Type: {column_info[2]}")

VITALSIGN datatable:

Column: subject_id, Type: INTEGER
Column: stay_id, Type: INTEGER
Column: charttime, Type: TEXT
Column: temperature, Type: REAL
Column: heartrate, Type: REAL
Column: resprate, Type: REAL
Column: o2sat, Type: REAL
Column: sbp, Type: REAL
Column: dbp, Type: REAL
Column: rhythm, Type: TEXT
Column: pain, Type: TEXT


In [13]:
vitalsign = {
    "vitalsign_mapping": """
    Data Dictionary for the 'vitalsign' table in the MIMIC-IV-ED dataset
    
    Table Description:
    This table contains aperiodic vital sign measurements documented for patients during their ED stay.
    
    Columns:
    - subject_id: (INTEGER) A unique identifier assigned to each individual patient.
    - stay_id: (INTEGER) A unique identifier for the ED visit.
    - charttime: (TEXT) The date and time when the vital signs were recorded.
    - temperature: (REAL) The patient's body temperature.
    - heartrate: (REAL) The patient's heart rate.
    - resprate: (REAL) The patient's respiratory rate.
    - o2sat: (REAL) The patient's oxygen saturation level.
    - sbp: (REAL) The patient's systolic blood pressure.
    - dbp: (REAL) The patient's diastolic blood pressure.
    - rhythm: (TEXT) The patient's heart rhythm.
    - pain: (TEXT) The patient's reported pain level.
    """
}

In [14]:
conn.close()

In [28]:
data_dictionary = {
    "diagnosis_mapping": """
    Data Dictionary for the 'diagnosis' table in the MIMIC-IV-ED dataset
    
    Table Description:
    This table provides coded diagnoses associated with each ED visit, based on the International Classification of Diseases (ICD) ontology.
    
    Columns:
    - subject_id: (INTEGER) A unique identifier assigned to each individual patient.
    - stay_id: (INTEGER) A unique identifier for the ED visit.
    - seq_num: (INTEGER) A pseudo-order representing the relevance of the diagnosis, with 1 being the most relevant.
    - icd_code: (TEXT) The coded representation of the diagnosis using the ICD ontology.
    - icd_version: (INTEGER) The version of the ICD ontology used (9 or 10).
    - icd_title: (TEXT) The textual description of the ICD code.
    """,
    "edstays_mapping":"""
    Data Dictionary for the 'edstays' table in the MIMIC-IV-ED dataset
    
    Table Description:
    This table tracks patient stays in the emergency department (ED). Each row represents a unique ED visit.
    
    Columns:
    - subject_id: (INTEGER) A unique identifier assigned to each individual patient.
    - hadm_id: (REAL) An identifier representing the hospital admission, if the patient was admitted after the ED visit.
    - stay_id: (INTEGER) A unique identifier for the ED visit.
    - intime: (TEXT) The date and time when the patient was admitted to the ED.
    - outtime: (TEXT) The date and time when the patient was discharged from the ED.
    - gender: (TEXT) The patient's gender.
    - race: (TEXT) The patient's race.
    - arrival_transport: (TEXT) The mode of transportation used by the patient to arrive at the ED (e.g., ambulance, walk-in).
    - disposition: (TEXT) The discharge location or status of the patient after the ED visit (e.g., admitted, discharged home).
    """,
    "medrecon_mapping":"""
    Data Dictionary for the 'medrecon' table in the MIMIC-IV-ED dataset
    
    Table Description:
    This table provides information about the medications the patient was taking prior to their ED visit (medication reconciliation).
    
    Columns:
    - subject_id: (INTEGER) A unique identifier assigned to each individual patient.
    - stay_id: (INTEGER) A unique identifier for the ED visit.
    - charttime: (TEXT) The date and time when the medication reconciliation was documented.
    - name: (TEXT) The textual description of the medication.
    - gsn: (INTEGER) The Generic Sequence Number (GSN) for the medication, if available.
    - ndc: (INTEGER) The National Drug Code (NDC) for the medication, if available.
    - etc_rn: (INTEGER) A sequential number for grouping medications into classes based on an ontology.
    - etccode: (TEXT) The coded representation of the medication class based on an ontology.
    - etcdescription: (TEXT) The textual description of the medication class based on an ontology.
    """,
    "pyxis_mapping": """
    Data Dictionary for the 'pyxis' table in the MIMIC-IV-ED dataset
    
    Table Description:
    This table contains information about medications dispensed from the automated Pyxis MedStation system during the ED visit.
    
    Columns:
    - subject_id: (INTEGER) A unique identifier assigned to each individual patient.
    - stay_id: (INTEGER) A unique identifier for the ED visit.
    - charttime: (TEXT) The date and time when the medication was dispensed.
    - med_rn: (INTEGER) A sequential number for delineating multiple medications dispensed at the same time.
    - name: (TEXT) The textual description of the dispensed medication.
    - gsn_rn: (INTEGER) A sequential number for delineating multiple GSN values associated with the same medication.
    - gsn: (REAL) The Generic Sequence Number (GSN) for the medication, if available.
    """,
    "triage_mapping": """
    Data Dictionary for the 'triage' table in the MIMIC-IV-ED dataset
    
    Table Description:
    This table contains information collected during the triage process, including vital signs, pain level, and the chief complaint reported by the patient.
    
    Columns:
    - subject_id: (INTEGER) A unique identifier assigned to each individual patient.
    - stay_id: (INTEGER) A unique identifier for the ED visit.
    - temperature: (REAL) The patient's body temperature recorded at triage.
    - heartrate: (REAL) The patient's heart rate recorded at triage.
    - resprate: (REAL) The patient's respiratory rate recorded at triage.
    - o2sat: (REAL) The patient's oxygen saturation level recorded at triage.
    - sbp: (REAL) The patient's systolic blood pressure recorded at triage.
    - dbp: (REAL) The patient's diastolic blood pressure recorded at triage.
    - pain: (TEXT) The patient's reported pain level at triage.
    - acuity: (INTEGER) The level of severity assigned by the care provider based on the triage assessment.
    - chiefcomplaint: (TEXT) The patient's reported reason for presenting to the ED, often a comma-separated list of entries.
    """,
    "vitalsign_mapping": """
    Data Dictionary for the 'vitalsign' table in the MIMIC-IV-ED dataset
    
    Table Description:
    This table contains aperiodic vital sign measurements documented for patients during their ED stay.
    
    Columns:
    - subject_id: (INTEGER) A unique identifier assigned to each individual patient.
    - stay_id: (INTEGER) A unique identifier for the ED visit.
    - charttime: (TEXT) The date and time when the vital signs were recorded.
    - temperature: (REAL) The patient's body temperature.
    - heartrate: (REAL) The patient's heart rate.
    - resprate: (REAL) The patient's respiratory rate.
    - o2sat: (REAL) The patient's oxygen saturation level.
    - sbp: (REAL) The patient's systolic blood pressure.
    - dbp: (REAL) The patient's diastolic blood pressure.
    - rhythm: (TEXT) The patient's heart rhythm.
    - pain: (TEXT) The patient's reported pain level.
    """
}