# Relevant Data Elements

In [1]:
import csv
import pandas

### MUHC Dataset

In [2]:
# Import original dataset
muhc = pandas.read_csv('00 MUHC Original.csv', delimiter=',', encoding='latin-1')
muhc[:1]

Unnamed: 0,incident_id,investigation_complete,event_type,incident_description,descriptor,coordinator_comments,investigation_narrative,acute_medical_harm,dosimetric_impact,latent_medical_harm,...,number_fractions_prescribed,number_fractions_incorrect,hardware_manufacturer_model,software_manufacturer_model,body_region_treated,treatment_intent,ameliorating_actions,safety_barriers_failed,safety_barriers_prevented,actions_reduce_risk
0,2511,True,Actual incident,Bolus was not prescribed by MD. Pt received 2 ...,Non prescribed bolus,,,,Minor,No,...,25.0,2.0,,,Thorax,,Other,Verification of treatment accessories,,


In [3]:
# Create a temporary DataFrame of only the relevant columns.
temp = muhc[['event_type']].copy()
temp['ID'] = muhc['incident_id']
temp['Incident Description'] = muhc['descriptor'] + ' . ' + muhc['incident_description'] # id for incident description
temp['Process Step'] = muhc['process_step_occurred']
temp['Problem Type'] = muhc['problem_type']
temp['Contributing Factors'] = muhc['contributing_factors']
temp['Overall Severity'] = muhc['acute_medical_harm']
muhc = temp[['ID', 'Process Step', 'Problem Type', 'Contributing Factors', 'Overall Severity', 'Incident Description']]
muhc[:1]

Unnamed: 0,ID,Process Step,Problem Type,Contributing Factors,Overall Severity,Incident Description
0,2511,Treatment delivery,Wrong treatment accessories,Loss of attention,,Non prescribed bolus . Bolus was not prescribe...


In [4]:
# Save the new dataset as '2 MUHC subset' because
    # this is the second version of the MUHC dataset
    # the columns of this version are a subset of the original version
muhc.to_csv('01 MUHC Relevant.csv', encoding='latin-1', index=False, quoting=csv.QUOTE_NONNUMERIC)

### CIHI Dataset

In [5]:
cihi = pandas.read_csv('00 CIHI Original.csv', delimiter=',', encoding='latin-1')
cihi[:1]

Unnamed: 0,RT NSIR Case ID,Detected Date,Overall Severity,Process Step Where Incident Occurred,Process Step Where Incident Detected,Problem Type - Primary,Contributing Factor List,Incident Description,Frequency
0,100124165,8/10/2016,,Imaging for treatment planning,Treatment delivery,Other,Policies and/or procedures non-existent or ina...,Laser origin tattooed instead of isocentre. R...,1


In [6]:
temp = cihi[['Frequency']].copy()
temp['ID'] = cihi['RT NSIR Case ID']
temp['Incident Description'] = cihi['Incident Description']
temp['Process Step'] = cihi['Process Step Where Incident Occurred']
temp['Problem Type'] = cihi['Problem Type - Primary']
temp['Contributing Factors'] = cihi['Contributing Factor List']
temp['Overall Severity'] = cihi['Overall Severity']
cihi = temp[['ID', 'Process Step', 'Problem Type', 'Contributing Factors', 'Overall Severity', 'Incident Description']]
cihi[:1]

Unnamed: 0,ID,Process Step,Problem Type,Contributing Factors,Overall Severity,Incident Description
0,100124165,Imaging for treatment planning,Other,Policies and/or procedures non-existent or ina...,,Laser origin tattooed instead of isocentre. R...


In [7]:
cihi.to_csv('01 CIHI Relevant.csv', encoding='latin-1', index=False, quoting=csv.QUOTE_NONNUMERIC)