In [1]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import functools as ft # 

pd.set_option('display.max_columns', None)

In [2]:
# read in 4 csv files from '../data/clean_data/' folder

# t1 == Medication Doses
t1 = pd.read_csv('/Users/danherman/Desktop/oud_treatment_outcome/data/clean_data/feature_engineering_data/medication.csv')

# t2 == Self Reported Drug Use
t2 = pd.read_csv('/Users/danherman/Desktop/oud_treatment_outcome/data/clean_data/feature_engineering_data/self_reported_use.csv')

# t3 == Urine Drug Screen
t3 = pd.read_csv('/Users/danherman/Desktop/oud_treatment_outcome/data/clean_data/feature_engineering_data/urine_drug_screen.csv')

# target == Treatment Outcome
target = pd.read_csv('/Users/danherman/Desktop/oud_treatment_outcome/data/clean_data/feature_engineering_data/target.csv')

In [3]:
# merge dfs, use .reduce() to treat all 4 dfs as one iterable

dfs = [t1, t2, t3, target]

t4 = ft.reduce(lambda left, right: pd.merge(left, right, on='patdeid'), dfs)

In [4]:
t4.shape

(1305, 325)

# Feature Engineering
We must remove the last 4 weeks of opiate tests to prevent data leakage into the model

In [5]:
# create list with columns that contain "t_Opiate300_21","t_Opiate300_22","t_Opiate300_23","t_Opiate300_24"
opioid_cols = [col for col in t4.columns if 't_Opiate300_21' in col or 't_Opiate300_22' in col or 't_Opiate300_23' in col or 't_Opiate300_24' in col]

In [6]:
opioid_cols[:5]

['t_Opiate300_21', 't_Opiate300_22', 't_Opiate300_23', 't_Opiate300_24']

In [7]:
# execute drop
t4.drop(opioid_cols, axis=1, inplace=True)

In [8]:
# drop patdeid column
t4.drop('patdeid', axis=1, inplace=True)

In [9]:
# check value counts for dtypes, make sure there are no strings
t4.dtypes.value_counts()

float64    318
int64        2
Name: count, dtype: int64

In [10]:
list(t4.columns)

['medication',
 'total_dose_0',
 'total_dose_1',
 'total_dose_2',
 'total_dose_3',
 'total_dose_4',
 'total_dose_5',
 'total_dose_6',
 'total_dose_7',
 'total_dose_8',
 'total_dose_9',
 'total_dose_10',
 'total_dose_11',
 'total_dose_12',
 'total_dose_13',
 'total_dose_14',
 'total_dose_15',
 'total_dose_16',
 'total_dose_17',
 'total_dose_18',
 'total_dose_19',
 'total_dose_20',
 'total_dose_21',
 'total_dose_22',
 'total_dose_23',
 'total_dose_24',
 'Unnamed: 0_x',
 'sru_alcohol_0',
 'sru_cannabis_0',
 'sru_cocaine_0',
 'sru_amphetamine_0',
 'sru_methamphetamine_0',
 'sru_opiates_0',
 'sru_benzodiazepines_0',
 'sru_methadone_0',
 'sru_oxycodone_0',
 'sru_other_0',
 'sru_alcohol_4',
 'sru_cannabis_4',
 'sru_cocaine_4',
 'sru_amphetamine_4',
 'sru_methamphetamine_4',
 'sru_opiates_4',
 'sru_benzodiazepines_4',
 'sru_methadone_4',
 'sru_oxycodone_4',
 'sru_other_4',
 'sru_alcohol_8',
 'sru_cannabis_8',
 'sru_cocaine_8',
 'sru_amphetamine_8',
 'sru_methamphetamine_8',
 'sru_opiates_8',
 

In [11]:
t4 = t4.drop(columns=['Unnamed: 0_x','Unnamed: 0_y'], axis=1)

In [13]:
t4.isna().sum().sum()

39290

In [14]:
t4 = t4.fillna(0)

### Data is cleaned properly and ready for machine learning

In [15]:
# check shape and head 
display(t4.shape)
display(t4.head())


(1305, 318)

Unnamed: 0,medication,total_dose_0,total_dose_1,total_dose_2,total_dose_3,total_dose_4,total_dose_5,total_dose_6,total_dose_7,total_dose_8,total_dose_9,total_dose_10,total_dose_11,total_dose_12,total_dose_13,total_dose_14,total_dose_15,total_dose_16,total_dose_17,total_dose_18,total_dose_19,total_dose_20,total_dose_21,total_dose_22,total_dose_23,total_dose_24,sru_alcohol_0,sru_cannabis_0,sru_cocaine_0,sru_amphetamine_0,sru_methamphetamine_0,sru_opiates_0,sru_benzodiazepines_0,sru_methadone_0,sru_oxycodone_0,sru_other_0,sru_alcohol_4,sru_cannabis_4,sru_cocaine_4,sru_amphetamine_4,sru_methamphetamine_4,sru_opiates_4,sru_benzodiazepines_4,sru_methadone_4,sru_oxycodone_4,sru_other_4,sru_alcohol_8,sru_cannabis_8,sru_cocaine_8,sru_amphetamine_8,sru_methamphetamine_8,sru_opiates_8,sru_benzodiazepines_8,sru_methadone_8,sru_oxycodone_8,sru_other_8,sru_alcohol_12,sru_cannabis_12,sru_cocaine_12,sru_amphetamine_12,sru_methamphetamine_12,sru_opiates_12,sru_benzodiazepines_12,sru_methadone_12,sru_oxycodone_12,sru_other_12,sru_alcohol_16,sru_cannabis_16,sru_cocaine_16,sru_amphetamine_16,sru_methamphetamine_16,sru_opiates_16,sru_benzodiazepines_16,sru_methadone_16,sru_oxycodone_16,sru_other_16,sru_alcohol_20,sru_cannabis_20,sru_cocaine_20,sru_amphetamine_20,sru_methamphetamine_20,sru_opiates_20,sru_benzodiazepines_20,sru_methadone_20,sru_oxycodone_20,sru_other_20,sru_alcohol_24,sru_cannabis_24,sru_cocaine_24,sru_amphetamine_24,sru_methamphetamine_24,sru_opiates_24,sru_benzodiazepines_24,sru_methadone_24,sru_oxycodone_24,sru_other_24,t_Amphetamines_0,t_Benzodiazapines_0,t_Methadone_0,t_Oxycodone_0,t_Cocaine_0,t_Methamphetamine_0,t_Opiate300_0,t_Cannabinoids_0,t_Propoxyphene_0,t_Amphetamines_1,t_Benzodiazapines_1,t_Methadone_1,t_Oxycodone_1,t_Cocaine_1,t_Methamphetamine_1,t_Opiate300_1,t_Cannabinoids_1,t_Propoxyphene_1,t_Amphetamines_2,t_Benzodiazapines_2,t_Methadone_2,t_Oxycodone_2,t_Cocaine_2,t_Methamphetamine_2,t_Opiate300_2,t_Cannabinoids_2,t_Propoxyphene_2,t_Amphetamines_3,t_Benzodiazapines_3,t_Methadone_3,t_Oxycodone_3,t_Cocaine_3,t_Methamphetamine_3,t_Opiate300_3,t_Cannabinoids_3,t_Propoxyphene_3,t_Amphetamines_4,t_Benzodiazapines_4,t_Methadone_4,t_Oxycodone_4,t_Cocaine_4,t_Methamphetamine_4,t_Opiate300_4,t_Cannabinoids_4,t_Propoxyphene_4,t_Amphetamines_5,t_Benzodiazapines_5,t_Methadone_5,t_Oxycodone_5,t_Cocaine_5,t_Methamphetamine_5,t_Opiate300_5,t_Cannabinoids_5,t_Propoxyphene_5,t_Amphetamines_6,t_Benzodiazapines_6,t_Methadone_6,t_Oxycodone_6,t_Cocaine_6,t_Methamphetamine_6,t_Opiate300_6,t_Cannabinoids_6,t_Propoxyphene_6,t_Amphetamines_7,t_Benzodiazapines_7,t_Methadone_7,t_Oxycodone_7,t_Cocaine_7,t_Methamphetamine_7,t_Opiate300_7,t_Cannabinoids_7,t_Propoxyphene_7,t_Amphetamines_8,t_Benzodiazapines_8,t_Methadone_8,t_Oxycodone_8,t_Cocaine_8,t_Methamphetamine_8,t_Opiate300_8,t_Cannabinoids_8,t_Propoxyphene_8,t_Amphetamines_9,t_Benzodiazapines_9,t_Methadone_9,t_Oxycodone_9,t_Cocaine_9,t_Methamphetamine_9,t_Opiate300_9,t_Cannabinoids_9,t_Propoxyphene_9,t_Amphetamines_10,t_Benzodiazapines_10,t_Methadone_10,t_Oxycodone_10,t_Cocaine_10,t_Methamphetamine_10,t_Opiate300_10,t_Cannabinoids_10,t_Propoxyphene_10,t_Amphetamines_11,t_Benzodiazapines_11,t_Methadone_11,t_Oxycodone_11,t_Cocaine_11,t_Methamphetamine_11,t_Opiate300_11,t_Cannabinoids_11,t_Propoxyphene_11,t_Amphetamines_12,t_Benzodiazapines_12,t_Methadone_12,t_Oxycodone_12,t_Cocaine_12,t_Methamphetamine_12,t_Opiate300_12,t_Cannabinoids_12,t_Propoxyphene_12,t_Amphetamines_13,t_Benzodiazapines_13,t_Methadone_13,t_Oxycodone_13,t_Cocaine_13,t_Methamphetamine_13,t_Opiate300_13,t_Cannabinoids_13,t_Propoxyphene_13,t_Amphetamines_14,t_Benzodiazapines_14,t_Methadone_14,t_Oxycodone_14,t_Cocaine_14,t_Methamphetamine_14,t_Opiate300_14,t_Cannabinoids_14,t_Propoxyphene_14,t_Amphetamines_15,t_Benzodiazapines_15,t_Methadone_15,t_Oxycodone_15,t_Cocaine_15,t_Methamphetamine_15,t_Opiate300_15,t_Cannabinoids_15,t_Propoxyphene_15,t_Amphetamines_16,t_Benzodiazapines_16,t_Methadone_16,t_Oxycodone_16,t_Cocaine_16,t_Methamphetamine_16,t_Opiate300_16,t_Cannabinoids_16,t_Propoxyphene_16,t_Amphetamines_17,t_Benzodiazapines_17,t_Methadone_17,t_Oxycodone_17,t_Cocaine_17,t_Methamphetamine_17,t_Opiate300_17,t_Cannabinoids_17,t_Propoxyphene_17,t_Amphetamines_18,t_Benzodiazapines_18,t_Methadone_18,t_Oxycodone_18,t_Cocaine_18,t_Methamphetamine_18,t_Opiate300_18,t_Cannabinoids_18,t_Propoxyphene_18,t_Amphetamines_19,t_Benzodiazapines_19,t_Methadone_19,t_Oxycodone_19,t_Cocaine_19,t_Methamphetamine_19,t_Opiate300_19,t_Cannabinoids_19,t_Propoxyphene_19,t_Amphetamines_20,t_Benzodiazapines_20,t_Methadone_20,t_Oxycodone_20,t_Cocaine_20,t_Methamphetamine_20,t_Opiate300_20,t_Cannabinoids_20,t_Propoxyphene_20,t_Amphetamines_21,t_Benzodiazapines_21,t_Methadone_21,t_Oxycodone_21,t_Cocaine_21,t_Methamphetamine_21,t_Cannabinoids_21,t_Propoxyphene_21,t_Amphetamines_22,t_Benzodiazapines_22,t_Methadone_22,t_Oxycodone_22,t_Cocaine_22,t_Methamphetamine_22,t_Cannabinoids_22,t_Propoxyphene_22,t_Amphetamines_23,t_Benzodiazapines_23,t_Methadone_23,t_Oxycodone_23,t_Cocaine_23,t_Methamphetamine_23,t_Cannabinoids_23,t_Propoxyphene_23,t_Amphetamines_24,t_Benzodiazapines_24,t_Methadone_24,t_Oxycodone_24,t_Cocaine_24,t_Methamphetamine_24,t_Cannabinoids_24,t_Propoxyphene_24,outcome
0,2.0,8.0,160.0,320.0,192.0,384.0,96.0,96.0,352.0,128.0,256.0,256.0,224.0,448.0,32.0,224.0,224.0,240.0,182.0,182.0,240.0,210.0,180.0,246.0,128.0,188.0,0.0,0.0,0.0,0.0,0.0,30.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0
1,2.0,8.0,64.0,68.0,84.0,60.0,108.0,84.0,96.0,36.0,96.0,88.0,112.0,104.0,56.0,88.0,160.0,80.0,72.0,56.0,56.0,56.0,80.0,84.0,84.0,68.0,0.0,0.0,0.0,0.0,0.0,30.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,0.0,0.0,3.0,1.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0
2,1.0,30.0,170.0,350.0,420.0,420.0,540.0,310.0,455.0,455.0,480.0,600.0,455.0,560.0,800.0,600.0,360.0,640.0,700.0,700.0,800.0,600.0,765.0,630.0,510.0,715.0,0.0,0.0,23.0,0.0,0.0,30.0,0.0,0.0,0.0,0.0,18.0,0.0,9.0,0.0,0.0,9.0,0.0,0.0,0.0,0.0,2.0,0.0,1.0,0.0,0.0,28.0,0.0,0.0,0.0,0.0,3.0,0.0,3.0,0.0,0.0,28.0,0.0,0.0,0.0,0.0,4.0,0.0,8.0,0.0,0.0,28.0,1.0,0.0,0.0,0.0,4.0,0.0,5.0,0.0,1.0,26.0,0.0,0.0,0.0,0.0,4.0,0.0,4.0,0.0,0.0,28.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0
3,2.0,16.0,248.0,256.0,160.0,96.0,416.0,256.0,224.0,224.0,224.0,224.0,224.0,320.0,160.0,256.0,160.0,320.0,128.0,256.0,192.0,448.0,64.0,160.0,192.0,96.0,0.0,1.0,2.0,0.0,0.0,30.0,1.0,0.0,1.0,0.0,1.0,2.0,1.0,0.0,0.0,6.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,14.0,0.0,0.0,0.0,0.0,1.0,1.0,2.0,0.0,0.0,8.0,1.0,0.0,0.0,0.0,0.0,0.0,3.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0
4,2.0,16.0,16.0,16.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.0,0.0,0.0,25.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [16]:
list(t4.columns)

['medication',
 'total_dose_0',
 'total_dose_1',
 'total_dose_2',
 'total_dose_3',
 'total_dose_4',
 'total_dose_5',
 'total_dose_6',
 'total_dose_7',
 'total_dose_8',
 'total_dose_9',
 'total_dose_10',
 'total_dose_11',
 'total_dose_12',
 'total_dose_13',
 'total_dose_14',
 'total_dose_15',
 'total_dose_16',
 'total_dose_17',
 'total_dose_18',
 'total_dose_19',
 'total_dose_20',
 'total_dose_21',
 'total_dose_22',
 'total_dose_23',
 'total_dose_24',
 'sru_alcohol_0',
 'sru_cannabis_0',
 'sru_cocaine_0',
 'sru_amphetamine_0',
 'sru_methamphetamine_0',
 'sru_opiates_0',
 'sru_benzodiazepines_0',
 'sru_methadone_0',
 'sru_oxycodone_0',
 'sru_other_0',
 'sru_alcohol_4',
 'sru_cannabis_4',
 'sru_cocaine_4',
 'sru_amphetamine_4',
 'sru_methamphetamine_4',
 'sru_opiates_4',
 'sru_benzodiazepines_4',
 'sru_methadone_4',
 'sru_oxycodone_4',
 'sru_other_4',
 'sru_alcohol_8',
 'sru_cannabis_8',
 'sru_cocaine_8',
 'sru_amphetamine_8',
 'sru_methamphetamine_8',
 'sru_opiates_8',
 'sru_benzodiazepi

In [17]:
# data is ready for machine learning

t4.to_csv('/Users/danherman/Desktop/oud_treatment_outcome/data/clean_data/machine_learning_data/final.csv', index=False)