# Drug Overdose Modeling

In [36]:
import numpy as np
import pandas as pd
import scipy as sp
import datetime
import matplotlib.pyplot as plt
import seaborn as sns
import statsmodels.api as sm
import patsy 
import math

pd.set_option('display.max_columns', 100)
%matplotlib inline

## Import the feature DataFrame

In [37]:
# Read the DF created from the feature_selection notebook
counties = pd.read_pickle('counties_df.pkl')

In [38]:
# Make the column names standardized for use in patsy formulas
counties.columns = [x.replace(' ', '_').replace('-', '_').replace('%', 'Percent').replace('.', '_').replace('(', '').replace(')', '').replace('<','lt') for x in list(counties.columns)]
# Patsy also doesn't like column names begining with a number
counties = counties.rename(columns={'20th_Percentile_Income': 'Percentile_Income_20th', '80th_Percentile_Income': 'Percentile_Income_80th'})

## Train a model on the appropriate features

In [39]:
counties

Unnamed: 0_level_0,State,County,Age_Adjusted_Mortality,Age_Adjusted_Mortality_Black,Age_Adjusted_Mortality_Hispanic,Age_Adjusted_Mortality_White,Child_Mortality_Rate,Child_Mortality_Rate_Black,Child_Mortality_Rate_White,Infant_Mortality_Rate,Percent_Frequent_Physical_Distress,Percent_Frequent_Mental_Distress,Percent_Diabetic,HIV_Prevalence_Rate,Percent_Food_Insecure,Percent_Limited_Access,Drug_Overdose_Mortality_Rate,MV_Mortality_Rate,Percent_Insufficient_Sleep,Percent_Uninsured,Percent_Uninsured_1,Costs,Other_PCP_Rate,Percent_Disconnected_Youth,Household_Income,Household_income_Black,Household_income_Hispanic,Household_income_White,Percent_Free_or_Reduced_Lunch,Segregation_index,Segregation_Index,Homicide_Rate,Firearm_Fatalities_Rate,Population,Percent_lt_18,Percent_65_and_over,Percent_African_American,Percent_American_Indian/Alaskan_Native,Percent_Asian,Percent_Native_Hawaiian/Other_Pacific_Islander,Percent_Hispanic,Percent_Non_Hispanic_White,Percent_Not_Proficient_in_English,Percent_Female,Percent_Rural,State_ranked,County_ranked,Years_of_Potential_Life_Lost_Rate,Years_of_Potential_Life_Lost_Rate_Black,Years_of_Potential_Life_Lost_Rate_Hispanic,...,Percent_LBW_Hispanic,Percent_LBW_White,Percent_Smokers,Percent_Obese,Food_Environment_Index,Percent_Physically_Inactive,Percent_With_Access,Percent_Excessive_Drinking,Percent_Alcohol_Impaired,Chlamydia_Rate,Teen_Birth_Rate,Teen_Birth_Rate_Black,Teen_Birth_Rate_Hispanic,Teen_Birth_Rate_White,Percent_Uninsured_ranked,PCP_Rate,Dentist_Rate,MHP_Rate,Preventable_Hosp__Rate,Percent_Receiving_HbA1c,Percent_Receiving_HbA1c_Black,Percent_Receiving_HbA1c_White,Percent_Mammography,Percent_Mammography_Black,Percent_Mammography_White,Cohort_Size,Graduation_Rate,Population_ranked,Percent_Some_College,Percent_Unemployed,Percent_Children_in_Poverty,Percent_Children_in_Poverty_Black,Percent_Children_in_Poverty_Hispanic,Percent_Children_in_Poverty_White,Percentile_Income_80th,Percentile_Income_20th,Income_Ratio,Percent_Single_Parent_Households,Association_Rate,Violent_Crime_Rate,Injury_Death_Rate,Average_Daily_PM2_5,Presence_of_violation,Percent_Severe_Housing_Problems,Percent_Drive_Alone,Percent_Drive_Alone_Black,Percent_Drive_Alone_Hispanic,Percent_Drive_Alone_White,Percent_Long_Commute___Drives_Alone,Urban
FIPS,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1
1001,Alabama,Autauga,449.6,531.700000,292.315327,444.900000,56.186903,95.921022,48.240956,7.718502,12.824434,12.638357,12.4,225.500000,13.9,11.991125,10.231226,20.167754,35.905406,12.193092,2.595313,10674.34,28.87253,14.570000,54487.0,32173.000000,72411.000000,58556.000000,48.475388,26.347048,24.000912,3.619853,16.972533,55416,24.408113,14.728598,19.048650,0.485419,1.140465,0.101054,2.688754,75.000000,0.832739,51.288437,42.002162,Alabama,Autauga,9409.294766,11806.223285,5968.227286,...,7.260143,7.415319,19.124658,36.4,7.1,30.9,71.120192,16.878015,26.785714,341.2,27.996758,31.533043,38.461538,27.153838,9.387712,45.16957,32.48159,12.63173,81.85,83.966245,74.107143,85.809683,62.693157,58.333333,63.209877,706.0,90.000000,14315,61.942019,5.271161,19.3,28.072153,16.699411,14.400244,101520.0,23134.0,4.388346,24.471409,13.912226,265.699747,72.584664,10.8,0.0,15.217927,86.750062,82.494851,83.676458,82.539683,40.8,True
1003,Alabama,Baldwin,351.3,517.800000,111.100000,349.300000,47.688777,87.008289,44.472180,5.545407,12.622002,12.822558,11.1,163.900000,13.0,5.424427,18.452504,15.281185,33.305868,14.719861,3.273439,9537.12,43.63190,15.410000,56460.0,26818.000000,41908.000000,54184.000000,45.795480,43.969941,30.674915,2.705282,14.718943,208563,21.734440,19.708194,9.042831,0.770990,1.074975,0.059454,4.416411,83.202198,0.818809,51.457833,42.279099,Alabama,Baldwin,7467.596664,10335.702691,2827.348216,...,4.672131,8.019411,16.795485,29.3,7.9,24.5,68.518915,16.714969,30.379747,338.8,31.965138,38.553804,57.609217,29.475711,11.524397,72.65266,49.38556,89.18169,46.30,83.212237,82.432432,83.259019,65.965233,65.753425,65.972551,2236.0,85.000000,47361,63.757100,5.415263,17.6,41.332247,10.290898,15.098892,102624.0,22306.0,4.600735,25.811441,11.045167,216.773078,71.492010,9.6,0.0,14.310156,84.646043,85.567010,68.864800,84.646255,40.1,True
1007,Alabama,Bibb,529.1,630.400000,379.530215,526.600000,116.315956,159.427910,102.321969,14.775414,13.162968,12.854036,14.6,191.900000,16.1,2.601627,22.146105,27.125572,38.148865,15.070569,3.141252,10755.78,75.07839,25.130000,43079.0,28256.000000,45909.000000,42020.000000,61.318483,43.487328,42.168010,8.200754,21.268865,22643,20.752550,15.430817,21.618160,0.379808,0.198737,0.119242,2.499669,74.415934,0.448137,46.363114,68.352607,Alabama,Bibb,11741.938889,11297.166352,8455.256165,...,7.695099,9.215263,19.916404,38.4,7.6,37.5,48.592625,15.925151,27.586207,302.1,47.260274,35.416667,58.653674,51.005101,11.855881,53.13732,22.08188,8.83275,92.87,81.981982,73.469388,83.450704,61.306533,45.161290,64.285714,262.0,85.000000,6158,49.821371,6.637117,27.5,47.923681,30.199112,20.249307,79882.0,18893.0,4.228127,31.427964,10.627463,147.290900,95.709893,10.5,0.0,12.358757,85.072464,82.516757,67.704607,79.254609,48.8,False
1009,Alabama,Blount,480.2,557.111669,264.584515,426.990614,55.375074,123.473245,47.882557,5.294367,13.720057,13.827943,14.4,95.400000,11.3,2.880150,21.375422,22.536300,35.945010,17.699115,4.489532,10326.33,12.13087,15.350000,47213.0,37647.000000,34375.000000,48045.000000,54.520167,39.938703,24.226299,6.191291,19.044717,57704,23.190767,17.986621,1.434909,0.627340,0.265146,0.112644,9.068695,87.467073,1.878506,50.613476,89.951502,Alabama,Blount,9359.122343,11192.898535,5133.144570,...,7.079646,7.745780,19.652158,35.8,8.5,29.0,32.272077,15.378722,20.000000,114.3,39.624778,46.875000,37.237644,40.335654,13.963659,20.80696,19.06280,8.66491,57.82,87.659574,84.296780,86.661374,59.584296,65.935647,65.331969,720.0,91.206250,14018,53.866457,5.520897,19.4,15.068493,57.107356,20.936920,83944.0,20634.0,4.068237,27.294239,8.842959,211.598836,104.572810,11.3,0.0,11.058037,86.107728,83.107590,79.539642,81.580997,60.2,False
1015,Alabama,Calhoun,564.3,627.700000,288.500000,566.300000,77.289582,130.528256,61.332671,8.759748,13.020953,13.806568,16.3,211.200000,17.4,9.178567,15.600309,17.022882,41.314344,14.514503,2.891841,10901.19,50.60596,19.070000,41778.0,26523.000000,31331.000000,47514.000000,58.868341,46.984796,41.778342,9.185008,22.234517,114611,21.830365,16.880579,20.734484,0.520020,0.919632,0.098594,3.577318,72.623919,0.709622,51.891180,33.696826,Alabama,Calhoun,11527.781204,13353.368133,5819.327989,...,5.152672,7.486210,20.462232,36.1,6.8,32.5,48.217117,15.431677,22.857143,587.5,39.711728,44.082354,39.513678,38.125317,11.396868,64.86767,60.20365,94.23179,72.80,81.270096,78.787879,81.787275,56.895446,59.793814,56.483516,1316.0,92.163374,28798,56.743524,6.697384,25.7,59.831267,29.846583,17.536471,82414.0,16952.0,4.861609,38.380573,14.011417,574.323556,74.115058,11.6,0.0,15.292172,84.985916,85.871991,83.291457,87.574201,29.4,True
1019,Alabama,Cherokee,546.0,922.900000,345.082993,533.000000,75.307062,157.686979,106.401193,11.202051,13.009557,13.643444,12.9,90.100000,13.9,0.221112,15.459734,32.986789,35.355071,14.645020,3.130789,11470.43,46.64723,25.163920,41456.0,33934.000000,35911.813661,39764.000000,63.186541,25.589739,19.715164,7.696917,21.564173,25725,19.825073,22.017493,4.291545,0.629738,0.256560,0.031098,1.605442,91.692906,0.060901,50.363460,85.736273,Alabama,Cherokee,11683.171114,15481.101545,9409.319587,...,8.465103,8.349515,19.144853,35.5,8.2,35.9,36.030628,15.232731,18.181818,169.0,45.303652,40.576455,65.726508,38.960083,11.682127,38.67126,15.54908,19.43635,76.63,88.628159,73.913043,89.265537,63.366337,61.390463,61.611978,280.0,88.000000,5516,55.565627,5.213652,27.5,37.931034,37.726231,21.099912,79412.0,17112.0,4.640720,32.235966,10.054526,383.600749,112.441757,10.8,0.0,15.778252,84.596061,75.903008,74.257848,81.779403,45.9,False
1021,Alabama,Chilton,516.3,615.200000,256.348989,522.100000,56.483879,105.666951,61.207661,6.894791,14.445380,14.260704,14.1,99.500000,13.5,1.460531,12.138224,22.140966,35.174569,19.470843,4.762770,10515.38,9.10312,19.580000,44188.0,27375.000000,28081.000000,45494.000000,61.087434,36.022367,30.416380,6.512049,15.939158,43941,24.039052,16.055620,9.929223,0.514326,0.475638,0.175235,7.603377,80.560297,2.446886,50.831797,86.744724,Alabama,Chilton,11099.683529,16051.458138,5249.976050,...,6.290672,8.253752,19.673275,36.0,8.2,29.8,46.044039,15.064313,20.253165,307.3,51.259961,41.629761,65.128901,51.742919,15.232994,18.20540,25.03357,38.68824,65.11,89.059081,88.888889,89.073634,64.000000,60.869565,64.259928,517.0,86.000000,11708,39.118551,5.617919,26.3,49.869452,56.843680,25.272703,84217.0,17180.0,4.902037,32.023821,16.612430,345.839685,90.625498,10.5,0.0,14.527027,82.865233,86.703601,79.046534,82.431522,47.6,False
1029,Alabama,Cleburne,591.9,626.433594,572.569693,498.369462,101.463752,160.595988,96.987752,15.119347,13.279598,13.661562,12.7,111.300000,13.5,2.071716,22.211363,25.799054,33.504785,15.475092,3.725327,11134.31,20.10185,26.267392,43483.0,41124.331337,18992.000000,38288.000000,57.772710,49.889622,36.826565,10.333679,22.712698,14924,23.090324,18.815331,3.088984,0.435540,0.180917,0.080407,2.452426,92.749933,0.816761,50.274725,100.000000,Alabama,Cleburne,11380.483302,12205.306120,11640.656213,...,10.710847,9.478716,19.710512,34.6,8.1,32.2,45.858937,15.970047,25.000000,252.0,44.540674,75.294594,89.515596,42.552257,12.120460,26.63471,6.70062,40.20370,67.61,82.972136,94.444444,82.295082,49.450549,55.140029,59.263472,201.0,98.000000,3563,46.674151,6.088150,24.5,33.434369,89.928058,24.128686,73032.0,15020.0,4.862317,22.142240,9.988014,149.925037,97.530996,10.3,0.0,13.386525,82.134529,81.470694,74.915551,76.930587,50.4,False
1031,Alabama,Coffee,409.2,559.800000,226.303544,391.500000,55.752870,113.601157,37.279816,6.991479,13.593147,13.445273,15.5,143.300000,15.1,5.981203,7.825441,16.853459,37.304732,15.281598,3.629893,9855.89,56.61188,16.890000,48632.0,28352.000000,40648.000000,53528.000000,46.965995,35.490598,26.341150,2.808910,14.870703,51226,23.745754,16.415492,17.227580,1.405536,1.526569,0.421661,6.969117,70.653574,1.497188,50.573927,47.195083,Alabama,Coffee,7295.411499,10559.281482,13654.156601,...,8.239700,6.369210,18.201221,34.2,7.5,29.8,44.630416,15.528420,31.914894,467.5,30.630003,37.379719,72.538860,25.298204,11.933247,56.62846,33.18627,54.65974,52.76,88.153998,89.940828,87.796209,63.099042,66.666667,62.523191,752.0,96.229388,13294,61.433730,6.053328,21.3,39.420423,36.694915,19.212395,98372.0,19622.0,5.013352,38.324789,16.012185,321.157993,62.222153,9.6,0.0,14.016243,85.725330,80.437873,84.768212,85.531749,23.3,True
1033,Alabama,Colbert,504.3,591.300000,248.537984,499.700000,78.919864,112.318201,57.839474,9.363745,13.113404,13.365516,17.4,93.300000,16.6,6.551705,8.583007,19.946512,36.950783,13.356842,3.055692,10879.20,121.73528,17.810000,46572.0,31813.000000,38750.000000,46991.000000,49.747878,26.561564,21.412017,3.674357,15.436693,54216,21.196695,19.215730,15.906743,0.649255,0.558876,0.051645,2.473440,78.784861,0.202753,51.752250,43.894687,Alabama,Colbert,10566.513329,11719.391858,5283.836689,...,7.692308,9.554326,18.371146,34.6,7.2,30.9,64.503564,15.822773,8.695652,473.0,38.705198,34.815436,31.948882,40.571692,10.602745,62.55289,42.42290,25.82264,74.59,87.413074,89.552239,86.923077,68.104575,78.571429,66.566717,627.0,88.850877,13031,54.063387,7.010588,25.1,34.537493,7.664234,20.964923,85487.0,17063.0,5.010080,35.244289,18.213931,449.589200,67.994957,10.2,0.0,15.708556,89.532088,89.024390,74.484314,91.570722,26.1,True


In [40]:
formula = "Drug_Overdose_Mortality_Rate ~ 1 + Percent_Unemployed + Household_Income + Graduation_Rate + Percent_Rural + HIV_Prevalence_Rate + Percent_Frequent_Mental_Distress + Percent_Excessive_Drinking"
y, X = patsy.dmatrices(formula, counties, return_type='matrix') 
model = sm.OLS(y, X)

In [41]:
results = model.fit()

In [42]:
results.summary()

0,1,2,3
Dep. Variable:,Drug_Overdose_Mortality_Rate,R-squared:,0.169
Model:,OLS,Adj. R-squared:,0.166
Method:,Least Squares,F-statistic:,47.91
Date:,"Wed, 12 Dec 2018",Prob (F-statistic):,3.67e-62
Time:,00:21:14,Log-Likelihood:,-6081.7
No. Observations:,1655,AIC:,12180.0
Df Residuals:,1647,BIC:,12220.0
Df Model:,7,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5,6
,coef,std err,t,P>|t|,[0.025,0.975]
Intercept,-19.2633,6.156,-3.129,0.002,-31.337,-7.189
Percent_Unemployed,0.8768,0.174,5.036,0.000,0.535,1.218
Household_Income,0.0001,2.9e-05,3.467,0.001,4.37e-05,0.000
Graduation_Rate,0.0669,0.035,1.924,0.055,-0.001,0.135
Percent_Rural,0.0172,0.011,1.597,0.110,-0.004,0.038
HIV_Prevalence_Rate,-0.0027,0.001,-2.109,0.035,-0.005,-0.000
Percent_Frequent_Mental_Distress,2.2124,0.274,8.084,0.000,1.676,2.749
Percent_Excessive_Drinking,-0.2322,0.099,-2.347,0.019,-0.426,-0.038

0,1,2,3
Omnibus:,535.045,Durbin-Watson:,1.631
Prob(Omnibus):,0.0,Jarque-Bera (JB):,2169.778
Skew:,1.518,Prob(JB):,0.0
Kurtosis:,7.717,Cond. No.,1420000.0


## See what SciKitLearn thinks are the best features to use

In [43]:
from sklearn.feature_selection import SelectKBest, f_regression
X = counties.copy().drop(columns=['Drug_Overdose_Mortality_Rate'])
X = X.select_dtypes(exclude='object')
y = counties['Drug_Overdose_Mortality_Rate']
kbest = SelectKBest(f_regression, k=20).fit(X, y)

In [44]:
new_features = []
mask = kbest.get_support()

for boolean, feature in zip(mask, list(counties.columns.values)):
    if boolean:
        new_features.append(feature)

In [45]:
new_features

['State',
 'Age_Adjusted_Mortality',
 'Age_Adjusted_Mortality_Black',
 'Child_Mortality_Rate',
 'Child_Mortality_Rate_Black',
 'Child_Mortality_Rate_White',
 'Infant_Mortality_Rate',
 'Percent_Frequent_Physical_Distress',
 'Percent_Uninsured_1',
 'Segregation_index',
 'Percent_Not_Proficient_in_English',
 'State_ranked',
 'Years_of_Potential_Life_Lost_Rate',
 'Years_of_Potential_Life_Lost_Rate_Black',
 'Physically_Unhealthy_Days',
 'Mentally_Unhealthy_Days',
 'Percent_Smokers',
 'Teen_Birth_Rate_White',
 'Percent_Some_College',
 'Percentile_Income_20th']

## Compare our intuitive features choices against the K-best

In [46]:
formula = "Drug_Overdose_Mortality_Rate ~ 1"
for feature in new_features:
    formula += ' + ' + feature
formula

'Drug_Overdose_Mortality_Rate ~ 1 + State + Age_Adjusted_Mortality + Age_Adjusted_Mortality_Black + Child_Mortality_Rate + Child_Mortality_Rate_Black + Child_Mortality_Rate_White + Infant_Mortality_Rate + Percent_Frequent_Physical_Distress + Percent_Uninsured_1 + Segregation_index + Percent_Not_Proficient_in_English + State_ranked + Years_of_Potential_Life_Lost_Rate + Years_of_Potential_Life_Lost_Rate_Black + Physically_Unhealthy_Days + Mentally_Unhealthy_Days + Percent_Smokers + Teen_Birth_Rate_White + Percent_Some_College + Percentile_Income_20th'

In [47]:
y, X = patsy.dmatrices(formula, counties, return_type='matrix') 
model = sm.OLS(y, X)

In [48]:
results = model.fit()

In [49]:
results.summary()

0,1,2,3
Dep. Variable:,Drug_Overdose_Mortality_Rate,R-squared:,0.574
Model:,OLS,Adj. R-squared:,0.556
Method:,Least Squares,F-statistic:,31.47
Date:,"Wed, 12 Dec 2018",Prob (F-statistic):,9.44e-244
Time:,00:21:15,Log-Likelihood:,-5528.4
No. Observations:,1655,AIC:,11190.0
Df Residuals:,1586,BIC:,11570.0
Df Model:,68,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5,6
,coef,std err,t,P>|t|,[0.025,0.975]
Intercept,-19.2794,6.375,-3.024,0.003,-31.783,-6.776
State[T.Alaska],4.8945,1.924,2.543,0.011,1.120,8.669
State[T.Arizona],4.4482,1.278,3.481,0.001,1.942,6.955
State[T.Arkansas],-0.6883,0.892,-0.772,0.440,-2.438,1.061
State[T.California],4.1262,0.864,4.776,0.000,2.432,5.821
State[T.Colorado],5.6241,0.992,5.672,0.000,3.679,7.569
State[T.Connecticut],7.7483,1.421,5.453,0.000,4.961,10.535
State[T.Delaware],7.0096,2.131,3.290,0.001,2.830,11.189
State[T.District of Columbia],3.2218,3.595,0.896,0.370,-3.830,10.273

0,1,2,3
Omnibus:,247.84,Durbin-Watson:,2.088
Prob(Omnibus):,0.0,Jarque-Bera (JB):,702.704
Skew:,0.782,Prob(JB):,2.57e-153
Kurtosis:,5.783,Cond. No.,1.02e+16


## Building a Logistic Regression model to predict Drug Overdose Mortality Rate Percentile

#### In this section, we will break counties into top 25% and bottom 25% of Drug Overdose Mortality Rate and build a logistic regression model to predict which group a county might be in.



In [50]:
counties

Unnamed: 0_level_0,State,County,Age_Adjusted_Mortality,Age_Adjusted_Mortality_Black,Age_Adjusted_Mortality_Hispanic,Age_Adjusted_Mortality_White,Child_Mortality_Rate,Child_Mortality_Rate_Black,Child_Mortality_Rate_White,Infant_Mortality_Rate,Percent_Frequent_Physical_Distress,Percent_Frequent_Mental_Distress,Percent_Diabetic,HIV_Prevalence_Rate,Percent_Food_Insecure,Percent_Limited_Access,Drug_Overdose_Mortality_Rate,MV_Mortality_Rate,Percent_Insufficient_Sleep,Percent_Uninsured,Percent_Uninsured_1,Costs,Other_PCP_Rate,Percent_Disconnected_Youth,Household_Income,Household_income_Black,Household_income_Hispanic,Household_income_White,Percent_Free_or_Reduced_Lunch,Segregation_index,Segregation_Index,Homicide_Rate,Firearm_Fatalities_Rate,Population,Percent_lt_18,Percent_65_and_over,Percent_African_American,Percent_American_Indian/Alaskan_Native,Percent_Asian,Percent_Native_Hawaiian/Other_Pacific_Islander,Percent_Hispanic,Percent_Non_Hispanic_White,Percent_Not_Proficient_in_English,Percent_Female,Percent_Rural,State_ranked,County_ranked,Years_of_Potential_Life_Lost_Rate,Years_of_Potential_Life_Lost_Rate_Black,Years_of_Potential_Life_Lost_Rate_Hispanic,...,Percent_LBW_Hispanic,Percent_LBW_White,Percent_Smokers,Percent_Obese,Food_Environment_Index,Percent_Physically_Inactive,Percent_With_Access,Percent_Excessive_Drinking,Percent_Alcohol_Impaired,Chlamydia_Rate,Teen_Birth_Rate,Teen_Birth_Rate_Black,Teen_Birth_Rate_Hispanic,Teen_Birth_Rate_White,Percent_Uninsured_ranked,PCP_Rate,Dentist_Rate,MHP_Rate,Preventable_Hosp__Rate,Percent_Receiving_HbA1c,Percent_Receiving_HbA1c_Black,Percent_Receiving_HbA1c_White,Percent_Mammography,Percent_Mammography_Black,Percent_Mammography_White,Cohort_Size,Graduation_Rate,Population_ranked,Percent_Some_College,Percent_Unemployed,Percent_Children_in_Poverty,Percent_Children_in_Poverty_Black,Percent_Children_in_Poverty_Hispanic,Percent_Children_in_Poverty_White,Percentile_Income_80th,Percentile_Income_20th,Income_Ratio,Percent_Single_Parent_Households,Association_Rate,Violent_Crime_Rate,Injury_Death_Rate,Average_Daily_PM2_5,Presence_of_violation,Percent_Severe_Housing_Problems,Percent_Drive_Alone,Percent_Drive_Alone_Black,Percent_Drive_Alone_Hispanic,Percent_Drive_Alone_White,Percent_Long_Commute___Drives_Alone,Urban
FIPS,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1
1001,Alabama,Autauga,449.6,531.700000,292.315327,444.900000,56.186903,95.921022,48.240956,7.718502,12.824434,12.638357,12.4,225.500000,13.9,11.991125,10.231226,20.167754,35.905406,12.193092,2.595313,10674.34,28.87253,14.570000,54487.0,32173.000000,72411.000000,58556.000000,48.475388,26.347048,24.000912,3.619853,16.972533,55416,24.408113,14.728598,19.048650,0.485419,1.140465,0.101054,2.688754,75.000000,0.832739,51.288437,42.002162,Alabama,Autauga,9409.294766,11806.223285,5968.227286,...,7.260143,7.415319,19.124658,36.4,7.1,30.9,71.120192,16.878015,26.785714,341.2,27.996758,31.533043,38.461538,27.153838,9.387712,45.16957,32.48159,12.63173,81.85,83.966245,74.107143,85.809683,62.693157,58.333333,63.209877,706.0,90.000000,14315,61.942019,5.271161,19.3,28.072153,16.699411,14.400244,101520.0,23134.0,4.388346,24.471409,13.912226,265.699747,72.584664,10.8,0.0,15.217927,86.750062,82.494851,83.676458,82.539683,40.8,True
1003,Alabama,Baldwin,351.3,517.800000,111.100000,349.300000,47.688777,87.008289,44.472180,5.545407,12.622002,12.822558,11.1,163.900000,13.0,5.424427,18.452504,15.281185,33.305868,14.719861,3.273439,9537.12,43.63190,15.410000,56460.0,26818.000000,41908.000000,54184.000000,45.795480,43.969941,30.674915,2.705282,14.718943,208563,21.734440,19.708194,9.042831,0.770990,1.074975,0.059454,4.416411,83.202198,0.818809,51.457833,42.279099,Alabama,Baldwin,7467.596664,10335.702691,2827.348216,...,4.672131,8.019411,16.795485,29.3,7.9,24.5,68.518915,16.714969,30.379747,338.8,31.965138,38.553804,57.609217,29.475711,11.524397,72.65266,49.38556,89.18169,46.30,83.212237,82.432432,83.259019,65.965233,65.753425,65.972551,2236.0,85.000000,47361,63.757100,5.415263,17.6,41.332247,10.290898,15.098892,102624.0,22306.0,4.600735,25.811441,11.045167,216.773078,71.492010,9.6,0.0,14.310156,84.646043,85.567010,68.864800,84.646255,40.1,True
1007,Alabama,Bibb,529.1,630.400000,379.530215,526.600000,116.315956,159.427910,102.321969,14.775414,13.162968,12.854036,14.6,191.900000,16.1,2.601627,22.146105,27.125572,38.148865,15.070569,3.141252,10755.78,75.07839,25.130000,43079.0,28256.000000,45909.000000,42020.000000,61.318483,43.487328,42.168010,8.200754,21.268865,22643,20.752550,15.430817,21.618160,0.379808,0.198737,0.119242,2.499669,74.415934,0.448137,46.363114,68.352607,Alabama,Bibb,11741.938889,11297.166352,8455.256165,...,7.695099,9.215263,19.916404,38.4,7.6,37.5,48.592625,15.925151,27.586207,302.1,47.260274,35.416667,58.653674,51.005101,11.855881,53.13732,22.08188,8.83275,92.87,81.981982,73.469388,83.450704,61.306533,45.161290,64.285714,262.0,85.000000,6158,49.821371,6.637117,27.5,47.923681,30.199112,20.249307,79882.0,18893.0,4.228127,31.427964,10.627463,147.290900,95.709893,10.5,0.0,12.358757,85.072464,82.516757,67.704607,79.254609,48.8,False
1009,Alabama,Blount,480.2,557.111669,264.584515,426.990614,55.375074,123.473245,47.882557,5.294367,13.720057,13.827943,14.4,95.400000,11.3,2.880150,21.375422,22.536300,35.945010,17.699115,4.489532,10326.33,12.13087,15.350000,47213.0,37647.000000,34375.000000,48045.000000,54.520167,39.938703,24.226299,6.191291,19.044717,57704,23.190767,17.986621,1.434909,0.627340,0.265146,0.112644,9.068695,87.467073,1.878506,50.613476,89.951502,Alabama,Blount,9359.122343,11192.898535,5133.144570,...,7.079646,7.745780,19.652158,35.8,8.5,29.0,32.272077,15.378722,20.000000,114.3,39.624778,46.875000,37.237644,40.335654,13.963659,20.80696,19.06280,8.66491,57.82,87.659574,84.296780,86.661374,59.584296,65.935647,65.331969,720.0,91.206250,14018,53.866457,5.520897,19.4,15.068493,57.107356,20.936920,83944.0,20634.0,4.068237,27.294239,8.842959,211.598836,104.572810,11.3,0.0,11.058037,86.107728,83.107590,79.539642,81.580997,60.2,False
1015,Alabama,Calhoun,564.3,627.700000,288.500000,566.300000,77.289582,130.528256,61.332671,8.759748,13.020953,13.806568,16.3,211.200000,17.4,9.178567,15.600309,17.022882,41.314344,14.514503,2.891841,10901.19,50.60596,19.070000,41778.0,26523.000000,31331.000000,47514.000000,58.868341,46.984796,41.778342,9.185008,22.234517,114611,21.830365,16.880579,20.734484,0.520020,0.919632,0.098594,3.577318,72.623919,0.709622,51.891180,33.696826,Alabama,Calhoun,11527.781204,13353.368133,5819.327989,...,5.152672,7.486210,20.462232,36.1,6.8,32.5,48.217117,15.431677,22.857143,587.5,39.711728,44.082354,39.513678,38.125317,11.396868,64.86767,60.20365,94.23179,72.80,81.270096,78.787879,81.787275,56.895446,59.793814,56.483516,1316.0,92.163374,28798,56.743524,6.697384,25.7,59.831267,29.846583,17.536471,82414.0,16952.0,4.861609,38.380573,14.011417,574.323556,74.115058,11.6,0.0,15.292172,84.985916,85.871991,83.291457,87.574201,29.4,True
1019,Alabama,Cherokee,546.0,922.900000,345.082993,533.000000,75.307062,157.686979,106.401193,11.202051,13.009557,13.643444,12.9,90.100000,13.9,0.221112,15.459734,32.986789,35.355071,14.645020,3.130789,11470.43,46.64723,25.163920,41456.0,33934.000000,35911.813661,39764.000000,63.186541,25.589739,19.715164,7.696917,21.564173,25725,19.825073,22.017493,4.291545,0.629738,0.256560,0.031098,1.605442,91.692906,0.060901,50.363460,85.736273,Alabama,Cherokee,11683.171114,15481.101545,9409.319587,...,8.465103,8.349515,19.144853,35.5,8.2,35.9,36.030628,15.232731,18.181818,169.0,45.303652,40.576455,65.726508,38.960083,11.682127,38.67126,15.54908,19.43635,76.63,88.628159,73.913043,89.265537,63.366337,61.390463,61.611978,280.0,88.000000,5516,55.565627,5.213652,27.5,37.931034,37.726231,21.099912,79412.0,17112.0,4.640720,32.235966,10.054526,383.600749,112.441757,10.8,0.0,15.778252,84.596061,75.903008,74.257848,81.779403,45.9,False
1021,Alabama,Chilton,516.3,615.200000,256.348989,522.100000,56.483879,105.666951,61.207661,6.894791,14.445380,14.260704,14.1,99.500000,13.5,1.460531,12.138224,22.140966,35.174569,19.470843,4.762770,10515.38,9.10312,19.580000,44188.0,27375.000000,28081.000000,45494.000000,61.087434,36.022367,30.416380,6.512049,15.939158,43941,24.039052,16.055620,9.929223,0.514326,0.475638,0.175235,7.603377,80.560297,2.446886,50.831797,86.744724,Alabama,Chilton,11099.683529,16051.458138,5249.976050,...,6.290672,8.253752,19.673275,36.0,8.2,29.8,46.044039,15.064313,20.253165,307.3,51.259961,41.629761,65.128901,51.742919,15.232994,18.20540,25.03357,38.68824,65.11,89.059081,88.888889,89.073634,64.000000,60.869565,64.259928,517.0,86.000000,11708,39.118551,5.617919,26.3,49.869452,56.843680,25.272703,84217.0,17180.0,4.902037,32.023821,16.612430,345.839685,90.625498,10.5,0.0,14.527027,82.865233,86.703601,79.046534,82.431522,47.6,False
1029,Alabama,Cleburne,591.9,626.433594,572.569693,498.369462,101.463752,160.595988,96.987752,15.119347,13.279598,13.661562,12.7,111.300000,13.5,2.071716,22.211363,25.799054,33.504785,15.475092,3.725327,11134.31,20.10185,26.267392,43483.0,41124.331337,18992.000000,38288.000000,57.772710,49.889622,36.826565,10.333679,22.712698,14924,23.090324,18.815331,3.088984,0.435540,0.180917,0.080407,2.452426,92.749933,0.816761,50.274725,100.000000,Alabama,Cleburne,11380.483302,12205.306120,11640.656213,...,10.710847,9.478716,19.710512,34.6,8.1,32.2,45.858937,15.970047,25.000000,252.0,44.540674,75.294594,89.515596,42.552257,12.120460,26.63471,6.70062,40.20370,67.61,82.972136,94.444444,82.295082,49.450549,55.140029,59.263472,201.0,98.000000,3563,46.674151,6.088150,24.5,33.434369,89.928058,24.128686,73032.0,15020.0,4.862317,22.142240,9.988014,149.925037,97.530996,10.3,0.0,13.386525,82.134529,81.470694,74.915551,76.930587,50.4,False
1031,Alabama,Coffee,409.2,559.800000,226.303544,391.500000,55.752870,113.601157,37.279816,6.991479,13.593147,13.445273,15.5,143.300000,15.1,5.981203,7.825441,16.853459,37.304732,15.281598,3.629893,9855.89,56.61188,16.890000,48632.0,28352.000000,40648.000000,53528.000000,46.965995,35.490598,26.341150,2.808910,14.870703,51226,23.745754,16.415492,17.227580,1.405536,1.526569,0.421661,6.969117,70.653574,1.497188,50.573927,47.195083,Alabama,Coffee,7295.411499,10559.281482,13654.156601,...,8.239700,6.369210,18.201221,34.2,7.5,29.8,44.630416,15.528420,31.914894,467.5,30.630003,37.379719,72.538860,25.298204,11.933247,56.62846,33.18627,54.65974,52.76,88.153998,89.940828,87.796209,63.099042,66.666667,62.523191,752.0,96.229388,13294,61.433730,6.053328,21.3,39.420423,36.694915,19.212395,98372.0,19622.0,5.013352,38.324789,16.012185,321.157993,62.222153,9.6,0.0,14.016243,85.725330,80.437873,84.768212,85.531749,23.3,True
1033,Alabama,Colbert,504.3,591.300000,248.537984,499.700000,78.919864,112.318201,57.839474,9.363745,13.113404,13.365516,17.4,93.300000,16.6,6.551705,8.583007,19.946512,36.950783,13.356842,3.055692,10879.20,121.73528,17.810000,46572.0,31813.000000,38750.000000,46991.000000,49.747878,26.561564,21.412017,3.674357,15.436693,54216,21.196695,19.215730,15.906743,0.649255,0.558876,0.051645,2.473440,78.784861,0.202753,51.752250,43.894687,Alabama,Colbert,10566.513329,11719.391858,5283.836689,...,7.692308,9.554326,18.371146,34.6,7.2,30.9,64.503564,15.822773,8.695652,473.0,38.705198,34.815436,31.948882,40.571692,10.602745,62.55289,42.42290,25.82264,74.59,87.413074,89.552239,86.923077,68.104575,78.571429,66.566717,627.0,88.850877,13031,54.063387,7.010588,25.1,34.537493,7.664234,20.964923,85487.0,17063.0,5.010080,35.244289,18.213931,449.589200,67.994957,10.2,0.0,15.708556,89.532088,89.024390,74.484314,91.570722,26.1,True


In [51]:
#Calulte cutoffs for top and bottom percentiles
top_25_cutoff =  float(pd.DataFrame(counties['Drug_Overdose_Mortality_Rate']).quantile(q=0.75, axis=0, numeric_only=True, interpolation='linear'))
bottom_25_cutoff = float(pd.DataFrame(counties['Drug_Overdose_Mortality_Rate']).quantile(q=0.25, axis=0, numeric_only=True, interpolation='linear'))


In [82]:
#Drop anything in middle 50%
counties = counties.drop(counties[(counties['Drug_Overdose_Mortality_Rate'] < top_25_cutoff) &  (counties['Drug_Overdose_Mortality_Rate'] > bottom_25_cutoff)].index)
counties.head()


Unnamed: 0_level_0,State,County,Age_Adjusted_Mortality,Age_Adjusted_Mortality_Black,Age_Adjusted_Mortality_Hispanic,Age_Adjusted_Mortality_White,Child_Mortality_Rate,Child_Mortality_Rate_Black,Child_Mortality_Rate_White,Infant_Mortality_Rate,Percent_Frequent_Physical_Distress,Percent_Frequent_Mental_Distress,Percent_Diabetic,HIV_Prevalence_Rate,Percent_Food_Insecure,Percent_Limited_Access,Drug_Overdose_Mortality_Rate,MV_Mortality_Rate,Percent_Insufficient_Sleep,Percent_Uninsured,Percent_Uninsured_1,Costs,Other_PCP_Rate,Percent_Disconnected_Youth,Household_Income,Household_income_Black,Household_income_Hispanic,Household_income_White,Percent_Free_or_Reduced_Lunch,Segregation_index,Segregation_Index,Homicide_Rate,Firearm_Fatalities_Rate,Population,Percent_lt_18,Percent_65_and_over,Percent_African_American,Percent_American_Indian/Alaskan_Native,Percent_Asian,Percent_Native_Hawaiian/Other_Pacific_Islander,Percent_Hispanic,Percent_Non_Hispanic_White,Percent_Not_Proficient_in_English,Percent_Female,Percent_Rural,State_ranked,County_ranked,Years_of_Potential_Life_Lost_Rate,Years_of_Potential_Life_Lost_Rate_Black,Years_of_Potential_Life_Lost_Rate_Hispanic,...,Percent_LBW_White,Percent_Smokers,Percent_Obese,Food_Environment_Index,Percent_Physically_Inactive,Percent_With_Access,Percent_Excessive_Drinking,Percent_Alcohol_Impaired,Chlamydia_Rate,Teen_Birth_Rate,Teen_Birth_Rate_Black,Teen_Birth_Rate_Hispanic,Teen_Birth_Rate_White,Percent_Uninsured_ranked,PCP_Rate,Dentist_Rate,MHP_Rate,Preventable_Hosp__Rate,Percent_Receiving_HbA1c,Percent_Receiving_HbA1c_Black,Percent_Receiving_HbA1c_White,Percent_Mammography,Percent_Mammography_Black,Percent_Mammography_White,Cohort_Size,Graduation_Rate,Population_ranked,Percent_Some_College,Percent_Unemployed,Percent_Children_in_Poverty,Percent_Children_in_Poverty_Black,Percent_Children_in_Poverty_Hispanic,Percent_Children_in_Poverty_White,Percentile_Income_80th,Percentile_Income_20th,Income_Ratio,Percent_Single_Parent_Households,Association_Rate,Violent_Crime_Rate,Injury_Death_Rate,Average_Daily_PM2_5,Presence_of_violation,Percent_Severe_Housing_Problems,Percent_Drive_Alone,Percent_Drive_Alone_Black,Percent_Drive_Alone_Hispanic,Percent_Drive_Alone_White,Percent_Long_Commute___Drives_Alone,Urban,top_25
FIPS,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1
1001,Alabama,Autauga,449.6,531.7,292.315327,444.9,56.186903,95.921022,48.240956,7.718502,12.824434,12.638357,12.4,225.5,13.9,11.991125,10.231226,20.167754,35.905406,12.193092,2.595313,10674.34,28.87253,14.57,54487.0,32173.0,72411.0,58556.0,48.475388,26.347048,24.000912,3.619853,16.972533,55416,24.408113,14.728598,19.04865,0.485419,1.140465,0.101054,2.688754,75.0,0.832739,51.288437,42.002162,Alabama,Autauga,9409.294766,11806.223285,5968.227286,...,7.415319,19.124658,36.4,7.1,30.9,71.120192,16.878015,26.785714,341.2,27.996758,31.533043,38.461538,27.153838,9.387712,45.16957,32.48159,12.63173,81.85,83.966245,74.107143,85.809683,62.693157,58.333333,63.209877,706.0,90.0,14315,61.942019,5.271161,19.3,28.072153,16.699411,14.400244,101520.0,23134.0,4.388346,24.471409,13.912226,265.699747,72.584664,10.8,0.0,15.217927,86.750062,82.494851,83.676458,82.539683,40.8,True,0
1021,Alabama,Chilton,516.3,615.2,256.348989,522.1,56.483879,105.666951,61.207661,6.894791,14.44538,14.260704,14.1,99.5,13.5,1.460531,12.138224,22.140966,35.174569,19.470843,4.76277,10515.38,9.10312,19.58,44188.0,27375.0,28081.0,45494.0,61.087434,36.022367,30.41638,6.512049,15.939158,43941,24.039052,16.05562,9.929223,0.514326,0.475638,0.175235,7.603377,80.560297,2.446886,50.831797,86.744724,Alabama,Chilton,11099.683529,16051.458138,5249.97605,...,8.253752,19.673275,36.0,8.2,29.8,46.044039,15.064313,20.253165,307.3,51.259961,41.629761,65.128901,51.742919,15.232994,18.2054,25.03357,38.68824,65.11,89.059081,88.888889,89.073634,64.0,60.869565,64.259928,517.0,86.0,11708,39.118551,5.617919,26.3,49.869452,56.84368,25.272703,84217.0,17180.0,4.902037,32.023821,16.61243,345.839685,90.625498,10.5,0.0,14.527027,82.865233,86.703601,79.046534,82.431522,47.6,False,0
1031,Alabama,Coffee,409.2,559.8,226.303544,391.5,55.75287,113.601157,37.279816,6.991479,13.593147,13.445273,15.5,143.3,15.1,5.981203,7.825441,16.853459,37.304732,15.281598,3.629893,9855.89,56.61188,16.89,48632.0,28352.0,40648.0,53528.0,46.965995,35.490598,26.34115,2.80891,14.870703,51226,23.745754,16.415492,17.22758,1.405536,1.526569,0.421661,6.969117,70.653574,1.497188,50.573927,47.195083,Alabama,Coffee,7295.411499,10559.281482,13654.156601,...,6.36921,18.201221,34.2,7.5,29.8,44.630416,15.52842,31.914894,467.5,30.630003,37.379719,72.53886,25.298204,11.933247,56.62846,33.18627,54.65974,52.76,88.153998,89.940828,87.796209,63.099042,66.666667,62.523191,752.0,96.229388,13294,61.43373,6.053328,21.3,39.420423,36.694915,19.212395,98372.0,19622.0,5.013352,38.324789,16.012185,321.157993,62.222153,9.6,0.0,14.016243,85.72533,80.437873,84.768212,85.531749,23.3,True,0
1033,Alabama,Colbert,504.3,591.3,248.537984,499.7,78.919864,112.318201,57.839474,9.363745,13.113404,13.365516,17.4,93.3,16.6,6.551705,8.583007,19.946512,36.950783,13.356842,3.055692,10879.2,121.73528,17.81,46572.0,31813.0,38750.0,46991.0,49.747878,26.561564,21.412017,3.674357,15.436693,54216,21.196695,19.21573,15.906743,0.649255,0.558876,0.051645,2.47344,78.784861,0.202753,51.75225,43.894687,Alabama,Colbert,10566.513329,11719.391858,5283.836689,...,9.554326,18.371146,34.6,7.2,30.9,64.503564,15.822773,8.695652,473.0,38.705198,34.815436,31.948882,40.571692,10.602745,62.55289,42.4229,25.82264,74.59,87.413074,89.552239,86.923077,68.104575,78.571429,66.566717,627.0,88.850877,13031,54.063387,7.010588,25.1,34.537493,7.664234,20.964923,85487.0,17063.0,5.01008,35.244289,18.213931,449.5892,67.994957,10.2,0.0,15.708556,89.532088,89.02439,74.484314,91.570722,26.1,True,0
1039,Alabama,Covington,529.5,737.6,357.444648,508.3,69.062847,123.305788,75.786874,7.997441,14.474782,14.119544,14.1,169.9,16.3,4.370327,9.716714,20.387283,35.912449,15.755214,3.133673,10886.93,64.07176,23.55,35010.0,21728.0,33750.0,41071.0,56.050955,43.61879,39.411511,9.362151,11.10829,37458,21.968605,20.361472,12.67553,0.670084,0.493886,0.008009,1.63116,83.223877,0.593814,51.751295,69.651794,Alabama,Covington,10307.0633,13065.928954,9381.973601,...,8.934708,20.939811,33.8,7.4,30.9,62.025685,15.401891,23.076923,448.4,55.795678,48.128342,55.558274,58.933108,12.263051,50.21805,34.70554,53.39313,93.51,80.564263,71.428571,81.949458,59.621993,65.909091,59.107807,453.0,95.275938,8500,54.011765,6.997141,28.1,53.835022,16.86747,24.684741,76541.0,16243.0,4.712245,35.160379,13.215277,273.129856,63.475943,9.2,0.0,15.186916,85.151302,79.541735,64.21376,88.248317,27.0,False,0


In [83]:
# Create binary feature for top 25% vs bottom 25%

counties['top_25'] = counties['Drug_Overdose_Mortality_Rate'] >= top_25_cutoff
counties['top_25'] = counties['top_25']*1

In [84]:
counties[['top_25','Drug_Overdose_Mortality_Rate']].head()

Unnamed: 0_level_0,top_25,Drug_Overdose_Mortality_Rate
FIPS,Unnamed: 1_level_1,Unnamed: 2_level_1
1001,0,10.231226
1021,0,12.138224
1031,0,7.825441
1033,0,8.583007
1039,0,9.716714


In [85]:
#Use formula from previous model and add in our original features of interest
formula_logit = 'top_25 ~ 1 + Age_Adjusted_Mortality + Age_Adjusted_Mortality_Black + Child_Mortality_Rate + Child_Mortality_Rate_Black + Child_Mortality_Rate_White + Infant_Mortality_Rate + Percent_Frequent_Physical_Distress + Percent_Uninsured_1 + Segregation_index + Percent_Not_Proficient_in_English + Years_of_Potential_Life_Lost_Rate + Years_of_Potential_Life_Lost_Rate_Black + Physically_Unhealthy_Days + Mentally_Unhealthy_Days + Percent_Smokers + Teen_Birth_Rate_White + Percent_Some_College + Percentile_Income_20th + Percent_Unemployed + Household_Income + Graduation_Rate + Percent_Rural + HIV_Prevalence_Rate + Percent_Frequent_Mental_Distress + Percent_Excessive_Drinking'
y, X = patsy.dmatrices(formula_logit, counties, return_type='matrix') 
model_logit = sm.Logit(y,X)
results_logit = model_logit.fit()

Optimization terminated successfully.
         Current function value: 0.373546
         Iterations 7


In [86]:
results_logit.summary()

0,1,2,3
Dep. Variable:,top_25,No. Observations:,828.0
Model:,Logit,Df Residuals:,802.0
Method:,MLE,Df Model:,25.0
Date:,"Wed, 12 Dec 2018",Pseudo R-squ.:,0.4611
Time:,00:42:18,Log-Likelihood:,-309.3
converged:,True,LL-Null:,-573.93
,,LLR p-value:,6.545e-96

0,1,2,3,4,5,6
,coef,std err,z,P>|z|,[0.025,0.975]
Intercept,-14.5474,3.563,-4.083,0.000,-21.531,-7.564
Age_Adjusted_Mortality,0.0135,0.005,2.490,0.013,0.003,0.024
Age_Adjusted_Mortality_Black,0.0015,0.002,0.966,0.334,-0.002,0.005
Child_Mortality_Rate,-0.0443,0.011,-4.018,0.000,-0.066,-0.023
Child_Mortality_Rate_Black,0.0262,0.006,4.077,0.000,0.014,0.039
Child_Mortality_Rate_White,0.0485,0.011,4.217,0.000,0.026,0.071
Infant_Mortality_Rate,0.2121,0.088,2.411,0.016,0.040,0.385
Percent_Frequent_Physical_Distress,-1.3801,0.501,-2.753,0.006,-2.363,-0.398
Percent_Uninsured_1,-0.1084,0.055,-1.985,0.047,-0.215,-0.001


### Looking at Logistic Regression Coefficients


In [87]:
# Convert from log odds to odds ratios
for ix,x in enumerate(np.exp(results_logit.params)): 
    print (x,X.design_info.column_names[ix])

4.809944668826064e-07 Intercept
1.013624135385344 Age_Adjusted_Mortality
1.0015422954903095 Age_Adjusted_Mortality_Black
0.956624762690044 Child_Mortality_Rate
1.026524256528914 Child_Mortality_Rate_Black
1.049683256656971 Child_Mortality_Rate_White
1.236273999101653 Infant_Mortality_Rate
0.2515625417886249 Percent_Frequent_Physical_Distress
0.8973127695914501 Percent_Uninsured_1
1.0326258334807938 Segregation_index
0.991812776874542 Percent_Not_Proficient_in_English
1.0007719570211537 Years_of_Potential_Life_Lost_Rate
0.999805539997919 Years_of_Potential_Life_Lost_Rate_Black
13.848668305761125 Physically_Unhealthy_Days
92.78408136692597 Mentally_Unhealthy_Days
1.0023662706717684 Percent_Smokers
0.9184914048974326 Teen_Birth_Rate_White
0.9457353095837092 Percent_Some_College
0.9999306250772376 Percentile_Income_20th
1.0458985252896376 Percent_Unemployed
1.0000833202543888 Household_Income
1.0094045018217432 Graduation_Rate
0.9698157087129744 Percent_Rural
0.9986174267410463 HIV_Prevale

In [88]:
# Convert confidence intervals to odds ratios as well
for ix,x in enumerate(np.exp(results_logit.conf_int())): 
    print (x,X.design_info.column_names[ix])

[4.46035079e-10 5.18693905e-04] Intercept
[1.00288315 1.02448016] Age_Adjusted_Mortality
[0.99841425 1.00468014] Age_Adjusted_Mortality_Black
[0.9361549  0.97754222] Child_Mortality_Rate
[1.01368755 1.03952352] Child_Mortality_Rate_Black
[1.02628968 1.07361008] Child_Mortality_Rate_White
[1.04046951 1.46892665] Infant_Mortality_Rate
[0.09418079 0.67193862] Percent_Frequent_Physical_Distress
[0.80625607 0.9986532 ] Percent_Uninsured_1
[1.01617702 1.04934091] Segregation_index
[0.8514144  1.15536287] Percent_Not_Proficient_in_English
[1.00032927 1.00121484] Years_of_Potential_Life_Lost_Rate
[0.99966076 0.99995035] Years_of_Potential_Life_Lost_Rate_Black
[  0.93235757 205.69963659] Physically_Unhealthy_Days
[ 12.28112827 700.9849231 ] Mentally_Unhealthy_Days
[0.88763276 1.13192998] Percent_Smokers
[0.89000481 0.94788978] Teen_Birth_Rate_White
[0.90713805 0.98597482] Percent_Some_College
[0.99981519 1.00004607] Percentile_Income_20th
[0.86133974 1.27000262] Percent_Unemployed
[1.00002623 1