## Import Statistical Module

In [1]:
import xlrd
import pandas as pd
import numpy as np
import sys
from scipy import stats
from statsmodels.formula.api import ols
import matplotlib.pyplot as plt
%matplotlib inline

## Load the File

In [2]:
#Load the File
filename='.\\BK for Wei 5.xlsx'
book=xlrd.open_workbook(filename)
print('Source file: '+sys.path[0]+filename+' loaded!')

Source file: .\BK for Wei 5.xlsx loaded!


In [3]:
nrows_bmi = book.sheet_by_name('target-BMI').nrows
nrows_crp = book.sheet_by_name('target-CRP').nrows
nrows_hba1c = book.sheet_by_name('target-HbA1C').nrows
nrows_lipid = book.sheet_by_name('target-lipid').nrows

In [4]:
header_bmi = book.sheet_by_name('target-BMI').row_values(0)
header_crp = book.sheet_by_name('target-CRP').row_values(0)
header_hba1c = book.sheet_by_name('target-HbA1C').row_values(0)
header_lipid = book.sheet_by_name('target-lipid').row_values(0)

In [5]:
data_bmi = [book.sheet_by_name('target-BMI').row_values(i) for i in range(1, nrows_bmi)]
data_crp = [book.sheet_by_name('target-CRP').row_values(i) for i in range(1, nrows_crp)]
data_hba1c = [book.sheet_by_name('target-HbA1C').row_values(i) for i in range(1, nrows_hba1c)]
data_lipid = [book.sheet_by_name('target-lipid').row_values(i) for i in range(1, nrows_lipid)]

In [6]:
df_bmi = pd.DataFrame(data_bmi, columns = header_bmi)
df_crp = pd.DataFrame(data_crp, columns = header_crp)
df_hba1c = pd.DataFrame(data_hba1c, columns = header_hba1c)
df_lipid = pd.DataFrame(data_lipid, columns = header_lipid)

## Extract Raw DataFrame

In [7]:
df_bmi

Unnamed: 0,StudyID,ACE_Inhibitor,BKHypBK,HypBKBK,Age,BMI
0,DM001,0,0.057791,17.582649,46,29.80
1,DM003,0,0.132757,7.533061,40,33.30
2,DM004,0,0.269416,3.712065,50,19.60
3,DM005,0,0.169639,5.897226,37,33.00
4,DM006,0,0.348889,2.866964,53,41.50
5,DM007,0,0.707396,1.413821,46,23.00
6,DM008,0,0.204086,4.901285,37,43.60
7,DM009,1,0.042670,23.515039,32,33.60
8,DM010,0,0.493274,2.027968,73,32.80
9,DM012,1,0.554848,1.802519,55,23.20


# BMI

## Combined

In [8]:
parameters_bmi = header_bmi[2:]
data_bmi = df_bmi[parameters_bmi]
data_bmi = data_bmi.astype(float)

#### BK/HypBK vs Other Parameters

In [9]:
model = ols('BKHypBK~Age+BMI', 
            data_bmi).fit()
model.summary()

0,1,2,3
Dep. Variable:,BKHypBK,R-squared:,0.167
Model:,OLS,Adj. R-squared:,0.152
Method:,Least Squares,F-statistic:,11.61
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,2.54e-05
Time:,00:26:05,Log-Likelihood:,-42.481
No. Observations:,119,AIC:,90.96
Df Residuals:,116,BIC:,99.3
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,1.1480,0.177,6.476,0.000,0.797 1.499
Age,-0.0043,0.002,-2.103,0.038,-0.008 -0.000
BMI,-0.0198,0.004,-4.429,0.000,-0.029 -0.011

0,1,2,3
Omnibus:,69.362,Durbin-Watson:,1.846
Prob(Omnibus):,0.0,Jarque-Bera (JB):,270.238
Skew:,2.134,Prob(JB):,2.0800000000000002e-59
Kurtosis:,9.024,Cond. No.,336.0


### HypBK/BK vs Other Parameters

In [10]:
model = ols('HypBKBK~Age+BMI', 
            data_bmi).fit()
model.summary()

0,1,2,3
Dep. Variable:,HypBKBK,R-squared:,0.102
Model:,OLS,Adj. R-squared:,0.087
Method:,Least Squares,F-statistic:,6.59
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.00195
Time:,00:26:05,Log-Likelihood:,-393.14
No. Observations:,119,AIC:,792.3
Df Residuals:,116,BIC:,800.6
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,-1.0793,3.376,-0.320,0.750,-7.766 5.607
Age,-0.0099,0.039,-0.256,0.798,-0.086 0.066
BMI,0.3073,0.085,3.605,0.000,0.138 0.476

0,1,2,3
Omnibus:,41.917,Durbin-Watson:,1.748
Prob(Omnibus):,0.0,Jarque-Bera (JB):,79.241
Skew:,1.544,Prob(JB):,6.21e-18
Kurtosis:,5.539,Cond. No.,336.0


=========================

## Without ACEI

In [11]:
df_bmi_withoutACEI = df_bmi[df_bmi['ACE_Inhibitor'] != 1]
parameters_bmi = header_bmi[2:]
data_bmi_withoutACEI = df_bmi_withoutACEI[parameters_bmi]
data_bmi_withoutACEI = data_bmi_withoutACEI.astype(float)

### BK/HypBK vs Other Parameters

In [12]:
model = ols('BKHypBK~Age+BMI', 
            data_bmi_withoutACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,BKHypBK,R-squared:,0.115
Model:,OLS,Adj. R-squared:,0.095
Method:,Least Squares,F-statistic:,5.614
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.00511
Time:,00:26:05,Log-Likelihood:,-31.083
No. Observations:,89,AIC:,68.17
Df Residuals:,86,BIC:,75.63
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,0.9664,0.195,4.954,0.000,0.579 1.354
Age,-0.0028,0.002,-1.232,0.221,-0.007 0.002
BMI,-0.0160,0.005,-3.174,0.002,-0.026 -0.006

0,1,2,3
Omnibus:,56.641,Durbin-Watson:,1.974
Prob(Omnibus):,0.0,Jarque-Bera (JB):,212.057
Skew:,2.141,Prob(JB):,8.96e-47
Kurtosis:,9.233,Cond. No.,315.0


### HypBK/BK vs Other Parameters

In [13]:
model = ols('HypBKBK~Age+BMI', 
            data_bmi_withoutACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,HypBKBK,R-squared:,0.077
Model:,OLS,Adj. R-squared:,0.056
Method:,Least Squares,F-statistic:,3.586
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.0319
Time:,00:26:05,Log-Likelihood:,-294.05
No. Observations:,89,AIC:,594.1
Df Residuals:,86,BIC:,601.6
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,-0.4262,3.744,-0.114,0.910,-7.870 7.018
Age,-0.0052,0.043,-0.122,0.903,-0.091 0.080
BMI,0.2577,0.097,2.666,0.009,0.066 0.450

0,1,2,3
Omnibus:,46.091,Durbin-Watson:,1.587
Prob(Omnibus):,0.0,Jarque-Bera (JB):,113.947
Skew:,1.911,Prob(JB):,1.81e-25
Kurtosis:,7.015,Cond. No.,315.0


=================

## Take ACEI

In [14]:
df_bmi_withACEI = df_bmi[df_bmi['ACE_Inhibitor'] == 1]

parameters_bmi = header_bmi[2:]
data_bmi_withACEI = df_bmi_withACEI[parameters_bmi]
data_bmi_withACEI = data_bmi_withACEI.astype(float)

### BK/HypBK vs Other Parameters

In [15]:
model = ols('BKHypBK~Age+BMI', 
            data_bmi_withACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,BKHypBK,R-squared:,0.378
Model:,OLS,Adj. R-squared:,0.332
Method:,Least Squares,F-statistic:,8.216
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.00163
Time:,00:26:05,Log-Likelihood:,-8.7419
No. Observations:,30,AIC:,23.48
Df Residuals:,27,BIC:,27.69
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,1.9915,0.437,4.555,0.000,1.094 2.889
Age,-0.0114,0.005,-2.328,0.028,-0.021 -0.001
BMI,-0.0348,0.010,-3.580,0.001,-0.055 -0.015

0,1,2,3
Omnibus:,12.565,Durbin-Watson:,2.164
Prob(Omnibus):,0.002,Jarque-Bera (JB):,12.594
Skew:,1.195,Prob(JB):,0.00184
Kurtosis:,5.088,Cond. No.,453.0


### HypBK/BK vs Other Parameters

In [16]:
model = ols('HypBKBK~Age+BMI', 
            data_bmi_withACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,HypBKBK,R-squared:,0.198
Model:,OLS,Adj. R-squared:,0.139
Method:,Least Squares,F-statistic:,3.338
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.0507
Time:,00:26:05,Log-Likelihood:,-96.685
No. Observations:,30,AIC:,199.4
Df Residuals:,27,BIC:,203.6
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,2.1335,8.200,0.260,0.797,-14.691 18.958
Age,-0.0928,0.092,-1.013,0.320,-0.281 0.095
BMI,0.4069,0.182,2.234,0.034,0.033 0.781

0,1,2,3
Omnibus:,3.745,Durbin-Watson:,2.112
Prob(Omnibus):,0.154,Jarque-Bera (JB):,3.376
Skew:,0.783,Prob(JB):,0.185
Kurtosis:,2.499,Cond. No.,453.0


# CRP

## Combined

In [17]:
parameters_crp = header_crp[2:]
data_crp = df_crp[parameters_crp]
data_crp = data_crp.astype(float)

#### BK/HypBK vs Other Parameters

In [18]:
model = ols('BKHypBK~Age+hsCRP', 
            data_crp).fit()
model.summary()

0,1,2,3
Dep. Variable:,BKHypBK,R-squared:,0.085
Model:,OLS,Adj. R-squared:,0.07
Method:,Least Squares,F-statistic:,5.685
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.00435
Time:,00:26:05,Log-Likelihood:,-49.276
No. Observations:,126,AIC:,104.6
Df Residuals:,123,BIC:,113.1
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,0.4974,0.107,4.651,0.000,0.286 0.709
Age,-0.0041,0.002,-2.053,0.042,-0.008 -0.000
hsCRP,0.0056,0.002,2.635,0.010,0.001 0.010

0,1,2,3
Omnibus:,69.853,Durbin-Watson:,1.826
Prob(Omnibus):,0.0,Jarque-Bera (JB):,250.24
Skew:,2.096,Prob(JB):,4.58e-55
Kurtosis:,8.486,Cond. No.,179.0


#### HypBK/BK vs Other Parameters

In [19]:
model = ols('HypBKBK~Age+hsCRP', 
            data_crp).fit()
model.summary()

0,1,2,3
Dep. Variable:,HypBKBK,R-squared:,0.023
Model:,OLS,Adj. R-squared:,0.007
Method:,Least Squares,F-statistic:,1.435
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.242
Time:,00:26:06,Log-Likelihood:,-419.67
No. Observations:,126,AIC:,845.3
Df Residuals:,123,BIC:,853.8
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,8.6680,2.022,4.287,0.000,4.666 12.670
Age,-0.0124,0.037,-0.331,0.741,-0.086 0.062
hsCRP,-0.0676,0.041,-1.668,0.098,-0.148 0.013

0,1,2,3
Omnibus:,38.345,Durbin-Watson:,1.859
Prob(Omnibus):,0.0,Jarque-Bera (JB):,64.131
Skew:,1.441,Prob(JB):,1.19e-14
Kurtosis:,4.977,Cond. No.,179.0


## Without ACEI

In [20]:
df_crp_withoutACEI = df_crp[df_crp['ACE_inhibitor'] != 1]
parameters_crp = header_crp[2:]
data_crp_withoutACEI = df_crp_withoutACEI[parameters_crp]
data_crp_withoutACEI = data_crp_withoutACEI.astype(float)

#### BK/HypBK vs Other Parameters

In [21]:
model = ols('BKHypBK~Age+hsCRP', 
            data_crp_withoutACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,BKHypBK,R-squared:,0.119
Model:,OLS,Adj. R-squared:,0.1
Method:,Least Squares,F-statistic:,6.152
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.00312
Time:,00:26:06,Log-Likelihood:,-31.631
No. Observations:,94,AIC:,69.26
Df Residuals:,91,BIC:,76.89
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,0.4310,0.110,3.922,0.000,0.213 0.649
Age,-0.0026,0.002,-1.283,0.203,-0.007 0.001
hsCRP,0.0069,0.002,3.229,0.002,0.003 0.011

0,1,2,3
Omnibus:,48.484,Durbin-Watson:,2.23
Prob(Omnibus):,0.0,Jarque-Bera (JB):,136.519
Skew:,1.85,Prob(JB):,2.27e-30
Kurtosis:,7.601,Cond. No.,164.0


#### HypBK/BK vs Other Parameters

In [22]:
model = ols('HypBKBK~Age+hsCRP', 
            data_crp_withoutACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,HypBKBK,R-squared:,0.048
Model:,OLS,Adj. R-squared:,0.027
Method:,Least Squares,F-statistic:,2.297
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.106
Time:,00:26:06,Log-Likelihood:,-307.31
No. Observations:,94,AIC:,620.6
Df Residuals:,91,BIC:,628.3
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,8.1320,2.064,3.941,0.000,4.033 12.231
Age,-0.0154,0.039,-0.397,0.693,-0.092 0.062
hsCRP,-0.0853,0.040,-2.116,0.037,-0.165 -0.005

0,1,2,3
Omnibus:,48.239,Durbin-Watson:,1.749
Prob(Omnibus):,0.0,Jarque-Bera (JB):,126.632
Skew:,1.889,Prob(JB):,3.18e-28
Kurtosis:,7.25,Cond. No.,164.0


## Take ACEI

In [23]:
df_crp_withACEI = df_crp[df_crp['ACE_inhibitor'] == 1]

parameters_crp = header_crp[2:]
data_crp_withACEI = df_crp_withACEI[parameters_crp]
data_crp_withACEI = data_crp_withACEI.astype(float)

#### BK/HypBK vs Other Parameters

In [24]:
model = ols('BKHypBK~Age+hsCRP', 
            data_crp_withACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,BKHypBK,R-squared:,0.116
Model:,OLS,Adj. R-squared:,0.055
Method:,Least Squares,F-statistic:,1.904
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.167
Time:,00:26:06,Log-Likelihood:,-14.238
No. Observations:,32,AIC:,34.48
Df Residuals:,29,BIC:,38.87
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,0.7927,0.314,2.521,0.017,0.150 1.436
Age,-0.0089,0.006,-1.577,0.126,-0.020 0.003
hsCRP,-0.0072,0.008,-0.914,0.368,-0.023 0.009

0,1,2,3
Omnibus:,30.432,Durbin-Watson:,2.019
Prob(Omnibus):,0.0,Jarque-Bera (JB):,65.478
Skew:,2.197,Prob(JB):,6.05e-15
Kurtosis:,8.459,Cond. No.,254.0


#### HypBK/BK vs Other Parameters

In [25]:
model = ols('HypBKBK~Age+hsCRP', 
            data_crp_withACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,HypBKBK,R-squared:,0.099
Model:,OLS,Adj. R-squared:,0.036
Method:,Least Squares,F-statistic:,1.586
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.222
Time:,00:26:06,Log-Likelihood:,-106.59
No. Observations:,32,AIC:,219.2
Df Residuals:,29,BIC:,223.6
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,15.0857,5.635,2.677,0.012,3.560 26.611
Age,-0.1129,0.101,-1.118,0.273,-0.320 0.094
hsCRP,0.2151,0.140,1.531,0.137,-0.072 0.502

0,1,2,3
Omnibus:,1.975,Durbin-Watson:,1.688
Prob(Omnibus):,0.373,Jarque-Bera (JB):,1.738
Skew:,0.459,Prob(JB):,0.419
Kurtosis:,2.32,Cond. No.,254.0


# HbA1c

## Combined

In [26]:
parameters_hba1c = header_hba1c[2:]
data_hba1c = df_hba1c[parameters_hba1c]
data_hba1c = data_hba1c.astype(float)

#### BK/HypBK vs Other Parameters

In [27]:
model = ols('BKHypBK~Age+HbA1c', 
            data_hba1c).fit()
model.summary()

0,1,2,3
Dep. Variable:,BKHypBK,R-squared:,0.188
Model:,OLS,Adj. R-squared:,0.175
Method:,Least Squares,F-statistic:,14.66
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,1.86e-06
Time:,00:26:06,Log-Likelihood:,-41.954
No. Observations:,130,AIC:,89.91
Df Residuals:,127,BIC:,98.51
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,-0.0280,0.153,-0.183,0.855,-0.331 0.275
Age,-0.0049,0.002,-2.661,0.009,-0.008 -0.001
HbA1c,0.0939,0.019,4.887,0.000,0.056 0.132

0,1,2,3
Omnibus:,43.235,Durbin-Watson:,1.875
Prob(Omnibus):,0.0,Jarque-Bera (JB):,92.209
Skew:,1.402,Prob(JB):,9.49e-21
Kurtosis:,6.027,Cond. No.,278.0


#### HypBK/BK vs Other Parameters

In [28]:
model = ols('HypBKBK~Age+HbA1c', 
            data_hba1c).fit()
model.summary()

0,1,2,3
Dep. Variable:,HypBKBK,R-squared:,0.008
Model:,OLS,Adj. R-squared:,-0.008
Method:,Least Squares,F-statistic:,0.4916
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.613
Time:,00:26:06,Log-Likelihood:,-433.07
No. Observations:,130,AIC:,872.1
Df Residuals:,127,BIC:,880.7
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,10.1030,3.106,3.253,0.001,3.956 16.250
Age,-0.0046,0.037,-0.126,0.900,-0.078 0.068
HbA1c,-0.3788,0.389,-0.973,0.333,-1.149 0.392

0,1,2,3
Omnibus:,41.76,Durbin-Watson:,1.869
Prob(Omnibus):,0.0,Jarque-Bera (JB):,73.273
Skew:,1.502,Prob(JB):,1.23e-16
Kurtosis:,5.123,Cond. No.,278.0


## Without ACEI

In [29]:
df_hba1c_withoutACEI = df_hba1c[df_hba1c['ACE_inhibitor'] != 1]
parameters_hba1c = header_hba1c[2:]
data_hba1c_withoutACEI = df_hba1c_withoutACEI[parameters_hba1c]
data_hba1c_withoutACEI = data_hba1c_withoutACEI.astype(float)

#### BK/HypBK vs Other Parameters

In [30]:
model = ols('BKHypBK~Age+HbA1c', 
            data_hba1c_withoutACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,BKHypBK,R-squared:,0.086
Model:,OLS,Adj. R-squared:,0.067
Method:,Least Squares,F-statistic:,4.444
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.0143
Time:,00:26:07,Log-Likelihood:,-33.662
No. Observations:,97,AIC:,73.32
Df Residuals:,94,BIC:,81.05
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,0.0502,0.206,0.244,0.808,-0.359 0.459
Age,-0.0034,0.002,-1.653,0.102,-0.008 0.001
HbA1c,0.0759,0.029,2.603,0.011,0.018 0.134

0,1,2,3
Omnibus:,39.324,Durbin-Watson:,2.058
Prob(Omnibus):,0.0,Jarque-Bera (JB):,83.12
Skew:,1.582,Prob(JB):,8.93e-19
Kurtosis:,6.248,Cond. No.,307.0


#### HypBK/BK vs Other Parameters

In [31]:
model = ols('HypBKBK~Age+HbA1c', 
            data_hba1c).fit()
model.summary()

0,1,2,3
Dep. Variable:,HypBKBK,R-squared:,0.008
Model:,OLS,Adj. R-squared:,-0.008
Method:,Least Squares,F-statistic:,0.4916
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.613
Time:,00:26:07,Log-Likelihood:,-433.07
No. Observations:,130,AIC:,872.1
Df Residuals:,127,BIC:,880.7
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,10.1030,3.106,3.253,0.001,3.956 16.250
Age,-0.0046,0.037,-0.126,0.900,-0.078 0.068
HbA1c,-0.3788,0.389,-0.973,0.333,-1.149 0.392

0,1,2,3
Omnibus:,41.76,Durbin-Watson:,1.869
Prob(Omnibus):,0.0,Jarque-Bera (JB):,73.273
Skew:,1.502,Prob(JB):,1.23e-16
Kurtosis:,5.123,Cond. No.,278.0


## Take ACEI

In [32]:
df_hba1c_withACEI = df_hba1c[df_hba1c['ACE_inhibitor'] == 1]

parameters_hba1c = header_hba1c[2:]
data_hba1c_withACEI = df_hba1c_withACEI[parameters_hba1c]
data_hba1c_withACEI = data_hba1c_withACEI.astype(float)

#### BK/HypBK vs Other Parameters

In [33]:
model = ols('BKHypBK~Age+HbA1c', 
            data_hba1c_withACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,BKHypBK,R-squared:,0.552
Model:,OLS,Adj. R-squared:,0.522
Method:,Least Squares,F-statistic:,18.5
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,5.84e-06
Time:,00:26:07,Log-Likelihood:,-3.1623
No. Observations:,33,AIC:,12.32
Df Residuals:,30,BIC:,16.81
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,-0.1936,0.284,-0.682,0.500,-0.773 0.386
Age,-0.0081,0.004,-2.047,0.050,-0.016 -1.84e-05
HbA1c,0.1273,0.023,5.579,0.000,0.081 0.174

0,1,2,3
Omnibus:,4.275,Durbin-Watson:,1.857
Prob(Omnibus):,0.118,Jarque-Bera (JB):,3.697
Skew:,-0.191,Prob(JB):,0.157
Kurtosis:,4.594,Cond. No.,332.0


#### HypBK/BK vs Other Parameters

In [34]:
model = ols('HypBKBK~Age+HbA1c', 
            data_hba1c_withACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,HypBKBK,R-squared:,0.052
Model:,OLS,Adj. R-squared:,-0.011
Method:,Least Squares,F-statistic:,0.8251
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.448
Time:,00:26:07,Log-Likelihood:,-110.88
No. Observations:,33,AIC:,227.8
Df Residuals:,30,BIC:,232.3
Df Model:,2,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,19.1777,7.422,2.584,0.015,4.020 34.335
Age,-0.1003,0.103,-0.974,0.338,-0.311 0.110
HbA1c,-0.5376,0.597,-0.900,0.375,-1.757 0.682

0,1,2,3
Omnibus:,3.079,Durbin-Watson:,1.59
Prob(Omnibus):,0.214,Jarque-Bera (JB):,2.793
Skew:,0.675,Prob(JB):,0.247
Kurtosis:,2.544,Cond. No.,332.0


# Lipid

## Combined

In [35]:
parameters_lipid = header_lipid[2:]
data_lipid = df_lipid[parameters_lipid]
data_lipid = data_lipid.astype(float)

#### BK/HypBK vs Other Parameters

In [36]:
model = ols('BKHypBK~Age+Totoal_Cholesterol+HDL+Triglycerides+LDL', 
            data_lipid).fit()
model.summary()

0,1,2,3
Dep. Variable:,BKHypBK,R-squared:,0.094
Model:,OLS,Adj. R-squared:,0.057
Method:,Least Squares,F-statistic:,2.504
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.034
Time:,00:26:07,Log-Likelihood:,-48.588
No. Observations:,126,AIC:,109.2
Df Residuals:,120,BIC:,126.2
Df Model:,5,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,0.7918,0.189,4.182,0.000,0.417 1.167
Age,-0.0042,0.002,-2.057,0.042,-0.008 -0.000
Totoal_Cholesterol,-0.0050,0.077,-0.065,0.948,-0.157 0.147
HDL,0.0053,0.077,0.069,0.945,-0.146 0.157
Triglycerides,0.0003,0.015,0.021,0.983,-0.030 0.031
LDL,0.0031,0.077,0.041,0.968,-0.149 0.155

0,1,2,3
Omnibus:,71.208,Durbin-Watson:,1.934
Prob(Omnibus):,0.0,Jarque-Bera (JB):,252.51
Skew:,2.155,Prob(JB):,1.47e-55
Kurtosis:,8.433,Cond. No.,1510.0


#### HypBK/BK vs Other Parameters

In [37]:
model = ols('HypBKBK~Age+Totoal_Cholesterol+HDL+Triglycerides+LDL', 
            data_lipid).fit()
model.summary()

0,1,2,3
Dep. Variable:,HypBKBK,R-squared:,0.203
Model:,OLS,Adj. R-squared:,0.17
Method:,Least Squares,F-statistic:,6.104
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,4.51e-05
Time:,00:26:07,Log-Likelihood:,-406.84
No. Observations:,126,AIC:,825.7
Df Residuals:,120,BIC:,842.7
Df Model:,5,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,-0.5852,3.252,-0.180,0.857,-7.024 5.853
Age,-0.0167,0.035,-0.480,0.632,-0.085 0.052
Totoal_Cholesterol,-0.3136,1.319,-0.238,0.812,-2.925 2.298
HDL,0.3309,1.314,0.252,0.802,-2.272 2.934
Triglycerides,0.0910,0.264,0.345,0.731,-0.432 0.614
LDL,0.3600,1.320,0.273,0.786,-2.254 2.974

0,1,2,3
Omnibus:,39.513,Durbin-Watson:,2.036
Prob(Omnibus):,0.0,Jarque-Bera (JB):,79.126
Skew:,1.339,Prob(JB):,6.58e-18
Kurtosis:,5.81,Cond. No.,1510.0


## Without ACEI

In [38]:
df_lipid_withoutACEI = df_lipid[df_lipid['ACE_inhibitor'] != 1]
parameters_lipid = header_lipid[2:]
data_lipid_withoutACEI = df_lipid_withoutACEI[parameters_lipid]
data_lipid_withoutACEI = data_lipid_withoutACEI.astype(float)

#### BK/HypBK vs Other Parameters

In [39]:
model = ols('BKHypBK~Age+Totoal_Cholesterol+HDL+Triglycerides+LDL', 
            data_lipid_withoutACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,BKHypBK,R-squared:,0.059
Model:,OLS,Adj. R-squared:,0.006
Method:,Least Squares,F-statistic:,1.11
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.361
Time:,00:26:08,Log-Likelihood:,-34.705
No. Observations:,94,AIC:,81.41
Df Residuals:,88,BIC:,96.67
Df Model:,5,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,0.8245,0.225,3.660,0.000,0.377 1.272
Age,-0.0025,0.002,-1.143,0.256,-0.007 0.002
Totoal_Cholesterol,0.0480,0.088,0.546,0.587,-0.127 0.223
HDL,-0.0501,0.088,-0.571,0.570,-0.224 0.124
Triglycerides,-0.0105,0.018,-0.594,0.554,-0.046 0.025
LDL,-0.0494,0.088,-0.561,0.576,-0.224 0.126

0,1,2,3
Omnibus:,49.808,Durbin-Watson:,2.047
Prob(Omnibus):,0.0,Jarque-Bera (JB):,139.131
Skew:,1.919,Prob(JB):,6.14e-31
Kurtosis:,7.56,Cond. No.,1490.0


#### HypBK/BK vs Other Parameters

In [40]:
model = ols('HypBKBK~Age+Totoal_Cholesterol+HDL+Triglycerides+LDL', 
            data_lipid_withoutACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,HypBKBK,R-squared:,0.095
Model:,OLS,Adj. R-squared:,0.044
Method:,Least Squares,F-statistic:,1.852
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.111
Time:,00:26:08,Log-Likelihood:,-304.92
No. Observations:,94,AIC:,621.8
Df Residuals:,88,BIC:,637.1
Df Model:,5,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,-1.3905,3.992,-0.348,0.728,-9.324 6.543
Age,-0.0164,0.039,-0.421,0.675,-0.094 0.061
Totoal_Cholesterol,0.0990,1.559,0.063,0.950,-3.000 3.197
HDL,-0.0606,1.555,-0.039,0.969,-3.151 3.029
Triglycerides,0.0037,0.313,0.012,0.991,-0.618 0.625
LDL,-0.0559,1.560,-0.036,0.971,-3.157 3.045

0,1,2,3
Omnibus:,43.387,Durbin-Watson:,1.83
Prob(Omnibus):,0.0,Jarque-Bera (JB):,104.574
Skew:,1.717,Prob(JB):,1.9599999999999997e-23
Kurtosis:,6.86,Cond. No.,1490.0


## Take ACEI

In [41]:
df_lipid_withACEI = df_lipid[df_lipid['ACE_inhibitor'] == 1]

parameters_lipid = header_lipid[2:]
data_lipid_withACEI = df_lipid_withACEI[parameters_lipid]
data_lipid_withACEI = data_lipid_withACEI.astype(float)

#### BK/HypBK vs Other Parameters

In [42]:
model = ols('BKHypBK~Age+Totoal_Cholesterol+HDL+Triglycerides+LDL', 
            data_lipid_withACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,BKHypBK,R-squared:,0.525
Model:,OLS,Adj. R-squared:,0.433
Method:,Least Squares,F-statistic:,5.74
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.00107
Time:,00:26:08,Log-Likelihood:,-4.316
No. Observations:,32,AIC:,20.63
Df Residuals:,26,BIC:,29.43
Df Model:,5,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,0.8639,0.385,2.243,0.034,0.072 1.656
Age,-0.0111,0.005,-2.403,0.024,-0.021 -0.002
Totoal_Cholesterol,-0.1148,0.135,-0.851,0.402,-0.392 0.162
HDL,0.1246,0.134,0.928,0.362,-0.151 0.401
Triglycerides,0.0229,0.027,0.848,0.404,-0.033 0.078
LDL,0.1095,0.135,0.810,0.425,-0.168 0.388

0,1,2,3
Omnibus:,11.768,Durbin-Watson:,1.991
Prob(Omnibus):,0.003,Jarque-Bera (JB):,11.824
Skew:,1.091,Prob(JB):,0.00271
Kurtosis:,5.027,Cond. No.,2060.0


#### HypBK/BK vs Other Parameters

In [43]:
model = ols('HypBKBK~Age+Totoal_Cholesterol+HDL+Triglycerides+LDL', 
            data_lipid_withACEI).fit()
model.summary()

0,1,2,3
Dep. Variable:,HypBKBK,R-squared:,0.538
Model:,OLS,Adj. R-squared:,0.45
Method:,Least Squares,F-statistic:,6.066
Date:,"Sat, 08 Oct 2016",Prob (F-statistic):,0.000755
Time:,00:26:08,Log-Likelihood:,-95.878
No. Observations:,32,AIC:,203.8
Df Residuals:,26,BIC:,212.6
Df Model:,5,,
Covariance Type:,nonrobust,,

0,1,2,3,4,5
,coef,std err,t,P>|t|,[95.0% Conf. Int.]
Intercept,9.7353,6.734,1.446,0.160,-4.107 23.577
Age,-0.0788,0.081,-0.975,0.338,-0.245 0.087
Totoal_Cholesterol,-0.5847,2.358,-0.248,0.806,-5.432 4.263
HDL,0.4881,2.349,0.208,0.837,-4.340 5.316
Triglycerides,0.1405,0.471,0.298,0.768,-0.829 1.110
LDL,0.6489,2.364,0.274,0.786,-4.211 5.509

0,1,2,3
Omnibus:,0.03,Durbin-Watson:,2.043
Prob(Omnibus):,0.985,Jarque-Bera (JB):,0.146
Skew:,0.063,Prob(JB):,0.929
Kurtosis:,2.694,Cond. No.,2060.0
