In [72]:
from sklearn.datasets import load_diabetes
from sklearn.model_selection import train_test_split

diabetes_data = load_diabetes()
print(diabetes_data.DESCR)


.. _diabetes_dataset:

Diabetes dataset
----------------

Ten baseline variables, age, sex, body mass index, average blood
pressure, and six blood serum measurements were obtained for each of n =
442 diabetes patients, as well as the response of interest, a
quantitative measure of disease progression one year after baseline.

**Data Set Characteristics:**

:Number of Instances: 442

:Number of Attributes: First 10 columns are numeric predictive values

:Target: Column 11 is a quantitative measure of disease progression one year after baseline

:Attribute Information:
    - age     age in years
    - sex
    - bmi     body mass index
    - bp      average blood pressure
    - s1      tc, total serum cholesterol
    - s2      ldl, low-density lipoproteins
    - s3      hdl, high-density lipoproteins
    - s4      tch, total cholesterol / HDL
    - s5      ltg, possibly log of serum triglycerides level
    - s6      glu, blood sugar level

Note: Each of these 10 feature variables have bee

In [73]:
X, y = diabetes_data.data, diabetes_data.target
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=32)

In [74]:
from sklearn.linear_model import LinearRegression

model = LinearRegression()
model.fit(X_train, y_train)

y_pred = model.predict(X=X_test)

In [75]:
from sklearn.metrics import mean_squared_error, r2_score

mse = mean_squared_error(y_true=y_test, y_pred=y_pred)
r2 = r2_score(y_true=y_test, y_pred=y_pred)

print(f"MSE of the model is {mse}")
print(f"R2 Score of the model is {r2}")

MSE of the model is 2787.643402443914
R2 Score of the model is 0.4522338796354569


In [76]:
for feature, coef in zip(diabetes_data.feature_names, model.coef_):
    print(f"Feature \"{feature}\" a has coefficient of {coef}")

Feature "age" a has coefficient of 32.500000778508856
Feature "sex" a has coefficient of -274.20835690275203
Feature "bmi" a has coefficient of 501.5274406922501
Feature "bp" a has coefficient of 368.7931960971641
Feature "s1" a has coefficient of -822.3112098781187
Feature "s2" a has coefficient of 504.23867319220295
Feature "s3" a has coefficient of 101.57697154691736
Feature "s4" a has coefficient of 158.16545686716256
Feature "s5" a has coefficient of 744.9154171205339
Feature "s6" a has coefficient of 78.40553631547385
