In [2]:
from sklearn.datasets import load_diabetes
from sklearn.metrics import r2_score
import numpy as np

In [3]:
X , y = load_diabetes(return_X_y=True)

In [4]:
X

array([[ 0.03807591,  0.05068012,  0.06169621, ..., -0.00259226,
         0.01990749, -0.01764613],
       [-0.00188202, -0.04464164, -0.05147406, ..., -0.03949338,
        -0.06833155, -0.09220405],
       [ 0.08529891,  0.05068012,  0.04445121, ..., -0.00259226,
         0.00286131, -0.02593034],
       ...,
       [ 0.04170844,  0.05068012, -0.01590626, ..., -0.01107952,
        -0.04688253,  0.01549073],
       [-0.04547248, -0.04464164,  0.03906215, ...,  0.02655962,
         0.04452873, -0.02593034],
       [-0.04547248, -0.04464164, -0.0730303 , ..., -0.03949338,
        -0.00422151,  0.00306441]])

In [5]:
y

array([151.,  75., 141., 206., 135.,  97., 138.,  63., 110., 310., 101.,
        69., 179., 185., 118., 171., 166., 144.,  97., 168.,  68.,  49.,
        68., 245., 184., 202., 137.,  85., 131., 283., 129.,  59., 341.,
        87.,  65., 102., 265., 276., 252.,  90., 100.,  55.,  61.,  92.,
       259.,  53., 190., 142.,  75., 142., 155., 225.,  59., 104., 182.,
       128.,  52.,  37., 170., 170.,  61., 144.,  52., 128.,  71., 163.,
       150.,  97., 160., 178.,  48., 270., 202., 111.,  85.,  42., 170.,
       200., 252., 113., 143.,  51.,  52., 210.,  65., 141.,  55., 134.,
        42., 111.,  98., 164.,  48.,  96.,  90., 162., 150., 279.,  92.,
        83., 128., 102., 302., 198.,  95.,  53., 134., 144., 232.,  81.,
       104.,  59., 246., 297., 258., 229., 275., 281., 179., 200., 200.,
       173., 180.,  84., 121., 161.,  99., 109., 115., 268., 274., 158.,
       107.,  83., 103., 272.,  85., 280., 336., 281., 118., 317., 235.,
        60., 174., 259., 178., 128.,  96., 126., 28

In [6]:
from sklearn.model_selection import train_test_split
X_train , X_test , y_train , y_test = train_test_split(X,y,test_size=0.2,random_state=2)

In [8]:
from sklearn.linear_model import SGDRegressor

reg = SGDRegressor(penalty = "l2",max_iter=500,eta0=0.1,learning_rate="constant",alpha=0.001) # where l2 = Ridge Regression
reg.fit(X_train,y_train)
y_pred = reg.predict(X_test)
r2_score(y_test,y_pred)

0.4394883483508436

In [10]:
print(reg.coef_)
print(reg.intercept_)

[  36.91916906  -97.48581509  368.97025677  252.43965458   -1.9676989
  -54.31662651 -169.59332361  113.34076473  335.40840169  111.58975161]
[157.69666971]


In [12]:
from sklearn.linear_model import Ridge

reg = Ridge(alpha=0.001,max_iter=500,solver="sparse_cg")
reg.fit(X_train,y_train)
y_pred = reg.predict(X_test)
print("R2 Score : ",r2_score(y_test,y_pred))
print("Intercept : ",reg.intercept_)
print("Coef : ",reg.coef_)

R2 Score :  0.44086171110501016
Intercept :  151.88534078043028
Coef :  [  -8.76148626 -204.3134038   518.38060964  339.96792698 -787.70050902
  475.28218248  106.79525197  114.62926652  819.74572421   52.87335061]


# **Custom Code for Ridge Regression with Gradient Descent**

In [14]:
class MeraRidgeGD:
  def __init__(self,epochs,learning_rate,alpha):
    self.epochs = epochs
    self.learning_rate = learning_rate
    self.alpha = alpha
    self.coef_ = None
    self.intercept_ = None

  def fit(self,X_train,y_train):
    self.coef_ = np.ones(X_train.shape[1])
    self.intercept_ = 0
    theta = np.insert(self.coef_,0,self.intercept_)

    X_train = np.insert(X_train,0,1,axis = 1)

    for i in range(self.epochs):
      theta_der = np.dot(X_train.T,X_train).dot(theta) - np.dot(X_train.T,y_train) + self.alpha*theta
      theta = theta - self.learning_rate * theta_der


    self.coef_ = theta[1:]
    self.intercept_ = theta[0]

  def predict(self,X_test):

    return np.dot(X_test,self.coef_) + self.intercept_


In [15]:
reg = MeraRidgeGD(epochs = 500 , alpha = 0.001 , learning_rate= 0.005)
reg.fit(X_train,y_train)
y_pred = reg.predict(X_test)
print("R2 Score: ",r2_score(y_test,y_pred))
print("Intercept : ",reg.intercept_)
print("Coef : ",reg.coef_)

R2 Score:  0.45395431712097367
Intercept :  152.03121813717044
Coef :  [  19.50919039 -162.92602513  478.95477998  317.86376108  -34.07709121
 -108.63608801 -193.66871805  106.94769192  437.10746813  103.57606041]
