In [52]:
from sklearn.datasets import load_diabetes
from sklearn.metrics import r2_score
import numpy as np

In [53]:
X,y = load_diabetes(return_X_y=True)

In [54]:
from sklearn.model_selection import train_test_split

In [55]:
X_train,X_test,y_train,y_test = train_test_split(X,y,test_size=0.2,random_state=4)

### Ridge Regularization using Gradient Descent (using SGDRegressor from sklearn library)

In [56]:
from sklearn.linear_model import SGDRegressor

In [57]:
reg = SGDRegressor(penalty='l2',max_iter=500,eta0=0.1,learning_rate='constant',alpha=0.001)

In [58]:
reg.fit(X_train,y_train)
y_pred = reg.predict(X_test)

In [59]:
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.44445197497435585
[  53.10145859 -147.02000736  363.23838464  268.44980801   -1.87301106
  -54.78697733 -165.38581941  139.5303517   324.66226131  100.65977654]
[147.57755254]


### Ridge Regression using Gradient Descent (using Ridge Class from sklearn library)

solver : {‘auto’, ‘dense_cholesky’, ‘sparse_cg’}

Solver to use in the computational routines. ‘delse_cholesky’ will use the standard scipy.linalg.solve function, ‘sparse_cg’ will use the a conjugate gradient solver as found in scipy.sparse.linalg.cg while ‘auto’ will chose the most appropiate depending on the matrix X.

In [60]:
from sklearn.linear_model import Ridge

reg = Ridge(alpha=0.001, max_iter=500,solver='sparse_cg')

In [61]:
reg.fit(X_train,y_train)
y_pred = reg.predict(X_test)

In [62]:
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.46250101619914563
[  34.52192544 -290.84084076  482.40181344  368.0678662  -852.44873179
  501.59160336  180.11115788  270.76333979  759.73534372   37.4913546 ]
151.10198517439466


### Implementing Ridge Regression via Gradient Descent with a Custom Ridge Class

In [63]:
class CustomRidgeGD:

  def __init__(self,epochs,learning_rate,alpha):

    self.learning_rate = learning_rate
    self.epochs = epochs
    self.alpha = alpha
    self.coef_ = None
    self.intercept_ = None

  def fit(self,X_train,y_train):

    self.coef_ = np.ones(X_train.shape[1])
    self.intercept_ = 0
    thetha = np.insert(self.coef_,0,self.intercept_)

    X_train = np.insert(X_train,0,1,axis=1)

    for i in range(self.epochs):
      thetha_der = np.dot(X_train.T,X_train).dot(thetha) - np.dot(X_train.T,y_train) + self.alpha*thetha
      thetha = thetha - self.learning_rate*thetha_der

    self.coef_ = thetha[1:]
    self.intercept_ = thetha[0]

  def predict(self,X_test):

    return np.dot(X_test,self.coef_) + self.intercept_

In [64]:
reg = CustomRidgeGD(epochs=500,alpha=0.001,learning_rate=0.005)

In [65]:
reg.fit(X_train, y_train)
y_pred = reg.predict(X_test)

In [66]:
print("R2 Score ", r2_score(y_test, y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 Score  0.4738018280260913
[  46.65050914 -221.3750037   452.12080647  325.54248128  -29.09464178
  -96.47517735 -190.90017011  146.32900372  400.80267299   95.09048094]
150.86975316713472
