## Using Stochastic Gradient Regressor class

In [1]:
from sklearn.datasets import load_diabetes
from sklearn.metrics import r2_score
import numpy as np

In [2]:
X,y = load_diabetes(return_X_y=True)

In [3]:
from sklearn.model_selection import train_test_split


In [4]:
X_train,X_test,y_train,y_test = train_test_split(X,y,test_size=0.2,random_state=4)

In [5]:
from sklearn.linear_model import SGDRegressor

In [9]:
reg = SGDRegressor(penalty='l2',max_iter=500,eta0=0.1,learning_rate='constant',alpha=0.001)

In [10]:
reg.fit(X_train,y_train)

y_pred = reg.predict(X_test)
print("R2-score : ",r2_score(y_test,y_pred))
print("Coefficient : ",reg.coef_)
print("Intercepts \n : ",reg.intercept_)

R2-score :  0.46006212496547294
Coefficient :  [  53.58141071 -155.10830845  364.72783385  267.29770077   -3.95912164
  -59.12339113 -166.35301446  137.68236977  334.99810623  103.55981003]
Intercepts 
 :  [156.03545296]


## Using Ridge class applying Gradient Descent 

In [11]:
from sklearn.linear_model import Ridge
reg = Ridge(alpha=0.001, max_iter=500, solver='sparse_cg')

In [12]:
reg.fit(X_train,y_train)

y_pred  = reg.predict(X_test)

In [13]:
print("R2-score : ",r2_score(y_test,y_pred))
print("Coefficient : ",reg.coef_)
print("Intercepts \n : ",reg.intercept_)

R2-score :  0.46250101619914563
Coefficient :  [  34.52192544 -290.84084076  482.40181344  368.0678662  -852.44873179
  501.59160336  180.11115788  270.76333979  759.73534372   37.4913546 ]
Intercepts 
 :  151.10198517439466


## Coding the Ridge regressor which uses Gradient Descent under the hood , using numpy

In [17]:
class RidgeReg:

    def __init__(self,alpha,learning_rate,epochs):
        self.alpha = alpha
        self.learning_rate = learning_rate
        self.epochs = epochs
        self.coef_ = None
        self.intercept_ = None

    def fit(self,X_train,y_train):
        
        self.coef_  = np.ones(X_train.shape[1])
        self.intercept_ = 0
        theta = np.insert(self.coef_,0,self.intercept_)

        X_train = np.insert(X_train,0,1,axis=1)

        for i in range(self.epochs):

            theta_der = np.dot(X_train.T,X_train).dot(theta) - np.dot(X_train.T,y_train) + self.alpha * theta
            theta = theta - self.learning_rate * theta_der

        self.coef_ = theta[1:]
        self.intercept_ = theta[0]

    def predict(self,X_test):

        return np.dot(X_test,self.coef_) + self.intercept_

In [18]:
reg = RidgeReg(epochs=500,alpha=0.001,learning_rate=0.005)

In [19]:
reg.fit(X_train,y_train)

y_pred = reg.predict(X_test)


In [20]:
print("R2-score : ",r2_score(y_test,y_pred))
print("Coefficient : ",reg.coef_)
print("Intercepts \n : ",reg.intercept_)

R2-score :  0.4738018280260913
Coefficient :  [  46.65050914 -221.3750037   452.12080647  325.54248128  -29.09464178
  -96.47517735 -190.90017011  146.32900372  400.80267299   95.09048094]
Intercepts 
 :  150.86975316713472
