In [1]:
from sklearn.datasets import load_diabetes
from sklearn.metrics import r2_score
import numpy as np

In [2]:
X,y = load_diabetes(return_X_y=True)

In [3]:
from sklearn.model_selection import train_test_split

In [4]:
X_train,X_test,y_train,y_test = train_test_split(X,y,test_size=0.2,random_state=4)

In [5]:
from sklearn.linear_model import SGDRegressor

# SGD Ridge Regression using sklearn SGDRegression 

In [7]:
# penalty - l2/l1/elastic_net
# alpha - regularization hyperparameter (basically lambda)

reg = SGDRegressor(penalty='l2',max_iter=500,eta0=0.1,learning_rate='constant',alpha=0.001)

In [7]:
reg.fit(X_train,y_train)

y_pred = reg.predict(X_test)
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.46236761393945147
[  47.76825752 -160.50379552  375.01333397  273.48207921   -8.19803343
  -61.48174855 -169.27405666  137.02466186  337.65133708   94.16006728]
[154.51322724]


# GD Ridge Regression using sklearn Ridge

In [8]:
from sklearn.linear_model import Ridge

# alpha - regularization hypterparameter
# solver{‘auto’, ‘svd’, ‘cholesky’, ‘lsqr’, ‘sparse_cg’, ‘sag’, ‘saga’, ‘lbfgs’} 
# svd, cholesky, lsqr -> closed form solution
# sparse_cg, sag, saga-> gradient descent

reg = Ridge(alpha=0.001, max_iter=500,solver='sparse_cg')

In [107]:
reg.fit(X_train,y_train)

y_pred = reg.predict(X_test)
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.46238922017853457
[  34.62617431 -290.42643559  483.96594581  367.96559729 -852.21640464
  498.74459944  183.78210203  276.57704126  757.34559544   36.95860457]
151.1041692189411


In [108]:
class MeraRidgeGD:
    
    def __init__(self,epochs,learning_rate,alpha):
        
        self.learning_rate = learning_rate
        self.epochs = epochs
        self.alpha = alpha
        self.coef_ = None
        self.intercept_ = None
        
    def fit(self,X_train,y_train):
        
        self.coef_ = np.ones(X_train.shape[1])
        self.intercept_ = 0
        thetha = np.insert(self.coef_,0,self.intercept_)    # entire beta matrix 
        
        X_train = np.insert(X_train,0,1,axis=1)
        
        for i in range(self.epochs):
            thetha_der = np.dot(X_train.T,X_train).dot(thetha) - np.dot(X_train.T,y_train) + self.alpha*thetha
            thetha = thetha - self.learning_rate*thetha_der
        
        self.coef_ = thetha[1:]
        self.intercept_ = thetha[0]
    
    def predict(self,X_test):
        
        return np.dot(X_test,self.coef_) + self.intercept_

In [109]:
reg = MeraRidgeGD(epochs=500,alpha=0.001,learning_rate=0.005)

In [110]:
reg.fit(X_train,y_train)

y_pred = reg.predict(X_test)
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.47379622696725354
[  46.65040212 -221.37723801  452.11770407  325.54645024  -29.09573382
  -96.47613436 -190.90029664  146.3286965   400.80754967   95.08979987]
150.86972442733904
