In [1]:
from sklearn.datasets import load_diabetes
from sklearn.metrics import r2_score
import numpy as np

In [2]:
X,y = load_diabetes(return_X_y=True)

In [3]:
from sklearn.model_selection import train_test_split

In [4]:
X_train,X_test,y_train,y_test = train_test_split(X,y,test_size=0.2,random_state=4)

In [5]:
from sklearn.linear_model import SGDRegressor

In [6]:
reg = SGDRegressor(penalty='l2',max_iter=500,eta0=0.1,learning_rate='constant',alpha=0.001)

In [7]:
reg.fit(X_train,y_train)

y_pred = reg.predict(X_test)
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.44370882858575644
[  49.52649741 -149.14235548  363.57502226  264.12720616   -2.47073754
  -54.96041589 -165.93320431  135.42104017  323.90876143  104.87089839]
[147.05636936]


In [8]:
from sklearn.linear_model import Ridge

reg = Ridge(alpha=0.001, max_iter=500,solver='sparse_cg')

In [9]:
reg.fit(X_train,y_train)

y_pred = reg.predict(X_test)
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.46250101621910966
[  34.52193893 -290.84082896  482.4018325   368.0678841  -852.44871106
  501.59162397  180.11113982  270.76336652  759.73536846   37.49137396]
151.10198522135005


In [106]:
class MeraRidgeGD:
    
    def __init__(self,epochs,learning_rate,alpha):
        
        self.learning_rate = learning_rate
        self.epochs = epochs
        self.alpha = alpha
        self.coef_ = None
        self.intercept_ = None
        
    def fit(self,X_train,y_train):
        
        # np.ones(size) create the float value array of 1 of the given size np.ones(3) return [1.0,1.0,1.0]
        self.coef_ = np.ones(X_train.shape[1])
        self.intercept_ = 0
        # insert self.intercept_ at 0th index of array self.coef_
        thetha = np.insert(self.coef_,0,self.intercept_)

        # axis=1: This specifies that you want to insert the values along the columns (axis 1), not along the rows (axis 0)
        # if axis=0: this will add a row of 1.0 at the 0th index in row count
        X_train = np.insert(X_train,0,1,axis=1)
        
        for i in range(self.epochs):
            # calculate the formula update the Thetha-derivative = X_trainT*X_train*0-X_trainT*y_train + alpha*0 , where the T is transpose of prev element
            thetha_der = np.dot(X_train.T,X_train).dot(thetha) - np.dot(X_train.T,y_train) + self.alpha*thetha
            # update the new Thetha 0new = 0old -learning_rate*thetha_derivative
            thetha = thetha - self.learning_rate*thetha_der

        # thetha is the array in which 0th element is intercept and rest is coefficient, so filter it
        self.coef_ = thetha[1:]
        self.intercept_ = thetha[0]
    
    def predict(self,X_test):

        return np.dot(X_test,self.coef_) + self.intercept_

        # you can return it like this also where you physically create a identity matrix and dot with self.intercept_ to make it a matrix
        # self.intercept_ is having only a single value in it then in order to add with a matrix I converted it into matrix just for understanding, you can ignore also
        # I = np.ones(X_test.shape[0])
        # return np.dot(X_test,self.coef_) + np.dot(self.intercept_,I)

In [107]:
reg = MeraRidgeGD(epochs=500,alpha=0.001,learning_rate=0.005)

In [108]:
reg.fit(X_train,y_train)

y_pred = reg.predict(X_test)
print("R2 score",r2_score(y_test,y_pred))
# print(reg.coef_)
print(reg.intercept_)

R2 score 0.4738018280260914
150.86975316713472
