In [1]:
from sklearn.datasets import load_diabetes
from sklearn.metrics import r2_score
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.linear_model import SGDRegressor

In [2]:
X, y = load_diabetes(return_X_y=True)

In [4]:
X_train, X_test, Y_train, Y_test = train_test_split(X,y,test_size=0.2,random_state=4)

In [6]:
reg = SGDRegressor(penalty='l2', max_iter=500, eta0=0.1, learning_rate='constant', alpha=0.001)

In [7]:
reg.fit(X_train, Y_train)

In [10]:
y_pred = reg.predict(X_test)
print(r2_score(Y_test, y_pred))
print(reg.coef_)
print(reg.intercept_)


0.4586751356557408
[  51.18778602 -150.31274792  365.66517915  266.76494721   -0.7403347
  -56.59524575 -166.5490185   138.40820775  330.0925699   103.47299008]
[158.92170049]


### Alternate Method using Ridge

In [11]:
from sklearn.linear_model import Ridge
reg = Ridge(alpha=0.001, max_iter=500, solver='sparse_cg')

In [12]:
reg.fit(X_train, Y_train)

In [13]:
y_pred = reg.predict(X_test)
r2_score(Y_test, y_pred)

0.46250101620710193

### Custom Ridge Regression

In [34]:
class RidgeGD:
    def __init__(self, epochs, learning_rate, alpha):
        self.learning_rate = learning_rate
        self.epochs = epochs
        self.alpha = alpha
        self.coef_ = None
        self.intercept_ = None

    def fit(self, X_train, Y_train):
        self.coef_ = np.ones(X_train.shape[1])
        self.intercept_ = 0
        thetha = np.insert(self.coef_, 0, self.intercept_)
        X_train = np.insert(X_train, 0,1,axis=1)

        for i in range(self.epochs):
            # derivative of ridge loss w.r.t Weights(W) or theta
            thetha_der = np.dot(X_train.T, X_train).dot(thetha) - np.dot(X_train.T, Y_train) + self.alpha*thetha
            thetha = thetha - self.learning_rate*thetha_der

        self.coef_ = thetha[1:]
        self.intercept_ = thetha[0]

    def predict(self, X_test):
        return np.dot(X_test, self.coef_) + self.intercept_


In [35]:
RidgeGD_inst = RidgeGD(epochs=500, alpha=0.001, learning_rate=0.005)

In [36]:
RidgeGD_inst.fit(X_train, Y_train)
y_pred = RidgeGD_inst.predict(X_test)
r2_score(Y_test, y_pred)

0.4738018280260913