In [24]:
from sklearn.datasets import load_diabetes
from sklearn.metrics import r2_score
import numpy as np

In [25]:
X,y = load_diabetes(return_X_y=True)

In [26]:
from sklearn.model_selection import train_test_split

In [27]:
X_train,X_test,y_train,y_test = train_test_split(X,y,test_size=0.2,random_state=4)


In [28]:
from sklearn.linear_model import SGDRegressor

In [29]:
#penalty = l2 applies l2 norm(α∥w∥2) means ridge regression
#eta0 means the learning rate
#learning rate constant (learning rate = always eta0)
#alpha means the lambda
reg = SGDRegressor(penalty='l2',max_iter=500,eta0=0.1,learning_rate='constant',alpha=0.001)

In [30]:
reg.fit(X_train,y_train)

y_pred = reg.predict(X_test)
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.4493801300144994
[  53.16367605 -155.63683043  366.63206791  269.2204234    -4.68395373
  -58.14799995 -164.07062932  135.95096832  329.25350055   94.41349827]
[149.24485632]


In [36]:
from sklearn.linear_model import Ridge

#solver = sag means stochastic avg gd

reg = Ridge(alpha=0.001, max_iter=500,solver='sag')

In [35]:
reg.fit(X_train,y_train)

y_pred = reg.predict(X_test)
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.4625079299554483
[  34.53451854 -290.83365228  482.40884358  368.06390807 -851.82437608
  501.10213649  179.81595706  270.66159869  759.50119819   37.48676349]
151.10171965027192


In [46]:
class myGDRidge:
    
    def __init__(self,alpha,epochs,learning_rate):
        self.alpha = alpha
        self.intercept_ = None
        self.coef_ = None
        self.epochs = epochs
        self.learning_rate = learning_rate

    def fit(self, X_train,y_train):
        self.intercept_ = 0
        self.coef_ = np.ones(X_train.shape[1])
        X_train = np.insert(X_train,0,1,axis=1)
        w = np.insert(self.coef_,0,self.intercept_)

        for i in range(self.epochs):
            w_der = np.dot(X_train.T,X_train).dot(w)  - np.dot(X_train.T,y_train) + self.alpha*w
            w = w - self.learning_rate*w_der

        self.intercept_ = w[0]
        self.coef_ = w[1:]

        print(self.intercept_)
        print(self.coef_)
        
    def predict(self, X_test):
        pass

In [60]:
rgd = myGDRidge(alpha=0.001,epochs=500,learning_rate=0.005)

In [61]:
rgd.fit(X_train,y_train)

150.86975316713466
[  46.65050914 -221.3750037   452.12080647  325.54248128  -29.09464178
  -96.47517735 -190.90017011  146.32900372  400.80267299   95.09048094]


In [51]:
reg.fit(X_train,y_train)

y_pred = reg.predict(X_test)
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.46250747373452117
[  34.52607513 -290.83722477  482.40353483  368.06055556 -851.85126856
  501.12313261  179.83582934  270.66424674  759.52377144   37.49002552]
151.1017427834707
