In [1]:
import numpy as np
from sklearn.datasets import load_diabetes
from sklearn.metrics import r2_score

In [2]:
x,y = load_diabetes(return_X_y=True)

In [3]:
from sklearn.model_selection import train_test_split

In [4]:
x_train , x_test , y_train , y_test = train_test_split(x,y,test_size=0.2,random_state=4)

## Using SGD

In [5]:
from sklearn.linear_model import SGDRegressor

In [7]:
reg = SGDRegressor(penalty='l2',max_iter=500,eta0=0.1,learning_rate='constant',alpha=0.001)

In [9]:
reg.fit(x_train,y_train)
y_pred = reg.predict(x_test)
print('r2 score ', r2_score(y_test,y_pred))
print('coef',reg.coef_)
print('intercept',reg.intercept_)

r2 score  0.3853540809158349
coef [  48.81307382 -145.42454343  358.15695972  265.16810652   -1.06330143
  -53.17258849 -166.57420646  137.73235593  322.36808094  105.32723792]
intercept [136.31879423]


## Using Ridge

In [10]:
from sklearn.linear_model import Ridge

reg = Ridge(alpha=0.001, max_iter=500,solver='sparse_cg')

In [11]:
reg.fit(x_train,y_train)

y_pred = reg.predict(x_test)
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.4625010162060629
[  34.52192993 -290.84083684  482.40181978  368.06787216 -852.44872489
  501.59161022  180.11115187  270.76334868  759.73535195   37.49136104]
151.10198519001634


In [21]:
class MeraRidgeGD:
    
    def __init__(self,epochs,learning_rate,alpha):
        
        self.learning_rate = learning_rate
        self.epochs = epochs
        self.alpha = alpha
        self.coef_ = None
        self.intercept_ = None
        
    def fit(self,x_train,y_train):
        
        self.coef_ = np.ones(x_train.shape[1])
        self.intercept_ = 0
        thetha = np.insert(self.coef_,0,self.intercept_)
        
        x_train = np.insert(x_train,0,1,axis=1)
        
        for i in range(self.epochs):
            thetha_der = np.dot(x_train.T,x_train).dot(thetha) - np.dot(x_train.T,y_train) + self.alpha*thetha
            thetha = thetha - self.learning_rate*thetha_der
        
        self.coef_ = thetha[1:]
        self.intercept_ = thetha[0]
    
    def predict(self,x_test):
        
        return np.dot(x_test,self.coef_) + self.intercept_

In [22]:
reg = MeraRidgeGD(epochs=500,alpha=0.001,learning_rate=0.005)

In [23]:
reg.fit(x_train,y_train)

y_pred = reg.predict(x_test)
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.47380182802609105
[  46.65050914 -221.3750037   452.12080647  325.54248128  -29.09464178
  -96.47517735 -190.90017011  146.32900372  400.80267299   95.09048094]
150.86975316713463


In [25]:
alphas = [0,0.0001,0.0005,0.001,0.005,0.1,0.5,1,5,10]

coefs = []

for i in alphas:
    reg = Ridge(alpha=i)
    reg.fit(X_train,y_train)
    
    coefs.append(reg.coef_.tolist())

NameError: name 'X_train' is not defined