In [1]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt

from sklearn.linear_model import SGDRegressor,Ridge
from sklearn.metrics import r2_score,mean_squared_error
from sklearn.model_selection import train_test_split

from sklearn.datasets import load_diabetes

X,y = load_diabetes(return_X_y=True)

In [2]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=4)

In [3]:
reg = Ridge(alpha=0.001,max_iter=500,solver='sparse_cg')
reg.fit(X_train,y_train)
y_pred = reg.predict(X_test)

print('r2_score: ',r2_score(y_test,y_pred))
print('RMSE: ',np.sqrt(mean_squared_error(y_test,y_pred)))

print('\n')

print(reg.coef_)
print(reg.intercept_)

r2_score:  0.4623892201785529
RMSE:  54.15090321973907


[  34.62617432 -290.42643558  483.96594583  367.96559731 -852.21640462
  498.74459947  183.78210201  276.57704129  757.34559547   36.95860459]
151.10416921898823


In [5]:
sgd = SGDRegressor(penalty='l2',max_iter=500,eta0=0.1,learning_rate='constant',alpha=0.001)
sgd.fit(X_train,y_train)
y_pred1 = sgd.predict(X_test)

print('r2_score: ',r2_score(y_test,y_pred1))
print('RMSE: ',np.sqrt(mean_squared_error(y_test,y_pred1)))

print('\n')

print(sgd.coef_)
print(sgd.intercept_)

r2_score:  0.45405294221128456
RMSE:  54.56912444947945


[  51.51440332 -140.39488311  356.73422149  265.55422419   -0.59046942
  -53.11492404 -167.85315936  139.48876701  323.31742488  101.34043088]
[151.8708251]


In [20]:
class SGDRidgeRegression:
    
    def __init__(self,epochs,learning_rate,alpha=0.1):
        
        self.alpha = alpha
        self.epochs = epochs
        self.learning_rate = learning_rate
        self.coef_ = None
        self.intercept_ = None
        
    def fit(self,X_train,y_train):
        self.coef_ = np.ones(X_train.shape[1])
        self.intercept_ = 0
        
        thetha = np.insert(self.coef_,0,self.intercept_)
        
        X_train = np.insert(X_train,0,1,axis=1)
        
        for i in range(self.epochs):
            thetha_der =np.dot(X_train.T,X_train).dot(thetha) - np.dot(X_train.T,y_train) + self.alpha * thetha
            thetha -= self.learning_rate * thetha_der
        
        self.intercept_ = thetha[0]
        self.coef_ = thetha[1:]
        
    
    def predict(self,X_test):
        return np.dot(X_test,self.coef_) + self.intercept_

In [21]:
sgd = SGDRidgeRegression(epochs=500,learning_rate=0.005,alpha=0.001)
sgd.fit(X_train,y_train)
y_pred1 = sgd.predict(X_test)

print('r2_score: ',r2_score(y_test,y_pred1))
print('RMSE: ',np.sqrt(mean_squared_error(y_test,y_pred1)))

print('\n')

print(sgd.coef_)
print(sgd.intercept_)

r2_score:  0.47379622696725365
RMSE:  53.573337110687554


[  46.65040212 -221.37723801  452.11770407  325.54645024  -29.09573382
  -96.47613436 -190.90029664  146.3286965   400.80754967   95.08979987]
150.86972442733904
