# **Ridge Regularization Non-Closed Form**
`Gradient Descent`

In [15]:
from sklearn.datasets import load_diabetes
from sklearn.metrics import r2_score
import numpy as np
X,y = load_diabetes(return_X_y=True)
from sklearn.model_selection import train_test_split
X_train,X_test,y_train,y_test = train_test_split(X,y,test_size=0.2,random_state=4)

In [16]:
from sklearn.linear_model import SGDRegressor
sgd = SGDRegressor(penalty='l2',alpha=0.001,eta0=0.1,learning_rate='constant',max_iter=500)

In [17]:
sgd.fit(X_train,y_train)

y_pred = sgd.predict(X_test)
print("R2 score",r2_score(y_test,y_pred))
print(sgd.coef_)
print(sgd.intercept_)

R2 score 0.44070301942751033
[  49.08657453 -154.96434494  372.81786322  271.69083344   -9.75688997
  -60.37756143 -168.5398897   136.56372306  332.51550855   93.76950073]
[167.19130262]


In [18]:
from sklearn.linear_model import Ridge

reg = Ridge(alpha=0.001, max_iter=500,solver='sparse_cg')
reg.fit(X_train,y_train)

y_pred = reg.predict(X_test)
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.46250101621236117
[  34.52193418 -290.84083311  482.40182579  368.0678778  -852.44871836
  501.59161672  180.11114618  270.76335711  759.73535975   37.49136714]
151.1019852048177


In [19]:
class MeraRidgeGD:

    def __init__(self,epochs,learning_rate=0.001,alpha=0.1):

        self.epochs = epochs
        self.learning_rate = learning_rate
        self.alpha = alpha
        self.coef_ = None
        self.intercept_ = None

    def fit(self,X_train,y_train):
        self.intercept_= 0
        self.coef_ = np.ones(X_train.shape[1])
        theta = np.insert(self.coef_,0,self.intercept_)
        X_train = np.insert(X_train,0,1,axis=1)

        for i in range(self.epochs):
            theta_der = (np.dot(X_train.T,X_train).dot(theta)) - np.dot(X_train.T,y_train) + self.alpha*theta
            theta = theta - (self.learning_rate * theta_der)
            
        self.intercept_ = theta[0]
        self.coef_ = theta[1:]

    def predict(self,X_test):
        return np.dot(X_test,self.coef_) + self.intercept_



In [20]:
reg = MeraRidgeGD(epochs=500,alpha=0.001,learning_rate=0.005)

In [21]:
reg.fit(X_train,y_train)

y_pred = reg.predict(X_test)
print("R2 score",r2_score(y_test,y_pred))
print(reg.coef_)
print(reg.intercept_)

R2 score 0.4738018280260913
[  46.65050914 -221.3750037   452.12080647  325.54248128  -29.09464178
  -96.47517735 -190.90017011  146.32900372  400.80267299   95.09048094]
150.86975316713472
