## Rigid Regression

In [1]:
from sklearn.datasets import load_diabetes

In [2]:
X,y = load_diabetes(return_X_y = True)

In [7]:
print(X.shape)
print(y.shape)

(442, 10)
(442,)


In [19]:
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X,y, test_size=0.2, random_state=42)

print(X_train.shape)
print(X_test.shape)

(353, 10)
(89, 10)


In [15]:
from sklearn.linear_model import SGDRegressor

In [84]:
sgd = SGDRegressor(max_iter=1000, eta0=0.1, learning_rate='constant', alpha=0.001)

In [85]:
sgd.fit(X_train,y_train)

In [86]:
y_pred_sgd = sgd.predict(X_test)

In [87]:
from sklearn.metrics import r2_score

In [88]:
r2_score(y_test,y_pred_sgd)

0.3993384035404369

## Rigid Regulirization

In [41]:
from sklearn.linear_model import Ridge


### Solvers for Ridge 

### use OLS to solve
‘svd’, ‘cholesky’, ‘lsqr’

#### Uses Gradiend Descent to solve
‘sparse_cg’, ‘sag’, ‘saga’

In [101]:
rg = Ridge(alpha=0.1, max_iter=100, solver='sparse_cg')


In [102]:
rg.fit(X_train,y_train)

In [103]:
y_pred_rg = rg.predict(X_test)

In [104]:
r2_score(y_test,y_pred_rg)

0.46082620941433683

## SGDR with Rigid

In [64]:
sgdr = SGDRegressor(max_iter=1000, eta0=0.1, learning_rate='constant', alpha=0.001)

In [65]:
sgdr.fit(X_train,y_train)

In [66]:
y_pred = sgdr.predict(X_test)

In [67]:
r2_score(y_test,y_pred)

0.453457673737065

## From scratch


In [110]:
import numpy as np

In [135]:
class RigidGD:
    def __init__(self,epoch,learning_rate,alpha):
        self.epoch = epoch
        self.learning_rate = learning_rate
        self.alpha = alpha
        self.coef_ = None
        self.intercept_ = None

    def fit(self,X_train,y_train):
        self.coef_ = np.ones(X_train.shape[1])
        self.intercept_ = 0

        theta = np.insert(self.coef_,0,self.intercept_)

        X_train = np.insert(X_train,0,1,axis=1)

        for i in range(self.epoch):
            theta_der = np.dot(X_train.T, X_train).dot(theta) - np.dot(X_train.T, y_train) + self.alpha * theta
            theta = theta - (self.learning_rate * theta_der)
            
        self.coef_ = theta[1:]
        self.intercept_ = theta[0]
        
    def predict(self,X_test):
        return np.dot(X_train,self.coef_) + self.intercept_
    

In [136]:
rgd = RigidGD(epoch=1000, learning_rate=0.1, alpha=0.1)

In [137]:
rgd.fit(X_train,y_train)

  theta = theta - self.learning_rate * theta_der


In [138]:
y_pred_rgd = rgd.predict(X_test)


In [139]:
r2_score(y_test,y_pred_rgd)

ValueError: Found input variables with inconsistent numbers of samples: [89, 353]