# Linear Regression From Scratch

#### Testing the sklearn baseline Function

In [1]:
import numpy as np
import pandas as pd
from sklearn.datasets import load_breast_cancer
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import accuracy_score, confusion_matrix, classification_report


data = load_breast_cancer()
X = data.data
y = data.target 

X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.2, random_state=42
)


scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)


log_reg = LogisticRegression(max_iter=1000)
log_reg.fit(X_train, y_train)


y_pred = log_reg.predict(X_test)

acc = accuracy_score(y_test, y_pred)

print("Accuracy of Baseline Model:",acc)

Accuracy of Baseline Model: 0.9736842105263158


## Custom Model

In [2]:
def sigmoid(x):
    return 1 / (1 + np.exp(-x))

class LogisticRegression:

    def __init__(self, lr=0.01, n_iters=1000):
        self.lr = lr
        self.n_iters = n_iters
        self.weights = None
        self.bias = None

    def fit(self, X, y):
        n_samples, n_features = X.shape
        self.weights = np.zeros(n_features)
        self.bias = 0

        for _ in range(self.n_iters):
            linear_model = np.dot(X, self.weights) + self.bias
            pred = sigmoid(linear_model)

            dw = (1 / n_samples) * np.dot(X.T, (pred - y))
            db = (1 / n_samples) * np.sum(pred - y)

            self.weights -= self.lr * dw
            self.bias -= self.lr * db

    def predict(self, X):
        linear_model = np.dot(X, self.weights) + self.bias
        pred = sigmoid(linear_model)
        class_pred = [1 if i > 0.5 else 0 for i in pred]
        return class_pred


In [3]:
clf = LogisticRegression()

clf.fit(X_train,y_train)

custom_pred = clf.predict(X_test)

def accuracy(y_true,y_pred):
    acc = np.sum(y_pred == y_true)/len(y_true)
    return acc

print("Custom Model Accuracy: ",accuracy(y_test,custom_pred))

Custom Model Accuracy:  0.9824561403508771
