In [23]:
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn import datasets

import matplotlib.pyplot as plt


    

In [40]:
class LogisticRegression:
    
    def __init__(self, lr=0.001, n_iters=1000):
        self.lr = lr
        self.n_iters = n_iters
        self.weights = None
        self.bias = None
    
    # X is of shape mxn where m is number o(f samples and n is number of features
    # y is a one dimensional row vector
    def fit(self, X, y):  
        #initialize weights
        n_samples, n_features = X.shape
        self.weights = np.zeros(n_features)
        self.bias = 0
        
        # gradient descent
        for _ in range(self.n_iters):
            linear_model = np.dot(X, self.weights) + self.bias
            y_predict = self._sigmoid(linear_model)
            
            dw = (1 / n_samples)*np.dot(X.T, (y_predict-y))
            db = (1 / n_samples)*np.sum(y_predict - y)
            
            self.weights -= self.lr * dw
            self.bias -= self.lr*db
       
    
    def predict(self, X):
        linear_model = np.dot(X, self.weights) + self.bias
        y_predicted = self._sigmoid(linear_model)
        y_predicted_cls = [1 if i > 0.5 else 0 for i in y_predicted]
        return y_predicted_cls
        
    
    def _sigmoid(self, x):
        return 1/(1 + np.exp(-x))

In [41]:
tumor = datasets.load_breast_cancer()
X,y = tumor.data, tumor.target

In [42]:
X_train, X_test,y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=1234)




In [43]:
def accuracy(y_true,y_pred):
    accuracy = np.sum(y_true == y_pred)/len(y_true)
    return accuracy



In [46]:
regressor = LogisticRegression(lr = 0.0001, n_iters = 1000)
regressor.fit(X_train,y_train)
prediction = regressor.predict(X_test)

print("LR classification accuracy is: ",accuracy(y_test,prediction))

LR classification accuracy is:  0.9298245614035088
