In [25]:
class LogisticRegression:
    def __init__(self, lr=0.01, num_iter=100000, fit_intercept=True, verbose=False):
        self.lr = lr
        self.num_iter = num_iter
        self.fit_intercept = fit_intercept
        self.verbose = verbose
    
    def __add_intercept(self, X):
        intercept = np.ones((X.shape[0], 1))  #for bias
        return np.concatenate((intercept, X), axis=1)
    
    def __sigmoid(self, z):
        return 1 / (1 + np.exp(-z))
    def __loss(self, h, y):
        return (-y * np.log(h) - (1 - y) * np.log(1 - h)).mean()
    
    def fit(self, X, y):
        if self.fit_intercept:
            X = self.__add_intercept(X)
        
        # weights initialization
        self.theta = np.zeros(X.shape[1])
        
        for i in range(self.num_iter):
            z = np.dot(X, self.theta)
            h = self.__sigmoid(z)
            gradient = np.dot(X.T, (h - y)) / y.size
            self.theta -= self.lr * gradient
            
            if(self.verbose == True and i % 10000 == 0):
                z = np.dot(X, self.theta)
                h = self.__sigmoid(z)
                print(f'loss: {self.__loss(h, y)} \t')
    
    def predict_prob(self, X):
        if self.fit_intercept:
            X = self.__add_intercept(X)
    
        return self.__sigmoid(np.dot(X, self.theta))
    
    def predict(self, X, threshold):
        return self.predict_prob(X) >= threshold

In [26]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.datasets import load_breast_cancer

In [27]:
from sklearn.model_selection import train_test_split
cancer = load_breast_cancer()
df = pd.DataFrame(np.c_[cancer['data'], cancer['target']],
                 columns = np.append(cancer['feature_names'], ['target']))

In [28]:
x = df[['mean radius', 'mean texture', 'mean smoothness', 'worst texture', 'worst smoothness']]
y = df['target']
x_train, x_test, y_train, y_test = train_test_split(x, y, test_size = 0.3)

In [29]:
log = LogisticRegression(verbose=True)

In [30]:
log.fit(x_train, y_train)

loss: 0.7365450340689542 	
loss: 0.5364357649783162 	
loss: 0.32889171800905653 	
loss: 0.30201870896259675 	
loss: 0.28590877610662313 	
loss: 0.2751477675701624 	
loss: 0.26742386508404076 	
loss: 0.26158553929948264 	
loss: 0.25699503396670403 	
loss: 0.2532707750967094 	
