# Logistic Regression

In [1]:
import warnings
warnings.filterwarnings("ignore")
%matplotlib inline
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn import datasets

In [2]:
iris = datasets.load_iris()

In [3]:
X = iris.data[:100]
y = iris.target[:100]

## Logistic Regression from Scratch

In [4]:
class LogisticRegression:
    def __init__(self, lr=0.01, num_iter=100000, fit_intercept=False, verbose=False):
        self.lr = lr
        self.num_iter = num_iter
        self.fit_intercept = fit_intercept
        self.verbose = verbose
    
    def __add_intercept(self, X):
        intercept = np.ones((X.shape[0], 1))
        return np.concatenate((intercept, X), axis=1)
    
    def __sigmoid(self, z):
        return 1 / (1 + np.exp(-z))
    def __loss(self, h, y):
        return (-y * np.log(h) - (1 - y) * np.log(1 - h)).mean()
    
    def fit(self, X, y):
        self.theta = np.zeros(X.shape[1])
        
        for i in range(self.num_iter):
            z = np.dot(X, self.theta)
            h = self.__sigmoid(z)
            gradient = np.dot(X.T, (h - y)) / y.size
            self.theta -= self.lr * gradient
            
            z = np.dot(X, self.theta)
            h = self.__sigmoid(z)
            loss = self.__loss(h, y)
                
            if(self.verbose ==True and i % 10000 == 0):
                print(f'loss: {loss} \t')
    
    def predict_prob(self, X):
        return self.__sigmoid(np.dot(X, self.theta))
    
    def predict(self, X):
        return self.predict_prob(X).round()

In [5]:
model = LogisticRegression(lr=0.1, num_iter=300000)

In [6]:
%%time
model.fit(X, y)

CPU times: user 10.3 s, sys: 96 µs, total: 10.3 s
Wall time: 10.3 s


In [7]:
model.theta

array([-1.48245771, -4.68218469,  7.32016169,  3.50845414])

## Logistic Regression using sklearn

In [8]:
from sklearn.linear_model import LogisticRegression

In [9]:
mod = LogisticRegression(C=1e20,fit_intercept=True)

In [10]:
%%time
mod.fit(X, y)

CPU times: user 3.83 ms, sys: 0 ns, total: 3.83 ms
Wall time: 3.86 ms


LogisticRegression(C=1e+20, class_weight=None, dual=False, fit_intercept=True,
                   intercept_scaling=1, l1_ratio=None, max_iter=100,
                   multi_class='warn', n_jobs=None, penalty='l2',
                   random_state=None, solver='warn', tol=0.0001, verbose=0,
                   warm_start=False)

In [11]:
mod.coef_

array([[-1.4200051 , -4.86036867,  7.6614612 ,  3.65208339]])

## Weights:

### Weights using sklearn implementation

In [12]:
mod.coef_

array([[-1.4200051 , -4.86036867,  7.6614612 ,  3.65208339]])

### Weights using scratch implementation

In [13]:
model.theta

array([-1.48245771, -4.68218469,  7.32016169,  3.50845414])