In [74]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.model_selection import train_test_split

In [75]:
df = pd.read_csv('insurance.csv')

In [76]:
class LogisticRegression:
    def __init__(self, learning_rate=0.001, n_iters=1000):
        self.lr = learning_rate
        self.n_iters = n_iters
        self.weights = None
        self.bias = None
    
    def fit(self, X, y):
        n_samples, n_features = X.shape
    
        self.weights = np.zeros(n_features)
        self.bias = 0
    
        for _ in range(self.n_iters):
            linear_model = np.dot(X, self.weights) + self.bias
            y_predicted = self._sigmoid(linear_model)
        
        
            dw = (1/n_samples) * np.dot(X.T, (y_predicted - y))
            db = (1/n_samples) * np.sum(y_predicted - y)
        
            self.weights -= self.lr * dw
            self.bias -= self.lr * db
            
    def predict(self, X):
        linear_model = np.dot(X, self.weights) + self.bias
        y_predicted = self._sigmoid(linear_model)
        y_predicted_cls = [1 if i > 0.5 else 0 for i in y_predicted]
        return np.array(y_predicted_cls)
    
    def _sigmoid(self, X):
        return (1 / (1 + np.exp(-X)))

In [77]:
X = df[['age']].values
y = df['bought_insurance'].values
print(X.shape)
print(y.shape)

(27, 1)
(27,)


In [78]:
def accuracy(y_true, y_pred):
    accuracy = np.sum(y_true == y_pred) / len(y_true)
    return accuracy

In [79]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=1234)

In [86]:
regressor = LogisticRegression(learning_rate=0.1, n_iters=1000)
regressor.fit(X_train, y_train)
predictions = regressor.predict(24)
print(predictions)

[0]


In [81]:
print("LR classification accuracy:", accuracy(y_test, predictions))

LR classification accuracy: 0.6666666666666666
