# CREATING LOGISTIC REGRESSION FROM SCRATCH

In [1]:
import numpy as np

## Create a Model Class called LogisticRegression

In [2]:
class LogisticRegression:

    #initialise the paramaters of our model  or simply set the default values of the parameters.
    def __init__(self, learning_rate=0.001, n_iters=1000):
        self.lr = learning_rate
        self.n_iters = n_iters
        self.weights = None
        self.bias = None
    
    
    # sigmoid function
    def _sigmoid(self, x):
        return 1 / (1 + np.exp(-x))
    
    def predict(self, X):
        #predictions made by transforming the linear model to logistic by passing it through the sigmoid function
        linear_model = np.dot(X, self.weights) + self.bias
        y_predicted = self._sigmoid(linear_model) 
        
        # defines the threshold for returning values of zeroes and ones  
        y_predicted_cls = [1 if i > 0.5 else 0 for i in y_predicted]
        return np.array(y_predicted_cls)



    def fit(self, X, y):
        #n_samples and n_features recieve the values of X.shape, 
        #which are the values for the number of rows and columns repectively
        n_samples, n_features = X.shape

        # initialise the parameters for weights and biases
        self.weights = np.zeros(n_features)
        self.bias = 0

        # gradient descent
        for _ in range(self.n_iters):
            
            # approximate y with linear combination of weights and x, plus bias
            linear_model = np.dot(X, self.weights) + self.bias
            
            # apply sigmoid function to the linear model; this gives our logistic model
            y_predicted = self._sigmoid(linear_model)
            
            

            # compute gradients
            dw = (1 / n_samples) * np.dot(X.T, (y_predicted - y))
            db = (1 / n_samples) * np.sum(y_predicted - y)
            
            # update the weight and biases
            self.weights -= self.lr * dw
            self.bias -= self.lr * db

    
    

## Validation Score: Accuracy Score

In [3]:
# Create a function called accuracy to determine the accuracy score.
def accuracy(y_true, y_pred):
    accuracy = np.sum(y_true == y_pred) / len(y_true)
    return accuracy

## TEST OUR MODEL

In [4]:
#Load Breast cancer data set from sklearn
from sklearn.model_selection import train_test_split
from sklearn.datasets import load_breast_cancer

In [5]:
data = load_breast_cancer()

In [6]:
# store the independent variables in X and the dependent/target variable in y
X, y = data.data, data.target

In [7]:
X_train, X_test, y_train, y_test =  train_test_split(X,y, random_state=1, test_size=0.3)

In [8]:
regressor_clf = LogisticRegression()

In [9]:
regressor_clf.fit(X_train,y_train)

In [10]:
y_pred = regressor_clf.predict(X_test)

In [11]:
accuracy(y_test, y_pred)

0.935672514619883