In [None]:
import numpy as np
from numpy import log,dot,exp,shape
import matplotlib.pyplot as plt
from sklearn.datasets import make_classification

In [None]:
# making the classifier
X, y = make_classification(n_samples=1000, n_features=10, n_classes=2, random_state=42)

In [None]:
# splitting the dataframe
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state = 42)

In [None]:
# standardizing the dataset for logisitic regression
def standardize(X_tr):
    for i in range(shape(X_tr)[1]):
        X_tr[:,i] = (X_tr[:,i] - np.mean(X_tr[:,i]))/np.std(X_tr[:,i])

In [None]:
# accuracy prediction
def F1_score(y,y_hat):
    tp,tn,fp,fn = 0,0,0,0
    for i in range(len(y)):
        if y[i] == 1 and y_hat[i] == 1:
            tp += 1
        elif y[i] == 1 and y_hat[i] == 0:
            fn += 1
        elif y[i] == 0 and y_hat[i] == 1:
            fp += 1
        elif y[i] == 0 and y_hat[i] == 0:
            tn += 1
    precision = tp/(tp+fp)
    recall = tp/(tp+fn)
    f1_score = 2*precision*recall/(precision+recall)
    return f1_score

In [None]:
# main logistic function
class LogisticRegression:
    def sigmoid(self,z):
        sig = 1/(1+exp(-z))
        return sig
    def initialize(self,X):
        weights = np.zeros((shape(X)[1]+1,1))
        X = np.c_[np.ones((shape(X)[0],1)),X]
        return weights,X
    def fit(self,X,y,alpha=0.001,iter=400):
        weights,X = self.initialize(X)
        def cost(theta):
            z = dot(X,theta)
            cost0 = y.T.dot(log(self.sigmoid(z)))
            cost1 = (1-y).T.dot(log(1-self.sigmoid(z)))
            cost = -((cost1 + cost0))/len(y)
            return cost
        cost_list = np.zeros(iter,)
        for i in range(iter):
            weights = weights - alpha*dot(X.T,self.sigmoid(dot(X,weights))-np.reshape(y,(len(y),1)))
            cost_list[i] = cost(weights)
        self.weights = weights
        return cost_list
    def predict(self,X):
        z = dot(self.initialize(X)[1],self.weights)
        lis = []
        for i in self.sigmoid(z):
            if i>0.5:
                lis.append(1)
            else:
                lis.append(0)
        return lis



In [None]:
# standardizing the dataframe
standardize(X_train)
standardize(X_test)

In [None]:
# running the logisitic function
object1 = LogisticRegression()

In [None]:
# fitting the data
model= object1.fit(X_train,y_train)

In [None]:
# training and predicting
y_pred = object1.predict(X_test)
y_train = object1.predict(X_train)

In [None]:
# checking the accuracy using the f1score of the splitted dataset
f1_score_train = F1_score(y_train,y_train)
f1_score_test = F1_score(y_test,y_pred)

print("Accuracy of the Training Data : ", f1_score_train)
print("Accuracy of the Testing Data : ",f1_score_test)

Accuracy of the Training Data :  1.0
Accuracy of the Testing Data :  0.8349514563106797


In [None]:
import numpy as np
from sklearn.datasets import make_classification
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import f1_score

# making the classifier
X, y = make_classification(n_samples=1000, n_features=10, n_classes=2, random_state=42)

# splitting the dataframe
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# standardizing the dataset for logistic regression
from sklearn.preprocessing import StandardScaler
scaler = StandardScaler()
X_train = scaler.fit_transform(X_train)
X_test = scaler.transform(X_test)

# fitting the model
clf = LogisticRegression(random_state=42)
clf.fit(X_train, y_train)

# making predictions
y_pred_train = clf.predict(X_train)
y_pred_test = clf.predict(X_test)

# evaluating the model
f1_score_train = f1_score(y_train, y_pred_train)
f1_score_test = f1_score(y_test, y_pred_test)

print("Accuracy of the Training Data : ", f1_score_train)
print("Accuracy of the Testing Data : ",f1_score_test)


Accuracy of the Training Data :  0.8642297650130549
Accuracy of the Testing Data :  0.8425925925925926
