In [20]:
# Importing necessary libraries
# NumPy provides support for large, multi-dimensional arrays and matrices.
import numpy as np
# Pandas provides support for data manipulation and analysis.
import pandas as pd
# Matplotlib.pyplot is a plotting library in Python that provides a MATLAB-like interface for creating visualizations.
import matplotlib.pyplot as plt

In [21]:
# Load the dataset
data = pd.read_csv("CKD.csv")

In [22]:
# Convert categorical variables into dummy/indicator variables
data = pd.get_dummies(data, drop_first=True)

In [23]:
# Create the dependent variable (target)
dependent = data[["classification_yes"]]

In [35]:
# Create the independent variables (features)
independent = data[['age', 'bp', 'al', 'su', 'bgr', 'bu', 'sc', 'sod', 'pot', 'hrmo', 'pcv',
       'wc', 'rc', 'sg_b', 'sg_c', 'sg_d', 'sg_e', 'rbc_normal', 'pc_normal',
       'pcc_present', 'ba_present', 'htn_yes', 'dm_yes', 'cad_yes',
       'appet_yes', 'pe_yes', 'ane_yes']]


In [27]:
 #Importing train_test_split from sklearn.model_selection
# This function is used for splitting the data into training and testing sets
from sklearn.model_selection import train_test_split

In [28]:
# Splitting data into training and testing sets
# Train and test split ratio is 70% and 30% respectively
X_train, X_test, y_train, y_test = train_test_split(independent, dependent, test_size=0.30, random_state=0)

In [29]:
# Standardizing the features
from sklearn.preprocessing import StandardScaler
sc = StandardScaler()
X_train = sc.fit_transform(X_train)
X_test = sc.transform(X_test)

In [36]:
pre_inputs = sc.transform([[
    25.0, 80.0, 0.0, 0.0, 121.0, 19.0, 1.2, 142.0, 4.9, 15.0, 48.0, 6900.0, 5.3, 
    1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0,0
]])
pre_inputs



array([[-1.66716664,  0.26534721, -0.67367325, -0.36578176, -0.37689758,
        -0.78894921, -0.34458897,  0.42822683,  0.14656163,  0.93792653,
         1.11040228, -0.59507699,  0.76631453,  2.08935029, -0.52897686,
        -0.45584231, -0.13508581,  0.39101478,  0.50111982, -0.33399668,
        -0.22984819, -0.73582366, -0.73004591, -0.29973947,  0.50671171,
        -0.51229234, -0.43852901]])

In [37]:
# Importing pickle file and used for serializing and deserializing Python objects.
import pickle   

# Load the saved model using pickle, mode 'rb' stands for "read binary"
loaded_model = pickle.load(open("LogisticRegressionCDKclassification.sav","rb"))  





In [38]:
# Predicting the output value by inputting the values
result = loaded_model.predict(pre_inputs)
result

array([0], dtype=uint8)