# Chronic Kidney Disease Prediction

In [None]:
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.preprocessing import LabelEncoder
from sklearn.metrics import accuracy_score, classification_report
import pickle

In [None]:
# Sample data creation
data = {
    "age": [48.0, 7.0, 62.0, 48.0, 51.0],
    "bp": [80.0, 50.0, 80.0, 70.0, 80.0],
    "sg": [1.02, 1.02, 1.01, 1.005, 1.01],
    "al": [1.0, 4.0, 2.0, 3.0, 4.0],
    "su": [0.0, 0.0, 0.0, 0.0, 0.0],
    "hemo": [15.1, 11.3, 9.6, 11.2, 9.5],
    "classification": ["notckd", "ckd", "ckd", "ckd", "ckd"]
}
df = pd.DataFrame(data)

In [None]:
# Encode categorical
le = LabelEncoder()
df["classification"] = le.fit_transform(df["classification"])

In [None]:
X = df.drop("classification", axis=1)
y = df["classification"]
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
model = RandomForestClassifier()
model.fit(X_train, y_train)

In [None]:
y_pred = model.predict(X_test)
print("Accuracy:", accuracy_score(y_test, y_pred))
print(classification_report(y_test, y_pred))

In [None]:
with open('ckd_model.pkl', 'wb') as f:
    pickle.dump(model, f)