### Data Analysis of NHANES for Periodontal Disease Prediction
This analysis utilizes the NHANES dataset to develop a machine learning model for predicting periodontal disease risk based on routine blood tests.

In [None]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import classification_report

# Load the NHANES dataset
nhanes_data = pd.read_csv('nhanes_data.csv')  # Replace with actual data path

# Preprocessing
features = ['smoking_status', 'age', 'education_level', 'GGT', 'albumin', 'BUN', 'glucose', 'phosphorus', 'creatinine', 'basophil_count', 'total_calcium']
X = nhanes_data[features]
Y = nhanes_data['periodontitis']  # Binary outcome

# Split the data
X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.3, random_state=42)

# Train the Random Forest Classifier
model = RandomForestClassifier(n_estimators=100, random_state=42)
model.fit(X_train, Y_train)

# Predictions
predictions = model.predict(X_test)

# Evaluation
print(classification_report(Y_test, predictions))