### Detect Data Drift using Kolmogorov-Smirnov Test
**Description**: Use statistical tests to detect data drift between two datasets.

In [1]:
import numpy as np
from scipy.stats import ks_2samp

# Simulate reference dataset (e.g., training data)
np.random.seed(42)
data_ref = np.random.normal(loc=0, scale=1, size=1000)  # Normal distribution, mean=0, std=1

# Simulate new dataset (e.g., inference data) with drift (mean shifted)
data_new = np.random.normal(loc=0.5, scale=1, size=1000)  # Mean shifted to 0.5

# Apply Kolmogorov-Smirnov test to compare distributions
ks_stat, p_value = ks_2samp(data_ref, data_new)

print(f"KS Statistic: {ks_stat:.4f}")
print(f"P-value: {p_value:.4f}")

# Interpret results
alpha = 0.05  # significance level
if p_value < alpha:
    print("⚠️ Data drift detected (distributions are significantly different).")
else:
    print("✅ No data drift detected (distributions are similar).")

KS Statistic: 0.2420
P-value: 0.0000
⚠️ Data drift detected (distributions are significantly different).
