### Detect Data Drift using Kolmogorov-Smirnov Test
**Description**: Use statistical tests to detect data drift between two datasets.

In [1]:
import numpy as np
from scipy.stats import ks_2samp

# Step 1: Generate two sample datasets (numeric feature)
np.random.seed(42)
data_old = np.random.normal(loc=0, scale=1, size=1000)  # original distribution
data_new = np.random.normal(loc=0.5, scale=1.2, size=1000)  # shifted distribution to simulate drift

# Step 2: Perform KS test
statistic, p_value = ks_2samp(data_old, data_new)

print(f"KS Statistic: {statistic:.4f}")
print(f"P-value: {p_value:.4f}")

# Step 3: Interpret result
alpha = 0.05  # significance level

if p_value < alpha:
    print("Data drift detected: The two samples come from different distributions.")
else:
    print("No data drift detected: The two samples likely come from the same distribution.")


KS Statistic: 0.2310
P-value: 0.0000
Data drift detected: The two samples come from different distributions.
