In [None]:
import pandas as pd
import numpy as np

# -----------------------------
# 1. Create / Load Dataset
# -----------------------------

# Example dataset (can be replaced with a CSV file)
np.random.seed(42)

data = {
    "values": np.concatenate([
        np.random.normal(loc=50, scale=10, size=100),  # normal data
        [150, 160, -40]  # extreme outliers
    ])
}

df = pd.DataFrame(data)

# -----------------------------
# 2. Calculate Mean & Std Dev
# -----------------------------

mean = df["values"].mean()
std = df["values"].std()

print(f"Mean (μ): {mean:.2f}")
print(f"Standard Deviation (σ): {std:.2f}")
print("-" * 40)

# -----------------------------
# 3. Calculate Z-Scores
# -----------------------------

df["z_score"] = (df["values"] - mean) / std

# -----------------------------
# 4. Identify Outliers
# -----------------------------

outliers = df[np.abs(df["z_score"]) > 3]

print("Statistical Outliers (|Z| > 3):")
print(outliers)
print("-" * 40)

# -----------------------------
# 5. Summary
# -----------------------------

print(f"Total rows: {len(df)}")
print(f"Outliers detected: {len(outliers)}")
