In [2]:
import pandas as pd
import numpy as np

# --------------------------------------------------
# 1️⃣ Create a realistic dataset
# --------------------------------------------------
data = {
    "Student": ["Amit","Rahul","Sneha","Karan","Pooja","Anita","Ravi","Neha","Arjun","Meera"],
    "Score":   [65, 70, 72, 68, 75, 78, 80, 74, 69, 120]  # 120 is extreme/outlier
}

df = pd.DataFrame(data)

print("Original Dataset:")
print(df)

# --------------------------------------------------
# 2️⃣ Calculate Mean and Standard Deviation
# --------------------------------------------------
mean_val = df["Score"].mean()
std_val = df["Score"].std()

print("\nMean:", mean_val)
print("Standard Deviation:", std_val)

# --------------------------------------------------
# 3️⃣ Calculate Z-score
# --------------------------------------------------
df["z_score"] = (df["Score"] - mean_val) / std_val

print("\nDataset with Z-scores:")
print(df)

# --------------------------------------------------
# 4️⃣ Detect Outliers (|Z| > 3)
# --------------------------------------------------
outliers = df[np.abs(df["z_score"]) > 3]

print("\nOutliers detected:")
print(outliers)


Original Dataset:
  Student  Score
0    Amit     65
1   Rahul     70
2   Sneha     72
3   Karan     68
4   Pooja     75
5   Anita     78
6    Ravi     80
7    Neha     74
8   Arjun     69
9   Meera    120

Mean: 77.1
Standard Deviation: 15.758242992866375

Dataset with Z-scores:
  Student  Score   z_score
0    Amit     65 -0.767852
1   Rahul     70 -0.450558
2   Sneha     72 -0.323640
3   Karan     68 -0.577476
4   Pooja     75 -0.133264
5   Anita     78  0.057113
6    Ravi     80  0.184031
7    Neha     74 -0.196722
8   Arjun     69 -0.514017
9   Meera    120  2.722385

Outliers detected:
Empty DataFrame
Columns: [Student, Score, z_score]
Index: []
