In [1]:
import pandas as pd
from sklearn.preprocessing import LabelEncoder

# Sample dataset
df = pd.DataFrame({
    'Gender': ['Male', 'Female', 'Female', 'Male', 'Female'],
    'City': ['Nairobi', 'Kisumu', 'Mombasa', 'Nairobi', 'Kisumu']
})

print("Original Data:")
print(df)

# --------------------------
# 🔠 Label Encoding (for Gender)
# --------------------------
le = LabelEncoder()
df['Gender_encoded'] = le.fit_transform(df['Gender'])

# 'Male' becomes 1, 'Female' becomes 0

# --------------------------
# 🟦 One-Hot Encoding (for City)
# --------------------------
df_encoded = pd.get_dummies(df, columns=['City'], drop_first=True)

# 'drop_first=True' drops the first category (Nairobi) to avoid dummy variable trap

# --------------------------
# 🖨️ Final Output
# --------------------------
print("\nAfter Label and One-Hot Encoding:")
print(df_encoded)


Original Data:
   Gender     City
0    Male  Nairobi
1  Female   Kisumu
2  Female  Mombasa
3    Male  Nairobi
4  Female   Kisumu

After Label and One-Hot Encoding:
   Gender  Gender_encoded  City_Mombasa  City_Nairobi
0    Male               1         False          True
1  Female               0         False         False
2  Female               0          True         False
3    Male               1         False          True
4  Female               0         False         False
