# 🧪 ETL Pipeline using Pandas & Scikit-learn
This notebook demonstrates a basic ETL (Extract, Transform, Load) process.

In [None]:
import pandas as pd
from sklearn.preprocessing import StandardScaler

## 🔍 Step 1: Extract
Load the sample dataset.

In [None]:
df = pd.read_csv('data.csv')
print("Original Data:")
df

## 🔧 Step 2: Transform
Drop missing values and scale numeric columns.

In [None]:
# Drop rows with missing values
df_clean = df.dropna()

# Scale numeric columns
scaler = StandardScaler()
numeric_cols = df_clean.select_dtypes(include='number').columns
df_clean[numeric_cols] = scaler.fit_transform(df_clean[numeric_cols])
df_clean

## 💾 Step 3: Load
Save the cleaned and transformed data.

In [None]:
df_clean.to_csv('cleaned_data.csv', index=False)
print("ETL process complete. Cleaned data saved to cleaned_data.csv")