In [4]:
# Step 1: Import libraries
import pandas as pd
import numpy as np
from sklearn.preprocessing import StandardScaler

# Step 2: Load the Customer Sales dataset
df = pd.read_csv("customer_intelligence_dataset.csv")

# Step 3: Basic info
print("Dataset Shape:", df.shape)
print("\nFirst 5 rows:\n", df.head())
print("\nColumn names:", df.columns.tolist())

# Convert date columns
df["sale_date"] = pd.to_datetime(df["sale_date"], errors="coerce")
df["last_purchase_date"] = pd.to_datetime(df["last_purchase_date"], errors="coerce")

# Step 4: Choose numeric features for scaling
num_cols = ["price", "quantity", "total_value", "age", "tenure_months"]

# Step 5: Standardize numeric features
scaler = StandardScaler()
scaled_features = scaler.fit_transform(df[num_cols])

df_scaled = pd.DataFrame(scaled_features, columns=num_cols)

# keep categorical + IDs
for col in df.columns:
    if col not in num_cols:
        df_scaled[col] = df[col]

# Step 6: Save processed datasets
df.to_csv("customer_sales_raw.csv", index=False)
df_scaled.to_csv("customer_sales_scaled.csv", index=False)

print("\n✅ Data saved: customer_sales_raw.csv (original) & customer_sales_scaled.csv (standardized)")


Dataset Shape: (8000, 18)

First 5 rows:
    sale_id customer_id product_id product_name     category  price  quantity  \
0  S000001   CUST01553       P004         Desk    Furniture  12000         2   
1  S000002   CUST00161       P010    Projector  Electronics  45000         2   
2  S000003   CUST00627       P010    Projector  Electronics  45000         4   
3  S000004   CUST01291       P009      Monitor  Electronics  12000         1   
4  S000005   CUST01456       P004         Desk    Furniture  12000         4   

    sale_date  total_value  age  gender region         segment  churn  \
0  2020-01-07        24000   40  Female   West  Small Business      1   
1  2023-11-10        90000   50  Female   West       Corporate      0   
2  2022-07-04       180000   33    Male  South       Corporate      0   
3  2023-10-18        12000   41    Male   West        Consumer      0   
4  2023-09-13        48000   60  Female   West        Consumer      0   

   tenure_months last_purchase_date   