In [2]:
import pandas as pd
import os

# 1. Load data
# Ensure 'customer_churn_segmented.csv' is in the same folder as this notebook
try:
    df = pd.read_csv('customer_churn_segmented.csv')
    print(" Input file loaded successfully!")
except FileNotFoundError:
    print(" Error: 'customer_churn_segmented.csv' not found in the current directory.")

# 2. Create Power BI friendly dataset
powerbi_df = df.copy()

# 3. Identify and handle the Churn column
# Some datasets use 'Exited', others use 'Churn'
churn_col = 'Exited' if 'Exited' in powerbi_df.columns else 'Churn'

if churn_col in powerbi_df.columns:
    if powerbi_df[churn_col].dtype == 'object':
        powerbi_df['Churn_Status'] = powerbi_df[churn_col]
        powerbi_df['Churn_Binary'] = powerbi_df[churn_col].map({'Yes': 1, 'No': 0, 1: 1, 0: 0})
    else:
        powerbi_df['Churn_Status'] = powerbi_df[churn_col].map({1: 'Churned', 0: 'Retained'})
        powerbi_df['Churn_Binary'] = powerbi_df[churn_col]

# 4. Add useful calculated columns for Power BI Analysis
if 'Balance' in powerbi_df.columns and 'EstimatedSalary' in powerbi_df.columns:
    # Handling potential division by zero
    powerbi_df['Balance_to_Salary_Ratio'] = powerbi_df['Balance'] / powerbi_df['EstimatedSalary'].replace(0, 1)

# 5. Save for Power BI
output_filename = 'churn_powerbi_data.csv'
powerbi_df.to_csv(output_filename, index=False)


print(" SUCCESS: Power BI data ready!")
print(f" File saved as: {output_filename}")
print(f" Location: {os.getcwd()}")

print("\n Open Power BI Desktop and import this CSV file.")

 Input file loaded successfully!
 SUCCESS: Power BI data ready!
 File saved as: churn_powerbi_data.csv
 Location: C:\Users\91950\project-customer-churn-prediction

 Open Power BI Desktop and import this CSV file.
