# EDA - Customer Churn

This notebook provides a quick-start template for exploring the churn dataset.

## Steps
- Load the dataset from `../data/your_file.csv`
- Inspect schema and missingness
- Visualize distributions and target balance
- Explore correlations and feature importance




In [None]:
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt

pd.set_option('display.max_columns', None)

# Update this path
DATA_PATH = '../data/your_file.csv'
TARGET = 'churn'

try:
    df = pd.read_csv(DATA_PATH)
    print(df.shape)
    display(df.head())
except FileNotFoundError:
    print(f"CSV not found at {DATA_PATH}. Place your dataset and rerun.")



In [None]:
# Basic info
try:
    display(df.info())
    display(df.describe(include='all').T)
except NameError:
    pass



In [None]:
# Missingness heatmap
try:
    plt.figure(figsize=(10, 5))
    sns.heatmap(df.isna(), cbar=False)
    plt.title('Missingness')
    plt.show()
except NameError:
    pass



In [None]:
# Target balance
try:
    if TARGET in df.columns:
        ax = df[TARGET].value_counts(normalize=True).mul(100).plot(kind='bar')
        plt.title('Target Balance (%)')
        for p in ax.patches:
            ax.annotate(f"{p.get_height():.1f}%", (p.get_x()+0.1, p.get_height()+1))
        plt.show()
    else:
        print(f"Target column '{TARGET}' not in dataframe")
except NameError:
    pass

