In [None]:
# Credit Risk Analysis â€“ Exploratory Analysis

## Context
This notebook explores customer credit behavior to identify outstanding debt
and payment delays.

## Objective
Identify customers with high outstanding debt and significant days past due
to support credit risk decisions.

In [None]:
import pandas as pd

df = pd.read_csv("../data/credit_transactions.csv")
df.head()

In [None]:
df.info()
df.isnull().sum()

In [None]:
df["outstanding_debt"] = df["total_amount"] - df["paid_amount"]

customer_summary = df.groupby("customer_id").agg({
    "total_amount": "sum",
    "paid_amount": "sum",
    "outstanding_debt": "sum",
    "days_past_due": "mean"
}).reset_index()

customer_summary

In [None]:
import matplotlib.pyplot as plt

customer_summary.sort_values("outstanding_debt", ascending=False).plot(
    x="customer_id",
    y="outstanding_debt",
    kind="bar",
    legend=False,
    title="Outstanding Debt by Customer"
)

plt.ylabel("Outstanding Debt")
plt.xlabel("Customer")
plt.tight_layout()
plt.show()


In [None]:
## Key Insights

- Customers **C003** and **C008** present high outstanding debt.
- These customers also show higher average days past due.
- This pattern indicates an elevated credit risk and should be prioritized
  for monitoring or collection strategies.