# Data Processing Notebook

This notebook demonstrates a pipeline for processing and analyzing customer sales data.

In [None]:
import pandas as pd
import numpy as np

## Data Loading

In [None]:
data = pd.DataFrame({
    'customer_id': [101, 102, 103],
    'sales': [250.0, 130.0, 400.0],
    'region': ['North', 'East', 'West']
})
data.head()

## Data Processing

In [None]:
def process_data(df, region_filter=None):
    """
    Process customer sales data.

    Args:
        df (pd.DataFrame): The input DataFrame containing customer data.
        region_filter (str, optional): A region to filter data. Defaults to None.

    Returns:
        pd.DataFrame: Processed data with added total sales.
    """
    if region_filter:
        df = df[df['region'] == region_filter]

    # Add a new column for cumulative sales
    df['cumulative_sales'] = df['sales'].cumsum()
    return df

In [None]:
# Process the entire dataset without filtering
all_data = process_data(data)
all_data

In [None]:
# Filter and process data for the North region
north_data = process_data(data, region_filter='North')
north_data