# Insurance Risk Analytics Notebook

This notebook demonstrates the end-to-end workflow for insurance risk analysis using our custom modules.

In [None]:
# Import necessary modules
from src.data_processing import DataProcessor
from src.eda_utils import EDAAnalyzer
from src.modeling import InsuranceModeler
from src.visualization import InsuranceVisualizer
import pandas as pd
import numpy as np

## 1. Data Processing

In [None]:
# Initialize data processor
processor = DataProcessor()

# Load data
df = processor.load_data('data/insurance_data.csv')

# Clean data
cleaned_df = processor.clean_data(
    remove_duplicates=True,
    handle_missing='auto',
    outlier_method='iqr'
)

# Create features
feature_df = processor.create_insurance_features()

## 2. Exploratory Data Analysis

In [None]:
# Initialize EDA analyzer
eda = EDAAnalyzer(feature_df)

# Generate statistical profiles
eda.generate_statistical_profile()

# Plot distributions
eda.plot_numerical_distributions()
eda.plot_categorical_distributions()

## 3. Modeling

In [None]:
# Initialize modeler
modeler = InsuranceModeler(feature_df, target='claim_amount')

# Prepare data
X_train, X_test, y_train, y_test = modeler.prepare_data()

# Train models
modeler.train_linear_regression()
modeler.train_xgboost()

# Compare models
modeler.compare_models()

## 4. Visualization

In [None]:
# Initialize visualizer
visualizer = InsuranceVisualizer(feature_df)

# Create visualizations
visualizer.plot_loss_ratio_distribution()
visualizer.plot_claim_severity()
visualizer.plot_risk_heatmap()