# Exploratory Data Analysis - ACIS

This notebook performs EDA on the insurance claim data.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import sys
import os

# Add src to path
sys.path.append(os.path.abspath(os.path.join(os.getcwd(), '../')))

from src.loader import load_data
from src.eda import check_missing_values, get_descriptive_stats

# Load Data
filepath = '../data/raw/MachineLearningRating_v3.txt'
df = load_data(filepath, delimiter='|')

if df is not None:
    print("Data Loaded. Shape:", df.shape)

In [None]:
# Missing Values
missing = check_missing_values(df)
missing[missing > 0]

In [None]:
# Descriptive Statistics
get_descriptive_stats(df)

In [None]:
# Visualizations
plt.figure(figsize=(10, 6))
sns.histplot(df['TotalClaims'], bins=50, kde=True)
plt.title('Distribution of Total Claims')
plt.show()

In [None]:
plt.figure(figsize=(10, 6))
sns.scatterplot(x='TotalPremium', y='TotalClaims', data=df)
plt.title('Total Premium vs Total Claims')
plt.show()