# CSV Processor Pro: Data Analysis Dashboard
This notebook provides an interactive interface to analyze and visualize your CSV data.

**IMPORTANT**: Run the first code cell below to set up paths before running any other cells.

In [None]:
import os
import sys
from pathlib import Path

# ---------------------------------------------------------------------------
# PATH SETUP: Ensure the project root is in the Python path
# This fix prevents 'ModuleNotFoundError: No module named scripts'
# ---------------------------------------------------------------------------
project_root = str(Path(os.getcwd()).parent)
if project_root not in sys.path:
    sys.path.insert(0, project_root)

import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

from scripts.kpi_analyzer import calculate_kpis
from scripts.visualizer import generate_visualizations

# Load data
data_path = os.path.join(project_root, 'data', 'large_sample.csv')
df = pd.read_csv(data_path)
print(f"Success! Loaded {len(df)} rows from {data_path}")
df.head()

## Key Performance Indicators (KPIs)

In [None]:
kpis = calculate_kpis(df)
print("--- Summary KPIs ---")
for k, v in kpis.items():
    print(f"{k.replace('_', ' ').title()}: {v:,.2f}" if isinstance(v, float) else f"{k.replace('_', ' ').title()}: {v}")

## Visualizations

In [None]:
sns.set_theme(style="whitegrid")
plt.figure(figsize=(10, 6))
sns.histplot(df['salary'], kde=True, color='green')
plt.title('Overall Salary Distribution')
plt.show()