# Exploratory Process Analysis: HR Case Lifecycle
**Objective:** Understand the process flow, cycle times, and department-level variations in HRSD processes.

---

In [None]:
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt
import os

data_path = '../data/harmonized_eventlog.csv'
if os.path.exists(data_path):
    df = pd.read_csv(data_path)
    df['Timestamp'] = pd.to_datetime(df['Timestamp'])
    print(f"Loaded {len(df)} records.")
else:
    print("Harmonized log not found.")
    df = pd.DataFrame()

## 1. Case Volume by Department
Visualizing which departments have the highest ticket volume.

In [None]:
plt.figure(figsize=(10,6))
sns.countplot(y='Department', data=df.drop_duplicates(subset='Case ID'))
plt.title("HR Case Volume by Department")
plt.show()

## 2. Activity Frequency
Which activities are most frequent?

In [None]:
plt.figure(figsize=(10,6))
sns.countplot(y='Activity', data=df)
plt.title("Activity Frequency (Event Level)")
plt.show()

## 3. SLA Breach by Priority
Comparison of SLA compliance across different priority levels.

In [None]:
df_cases = df.drop_duplicates(subset='Case ID', keep='last')
plt.figure(figsize=(10,6))
sns.countplot(x='Priority', hue='SLA_Status', data=df_cases)
plt.title("SLA Compliance by Case Priority")
plt.show()