# HR Analytics Analysis

This notebook demonstrates how to load and analyze HR Analytics data using Python.

In [None]:

# Import necessary libraries
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Load the Excel file
file_path = '/mnt/data/HR_Analytics- V5.xlsx'

# Load the 'HR_Analytics.csv' sheet
df_hr_analytics = pd.read_excel(file_path, sheet_name='HR_Analytics.csv')

# Display the first few rows of the data
df_hr_analytics.head()
    

## Basic Data Exploration

In [None]:

# Checking the structure of the dataset
df_hr_analytics.info()

# Checking for missing values
df_hr_analytics.isnull().sum()

# Summary statistics
df_hr_analytics.describe()
    

## Data Visualization

In [None]:

# Bar plot of Attrition
plt.figure(figsize=(8, 5))
sns.countplot(x='Attrition', data=df_hr_analytics)
plt.title('Employee Attrition Count')
plt.show()
    

In [None]:

# Bar plot of department distribution
plt.figure(figsize=(8, 5))
sns.countplot(x='Department', data=df_hr_analytics)
plt.title('Employee Distribution by Department')
plt.show()
    

## Custom Metric: Turnover Rate

In [None]:

# Turnover rate
turnover_rate = df_hr_analytics['Attrition'].value_counts(normalize=True)['Yes']
print(f'Turnover Rate: {turnover_rate * 100:.2f}%')
    

## Export Cleaned Data for Power BI

In [None]:

# Exporting the dataset to CSV format for Power BI
df_hr_analytics.to_csv('cleaned_hr_analytics.csv', index=False)
    