In [1]:
# Unemployment Analysis with Python

# Importing necessary libraries
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Load the dataset
url = "Unemployment in India.csv"
data = pd.read_csv(url)

# Display dataset preview
def preview_data(data):
    print("Dataset Preview:")
    print(data.head())

preview_data(data)

# Check for missing values
if data.isnull().sum().sum() == 0:
    print("No missing values detected.")
else:
    print("Missing values found:")
    print(data.isnull().sum())

# Basic statistical summary
print("\nStatistical Summary:")
print(data.describe())

# Unemployment trends over time
if "Date" in data.columns:
    data["Date"] = pd.to_datetime(data["Date"])
    plt.figure(figsize=(10, 6))
    sns.lineplot(x="Date", y="Unemployment Rate", data=data, marker="o")
    plt.title("Unemployment Rate Over Time")
    plt.xlabel("Date")
    plt.ylabel("Unemployment Rate")
    plt.grid(True)
    plt.show()

# State-wise Unemployment Rate Analysis
if "Region" in data.columns and "Unemployment Rate" in data.columns:
    state_data = data.groupby("Region")["Unemployment Rate"].mean().sort_values()
    plt.figure(figsize=(12, 8))
    sns.barplot(x=state_data.values, y=state_data.index)
    plt.title("Average Unemployment Rate by State")
    plt.xlabel("Average Unemployment Rate")
    plt.ylabel("State")
    plt.show()


Dataset Preview:
           Region         Date  Frequency   Estimated Unemployment Rate (%)  \
0  Andhra Pradesh   31-05-2019    Monthly                              3.65   
1  Andhra Pradesh   30-06-2019    Monthly                              3.05   
2  Andhra Pradesh   31-07-2019    Monthly                              3.75   
3  Andhra Pradesh   31-08-2019    Monthly                              3.32   
4  Andhra Pradesh   30-09-2019    Monthly                              5.17   

    Estimated Employed   Estimated Labour Participation Rate (%)   Area  
0           11999139.0                                     43.24  Rural  
1           11755881.0                                     42.05  Rural  
2           12086707.0                                     43.50  Rural  
3           12285693.0                                     43.97  Rural  
4           12256762.0                                     44.68  Rural  
Missing values found:
Region                                    