# Important Libraries

In [None]:
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt
import plotly.express as px
from scipy.stats import ttest_ind
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_absolute_error, mean_squared_error, r2_score

In [None]:
#Load data
df1=pd.read_csv('/Unemployment_Rate_upto_11_2020.csv')

# Exploratory Data Analysis

In [None]:
df1.head()

In [None]:
df1.tail()

In [None]:
print(df1.shape)
df1.info()

In [None]:
df1 = df1.rename(columns={'Region': 'Region1', 'Region.1': 'Region2'})

In [None]:
df1.columns

In [None]:
# Step 6: Statistical Analysis
# Example: Correlation between variables
correlation_matrix = df1.corr()
print(correlation_matrix)

In [None]:
#statistical information about Dataframe
df1.describe()

# Data Visualization

# Bar plot of Estimated Unemployment Rate in states

In [None]:
# Clean the column names
df1.columns = df1.columns.str.strip()
# Group the data by region and calculate the average unemployment rate
avg_unemployment_rate = df1.groupby('Region1')['Estimated Unemployment Rate (%)'].mean().reset_index()

# Create a bar plot using Plotly
fig = px.bar(avg_unemployment_rate, x='Region1', y='Estimated Unemployment Rate (%)',
             title='Average Unemployment Rate Across Different States',
             labels={'Estimated Unemployment Rate (%)': 'Average Unemployment Rate (%)',
                     'Region1': 'Region'},
             color='Region1',
             color_discrete_sequence=px.colors.qualitative.Set1)

fig.update_layout(xaxis_tickangle=-45, xaxis_title='', yaxis_title='Average Unemployment Rate (%)')

fig.show()

# Bar  plot of Estimated Unemployment Rate in Region

In [None]:
# Group the data by region and calculate the average unemployment rate
avg_unemployment_rate = df1.groupby('Region2')['Estimated Unemployment Rate (%)'].mean().reset_index()

# Create a bar plot using Plotly
fig = px.bar(avg_unemployment_rate, x='Region2', y='Estimated Unemployment Rate (%)',
             title='Average Unemployment Rate Across Different Regions',
             labels={'Estimated Unemployment Rate (%)': 'Average Unemployment Rate (%)',
                     'Region2': 'Region'},
             color='Region2',
             color_discrete_sequence=px.colors.qualitative.Set1)

fig.update_layout(xaxis_tickangle=-45, xaxis_title='', yaxis_title='Average Unemployment Rate (%)')

fig.show()

# Scatter plot of Estimated Unemployment Rate in States

In [None]:
# Create a box plot using Plotly
fig = px.box(df1, x='Region1', y='Estimated Unemployment Rate (%)',
             title='Distribution of Unemployment Rate Across Different States',
             labels={'Estimated Unemployment Rate (%)': 'Unemployment Rate (%)',
                     'Region1': 'Region'})

fig.update_layout(xaxis_tickangle=-45, xaxis_title='', yaxis_title='Unemployment Rate (%)')

fig.show()

# Box  plot of Estimated Unemployment Rate in Region

In [None]:
# Create a box plot using Plotly
fig = px.box(df1, x='Region2', y='Estimated Unemployment Rate (%)',
             title='Distribution of Unemployment Rate Across Different Regions',
             labels={'Estimated Unemployment Rate (%)': 'Unemployment Rate (%)',
                     'Region2': 'Region'})

fig.update_layout(xaxis_tickangle=-45, xaxis_title='', yaxis_title='Unemployment Rate (%)')

fig.show()

# Scatter plot of Estimated Unemployment Rate in States

In [None]:
# Create a scatter plot using Plotly for Region1
fig_region1 = px.scatter(df1, x='Region1', y='Estimated Unemployment Rate (%)',
                          title='Unemployment Rate Across Different States',
                          labels={'Estimated Unemployment Rate (%)': 'Unemployment Rate (%)',
                                  'Region1': 'Region'})

fig_region1.update_layout(xaxis_tickangle=-45, xaxis_title='States', yaxis_title='Unemployment Rate (%)')

fig_region1.show()

# Scatter plot of Estimated Unemployment Rate in Region

In [None]:
# Create a scatter plot using Plotly for Region2
fig_region2 = px.scatter(df1, x='Region2', y='Estimated Unemployment Rate (%)',
                          title='Unemployment Rate Across Different Regions ',
                          labels={'Estimated Unemployment Rate (%)': 'Unemployment Rate (%)',
                                  'Region2': 'Region'})

fig_region2.update_layout(xaxis_tickangle=-45, xaxis_title='Region', yaxis_title='Unemployment Rate (%)')

fig_region2.show()

# Histogram of Estimated Unemployment Rate in States

In [None]:
# Create a histogram using Plotly
fig = px.histogram(df1, x='Region1',y='Estimated Unemployment Rate (%)',color='Region1',
                   title='Histogram of Estimated Unemployment Rate in States',template='plotly')

fig.update_layout(xaxis={'categoryorder': 'total descending'})

fig.show()