In [None]:
import warnings
warnings.filterwarnings('ignore')

In [None]:
import numpy as np
import pandas as pd
import scipy.stats as stats
import matplotlib.pyplot as plt
import hvplot.pandas


In [None]:
wage_data = pd.read_csv(r"E:\Minimum Wage Data.csv",encoding="latin1")
state_data = pd.read_csv(r"E:\state_coords.csv",encoding="latin1")
merged_df = pd.merge(wage_data, state_data, left_on="State", right_on="State", how="inner")
merged_df = merged_df.drop(columns="Footnote")
merged_df = merged_df.drop(columns= "Department.Of.Labor.Uncleaned.Data")
df=pd.DataFrame(merged_df)
df.head()



In [None]:
df.tail()

In [None]:
# Extract data for 1968, 1994, and 2020
minimum_wage_1968 = df[df['Year'] == 1968]['State.Minimum.Wage']
minimum_wage_1994 = df[df['Year'] == 1994]['State.Minimum.Wage']
minimum_wage_2020 = df[df['Year'] == 2020]['State.Minimum.Wage']

# Create box plots
plt.figure(figsize=(10, 6))

# Plot box plots for 1968, 1994, and 2020
plt.boxplot([minimum_wage_1968, minimum_wage_1994, minimum_wage_2020], positions=[1, 2, 3], labels=['1968', '1994', '2020'])

# Set x-axis limits
plt.xlim(0.5, 3.5)

plt.xlabel('Year')
plt.ylabel('Minimum Wage ($)')
plt.title('Minimum Wage Distribution in 1968, 1994, and 2020')
plt.grid(True)
plt.legend()
plt.show()

In [None]:
minimum_wage_1994_inflation = df[df['Year'] == 1994]['State.Minimum.Wage.2020.Dollars']
minimum_wage_1968_inflation = df[df['Year'] == 1968]['State.Minimum.Wage.2020.Dollars']
minimum_wage_2020_inflation = df[df['Year'] == 2020]['State.Minimum.Wage.2020.Dollars']

In [None]:
average_state_minimum_wage_inflation=[minimum_wage_1968_inflation.mean(), minimum_wage_1994_inflation.mean(), minimum_wage_2020_inflation.mean()]
average_state_minimum_wage_inflation

In [None]:
minimum_wage_1968_fed = df[df['Year'] == 1968]['Federal.Minimum.Wage.2020.Dollars']
minimum_wage_1994_fed = df[df['Year'] == 1994]['Federal.Minimum.Wage.2020.Dollars']
minimum_wage_2020_fed = df[df['Year'] == 2020]['Federal.Minimum.Wage.2020.Dollars']

In [None]:
average_fed_minimum_wage_inflation=[minimum_wage_1968_fed.mean(), minimum_wage_1994_fed.mean(), minimum_wage_2020_fed.mean()]
average_fed_minimum_wage_inflation

In [None]:
# Create line plot for federal minimum wage
plt.plot(federal_minimum_wage_years, average_fed_minimum_wage_inflation, marker='o', color='r', label='Federal Minimum Wage (2020$)')

# Create line plot for average state minimum wage
plt.plot(federal_minimum_wage_years, average_state_minimum_wage_inflation, marker='o', color='b', label='Average State Minimum Wage (2020 $)')

plt.xlabel('Year')
plt.ylabel('Inflation Adjusted Minimum Wage (2020 $)')
plt.title('Inflation Adjusted Minimum Wage (2020 $)')
plt.grid(True)
plt.ylim(4,10)
plt.legend()
plt.show()


In [None]:
# Extract data for 1968, 1994, and 2020
minimum_wage_1968 = df[df['Year'] == 1968]['State.Minimum.Wage']
minimum_wage_1994 = df[df['Year'] == 1994]['State.Minimum.Wage']
minimum_wage_2020 = df[df['Year'] == 2020]['State.Minimum.Wage']

# Calculate average state minimum wage for 1968, 1994, and 2020
average_state_minimum_wage = [minimum_wage_1968.mean(), minimum_wage_1994.mean(), minimum_wage_2020.mean()]

# Federal minimum wage data
federal_minimum_wage_years = [1968, 1994, 2020]
federal_minimum_wages = [1.6, 4.25, 7.25]  # Example federal minimum wage values for the corresponding years

# Create line plot for federal minimum wage
plt.plot(federal_minimum_wage_years, federal_minimum_wages, marker='o', color='r', label='Federal Minimum Wage')

# Create line plot for average state minimum wage
plt.plot(federal_minimum_wage_years, average_state_minimum_wage, marker='o', color='b', label='Average State Minimum Wage')

plt.xlabel('Year')
plt.ylabel('Minimum Wage ($)')
plt.title('Minimum Wage Distribution in 1968, 1994, and 2020')
plt.grid(True)
plt.legend()
plt.show()

In [None]:
print(minimum_wage_1968.mean())
print(minimum_wage_1994.mean()) 
print(minimum_wage_2020.mean())

In [None]:
1.6
4.25
7.25

In [None]:
stats.f_oneway(minimum_wage_1968, minimum_wage_1994, minimum_wage_2020)

In [None]:
df_1994=df[df["Year"]==1994]
df_1994

In [None]:
df_1994["State.Minimum.Wage"]

In [None]:
df_2020 = df[df['Year'] == 2020]
df_2020.head()

In [None]:
df_2020['Difference_2020'] = df_2020['State.Minimum.Wage'] - df_2020['Federal.Minimum.Wage']
df_2020["State.Min.1994"]=df_1994["State.Minimum.Wage"]
df_2020

In [None]:
negative_diff_df = df_2020[df_2020['Difference_2020'] < 0]

In [None]:
plt.figure(figsize=(12,8))
plt.bar(df_2020['State'], df_2020['Difference_2020'], color='skyblue')
plt.xlabel('State')
plt.ylabel('Difference in Minimum Wage ($)')
plt.xticks(rotation = 90)
plt.title('State vs Federal Minimum Wage (2020)')
plt.grid(axis='y')
plt.show()


In [None]:
plt.figure(figsize=(12, 8))
plt.bar(negative_diff_df['State'], negative_diff_df['Difference_2020'], color='salmon')
plt.xticks(rotation=90)
plt.xlabel('State')
plt.ylabel('Difference in Minimum Wage ($)')
plt.title('States with Negative Difference in Minimum Wage (2020)')
plt.grid(axis='y')
plt.show()

In [None]:
# Plotting a map to plot regionality and show differences in minimum wage per state
# 1994 vs 2020
# changing point color by difference in values
map_plot_1 = df_2020.hvplot.points(
    "longitude",
    "latitude",
    geo = True,
    tiles = "OSM"
)
map_plot_1


In [None]:
map_plot_2 = df_1994.hvplot.points(
    "longitude",
    "latitude",
    geo = True,
    tiles = "OSM",
    color = "red"
)
map_plot_2
