#### Functions for initial exploration

In [None]:
# Print the first five rows of unemployment
print(unemployment.head())

In [None]:
# Print a summary of non-missing values and data types in the unemployment DataFrame
print(unemployment.info())

In [None]:
# Print summary statistics for numerical columns in unemployment
print(unemployment.describe())

#### Counting categorical values

In [None]:
# Count the values associated with each continent in unemployment
print(unemployment['continent'].value_counts())

#### Global unemployment in 2021

In [None]:
# Import the required visualization libraries
import seaborn as sns
import matplotlib.pyplot as plt

# Create a histogram of 2021 unemployment; show a full percent in each bin
sns.histplot(x='2021',data=unemployment,binwidth=1)
plt.show()

#### Detecting data types

In [None]:
# Update the data type of the 2019 column to a float
unemployment["2019"] = unemployment['2019'].astype(float)
# Print the dtypes to check your work
print(unemployment.dtypes)

#### Validating continents

In [None]:
# Define a Series describing whether each continent is outside of Oceania
not_oceania = unemployment['continent'].isin(['Oceania'])
not_oceania = not_oceania == False

In [None]:
# Define a Series describing whether each continent is outside of Oceania
not_oceania = ~unemployment["continent"].isin(["Oceania"])

# Print unemployment without records related to countries in Oceania
print(unemployment[not_oceania])

#### Validating range

In [None]:
# Print the minimum and maximum unemployment rates during 2021
print(unemployment['2021'].min(), unemployment['2021'].max())

# Create a boxplot of 2021 unemployment rates, broken down by continent
sns.boxplot(x='2021',y='continent',data=unemployment)
plt.show()

#### Summaries with .groupby() and .agg()

In [None]:
# Print the mean and standard deviation of rates by year
print(unemployment.agg(['mean','std']))

In [None]:
# Print yearly mean and standard deviation grouped by continent
print(unemployment.groupby('continent').agg(['mean','std']))

In [None]:
continent_summary = unemployment.groupby("continent").agg(
    # Create the mean_rate_2021 column
    mean_rate_2021 = ('2021','mean'),
    # Create the std_rate_2021 column
    std_rate_2021 = ('2021','std')
)
print(continent_summary)

#### Visualizing categorical summaries

In [None]:
# Create a bar plot of continents and their average unemployment
sns.barplot(x='continent',y='2021',data=unemployment)
plt.show()