In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

**Summary** - The Worldwide Pollution Trend, explored through Exploratory Data Analysis (EDA), provides a comprehensive overview of air quality patterns across different regions. This analysis involves examining various aspects such as the distribution of Air Quality Index (AQI) values, correlations between pollutant levels, identification of hazardous conditions, and exploration of pollutant relationships through scatterplot matrices.

# **Data Cleaning**

In [None]:
df = pd.read_csv('/kaggle/input/world-air-quality-index-by-city-and-coordinates/AQI and Lat Long of Countries.csv')
df

In [None]:
df.info()

In [None]:
df.describe(include= 'all')

In [None]:
df.dropna(subset=['Country'], inplace = True)

In [None]:
df.info()

In [None]:
df.duplicated().sum()

In [None]:
df.drop_duplicates(subset=['City'], inplace= True)

# **Data Visualisation**

In [None]:
country = df.groupby('Country', as_index=False).agg('sum').sort_values(by=['AQI Value'], ascending=False).head(5)
country

In [None]:
plt.figure(figsize=(10, 8))
plt.pie(data=country, x='AQI Value', labels='Country', autopct='%.2f', shadow=True, explode=(0.1, 0, 0, 0, 0), colors=[
'tomato', 'cornflowerblue', 'gold', 'orchid', 'green'])
plt.title('AQI Value by Country')
plt.show()

In [None]:
corr_matrix = df[['CO AQI Value', 'Ozone AQI Value', 'NO2 AQI Value', 'PM2.5 AQI Value']].corr()

plt.figure(figsize=(10, 8))
sns.heatmap(corr_matrix, annot=True, cmap='RdYlGn', vmin=-1, vmax=1)
plt.title('Correlation Matrix of Pollutant AQI Values')
plt.show()

In [None]:
plt.figure(figsize=(16, 8))
sns.scatterplot(data=df, x='lng', y='lat', hue='AQI Category')
plt.title('AQI Category Distribution Amoung Countries')
plt.show()

In [None]:
plt.figure(figsize=(12, 8))

# Create a pair plot with scatter plots for each combination of variables with respect to AQI Category
sns.pairplot(data=df, vars=['CO AQI Value', 'Ozone AQI Value', 'NO2 AQI Value', 'PM2.5 AQI Value'],
             hue='AQI Category', palette='viridis', height=2.5)

# Set the title
plt.suptitle('Scatter Plot Matrix of Pollutant AQI Values by AQI Category', y=1.02)

# Show the plot
plt.show()

**Conclusion** - Looking at how air quality is in different places, checking how different pollution levels relate to each other, finding out which areas have really bad air quality, and studying the patterns of pollutants together helps us understand air quality worldwide. This insights might use to make specific plans to make the air better and reduce the harm that pollution does to people and nature.