In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
from datetime import datetime

sns.set(style='whitegrid')

In [None]:
# Load the dataset
df = pd.read_csv('cleaned_covid_data.csv')
df['Date'] = pd.to_datetime(df['Date'])
df.head()

In [None]:
# Check for missing values
df.isnull().sum()

In [None]:
# Total confirmed cases by WHO Region
region_summary = df.groupby('WHO Region')['Confirmed'].sum().sort_values(ascending=False)

plt.figure(figsize=(10,6))
sns.barplot(x=region_summary.index, y=region_summary.values, palette="viridis")
plt.title("Total Confirmed COVID-19 Cases by WHO Region")
plt.ylabel("Total Confirmed Cases")
plt.xlabel("WHO Region")
plt.xticks(rotation=45)
plt.tight_layout()
plt.show()

In [None]:
# Trend of confirmed cases over time
date_summary = df.groupby('Date')['Confirmed'].sum()

plt.figure(figsize=(12,6))
sns.lineplot(x=date_summary.index, y=date_summary.values)
plt.title("Trend of Confirmed COVID-19 Cases Over Time")
plt.ylabel("Total Confirmed Cases")
plt.xlabel("Date")
plt.xticks(rotation=45)
plt.tight_layout()
plt.show()

In [None]:
# Top 10 countries by confirmed cases
country_summary = df.groupby('Country/Region')['Confirmed'].sum().sort_values(ascending=False).head(10)

plt.figure(figsize=(10,6))
sns.barplot(x=country_summary.values, y=country_summary.index, palette="magma")
plt.title("Top 10 Countries by Total Confirmed Cases")
plt.xlabel("Total Confirmed Cases")
plt.ylabel("Country/Region")
plt.tight_layout()
plt.show()

## Conclusion
- The analysis provided insights into the spread of COVID-19 across WHO regions and countries.
- Time-based trends helped identify the rise in confirmed cases globally.
- This serves as a basic exploratory analysis which can be expanded with additional data like vaccination, mobility, and testing.