#  COVID-19 Global Data Tracker
This notebook analyzes global COVID-19 trends using real-world data.
It includes data cleaning, exploratory data analysis, and visualization of key metrics.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
sns.set(style='whitegrid')

# Load the dataset
df = pd.read_csv('COVID.csv')
df.head()

## 🧹 Data Cleaning

In [None]:
# Convert 'day' column to datetime format
df['day'] = pd.to_datetime(df['day'], errors='coerce')

# Fill or handle missing values
df['continent'].fillna('Unknown', inplace=True)
df['population'].fillna(df['population'].median(), inplace=True)
df['Recovered'].fillna(0, inplace=True)
df['Deaths'].fillna(0, inplace=True)
df['Tests'].fillna(0, inplace=True)

# Check for remaining missing values
df.isnull().sum()

## 📊 Data Visualization
### Top 10 Countries by Total COVID-19 Cases

In [None]:
top_cases = df.sort_values(by='Cases', ascending=False).head(10)
plt.figure(figsize=(10, 6))
sns.barplot(data=top_cases, x='Cases', y='country', palette='Reds_r')
plt.title('Top 10 Countries by Total COVID-19 Cases')
plt.xlabel('Total Cases')
plt.ylabel('Country')
plt.tight_layout()
plt.show()

### Total Deaths in Top 10 Countries by Cases

In [None]:
plt.figure(figsize=(10, 6))
sns.barplot(data=top_cases, x='Deaths', y='country', palette='Greys_r')
plt.title('Total Deaths in Top 10 Countries by Cases')
plt.xlabel('Total Deaths')
plt.ylabel('Country')
plt.tight_layout()
plt.show()

### Total Tests Conducted in Top 10 Countries

In [None]:
plt.figure(figsize=(10, 6))
sns.barplot(data=top_cases, x='Tests', y='country', palette='Blues_r')
plt.title('Total Tests in Top 10 Countries')
plt.xlabel('Total Tests')
plt.ylabel('Country')
plt.tight_layout()
plt.show()

### Death Rate in Top 10 Countries (Deaths / Cases)

In [None]:
top_cases['death_rate'] = top_cases['Deaths'] / top_cases['Cases']
plt.figure(figsize=(10, 6))
sns.barplot(data=top_cases, x='death_rate', y='country', palette='Purples_r')
plt.title('Death Rate in Top 10 Countries by Cases')
plt.xlabel('Death Rate')
plt.ylabel('Country')
plt.tight_layout()
plt.show()