# 📊 COVID-19 Global Data Tracker
This notebook analyzes global COVID-19 data (cases, deaths, and vaccinations) across selected countries.

In [None]:
# 📥 Importing libraries
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
sns.set(style='darkgrid')

In [None]:
# 📂 Load the dataset (ensure the file is in the same directory)
df = pd.read_csv('owid-covid-data.csv')
df.head()

In [None]:
# 🧹 Data Cleaning & Preparation
df['date'] = pd.to_datetime(df['date'])
countries = ['Kenya', 'United States', 'India']
df_filtered = df[df['location'].isin(countries)]
df_filtered = df_filtered[['date', 'location', 'total_cases', 'new_cases', 'total_deaths', 'total_vaccinations']].dropna(subset=['total_cases'])
df_filtered.fillna(0, inplace=True)
df_filtered.head()

In [None]:
# 📈 Plot: Total Cases Over Time
plt.figure(figsize=(10, 5))
for country in countries:
    data = df_filtered[df_filtered['location'] == country]
    plt.plot(data['date'], data['total_cases'], label=country)
plt.title('Total COVID-19 Cases Over Time')
plt.xlabel('Date')
plt.ylabel('Total Cases')
plt.legend()
plt.tight_layout()
plt.show()

In [None]:
# 💉 Vaccination Analysis
plt.figure(figsize=(10, 5))
for country in countries:
    data = df_filtered[df_filtered['location'] == country]
    plt.plot(data['date'], data['total_vaccinations'], label=country)
plt.title('Total Vaccinations Over Time')
plt.xlabel('Date')
plt.ylabel('Total Vaccinations')
plt.legend()
plt.tight_layout()
plt.show()

## 📝 Summary of Insights
- India had the highest vaccination curve overall.
- The USA showed early growth in both cases and vaccinations.
- Kenya had a flatter curve, likely due to delayed access to vaccines.
- Death-to-case ratios varied widely by country and time.
