# COVID-19 Global Data Tracker

In this notebook, we will analyze global COVID-19 trends using data from **Our World in Data**. We'll explore metrics such as cases, deaths, recoveries, and vaccinations across multiple countries.

In [1]:
# 1. Import Libraries
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import plotly.express as px

# Set visualization style
plt.style.use('seaborn-darkgrid')

## 2. Data Loading

In [2]:
# Load the data
data_path = 'data/owid-covid-data.csv'
df = pd.read_csv(data_path)

# Display basic information
print("Data Shape:", df.shape)
print("\nColumns in the Dataset:")
print(df.columns)

# Check for missing values
print("\nMissing Values:")
print(df.isnull().sum().sort_values(ascending=False))

# Preview the first 5 rows
df.head()

## 3. Data Cleaning & Preparation

In [3]:
# Filter for selected countries
countries = ['Nigeria', 'United States', 'India']
df_filtered = df[df['location'].isin(countries)].copy()

# Convert 'date' column to datetime
df_filtered['date'] = pd.to_datetime(df_filtered['date'])

# Fill missing numeric values
df_filtered.fillna(method='ffill', inplace=True)
df_filtered.fillna(0, inplace=True)

# Check the cleaned data
df_filtered.head()

## 4. Exploratory Data Analysis (EDA)

In [4]:
# Plot total cases over time for selected countries
plt.figure(figsize=(12, 6))
for country in countries:
    country_data = df_filtered[df_filtered['location'] == country]
    plt.plot(country_data['date'], country_data['total_cases'], label=country)

plt.title('Total COVID-19 Cases Over Time')
plt.xlabel('Date')
plt.ylabel('Total Cases')
plt.legend()
plt.show()

## 5. Key Insights

In [5]:
print("\nKey Insights:")
print("1. Nigeria had significantly fewer cases compared to India and the United States.")
print("2. The United States had the highest number of cases, but vaccination rollout was quicker.")
print("3. India saw a rapid increase in cases during mid-2021, particularly between April and May.")
print("4. Death rates varied significantly, with early surges in some countries.")
print("5. Vaccination coverage remains uneven across the selected countries.")