# COVID-19 Global Data Tracker
This notebook analyzes global COVID-19 trends.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

## Step 1: Load the Data

In [None]:
df = pd.read_csv('owid-covid-data.csv')
df.head()

## Step 2: Explore the Data

In [None]:
print(df.columns)
print(df.isnull().sum())
df.describe()

## Step 3: Clean the Data

In [None]:

df['date'] = pd.to_datetime(df['date'])
countries = ['Kenya', 'United States', 'India']
df = df[df['location'].isin(countries)]
df = df.dropna(subset=['date', 'total_cases', 'total_deaths'])
df.fillna(0, inplace=True)


## Step 4: Total COVID-19 Cases Over Time

In [None]:

for country in countries:
    subset = df[df['location'] == country]
    plt.plot(subset['date'], subset['total_cases'], label=country)
plt.legend()
plt.title("Total COVID-19 Cases Over Time")
plt.xlabel("Date")
plt.ylabel("Total Cases")
plt.show()


## Step 5: Vaccination Progress Over Time

In [None]:

for country in countries:
    subset = df[df['location'] == country]
    plt.plot(subset['date'], subset['total_vaccinations'], label=country)
plt.legend()
plt.title("Vaccination Progress Over Time")
plt.xlabel("Date")
plt.ylabel("Total Vaccinations")
plt.show()


## Optional: Choropleth Map (requires Plotly)

In [None]:

import plotly.express as px

latest = df[df['date'] == df['date'].max()]
fig = px.choropleth(latest,
                    locations="iso_code",
                    color="total_cases",
                    hover_name="location",
                    color_continuous_scale="Reds",
                    title="Total COVID-19 Cases by Country")
fig.show()


## Summary & Insights
- Country X had the fastest vaccine rollout.
- Country Y experienced a significant wave in month Z.
- Death rates varied significantly by region.