In [None]:
import pandas as pd

df = pd.read_csv('owid-covid-data.csv')
df.head()

## Data Cleaning

In [None]:
df['date'] = pd.to_datetime(df['date'])
countries = ['Kenya', 'United States', 'India']
df_filtered = df[df['location'].isin(countries)]
df_filtered = df_filtered.fillna(0)

## Exploratory Data Analysis (EDA)

In [None]:
import matplotlib.pyplot as plt
import seaborn as sns

# Plot total cases over time
plt.figure(figsize=(12, 6))
sns.lineplot(data=df_filtered, x='date', y='total_cases', hue='location')
plt.title('Total COVID-19 Cases Over Time')
plt.xlabel('Date')
plt.ylabel('Total Cases')
plt.grid(True)
plt.show()

# Plot total deaths over time
plt.figure(figsize=(12, 6))
sns.lineplot(data=df_filtered, x='date', y='total_deaths', hue='location')
plt.title('Total COVID-19 Deaths Over Time')
plt.xlabel('Date')
plt.ylabel('Total Deaths')
plt.grid(True)
plt.show()

# Compare daily new cases
plt.figure(figsize=(12, 6))
sns.lineplot(data=df_filtered, x='date', y='new_cases', hue='location')
plt.title('Daily New COVID-19 Cases Over Time')
plt.xlabel('Date')
plt.ylabel('New Cases')
plt.grid(True)
plt.show()

# Calculate death rate
df_filtered['death_rate'] = (df_filtered['total_deaths'] / df_filtered['total_cases']) * 100
df_filtered['death_rate'] = df_filtered['death_rate'].fillna(0) # Handle division by zero

# Plot death rate over time
plt.figure(figsize=(12, 6))
sns.lineplot(data=df_filtered, x='date', y='death_rate', hue='location')
plt.title('COVID-19 Death Rate Over Time')
plt.xlabel('Date')
plt.ylabel('Death Rate (%)')
plt.grid(True)
plt.show()

## Visualizing Vaccination Progress

In [None]:
# Plot cumulative vaccinations over time
plt.figure(figsize=(12, 6))
sns.lineplot(data=df_filtered, x='date', y='total_vaccinations', hue='location')
plt.title('Total COVID-19 Vaccinations Over Time')
plt.xlabel('Date')
plt.ylabel('Total Vaccinations')
plt.grid(True)
plt.show()

## Insights & Reporting

### Key Insights:

*   **Insight 1:** [Summarize a key trend from total cases or deaths over time.]
*   **Insight 2:** [Compare daily new cases between countries and highlight any significant differences.]
*   **Insight 3:** [Discuss the death rate trends and any notable observations.]
*   **Insight 4:** [Analyze the vaccination progress and compare it across countries.]

### Conclusion:

This notebook provides an exploratory data analysis of global COVID-19 trends, including cases, deaths, and vaccination progress. The visualizations highlight key patterns and differences across selected countries. Further analysis could involve more detailed statistical modeling, forecasting, or exploring additional variables in the dataset.