# Covid-19 Data Analysis

Analyze real-time Covid-19 data to uncover trends and understand the impact of various factors like vaccination and lockdowns.

## 1. Import Libraries

In [ ]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

## 2. Load Data

In [ ]:
# Update the path to your actual data file
df = pd.read_csv('../data/covid_data.csv')
print(df.head())
print(df.info())

## 3. Data Cleaning
- Handle missing values
- Format columns correctly

In [ ]:
df.fillna(method='ffill', inplace=True)  # Simple forward fill for missing data
# Additional cleaning steps depending on your data can be added here

## 4. Exploratory Data Analysis (EDA)
- Visualize cases, deaths, recoveries
- Plot trends over time

In [ ]:
plt.figure(figsize=(12,6))
plt.plot(df['date'], df['cases'], label='Cases')
plt.plot(df['date'], df['deaths'], label='Deaths')
plt.plot(df['date'], df['recoveries'], label='Recoveries')
plt.xlabel('Date')
plt.ylabel('Count')
plt.title('Covid-19 Cases, Deaths, and Recoveries Over Time')
plt.legend()
plt.xticks(rotation=45)
plt.tight_layout()
plt.show()

## 5. Correlation Analysis
- Explore relationships between variables like vaccination rates and case counts

In [ ]:
if 'vaccination_rate' in df.columns:
    plt.figure(figsize=(8,6))
    sns.scatterplot(x='vaccination_rate', y='cases', data=df)
    plt.title('Vaccination Rate vs Cases')
    plt.show()

## 6. Summary Statistics
Display basic statistics to summarize data.

In [ ]:
print(df.describe())