# 03. Country Analysis

This notebook provides a detailed look at COVID-19 statistics by country.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import os

sns.set(style="whitegrid")
data_dir = "../archive"

## 1. Load Data

In [None]:
country_wise = pd.read_csv(os.path.join(data_dir, "country_wise_latest.csv"))
full_grouped = pd.read_csv(os.path.join(data_dir, "full_grouped.csv"))
full_grouped['Date'] = pd.to_datetime(full_grouped['Date'])

## 2. Top 10 Countries - Total Cases

In [None]:
top_countries = country_wise.nlargest(10, 'Confirmed')

plt.figure(figsize=(12, 6))
sns.barplot(x='Confirmed', y='Country/Region', data=top_countries, palette='viridis')
plt.title('Top 10 Countries by Confirmed Cases')
plt.xlabel('Confirmed Cases')
plt.ylabel('Country')
plt.show()

## 3. Case Trajectory for Top 5 Countries

In [None]:
top_5_names = top_countries['Country/Region'].head(5).tolist()
top_5_data = full_grouped[full_grouped['Country/Region'].isin(top_5_names)]

plt.figure(figsize=(14, 7))
sns.lineplot(x='Date', y='Confirmed', hue='Country/Region', data=top_5_data)
plt.title('Trajectory of Confirmed Cases for Top 5 Countries')
plt.show()

## 4. Deaths per 100 Cases (Mortality Rate)
Comparing the severity of the outbreak in the most affected countries.

In [None]:
plt.figure(figsize=(12, 6))
sns.barplot(x='Deaths / 100 Cases', y='Country/Region', data=top_countries.sort_values('Deaths / 100 Cases', ascending=False), palette='Reds_r')
plt.title('Mortality Rate (Deaths / 100 Cases) in Top 10 Affected Countries')
plt.show()