# COVID-19 Interactive Analysis Dashboard

## What is COVID-19?
> Coronaviruses are a large family of viruses that may cause respiratory illnesses in humans ranging from common colds to more severe conditions such as Severe Acute Respiratory Syndrome (SARS) and Middle Eastern Respiratory Syndrome (MERS).1 'Novel coronavirus' is a new, previously unidentified strain of coronavirus. The novel coronavirus involved in the current outbreak has been named SARS-CoV-2 by the World Health Organization (WHO). 3The disease it causes has been named “coronavirus disease 2019” (or “COVID-19”).



<img src = "covid.jpg">

In [1]:
# IMPORTING THE DEPENDENCIES

from __future__ import print_function
from ipywidgets import interact, interactive, fixed, interact_manual
from IPython.core.display import display, HTML

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import plotly.express as px
import folium
import plotly.graph_objects as go
import seaborn as sns
import ipywidgets as widgets

In [2]:
# LOADING THE DATA 

death_df = pd.read_csv('https://raw.githubusercontent.com/CSSEGISandData/COVID-19/master/csse_covid_19_data/csse_covid_19_time_series/time_series_covid19_deaths_global.csv')
confirmed_df = pd.read_csv('https://raw.githubusercontent.com/CSSEGISandData/COVID-19/master/csse_covid_19_data/csse_covid_19_time_series/time_series_covid19_confirmed_global.csv')
recovered_df = pd.read_csv('https://raw.githubusercontent.com/CSSEGISandData/COVID-19/master/csse_covid_19_data/csse_covid_19_time_series/time_series_covid19_recovered_global.csv')
country_df = pd.read_csv('https://raw.githubusercontent.com/CSSEGISandData/COVID-19/web-data/data/cases_country.csv')

In [3]:
death_df.head() # FIRST FIVE RECORDS

Unnamed: 0,Province/State,Country/Region,Lat,Long,1/22/20,1/23/20,1/24/20,1/25/20,1/26/20,1/27/20,...,2/25/22,2/26/22,2/27/22,2/28/22,3/1/22,3/2/22,3/3/22,3/4/22,3/5/22,3/6/22
0,,Afghanistan,33.93911,67.709953,0,0,0,0,0,0,...,7579,7585,7593,7598,7609,7617,7619,7619,7622,7623
1,,Albania,41.1533,20.1683,0,0,0,0,0,0,...,3458,3458,3464,3469,3472,3474,3474,3478,3478,3482
2,,Algeria,28.0339,1.6596,0,0,0,0,0,0,...,6823,6828,6831,6835,6840,6843,6848,6852,6853,6855
3,,Andorra,42.5063,1.5218,0,0,0,0,0,0,...,151,151,151,151,151,151,151,151,151,151
4,,Angola,-11.2027,17.8739,0,0,0,0,0,0,...,1899,1899,1899,1900,1900,1900,1900,1900,1900,1900


In [4]:
confirmed_df.head()

Unnamed: 0,Province/State,Country/Region,Lat,Long,1/22/20,1/23/20,1/24/20,1/25/20,1/26/20,1/27/20,...,2/25/22,2/26/22,2/27/22,2/28/22,3/1/22,3/2/22,3/3/22,3/4/22,3/5/22,3/6/22
0,,Afghanistan,33.93911,67.709953,0,0,0,0,0,0,...,173084,173146,173395,173659,173879,174073,174214,174214,174331,174582
1,,Albania,41.1533,20.1683,0,0,0,0,0,0,...,271141,271141,271527,271563,271702,271825,271825,272030,272030,272210
2,,Algeria,28.0339,1.6596,0,0,0,0,0,0,...,264706,264778,264855,264936,265010,265079,265130,265186,265227,265265
3,,Andorra,42.5063,1.5218,0,0,0,0,0,0,...,37999,37999,37999,37999,38165,38249,38342,38434,38434,38434
4,,Angola,-11.2027,17.8739,0,0,0,0,0,0,...,98701,98701,98701,98741,98746,98746,98746,98796,98796,98806


In [5]:
recovered_df.head()

Unnamed: 0,Province/State,Country/Region,Lat,Long,1/22/20,1/23/20,1/24/20,1/25/20,1/26/20,1/27/20,...,2/25/22,2/26/22,2/27/22,2/28/22,3/1/22,3/2/22,3/3/22,3/4/22,3/5/22,3/6/22
0,,Afghanistan,33.93911,67.709953,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
1,,Albania,41.1533,20.1683,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
2,,Algeria,28.0339,1.6596,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
3,,Andorra,42.5063,1.5218,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0
4,,Angola,-11.2027,17.8739,0,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,0


In [6]:
country_df.head()

Unnamed: 0,Country_Region,Last_Update,Lat,Long_,Confirmed,Deaths,Recovered,Active,Incident_Rate,People_Tested,People_Hospitalized,Mortality_Rate,UID,ISO3,Cases_28_Days,Deaths_28_Days
0,Afghanistan,2022-03-07 18:21:02,33.93911,67.709953,175000,7626,,,449.543945,,,4.357714,4,AFG,8391,191
1,Albania,2022-03-07 18:21:02,41.1533,20.1683,272210,3482,,,9458.961707,,,1.279159,8,ALB,7586,102
2,Algeria,2022-03-07 18:21:02,28.0339,1.6596,265265,6855,,,604.922898,,,2.584208,12,DZA,7289,209
3,Andorra,2022-03-07 18:21:02,42.5063,1.5218,38434,151,,,49743.091956,,,0.392881,20,AND,1835,4
4,Angola,2022-03-07 18:21:02,-11.2027,17.8739,98806,1900,,,300.630421,,,1.92296,24,AGO,442,4


In [7]:
# DATA CLEANING

country_df.columns = map(str.lower, country_df.columns)
print("Country Columns :",country_df.columns)

confirmed_df.columns = map(str.lower, confirmed_df.columns)
print("Confirmed Columns :",confirmed_df.columns)

recovered_df.columns = map(str.lower, recovered_df.columns)
print("Recovered Columns :",recovered_df.columns)

death_df.columns = map(str.lower, death_df.columns)
print("Death Columns :",death_df.columns)

Country Columns : Index(['country_region', 'last_update', 'lat', 'long_', 'confirmed', 'deaths',
       'recovered', 'active', 'incident_rate', 'people_tested',
       'people_hospitalized', 'mortality_rate', 'uid', 'iso3', 'cases_28_days',
       'deaths_28_days'],
      dtype='object')
Confirmed Columns : Index(['province/state', 'country/region', 'lat', 'long', '1/22/20', '1/23/20',
       '1/24/20', '1/25/20', '1/26/20', '1/27/20',
       ...
       '2/25/22', '2/26/22', '2/27/22', '2/28/22', '3/1/22', '3/2/22',
       '3/3/22', '3/4/22', '3/5/22', '3/6/22'],
      dtype='object', length=779)
Recovered Columns : Index(['province/state', 'country/region', 'lat', 'long', '1/22/20', '1/23/20',
       '1/24/20', '1/25/20', '1/26/20', '1/27/20',
       ...
       '2/25/22', '2/26/22', '2/27/22', '2/28/22', '3/1/22', '3/2/22',
       '3/3/22', '3/4/22', '3/5/22', '3/6/22'],
      dtype='object', length=779)
Death Columns : Index(['province/state', 'country/region', 'lat', 'long', '1/22/2

In [8]:
confirmed_df = confirmed_df.rename(columns = {'provision/state' : 'state', 'country/region' : 'country'})

recovered_df = confirmed_df.rename(columns={'province/state': 'state', 'country/region': 'country'})

death_df = death_df.rename(columns={'province/state': 'state', 'country/region': 'country'})

country_df = country_df.rename(columns={'country_region': 'country'})

In [9]:
# total number of confirmed, death and recovered cases

confirmed_total = int(country_df['confirmed'].sum())
deaths_total = int(country_df['deaths'].sum())
recovered_total = int(country_df['recovered'].sum())
active_total = int(country_df['active'].sum())

In [24]:
confirmed_df.dropna(inplace = True)

In [10]:
# displaying the total stats

display(HTML("<div style = 'background-color: #504e4e; padding: 30px '>" +
             "<span style='color: #fff; font-size:30px;'> Confirmed: "  + str(confirmed_total) +"</span>" +
             "<span style='color: red; font-size:30px;margin-left:20px;'> Deaths: " + str(deaths_total) + "</span>"+
             "<span style='color: lightgreen; font-size:30px; margin-left:20px;'> Recovered: " + str(recovered_total) + "</span>"+
             "</div>")
       )

# COVID-19 Confirmed/Death/Recovered Cases By Countries

## Enter number of countries you want the data for 

In [11]:
# sorting the values by confirmed descednding order
# country_df.sort_values('confirmed', ascending= False).head(10).style.background_gradient(cmap='copper')

fig = go.FigureWidget( layout=go.Layout() )
def highlight_col(x):
    r = 'background-color: red'
    y = 'background-color: purple'
    g = 'background-color: grey'
    df1 = pd.DataFrame('', index=x.index, columns=x.columns)
    df1.iloc[:, 4] = y
    df1.iloc[:, 5] = r
    df1.iloc[:, 6] = g
    
    return df1

def show_latest_cases(n):
    n = int(n)
    return country_df.sort_values('confirmed', ascending= False).head(n).style.apply(highlight_col, axis=None)

interact(show_latest_cases, n='10')

ipywLayout = widgets.Layout(border='solid 2px green')
ipywLayout.display='none' # uncomment this, run cell again - then the graph/figure disappears
widgets.VBox([fig], layout=ipywLayout)

interactive(children=(Text(value='10', description='n'), Output()), _dom_classes=('widget-interact',))

VBox(children=(FigureWidget({
    'data': [], 'layout': {'template': '...'}
}),), layout=Layout(border='solid …

In [12]:
sorted_country_df = country_df.sort_values('confirmed', ascending= False)

## Slide to check for the worst hit countries

In [13]:
# plotting the 20 worst hit countries

def bubble_chart(n):
    fig = px.scatter(sorted_country_df.head(n), x="country", y="confirmed", size="confirmed", color="country",
               hover_name="country", size_max=60)
    fig.update_layout(
    title=str(n) +" Worst hit countries",
    xaxis_title="Countries",
    yaxis_title="Confirmed Cases",
    width = 700
    )
    fig.show();

interact(bubble_chart, n=10)

ipywLayout = widgets.Layout(border='solid 2px green')
ipywLayout.display='none'
widgets.VBox([fig], layout=ipywLayout)

interactive(children=(IntSlider(value=10, description='n', max=30, min=-10), Output()), _dom_classes=('widget-…

VBox(children=(FigureWidget({
    'data': [], 'layout': {'template': '...'}
}),), layout=Layout(border='solid …

In [14]:
def plot_cases_of_a_country(country):
    labels = ['confirmed', 'deaths']
    colors = ['blue', 'red']
    mode_size = [6, 8]
    line_size = [4, 5]
    
    df_list = [confirmed_df, death_df]
    
    fig = go.Figure();
    
    for i, df in enumerate(df_list):
        if country == 'World' or country == 'world':
            x_data = np.array(list(df.iloc[:, 20:].columns))
            y_data = np.sum(np.asarray(df.iloc[:,4:]),axis = 0)
            
        else:    
            x_data = np.array(list(df.iloc[:, 20:].columns))
            y_data = np.sum(np.asarray(df[df['country'] == country].iloc[:,20:]),axis = 0)
        print(i)
        fig.add_trace(go.Scatter(x=x_data, y=y_data, mode='lines+markers',
        name=labels[i],
        line=dict(color=colors[i], width=line_size[i]),
        connectgaps=True,
        text = "Total " + str(labels[i]) +": "+ str(y_data[-1])
        ));
    
    fig.update_layout(
        title="COVID 19 cases of " + country,
        xaxis_title='Date',
        yaxis_title='No. of Confirmed Cases',
        margin=dict(l=20, r=20, t=40, b=20),
        paper_bgcolor="lightgrey",
        width = 800,
        
    );
    
    fig.update_yaxes(type="linear")
    fig.show();

## Check the details of your country or the World

- Enter the name of your country(in capitalized format(e.g. Italy)) and world for total cases.

In [15]:
interact(plot_cases_of_a_country, country='World')

ipywLayout = widgets.Layout(border='solid 2px green')
ipywLayout.display='none' # uncomment this, run cell again - then the graph/figure disappears
widgets.VBox([fig], layout=ipywLayout)

interactive(children=(Text(value='World', description='country'), Output()), _dom_classes=('widget-interact',)…

VBox(children=(FigureWidget({
    'data': [], 'layout': {'template': '...'}
}),), layout=Layout(border='solid …

## 10 worst hit countries - Confirmed Cases

In [16]:
px.bar(
    sorted_country_df.head(10),
    x = "country",
    y = "confirmed",
    title= "Top 10 worst affected countries", # the axis names
    color_discrete_sequence=["pink"], 
    height=500,
    width=800
)

## 10 worst hit countries - Death Cases

In [17]:
px.bar(
    sorted_country_df.head(10),
    x = "country",
    y = "deaths",
    title= "Top 10 worst affected countries", # the axis names
    color_discrete_sequence=["pink"], 
    height=500,
    width=800
)

# Global spread of COVID-19

In [25]:
world_map = folium.Map(location=[11,0], tiles="cartodbpositron", zoom_start=2, max_zoom = 6, min_zoom = 2)


for i in range(0,len(confirmed_df)):
    folium.Circle(
        location=[confirmed_df.iloc[i]['lat'], confirmed_df.iloc[i]['long']],
        fill=True,
        radius=(int((np.log(confirmed_df.iloc[i,-1]+1.00001)))+0.2)*50000,
        color='red',
        fill_color='indigo',
        tooltip = "<div style='margin: 0; background-color: black; color: white;'>"+
                    "<h4 style='text-align:center;font-weight: bold'>"+confirmed_df.iloc[i]['country'] + "</h4>"
                    "<hr style='margin:10px;color: white;'>"+
                    "<ul style='color: white;;list-style-type:circle;align-item:left;padding-left:20px;padding-right:20px'>"+
                        "<li>Confirmed: "+str(confirmed_df.iloc[i,-1])+"</li>"+
                        "<li>Deaths:   "+str(death_df.iloc[i,-1])+"</li>"+
                        "<li>Death Rate: "+ str(np.round(death_df.iloc[i,-1]/(confirmed_df.iloc[i,-1]+1.00001)*100,2))+ "</li>"+
                    "</ul></div>",
        ).add_to(world_map)

world_map

# STAY SAFE & HEALTHY!!