# Covid-19 Dataset Understanding

In [None]:
# !pip install folium
# !pip install plotly

In [None]:
# import
import plotly.express as px
import plotly.graph_objects as go
import plotly.figure_factory as ff
from plotly.subplots import make_subplots

import folium

import pandas as pd 
import numpy as np
import matplotlib.pyplot as plt

%matplotlib inline

import math 
import random
from datetime import timedelta

import warnings 
warnings.filterwarnings('ignore')

# color pallette 
cnf = '#393e46'
dth = '#ff2e63'
rec = '#21bf73'
act = '#fe9801'

# Dataset Preparation

In [None]:
import plotly as py
py.offline.init_notebook_mode(connected=True)

In [None]:
import os

In [None]:
try:
    os.system("rm - rf Covid-19-Preprocessed-Dataset")
except:
    print("File does not exist")

In [None]:
!git clone https://github.com/laxmimerit/Covid-19-Preprocessed-Dataset

In [None]:
df = pd.read_csv('Covid-19-Preprocessed-Dataset/preprocessed/covid_19_data_cleaned.csv', parse_dates=['Date'])
country_daywise= pd.read_csv('Covid-19-Preprocessed-Dataset/preprocessed/country_daywise.csv', parse_dates=['Date'])
countrywise = pd.read_csv('Covid-19-Preprocessed-Dataset/preprocessed/countrywise.csv')
daywise = pd.read_csv('Covid-19-Preprocessed-Dataset/preprocessed/daywise.csv', parse_dates=['Date'])


In [None]:
df['Province/State']= df['Province/State'].fillna("")
df.head()

In [None]:
country_daywise

In [None]:
countrywise

In [None]:
daywise

In [None]:
df

In [None]:
confirmed = df.groupby('Date').sum()['Confirmed'].reset_index()
confirmed

In [None]:
recovered = df.groupby('Date').sum()['Recovered'].reset_index()
recovered

In [None]:
deaths = df.groupby('Date').sum()['Deaths'].reset_index()
deaths

In [None]:
df.isnull().sum()

In [None]:
df.info()

In [None]:
df.query('Country == "US"')

# Worldwide Total Confirmed, Recovered and Deaths

In [None]:
confirmed.head()

In [None]:
confirmed.tail()

In [None]:
recovered.head()

In [None]:
recovered.tail()

In [None]:
deaths.head()

In [None]:
deaths.tail()

# Total number of covid-19 cases in the world

In [None]:
fig = go.Figure()
fig.add_trace(go.Scatter(x = confirmed['Date'], y = confirmed['Confirmed'], mode = 'lines+markers', name = 'Confirmed', line = dict(color = "Gray", width = 4)))
fig.show()

# Total number of covid-19 recoveries in the world

In [None]:
fig = go.Figure()
fig.add_trace(go.Scatter(x = recovered['Date'], y = recovered['Recovered'], mode = 'lines+markers', name = 'Recovered', line = dict(color = "Green", width = 4)))
fig.show()   

#Since the number of recoveries as of August 5 is not included in the data set, it appears as 0 as of August 5, 2021, which has improved in the graphics and tables.

# Total number of covid-19 deaths in the world

In [None]:
fig = go.Figure()
fig.add_trace(go.Scatter(x = deaths['Date'], y = deaths['Deaths'], mode = 'lines+markers', name = 'Deaths', line = dict(color = "Red", width = 4)))
fig.show()

In [None]:
fig = go.Figure()
fig.add_trace(go.Scatter(x = confirmed['Date'], y = confirmed['Confirmed'], mode = 'lines+markers', name = 'Confirmed', line = dict(color = "Gray", width = 4)))
fig.add_trace(go.Scatter(x = recovered['Date'], y = recovered['Recovered'], mode = 'lines+markers', name = 'Recovered', line = dict(color = "Green", width = 4)))
fig.add_trace(go.Scatter(x = deaths['Date'], y = deaths['Deaths'], mode = 'lines+markers', name = 'Deaths', line = dict(color = "Red", width = 4)))
fig.update_layout(title = 'Worldwide Covid-19 Cases', xaxis_tickfont_size = 14, yaxis = dict(title = 'Number of Cases'))
fig.show()

# Cases Density Animation on World Map

In [None]:
df.info()

In [None]:
df.head()

In [None]:
fig = px.density_mapbox(df, lat = 'Lat', lon= 'Long', hover_name = 'Country', hover_data = ['Confirmed', 'Recovered', 'Deaths'], animation_frame='Country', color_continuous_scale='Portland', radius = 7, zoom = 0, height=700)
fig.update_layout(title = 'Worldwide Covid-19 Cases with Time Laps')
fig.update_layout(mapbox_style= 'open-street-map', mapbox_center_lon= 0)
fig.show()