# CoronaVirus 2020

Coronaviruses (CoV) are a large family of viruses that cause illness ranging from the common cold to more severe diseases such as Middle East Respiratory Syndrome (MERS-CoV) and Severe Acute Respiratory Syndrome (SARS-CoV).

Coronavirus disease (COVID-19) is a new strain that was discovered in 2019 and has not been previously identified in humans.

Coronaviruses are zoonotic, meaning they are transmitted between animals and people.  Detailed investigations found that SARS-CoV was transmitted from civet cats to humans and MERS-CoV from dromedary camels to humans. Several known coronaviruses are circulating in animals that have not yet infected humans. 

WHO link - https://www.who.int/health-topics/coronavirus

In [None]:
# This Python 3 environment comes with many helpful analytics libraries installed
# It is defined by the kaggle/python docker image: https://github.com/kaggle/docker-python
# For example, here's several helpful packages to load in 

import numpy as np # linear algebra
import pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)
import matplotlib.pyplot as plt
%matplotlib inline 

# Input data files are available in the "../input/" directory.
# For example, running this (by clicking run or pressing Shift+Enter) will list all files under the input directory



confirm = pd.read_csv("/kaggle/input/novel-corona-virus-2019-dataset/time_series_covid_19_confirmed.csv")
recover = pd.read_csv("/kaggle/input/novel-corona-virus-2019-dataset/time_series_covid_19_recovered.csv")
defeat = pd.read_csv("/kaggle/input/novel-corona-virus-2019-dataset/time_series_covid_19_deaths.csv")

# Any results you write to the current directory are saved as output.

In [None]:
total=pd.DataFrame({'confirmed':[1],'recovered':[1],'death':[1]})
total['death']=defeat.iloc[:,4:].sum().max()
total['confirmed']=confirm.iloc[:,4:].sum().max()
total['recovered']=recover.iloc[:,4:].sum().max()
total.index=[confirm.columns.values[-1]]
total.style.background_gradient(cmap='GnBu')

In [None]:
plt.bar(total.columns.values,total.values[0])

In [None]:
cases_day=pd.DataFrame({'confirmed':[],'recovered':[],'death':[]})
cases_day['death']=defeat.iloc[:,4:].sum()
cases_day['confirmed']=confirm.iloc[:,4:].sum()
cases_day['recovered']=recover.iloc[:,4:].sum()


In [None]:
 confirm_cases=confirm.iloc[:,4:].sum()
death_cases=defeat.iloc[:,4:].sum()

plt.figure(figsize=(20,7))
plt.scatter(confirm_cases.index,confirm_cases.values)
plt.plot(confirm_cases.index,confirm_cases.values)

plt.scatter(death_cases.index,death_cases.values)
plt.plot(death_cases.index,death_cases.values)


plt.title('Confirmed Vs Deaths' , size=25)
plt.xlabel('Date', size=20)
plt.ylabel('Cases', size=20)
plt.xticks(rotation=45, size=15)
plt.yticks(size=15)


In [None]:
cases_day.plot(kind='bar',figsize=(20,10))

plt.title('Growth of cases' , size=25)
plt.xlabel('Date', size=20)
plt.ylabel('Cases', size=20)
plt.xticks(rotation=45, size=15)
plt.yticks(size=15)
plt.legend(loc = "upper left"
           , frameon = True
           , fontsize = 15
           , ncol = 2 
           , fancybox = True
           , framealpha = 0.95
           , shadow = True
           , borderpad = 1)


In [None]:
cases_day['mortality']=cases_day['death']/cases_day['confirmed']
cases_day['mortality'].plot(figsize=(15,7))

plt.title('Growth of mortality rate' , size=25)
plt.xlabel('Date', size=20)
plt.ylabel('Mortality Rate', size=20)
plt.xticks(rotation=45, size=15)
plt.yticks(size=15)
plt.legend(loc = "upper left"
           , frameon = True
           , fontsize = 15
           , ncol = 2 
           , fancybox = True
           , framealpha = 0.95
           , shadow = True
           , borderpad = 1)



# Mortality among different Age Groups

source  https://i.insider.com/5e67b19a54f25c32e320ef33?width=600&format=jpeg&auto=webp


<html><img src='https://i.insider.com/5e67b19a54f25c32e320ef33?width=600&format=jpeg&auto=webp'></html>

# Data Across Countries

In [None]:
q=defeat.groupby("Country/Region").sum().iloc[:,3:].max(axis=1)
r=confirm.groupby("Country/Region").sum().iloc[:,3:].max(axis=1)
t=recover.groupby("Country/Region").sum().iloc[:,3:].max(axis=1)

b=pd.DataFrame({'confirmed':[],'recovered':[],'death':[]})
b['death']=q
b['confirmed']=r
b['recovered']=t

In [None]:
b.sort_values(by='death',ascending=False).style.background_gradient(cmap='GnBu')

In [None]:
b.sort_values(by= ['death','confirmed'],ascending=False).head(10).plot(kind='bar',figsize=(20,10))
plt.title('Top 10 affected countries' , size=25)
plt.xlabel('countries', size=20)
plt.ylabel('Cases', size=20)
plt.xticks(rotation=45, size=15)
plt.yticks(size=15)
plt.legend(loc = "upper right"
           , frameon = True
           , fontsize = 15
           , ncol = 2 
           , fancybox = True
           , framealpha = 0.95
           , shadow = True
           , borderpad = 1)


# China


In [None]:
china=pd.DataFrame({'confirmed':[],'recovered':[],'death':[]})
china['death']=defeat[defeat['Country/Region']=='China'].drop(['Country/Region'],axis=1).groupby('Province/State').sum().iloc[:,2:].sum(axis=1)
china['confirmed']=confirm[confirm['Country/Region']=='China'].drop(['Country/Region'],axis=1).groupby('Province/State').sum().iloc[:,2:].sum(axis=1)
china['recovered']=recover[recover['Country/Region']=='China'].drop(['Country/Region'],axis=1).groupby('Province/State').sum().iloc[:,2:].sum(axis=1)
china_data=confirm[confirm['Country/Region']=='China'].drop(['Country/Region'],axis=1).groupby('Province/State').sum().iloc[:,2:].sum(axis=1)

china=china.sort_values(by=['death','confirmed'],).tail(20)

In [None]:

china.plot(kind='bar',figsize=(20,10))
plt.title('Most affected areas' , size=25)
plt.xlabel('States', size=20)
plt.ylabel('Cases', size=20)
plt.xticks(rotation=45, size=15)
plt.yticks(size=15)
plt.legend(loc = "upper left"
           , frameon = True
           , fontsize = 15
           , ncol = 2 
           , fancybox = True
           , framealpha = 0.95
           , shadow = True
           , borderpad = 1)