# Import Pandas library

In [13]:
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt

### reading the data

In [14]:
corona = pd.read_csv("covid_19_clean_complete.csv")

In [15]:
corona.head(10)

Unnamed: 0,Province/State,Country/Region,Lat,Long,Date,Confirmed,Deaths,Recovered,Active,WHO Region
0,,Afghanistan,33.93911,67.709953,2020-01-22,0,0,0,0,Eastern Mediterranean
1,,Albania,41.1533,20.1683,2020-01-22,0,0,0,0,Europe
2,,Algeria,28.0339,1.6596,2020-01-22,0,0,0,0,Africa
3,,Andorra,42.5063,1.5218,2020-01-22,0,0,0,0,Europe
4,,Angola,-11.2027,17.8739,2020-01-22,0,0,0,0,Africa
5,,Antigua and Barbuda,17.0608,-61.7964,2020-01-22,0,0,0,0,Americas
6,,Argentina,-38.4161,-63.6167,2020-01-22,0,0,0,0,Americas
7,,Armenia,40.0691,45.0382,2020-01-22,0,0,0,0,Europe
8,Australian Capital Territory,Australia,-35.4735,149.0124,2020-01-22,0,0,0,0,Western Pacific
9,New South Wales,Australia,-33.8688,151.2093,2020-01-22,0,0,0,0,Western Pacific


In [16]:
corona.tail()

Unnamed: 0,Province/State,Country/Region,Lat,Long,Date,Confirmed,Deaths,Recovered,Active,WHO Region
49063,,Sao Tome and Principe,0.1864,6.6131,2020-07-27,865,14,734,117,Africa
49064,,Yemen,15.552727,48.516388,2020-07-27,1691,483,833,375,Eastern Mediterranean
49065,,Comoros,-11.6455,43.3333,2020-07-27,354,7,328,19,Africa
49066,,Tajikistan,38.861,71.2761,2020-07-27,7235,60,6028,1147,Europe
49067,,Lesotho,-29.61,28.2336,2020-07-27,505,12,128,365,Africa


## Check for null values 

In [30]:
corona.isnull().sum()

Country/Region    0
Lat               0
Long              0
Date              0
Confirmed         0
Deaths            0
Recovered         0
Active            0
WHO Region        0
dtype: int64

### deleting 'Province/State' coloumn because of higher number of null values 

## Checking for null values again

In [32]:
corona.isnull().sum()

Country/Region    0
Lat               0
Long              0
Date              0
Confirmed         0
Deaths            0
Recovered         0
Active            0
WHO Region        0
dtype: int64

In [33]:
corona.describe()

Unnamed: 0,Lat,Long,Confirmed,Deaths,Recovered,Active
count,49068.0,49068.0,49068.0,49068.0,49068.0,49068.0
mean,21.43373,23.528236,16884.9,884.17916,7915.713,8085.012
std,24.95032,70.44274,127300.2,6313.584411,54800.92,76258.9
min,-51.7963,-135.0,0.0,0.0,0.0,-14.0
25%,7.873054,-15.3101,4.0,0.0,0.0,0.0
50%,23.6345,21.7453,168.0,2.0,29.0,26.0
75%,41.20438,80.771797,1518.25,30.0,666.0,606.0
max,71.7069,178.065,4290259.0,148011.0,1846641.0,2816444.0


### Finding maximum number of death

In [34]:
corona.max()

Country/Region           Zimbabwe
Lat                       71.7069
Long                      178.065
Date                   2020-07-27
Confirmed                 4290259
Deaths                     148011
Recovered                 1846641
Active                    2816444
WHO Region        Western Pacific
dtype: object

## Find the Country/Region with the highest Deaths

In [35]:
corona[corona['Deaths'] == corona['Deaths'].max()]

Unnamed: 0,Country/Region,Lat,Long,Date,Confirmed,Deaths,Recovered,Active,WHO Region
49030,US,40.0,-100.0,2020-07-27,4290259,148011,1325804,2816444,Americas


## Find the Country/Region with highest number of Confirmed cases

In [36]:
corona[corona['Confirmed'] == corona['Confirmed'].max()]

Unnamed: 0,Country/Region,Lat,Long,Date,Confirmed,Deaths,Recovered,Active,WHO Region
49030,US,40.0,-100.0,2020-07-27,4290259,148011,1325804,2816444,Americas


## Checking our data again

In [38]:
corona

Unnamed: 0,Country/Region,Lat,Long,Date,Confirmed,Deaths,Recovered,Active,WHO Region
0,Afghanistan,33.939110,67.709953,2020-01-22,0,0,0,0,Eastern Mediterranean
1,Albania,41.153300,20.168300,2020-01-22,0,0,0,0,Europe
2,Algeria,28.033900,1.659600,2020-01-22,0,0,0,0,Africa
3,Andorra,42.506300,1.521800,2020-01-22,0,0,0,0,Europe
4,Angola,-11.202700,17.873900,2020-01-22,0,0,0,0,Africa
...,...,...,...,...,...,...,...,...,...
49063,Sao Tome and Principe,0.186400,6.613100,2020-07-27,865,14,734,117,Africa
49064,Yemen,15.552727,48.516388,2020-07-27,1691,483,833,375,Eastern Mediterranean
49065,Comoros,-11.645500,43.333300,2020-07-27,354,7,328,19,Africa
49066,Tajikistan,38.861000,71.276100,2020-07-27,7235,60,6028,1147,Europe


In [39]:
corona['WHO Region'].value_counts()

Europe                   15040
Western Pacific          10340
Africa                    9024
Americas                  8648
Eastern Mediterranean     4136
South-East Asia           1880
Name: WHO Region, dtype: int64

In [42]:
c = corona.groupby('WHO Region')
c

<pandas.core.groupby.generic.DataFrameGroupBy object at 0x000001EDB6034C10>

In [43]:
c.get_group('Africa')

Unnamed: 0,Country/Region,Lat,Long,Date,Confirmed,Deaths,Recovered,Active,WHO Region
2,Algeria,28.0339,1.6596,2020-01-22,0,0,0,0,Africa
4,Angola,-11.2027,17.8739,2020-01-22,0,0,0,0,Africa
24,Benin,9.3077,2.3158,2020-01-22,0,0,0,0,Africa
31,Burkina Faso,12.2383,-1.5616,2020-01-22,0,0,0,0,Africa
32,Cabo Verde,16.5388,-23.0418,2020-01-22,0,0,0,0,Africa
...,...,...,...,...,...,...,...,...,...
49061,South Sudan,6.8770,31.3070,2020-07-27,2305,46,1175,1084,Africa
49062,Western Sahara,24.2155,-12.8858,2020-07-27,10,1,8,1,Africa
49063,Sao Tome and Principe,0.1864,6.6131,2020-07-27,865,14,734,117,Africa
49065,Comoros,-11.6455,43.3333,2020-07-27,354,7,328,19,Africa


In [44]:
c.get_group('Europe')

Unnamed: 0,Country/Region,Lat,Long,Date,Confirmed,Deaths,Recovered,Active,WHO Region
1,Albania,41.1533,20.1683,2020-01-22,0,0,0,0,Europe
3,Andorra,42.5063,1.5218,2020-01-22,0,0,0,0,Europe
7,Armenia,40.0691,45.0382,2020-01-22,0,0,0,0,Europe
16,Austria,47.5162,14.5501,2020-01-22,0,0,0,0,Europe
17,Azerbaijan,40.1431,47.5769,2020-01-22,0,0,0,0,Europe
...,...,...,...,...,...,...,...,...,...
49053,United Kingdom,18.4207,-64.6400,2020-07-27,8,1,7,0,Europe
49054,United Kingdom,21.6940,-71.7979,2020-07-27,99,2,36,61,Europe
49059,United Kingdom,-51.7963,-59.5236,2020-07-27,13,0,13,0,Europe
49060,France,46.8852,-56.3159,2020-07-27,4,0,1,3,Europe


In [46]:
corona.groupby('WHO Region').sum()

Unnamed: 0_level_0,Lat,Long,Confirmed,Deaths,Recovered,Active
WHO Region,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1
Africa,4727.39442,141787.2,21791827,439978,11193730,10158119
Americas,161412.174448,-670371.0,402261194,19359292,157069444,225832458
Eastern Mediterranean,108204.921108,169781.0,74082892,1924029,48050703,24108160
Europe,567986.485104,103258.6,248879793,19271040,123202075,106406678
South-East Asia,26161.732764,175703.4,55118365,1458134,30030327,23629904
Western Pacific,183217.578356,1234324.0,26374411,932430,18861950,6580031
