#**Pandas Part 1**

Pandas deals with the following three data structures:
* Series
* DataFrame
* Panel                                   

These data structures are built over Numpy arrays

##Series

In [1]:
import pandas as pd

In [None]:
dir(pd)

In [None]:
import numpy as np

In [None]:
x = np.arange(10,50, 10)

In [None]:
x

array([10, 20, 30, 40])

In [None]:
pd.Series(x)

0    10
1    20
2    30
3    40
dtype: int64

0 1 2 3 are index

In [None]:
index = ['a', 'b', 'c', 'd']

In [None]:
s = pd.Series(x, index)

In [None]:
s

a    10
b    20
c    30
d    40
dtype: int64

In [None]:
s[0]

10

In [None]:
s['a']

10

##Series Methods

In [None]:
s.axes

[Index(['a', 'b', 'c', 'd'], dtype='object')]

In [None]:
s.values

array([10, 20, 30, 40])

In [None]:
s.size

4

In [None]:
s.shape

(4,)

In [None]:
s.ndim

1

In [None]:
s.dtype

dtype('int64')

In [None]:
s['e'] = 50  #New row added

In [None]:
s

a    10
b    20
c    30
d    40
e    50
dtype: int64

In [None]:
data = ['Raman', 'Guido', 'Ismail', 'Apu']

In [None]:
pd.Series(data)

0     Raman
1     Guido
2    Ismail
3       Apu
dtype: object

In [None]:
pd.Series(data, index)

a     Raman
b     Guido
c    Ismail
d       Apu
dtype: object

## Data as Sacalar

In [None]:
index = ['a', 'b', 'c', 'd']

In [None]:
pd.Series(10, index, int)

a    10
b    10
c    10
d    10
dtype: int64

##Series from Dictionary

In [None]:
data = {'a':10, 'b':20, 'c':30, 'd':40}

In [None]:
pd.Series(data)

a    10
b    20
c    30
d    40
dtype: int64

In [None]:
index = ['a', 'b', 'c', 'd', 'e']

In [None]:
pd.Series(data, index)

a    10.0
b    20.0
c    30.0
d    40.0
e     NaN
dtype: float64

NaN - Not a number

##Basic Operations

In [None]:
s

a    10
b    20
c    30
d    40
e    50
dtype: int64

In [None]:
s*2

a     20
b     40
c     60
d     80
e    100
dtype: int64

In [None]:
np.sqrt(s)

a    3.162278
b    4.472136
c    5.477226
d    6.324555
e    7.071068
dtype: float64

In [None]:
np.sum(s)

150

In [None]:
np.min(s)

10

In [None]:
np.max(s)

50

In [None]:
s[1:3]

b    20
c    30
dtype: int64

In [None]:
s.sum()

150

In [None]:
s.mean()

30.0

In [None]:
s.std()  #Standard deviation

15.811388300841896

#**Pandas Part 2**

##DataFrame

In [None]:
data = [10,20,30,40]

In [None]:
pd.DataFrame(data)

Unnamed: 0,0
0,10
1,20
2,30
3,40


In [None]:
d = [[10,20,30,40],[50,60,70,80]]

In [None]:
pd.DataFrame(d)

Unnamed: 0,0,1,2,3
0,10,20,30,40
1,50,60,70,80


In [None]:
index = ['a', 'b']

In [None]:
pd.DataFrame(d, index)

Unnamed: 0,0,1,2,3
a,10,20,30,40
b,50,60,70,80


In [None]:
d = pd.DataFrame(d, index, columns = ['A', 'B', 'C', 'D'])

In [None]:
d

Unnamed: 0,A,B,C,D
a,10,20,30,40
b,50,60,70,80


In [None]:
d['A']

a    10
b    50
Name: A, dtype: int64

In [None]:
d['A']['a']

10

In [None]:
d[1:3]

Unnamed: 0,A,B,C,D
b,50,60,70,80


In [None]:
# d['a']['A'] This is error

##Methods over DataFrame

In [None]:
d.axes

[Index(['a', 'b'], dtype='object'),
 Index(['A', 'B', 'C', 'D'], dtype='object')]

In [None]:
d.size

8

In [None]:
d.ndim

2

In [None]:
d.T

Unnamed: 0,a,b
A,10,50
B,20,60
C,30,70
D,40,80


In [None]:
d.empty

False

In [None]:
d

Unnamed: 0,A,B,C,D
a,10,20,30,40
b,50,60,70,80


In [None]:
d.values

array([[10, 20, 30, 40],
       [50, 60, 70, 80]])

In [None]:
d.head()

Unnamed: 0,A,B,C,D
a,10,20,30,40
b,50,60,70,80


In [None]:
d.tail()

Unnamed: 0,A,B,C,D
a,10,20,30,40
b,50,60,70,80


In [None]:
d.sum()

A     60
B     80
C    100
D    120
dtype: int64

In [None]:
d.sum(1)  #1 here is axes

a    100
b    260
dtype: int64

In [None]:
d.mean()

A    30.0
B    40.0
C    50.0
D    60.0
dtype: float64

In [None]:
d.mean(1)

a    25.0
b    65.0
dtype: float64

In [None]:
d.mean(1)[1]

65.0

In [None]:
d.std()

A    28.284271
B    28.284271
C    28.284271
D    28.284271
dtype: float64

In [None]:
d.std(1)

a    12.909944
b    12.909944
dtype: float64

In [None]:
d.std(1)

a    12.909944
b    12.909944
dtype: float64

In [None]:
d.max()

A    50
B    60
C    70
D    80
dtype: int64

In [None]:
d.min()

A    10
B    20
C    30
D    40
dtype: int64

In [None]:
d.describe()

Unnamed: 0,A,B,C,D
count,2.0,2.0,2.0,2.0
mean,30.0,40.0,50.0,60.0
std,28.284271,28.284271,28.284271,28.284271
min,10.0,20.0,30.0,40.0
25%,20.0,30.0,40.0,50.0
50%,30.0,40.0,50.0,60.0
75%,40.0,50.0,60.0,70.0
max,50.0,60.0,70.0,80.0


##DataFrame from Dictionary

In [None]:
data = {'a':10, 'b':20, 'c':30, 'd':40}

In [None]:
index = [1,2,3,4]

In [None]:
pd.DataFrame(data, index)

Unnamed: 0,a,b,c,d
1,10,20,30,40
2,10,20,30,40
3,10,20,30,40
4,10,20,30,40


##DataFrame from Dictionary of Lists

In [None]:
data = {'a': [10,15,20,25], 'b':[30,35,40,45], 'c':[50,55,60,65],
                                 'd':[70,75,80,85]}

In [None]:
index = [1,2,3,4]

In [None]:
pd.DataFrame(data, index)

Unnamed: 0,a,b,c,d
1,10,30,50,70
2,15,35,55,75
3,20,40,60,80
4,25,45,65,85


##DataFrame from Lists of Dictionaries 

In [None]:
data = [{'x':2, 'y':10}, {'x':4, 'y':20}, {'x':6, 'y':30}, {'x':8, 'y':40}]

In [None]:
d = pd.DataFrame(data, index = ['a', 'b', 'c', 'd'])

In [None]:
d

Unnamed: 0,x,y
a,2,10
b,4,20
c,6,30
d,8,40


In [None]:
d['x']

a    2
b    4
c    6
d    8
Name: x, dtype: int64

In [None]:
d['x']['b']

4

##DataFrame from Dictionary of Series

In [None]:
index = ['a', 'b', 'c', 'd']

In [None]:
s1 = pd.Series([5,8,9,11], index)
s1

a     5
b     8
c     9
d    11
dtype: int64

In [None]:
s2 = pd.Series([7,6,4,3], index)

In [None]:
d = {'A':s1, 'B':s2}

In [None]:
D = pd.DataFrame(d)

In [None]:
d

{'A': a     5
 b     8
 c     9
 d    11
 dtype: int64, 'B': a    7
 b    6
 c    4
 d    3
 dtype: int64}

In [None]:
D

Unnamed: 0,A,B
a,5,7
b,8,6
c,9,4
d,11,3


##Add Column to DataFrame

In [None]:
D['C'] = pd.DataFrame({'C': pd.Series([10,20,30,40], index)})

In [None]:
D

Unnamed: 0,A,B,C
a,5,7,10
b,8,6,20
c,9,4,30
d,11,3,40


In [None]:
D['C'] = pd.Series([10,20,30,40], index)

In [None]:
D

Unnamed: 0,A,B,C
a,5,7,10
b,8,6,20
c,9,4,30
d,11,3,40


##Delete columns from DataFrame

In [None]:
D1 = D.copy()
D1

Unnamed: 0,A,B,C
a,5,7,10
b,8,6,20
c,9,4,30
d,11,3,40


D1 = D makes D1 refer to D. They share the same DataFrame. Any change in D1 will change D

In [None]:
del D1['A']

In [None]:
D1

Unnamed: 0,B,C
a,7,10
b,6,20
c,4,30
d,3,40


##Location, Slicing

In [None]:
D

Unnamed: 0,A,B,C
a,5,7,10
b,8,6,20
c,9,4,30
d,11,3,40


In [None]:
D.loc['b']

A     8
B     6
C    20
Name: b, dtype: int64

In [None]:
D.iloc[1]  #iloc---> index location

A     8
B     6
C    20
Name: b, dtype: int64

In [None]:
D.iloc[1][2]

20

In [None]:
D[1:3]

Unnamed: 0,A,B,C
b,8,6,20
c,9,4,30


In [None]:
D[1:3]['A']

b    8
c    9
Name: A, dtype: int64

##Append and Delete

###Add Row to DataFrame

In [None]:
D1 = pd.DataFrame([[-1,0,2]], index = ['e'], columns = ['A', 'B', 'C'])

In [None]:
D1

Unnamed: 0,A,B,C
e,-1,0,2


In [None]:
D.append(D1)   #Append DataFrame

Unnamed: 0,A,B,C
a,5,7,10
b,8,6,20
c,9,4,30
d,11,3,40
e,-1,0,2


###Delete row from DataFrame

In [None]:
D.drop('a')

Unnamed: 0,A,B,C
b,8,6,20
c,9,4,30
d,11,3,40


In [None]:
D

Unnamed: 0,A,B,C
a,5,7,10
b,8,6,20
c,9,4,30
d,11,3,40


##Re-indexing

In [None]:
index = [1,2,3,4,5]

In [None]:
data = {'x':[0.1,0.3,0.5,0.7,0.9], 'y':[0.2,0.4,0.6,0.8,1.0]}

In [None]:
D = pd.DataFrame(data, index)

In [None]:
D

Unnamed: 0,x,y
1,0.1,0.2
2,0.3,0.4
3,0.5,0.6
4,0.7,0.8
5,0.9,1.0


In [None]:
D.reindex(np.arange(2,7), ['x', 'y'])

	'.reindex(a, b)' as 
	'.reindex(index=a, columns=b)'.
Use named arguments to remove any ambiguity. In the future, using positional arguments for 'index' or 'columns' will raise  a 'TypeError'.
  """Entry point for launching an IPython kernel.


Unnamed: 0,x,y
2,0.3,0.4
3,0.5,0.6
4,0.7,0.8
5,0.9,1.0
6,,


In [None]:
D

Unnamed: 0,x,y
1,0.1,0.2
2,0.3,0.4
3,0.5,0.6
4,0.7,0.8
5,0.9,1.0


#**Pandas Part 3**

##Getting Data

In [4]:
df = pd.read_csv('/content/time_series_covid19_confirmed_global.csv')

In [None]:
#df1 = pd.read_csv('time_series_covid19_confirmed_global.csv')

Both ways possible once you upload in google drive

In [None]:
type(df)

pandas.core.frame.DataFrame

In [None]:
df.head()

Unnamed: 0,Province/State,Country/Region,Lat,Long,1/22/20,1/23/20,1/24/20,1/25/20,1/26/20,1/27/20,1/28/20,1/29/20,1/30/20,1/31/20,2/1/20,2/2/20,2/3/20,2/4/20,2/5/20,2/6/20,2/7/20,2/8/20,2/9/20,2/10/20,2/11/20,2/12/20,2/13/20,2/14/20,2/15/20,2/16/20,2/17/20,2/18/20,2/19/20,2/20/20,2/21/20,2/22/20,2/23/20,2/24/20,2/25/20,2/26/20,...,6/8/20,6/9/20,6/10/20,6/11/20,6/12/20,6/13/20,6/14/20,6/15/20,6/16/20,6/17/20,6/18/20,6/19/20,6/20/20,6/21/20,6/22/20,6/23/20,6/24/20,6/25/20,6/26/20,6/27/20,6/28/20,6/29/20,6/30/20,7/1/20,7/2/20,7/3/20,7/4/20,7/5/20,7/6/20,7/7/20,7/8/20,7/9/20,7/10/20,7/11/20,7/12/20,7/13/20,7/14/20,7/15/20,7/16/20,7/17/20
0,,Afghanistan,33.93911,67.709953,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,...,20917,21459,22142,22890,23546,24102,24766,25527,26310,26874,27532,27878,28424,28833,29157,29481,29640,30175,30451,30616,30967,31238,31517,31836,32022,32324,32672,32951,33190,33384,33594,33908,34194,34366,34451,34455,34740,34994,35070,35229
1,,Albania,41.1533,20.1683,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,1263,1299,1341,1385,1416,1464,1521,1590,1672,1722,1788,1838,1891,1962,1995,2047,2114,2192,2269,2330,2402,2466,2535,2580,2662,2752,2819,2893,2964,3038,3106,3188,3278,3371,3454,3571,3667,3752,3851,3906
2,,Algeria,28.0339,1.6596,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,...,10265,10382,10484,10589,10698,10810,10919,11031,11147,11268,11385,11504,11631,11771,11920,12076,12248,12445,12685,12968,13273,13571,13907,14272,14657,15070,15500,15941,16404,16879,17348,17808,18242,18712,19195,19689,20216,20770,21355,21948
3,,Andorra,42.5063,1.5218,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,852,852,852,852,853,853,853,853,854,854,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,858,861,862,877,880
4,,Angola,-11.2027,17.8739,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,92,96,113,118,130,138,140,142,148,155,166,172,176,183,186,189,197,212,212,259,267,276,284,291,315,328,346,346,346,386,386,396,458,462,506,525,541,576,607,638


In [None]:
df.head(10)    #First 10 rows

Unnamed: 0,Province/State,Country/Region,Lat,Long,1/22/20,1/23/20,1/24/20,1/25/20,1/26/20,1/27/20,1/28/20,1/29/20,1/30/20,1/31/20,2/1/20,2/2/20,2/3/20,2/4/20,2/5/20,2/6/20,2/7/20,2/8/20,2/9/20,2/10/20,2/11/20,2/12/20,2/13/20,2/14/20,2/15/20,2/16/20,2/17/20,2/18/20,2/19/20,2/20/20,2/21/20,2/22/20,2/23/20,2/24/20,2/25/20,2/26/20,...,6/8/20,6/9/20,6/10/20,6/11/20,6/12/20,6/13/20,6/14/20,6/15/20,6/16/20,6/17/20,6/18/20,6/19/20,6/20/20,6/21/20,6/22/20,6/23/20,6/24/20,6/25/20,6/26/20,6/27/20,6/28/20,6/29/20,6/30/20,7/1/20,7/2/20,7/3/20,7/4/20,7/5/20,7/6/20,7/7/20,7/8/20,7/9/20,7/10/20,7/11/20,7/12/20,7/13/20,7/14/20,7/15/20,7/16/20,7/17/20
0,,Afghanistan,33.93911,67.709953,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,...,20917,21459,22142,22890,23546,24102,24766,25527,26310,26874,27532,27878,28424,28833,29157,29481,29640,30175,30451,30616,30967,31238,31517,31836,32022,32324,32672,32951,33190,33384,33594,33908,34194,34366,34451,34455,34740,34994,35070,35229
1,,Albania,41.1533,20.1683,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,1263,1299,1341,1385,1416,1464,1521,1590,1672,1722,1788,1838,1891,1962,1995,2047,2114,2192,2269,2330,2402,2466,2535,2580,2662,2752,2819,2893,2964,3038,3106,3188,3278,3371,3454,3571,3667,3752,3851,3906
2,,Algeria,28.0339,1.6596,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,...,10265,10382,10484,10589,10698,10810,10919,11031,11147,11268,11385,11504,11631,11771,11920,12076,12248,12445,12685,12968,13273,13571,13907,14272,14657,15070,15500,15941,16404,16879,17348,17808,18242,18712,19195,19689,20216,20770,21355,21948
3,,Andorra,42.5063,1.5218,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,852,852,852,852,853,853,853,853,854,854,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,858,861,862,877,880
4,,Angola,-11.2027,17.8739,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,92,96,113,118,130,138,140,142,148,155,166,172,176,183,186,189,197,212,212,259,267,276,284,291,315,328,346,346,346,386,386,396,458,462,506,525,541,576,607,638
5,,Antigua and Barbuda,17.0608,-61.7964,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,26,26,26,26,26,26,26,26,26,26,26,26,26,26,26,26,26,65,65,65,69,69,69,69,69,68,68,68,70,70,70,73,74,74,74,74,74,74,74,76
6,,Argentina,-38.4161,-63.6167,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,23620,24761,25987,27373,28764,30295,31577,32785,34159,35552,37510,39570,41204,42785,44931,47203,49851,52457,55343,57744,59933,62268,64530,67197,69941,72786,75376,77815,80447,83426,87030,90693,94060,97509,100166,103265,106910,111146,114783,119301
7,,Armenia,40.0691,45.0382,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,13325,13675,14103,14669,15281,16004,16667,17064,17489,18033,18698,19157,19708,20268,20588,21006,21717,22488,23247,23909,24645,25127,25542,26065,26658,27320,27900,28606,28936,29285,29820,30346,30903,31392,31969,32151,32490,33005,33559,34001
8,Australian Capital Territory,Australia,-35.4735,149.0124,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,108,111,112,113,113,113,113,113,113,113,113,113
9,New South Wales,Australia,-33.8688,151.2093,0,0,0,0,3,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,4,...,3114,3117,3117,3115,3119,3128,3131,3134,3135,3137,3143,3144,3149,3151,3150,3159,3162,3168,3174,3177,3184,3189,3203,3211,3211,3405,3419,3429,3433,3440,3453,3467,3474,3478,3492,3505,3517,3527,3535,3550


In [None]:
df.tail()

Unnamed: 0,Province/State,Country/Region,Lat,Long,1/22/20,1/23/20,1/24/20,1/25/20,1/26/20,1/27/20,1/28/20,1/29/20,1/30/20,1/31/20,2/1/20,2/2/20,2/3/20,2/4/20,2/5/20,2/6/20,2/7/20,2/8/20,2/9/20,2/10/20,2/11/20,2/12/20,2/13/20,2/14/20,2/15/20,2/16/20,2/17/20,2/18/20,2/19/20,2/20/20,2/21/20,2/22/20,2/23/20,2/24/20,2/25/20,2/26/20,...,6/8/20,6/9/20,6/10/20,6/11/20,6/12/20,6/13/20,6/14/20,6/15/20,6/16/20,6/17/20,6/18/20,6/19/20,6/20/20,6/21/20,6/22/20,6/23/20,6/24/20,6/25/20,6/26/20,6/27/20,6/28/20,6/29/20,6/30/20,7/1/20,7/2/20,7/3/20,7/4/20,7/5/20,7/6/20,7/7/20,7/8/20,7/9/20,7/10/20,7/11/20,7/12/20,7/13/20,7/14/20,7/15/20,7/16/20,7/17/20
261,,Sao Tome and Principe,0.1864,6.6131,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,513,514,611,632,639,659,661,662,671,683,688,693,698,698,702,707,710,711,712,713,713,713,714,715,717,719,719,720,721,724,724,726,727,727,729,732,732,737,740,741
262,,Yemen,15.552727,48.516388,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,496,524,560,591,632,705,728,844,885,902,909,919,922,941,967,992,1015,1076,1089,1103,1118,1128,1158,1190,1221,1240,1248,1265,1284,1297,1318,1356,1380,1389,1465,1498,1516,1526,1552,1576
263,,Comoros,-11.6455,43.3333,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,141,141,162,162,163,176,176,176,197,197,210,210,247,247,247,265,265,272,272,272,272,272,303,303,303,309,309,311,311,311,313,314,314,317,317,317,321,321,328,328
264,,Tajikistan,38.861,71.2761,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,4609,4690,4763,4834,4902,4971,5035,5097,5160,5221,5279,5338,5399,5457,5513,5567,5630,5691,5747,5799,5849,5900,5900,6005,6058,6058,6159,6213,6262,6315,6364,6410,6457,6506,6552,6596,6643,6695,6741,6786
265,,Lesotho,-29.61,28.2336,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,4,4,4,4,4,4,4,4,4,4,4,4,4,4,12,17,17,17,24,24,27,27,27,35,35,35,35,79,91,91,91,134,184,184,233,245,256,256,256,311


In [None]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 266 entries, 0 to 265
Columns: 182 entries, Province/State to 7/17/20
dtypes: float64(2), int64(178), object(2)
memory usage: 378.3+ KB


##Selecting Rows and Columns

In [None]:
df.columns

Index(['Province/State', 'Country/Region', 'Lat', 'Long', '1/22/20', '1/23/20',
       '1/24/20', '1/25/20', '1/26/20', '1/27/20',
       ...
       '7/8/20', '7/9/20', '7/10/20', '7/11/20', '7/12/20', '7/13/20',
       '7/14/20', '7/15/20', '7/16/20', '7/17/20'],
      dtype='object', length=182)

In [None]:
df.head()

Unnamed: 0,Province/State,Country/Region,Lat,Long,1/22/20,1/23/20,1/24/20,1/25/20,1/26/20,1/27/20,1/28/20,1/29/20,1/30/20,1/31/20,2/1/20,2/2/20,2/3/20,2/4/20,2/5/20,2/6/20,2/7/20,2/8/20,2/9/20,2/10/20,2/11/20,2/12/20,2/13/20,2/14/20,2/15/20,2/16/20,2/17/20,2/18/20,2/19/20,2/20/20,2/21/20,2/22/20,2/23/20,2/24/20,2/25/20,2/26/20,...,6/8/20,6/9/20,6/10/20,6/11/20,6/12/20,6/13/20,6/14/20,6/15/20,6/16/20,6/17/20,6/18/20,6/19/20,6/20/20,6/21/20,6/22/20,6/23/20,6/24/20,6/25/20,6/26/20,6/27/20,6/28/20,6/29/20,6/30/20,7/1/20,7/2/20,7/3/20,7/4/20,7/5/20,7/6/20,7/7/20,7/8/20,7/9/20,7/10/20,7/11/20,7/12/20,7/13/20,7/14/20,7/15/20,7/16/20,7/17/20
0,,Afghanistan,33.93911,67.709953,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,...,20917,21459,22142,22890,23546,24102,24766,25527,26310,26874,27532,27878,28424,28833,29157,29481,29640,30175,30451,30616,30967,31238,31517,31836,32022,32324,32672,32951,33190,33384,33594,33908,34194,34366,34451,34455,34740,34994,35070,35229
1,,Albania,41.1533,20.1683,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,1263,1299,1341,1385,1416,1464,1521,1590,1672,1722,1788,1838,1891,1962,1995,2047,2114,2192,2269,2330,2402,2466,2535,2580,2662,2752,2819,2893,2964,3038,3106,3188,3278,3371,3454,3571,3667,3752,3851,3906
2,,Algeria,28.0339,1.6596,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,...,10265,10382,10484,10589,10698,10810,10919,11031,11147,11268,11385,11504,11631,11771,11920,12076,12248,12445,12685,12968,13273,13571,13907,14272,14657,15070,15500,15941,16404,16879,17348,17808,18242,18712,19195,19689,20216,20770,21355,21948
3,,Andorra,42.5063,1.5218,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,852,852,852,852,853,853,853,853,854,854,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,858,861,862,877,880
4,,Angola,-11.2027,17.8739,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,92,96,113,118,130,138,140,142,148,155,166,172,176,183,186,189,197,212,212,259,267,276,284,291,315,328,346,346,346,386,386,396,458,462,506,525,541,576,607,638


In [None]:
df['Country/Region']

0                Afghanistan
1                    Albania
2                    Algeria
3                    Andorra
4                     Angola
               ...          
261    Sao Tome and Principe
262                    Yemen
263                  Comoros
264               Tajikistan
265                  Lesotho
Name: Country/Region, Length: 266, dtype: object

In [None]:
df[['Country/Region', 'Lat', 'Long']]

Unnamed: 0,Country/Region,Lat,Long
0,Afghanistan,33.939110,67.709953
1,Albania,41.153300,20.168300
2,Algeria,28.033900,1.659600
3,Andorra,42.506300,1.521800
4,Angola,-11.202700,17.873900
...,...,...,...
261,Sao Tome and Principe,0.186400,6.613100
262,Yemen,15.552727,48.516388
263,Comoros,-11.645500,43.333300
264,Tajikistan,38.861000,71.276100


In [None]:
type(df['Lat'])

pandas.core.series.Series

In [None]:
type(df[['Country/Region', 'Lat', 'Long']])

pandas.core.frame.DataFrame

In [None]:
df.iloc[0]   # Oth row

Province/State            NaN
Country/Region    Afghanistan
Lat                   33.9391
Long                    67.71
1/22/20                     0
                     ...     
7/13/20                 34455
7/14/20                 34740
7/15/20                 34994
7/16/20                 35070
7/17/20                 35229
Name: 0, Length: 182, dtype: object

In [None]:
df.loc[0]  # Used to access row by row index. Here row index is also numerical

Province/State            NaN
Country/Region    Afghanistan
Lat                   33.9391
Long                    67.71
1/22/20                     0
                     ...     
7/13/20                 34455
7/14/20                 34740
7/15/20                 34994
7/16/20                 35070
7/17/20                 35229
Name: 0, Length: 182, dtype: object

In [None]:
df2 = pd.read_csv('/content/time_series_covid19_confirmed_global.csv', index_col = 'Province/State')

In [None]:
df2.head()

Unnamed: 0_level_0,Country/Region,Lat,Long,1/22/20,1/23/20,1/24/20,1/25/20,1/26/20,1/27/20,1/28/20,1/29/20,1/30/20,1/31/20,2/1/20,2/2/20,2/3/20,2/4/20,2/5/20,2/6/20,2/7/20,2/8/20,2/9/20,2/10/20,2/11/20,2/12/20,2/13/20,2/14/20,2/15/20,2/16/20,2/17/20,2/18/20,2/19/20,2/20/20,2/21/20,2/22/20,2/23/20,2/24/20,2/25/20,2/26/20,2/27/20,...,6/8/20,6/9/20,6/10/20,6/11/20,6/12/20,6/13/20,6/14/20,6/15/20,6/16/20,6/17/20,6/18/20,6/19/20,6/20/20,6/21/20,6/22/20,6/23/20,6/24/20,6/25/20,6/26/20,6/27/20,6/28/20,6/29/20,6/30/20,7/1/20,7/2/20,7/3/20,7/4/20,7/5/20,7/6/20,7/7/20,7/8/20,7/9/20,7/10/20,7/11/20,7/12/20,7/13/20,7/14/20,7/15/20,7/16/20,7/17/20
Province/State,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1
,Afghanistan,33.93911,67.709953,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,1,...,20917,21459,22142,22890,23546,24102,24766,25527,26310,26874,27532,27878,28424,28833,29157,29481,29640,30175,30451,30616,30967,31238,31517,31836,32022,32324,32672,32951,33190,33384,33594,33908,34194,34366,34451,34455,34740,34994,35070,35229
,Albania,41.1533,20.1683,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,1263,1299,1341,1385,1416,1464,1521,1590,1672,1722,1788,1838,1891,1962,1995,2047,2114,2192,2269,2330,2402,2466,2535,2580,2662,2752,2819,2893,2964,3038,3106,3188,3278,3371,3454,3571,3667,3752,3851,3906
,Algeria,28.0339,1.6596,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,1,...,10265,10382,10484,10589,10698,10810,10919,11031,11147,11268,11385,11504,11631,11771,11920,12076,12248,12445,12685,12968,13273,13571,13907,14272,14657,15070,15500,15941,16404,16879,17348,17808,18242,18712,19195,19689,20216,20770,21355,21948
,Andorra,42.5063,1.5218,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,852,852,852,852,853,853,853,853,854,854,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,855,858,861,862,877,880
,Angola,-11.2027,17.8739,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,92,96,113,118,130,138,140,142,148,155,166,172,176,183,186,189,197,212,212,259,267,276,284,291,315,328,346,346,346,386,386,396,458,462,506,525,541,576,607,638


In [None]:
df2.loc["New South Wales"]

Country/Region    Australia
Lat                -33.8688
Long                151.209
1/22/20                   0
1/23/20                   0
                    ...    
7/13/20                3505
7/14/20                3517
7/15/20                3527
7/16/20                3535
7/17/20                3550
Name: New South Wales, Length: 181, dtype: object

In [None]:
df[df['7/17/20'] > 500000]

Unnamed: 0,Province/State,Country/Region,Lat,Long,1/22/20,1/23/20,1/24/20,1/25/20,1/26/20,1/27/20,1/28/20,1/29/20,1/30/20,1/31/20,2/1/20,2/2/20,2/3/20,2/4/20,2/5/20,2/6/20,2/7/20,2/8/20,2/9/20,2/10/20,2/11/20,2/12/20,2/13/20,2/14/20,2/15/20,2/16/20,2/17/20,2/18/20,2/19/20,2/20/20,2/21/20,2/22/20,2/23/20,2/24/20,2/25/20,2/26/20,...,6/8/20,6/9/20,6/10/20,6/11/20,6/12/20,6/13/20,6/14/20,6/15/20,6/16/20,6/17/20,6/18/20,6/19/20,6/20/20,6/21/20,6/22/20,6/23/20,6/24/20,6/25/20,6/26/20,6/27/20,6/28/20,6/29/20,6/30/20,7/1/20,7/2/20,7/3/20,7/4/20,7/5/20,7/6/20,7/7/20,7/8/20,7/9/20,7/10/20,7/11/20,7/12/20,7/13/20,7/14/20,7/15/20,7/16/20,7/17/20
28,,Brazil,-14.235,-51.9253,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,...,707412,739503,772416,802828,828810,850514,867624,888271,923189,955377,978142,1032913,1067579,1083341,1106470,1145906,1188631,1228114,1274974,1313667,1344143,1368195,1402041,1448753,1496858,1539081,1577004,1603055,1623284,1668589,1713160,1755779,1800827,1839850,1864681,1884967,1926824,1966748,2012151,2046328
131,,India,20.593684,78.96288,0,0,0,0,0,0,0,0,1,1,1,2,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,...,265928,276146,286605,297535,308993,320922,332424,343091,354065,366946,380532,395048,410451,425282,440215,456183,473105,490401,508953,528859,548318,566840,585481,604641,625544,648315,673165,697413,719664,742417,767296,793802,820916,849522,878254,906752,936181,968857,1003832,1039084
187,,Russia,61.52401,105.318756,0,0,0,0,0,0,0,0,0,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,...,476043,484630,493023,501800,510761,519458,528267,536484,544725,552549,560321,568292,576162,583879,591465,598878,606043,613148,619936,626779,633563,640246,646929,653479,660231,666941,673564,680283,686852,693215,699749,706240,712863,719449,726036,732547,738787,745197,751612,758001
225,,US,40.0,-100.0,1,1,2,2,5,5,5,5,5,7,8,8,11,11,11,11,11,11,11,11,12,12,13,13,13,13,13,13,13,13,15,15,15,15,15,15,...,1961785,1979912,2000706,2023656,2048986,2074542,2094366,2114026,2137731,2163290,2191099,2222579,2255328,2281767,2312303,2347491,2382426,2422299,2467554,2510259,2549864,2590668,2636414,2687588,2742049,2795361,2841241,2891124,2936077,2996098,3054699,3117946,3185737,3245925,3304942,3364157,3431574,3498902,3576157,3647715


In [None]:
df3 = df[df['7/17/20'] > 500000]

In [None]:
df3[['Province/State', 'Country/Region', '7/17/20']]

Unnamed: 0,Province/State,Country/Region,7/17/20
28,,Brazil,2046328
131,,India,1039084
187,,Russia,758001
225,,US,3647715


In [None]:
df3[df3['Country/Region'] != 'Russia']

Unnamed: 0,Province/State,Country/Region,Lat,Long,1/22/20,1/23/20,1/24/20,1/25/20,1/26/20,1/27/20,1/28/20,1/29/20,1/30/20,1/31/20,2/1/20,2/2/20,2/3/20,2/4/20,2/5/20,2/6/20,2/7/20,2/8/20,2/9/20,2/10/20,2/11/20,2/12/20,2/13/20,2/14/20,2/15/20,2/16/20,2/17/20,2/18/20,2/19/20,2/20/20,2/21/20,2/22/20,2/23/20,2/24/20,2/25/20,2/26/20,...,6/8/20,6/9/20,6/10/20,6/11/20,6/12/20,6/13/20,6/14/20,6/15/20,6/16/20,6/17/20,6/18/20,6/19/20,6/20/20,6/21/20,6/22/20,6/23/20,6/24/20,6/25/20,6/26/20,6/27/20,6/28/20,6/29/20,6/30/20,7/1/20,7/2/20,7/3/20,7/4/20,7/5/20,7/6/20,7/7/20,7/8/20,7/9/20,7/10/20,7/11/20,7/12/20,7/13/20,7/14/20,7/15/20,7/16/20,7/17/20
28,,Brazil,-14.235,-51.9253,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,...,707412,739503,772416,802828,828810,850514,867624,888271,923189,955377,978142,1032913,1067579,1083341,1106470,1145906,1188631,1228114,1274974,1313667,1344143,1368195,1402041,1448753,1496858,1539081,1577004,1603055,1623284,1668589,1713160,1755779,1800827,1839850,1864681,1884967,1926824,1966748,2012151,2046328
131,,India,20.593684,78.96288,0,0,0,0,0,0,0,0,1,1,1,2,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,3,...,265928,276146,286605,297535,308993,320922,332424,343091,354065,366946,380532,395048,410451,425282,440215,456183,473105,490401,508953,528859,548318,566840,585481,604641,625544,648315,673165,697413,719664,742417,767296,793802,820916,849522,878254,906752,936181,968857,1003832,1039084
225,,US,40.0,-100.0,1,1,2,2,5,5,5,5,5,7,8,8,11,11,11,11,11,11,11,11,12,12,13,13,13,13,13,13,13,13,15,15,15,15,15,15,...,1961785,1979912,2000706,2023656,2048986,2074542,2094366,2114026,2137731,2163290,2191099,2222579,2255328,2281767,2312303,2347491,2382426,2422299,2467554,2510259,2549864,2590668,2636414,2687588,2742049,2795361,2841241,2891124,2936077,2996098,3054699,3117946,3185737,3245925,3304942,3364157,3431574,3498902,3576157,3647715


In [None]:
df3[df3['Country/Region'] == 'Russia']

Unnamed: 0,Province/State,Country/Region,Lat,Long,1/22/20,1/23/20,1/24/20,1/25/20,1/26/20,1/27/20,1/28/20,1/29/20,1/30/20,1/31/20,2/1/20,2/2/20,2/3/20,2/4/20,2/5/20,2/6/20,2/7/20,2/8/20,2/9/20,2/10/20,2/11/20,2/12/20,2/13/20,2/14/20,2/15/20,2/16/20,2/17/20,2/18/20,2/19/20,2/20/20,2/21/20,2/22/20,2/23/20,2/24/20,2/25/20,2/26/20,...,6/8/20,6/9/20,6/10/20,6/11/20,6/12/20,6/13/20,6/14/20,6/15/20,6/16/20,6/17/20,6/18/20,6/19/20,6/20/20,6/21/20,6/22/20,6/23/20,6/24/20,6/25/20,6/26/20,6/27/20,6/28/20,6/29/20,6/30/20,7/1/20,7/2/20,7/3/20,7/4/20,7/5/20,7/6/20,7/7/20,7/8/20,7/9/20,7/10/20,7/11/20,7/12/20,7/13/20,7/14/20,7/15/20,7/16/20,7/17/20
187,,Russia,61.52401,105.318756,0,0,0,0,0,0,0,0,0,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,...,476043,484630,493023,501800,510761,519458,528267,536484,544725,552549,560321,568292,576162,583879,591465,598878,606043,613148,619936,626779,633563,640246,646929,653479,660231,666941,673564,680283,686852,693215,699749,706240,712863,719449,726036,732547,738787,745197,751612,758001


In [None]:
df3['Country/Region'] != 'Russia'

28      True
131     True
187    False
225     True
Name: Country/Region, dtype: bool

In [None]:
df3.values