In [None]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import warnings
warnings.filterwarnings('ignore')
import copy

# View the dimensions or shape of the data

In [None]:
df=pd.read_csv('world_alcohol.csv')
df.shape

(100, 5)

In [None]:
f"rows:{df.shape[0]} columns:{df.shape[1]}"

'rows:100 columns:5'

In [None]:
df.loc[:1]

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
0,1986,Western Pacific,Viet Nam,Wine,0.0
1,1986,Americas,Uruguay,Other,0.5


In [None]:
df.loc[:,'Year':'WHO region'].head()

Unnamed: 0,Year,WHO region
0,1986,Western Pacific
1,1986,Americas
2,1985,Africa
3,1986,Americas
4,1987,Americas


In [None]:
df[['Year','WHO region']].head()

Unnamed: 0,Year,WHO region
0,1986,Western Pacific
1,1986,Americas
2,1985,Africa
3,1986,Americas
4,1987,Americas


In [None]:
df.sample(5)

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
83,1986,Europe,Ukraine,Other,
73,1986,Eastern Mediterranean,Pakistan,Other,0.01
0,1986,Western Pacific,Viet Nam,Wine,0.0
35,1985,Americas,Saint Kitts and Nevis,Spirits,2.24
76,1985,Africa,Comoros,Beer,0.02


In [None]:
df.sample(frac=0.02)

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
71,1985,Africa,Mali,Other,0.57
39,1987,Africa,Burkina Faso,Spirits,0.01


find and drop the missing values

In [None]:
df.dropna(inplace=True)

In [None]:
df.isnull().sum()

Unnamed: 0,0
Year,0
WHO region,0
Country,0
Beverage Types,0
Display Value,0


In [None]:
df['WHO region'].drop_duplicates(inplace=True)

alcohol consumption of a given year from the world alcohol consumption dataset.

In [None]:
df['Year'].value_counts()

Unnamed: 0_level_0,count
Year,Unnamed: 1_level_1
1986,21
1987,20
1985,18
1984,18
1989,18


In [None]:
df[(df['Year']==1987) | (df['Year']==1989)].head(10)

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
4,1987,Americas,Saint Kitts and Nevis,Beer,1.98
5,1987,Americas,Guatemala,Other,0.0
6,1987,Africa,Mauritius,Wine,0.13
10,1987,Africa,Botswana,Wine,0.2
11,1989,Americas,Guatemala,Beer,0.62
15,1987,Africa,Guinea-Bissau,Wine,0.07
17,1989,Africa,Seychelles,Beer,2.23
21,1989,Americas,Costa Rica,Spirits,4.51
28,1987,Western Pacific,Viet Nam,Beer,0.11
32,1989,Africa,Mauritius,Beer,1.6


alcohol consumption details by the 'Americas' in the year '1985'

In [None]:
df[(df['WHO region']=='Americas') & (df['Year']==1989)]

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
11,1989,Americas,Guatemala,Beer,0.62
21,1989,Americas,Costa Rica,Spirits,4.51
55,1989,Americas,Suriname,Wine,0.04
64,1989,Americas,Bolivia (Plurinational State of),Beer,1.26
78,1989,Americas,Jamaica,Other,0.0


 alcohol consumption details in the year '1986' where WHO region is 'Western Pacific' and country is 'VietNam'

In [None]:
df[(df['WHO region']=='Western Pacific') & (df['Year']==1986) & (df['Country']=='Viet Nam')]

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
0,1986,Western Pacific,Viet Nam,Wine,0.0


alcohol consumption details in the year '1986' or '1989' where WHO region is 'Americas'

In [None]:
df[(df['WHO region']=='Americas') & ((df['Year']==1986) | (df['Year']==1989))]

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
1,1986,Americas,Uruguay,Other,0.5
3,1986,Americas,Colombia,Beer,4.27
8,1986,Americas,Antigua and Barbuda,Spirits,1.55
11,1989,Americas,Guatemala,Beer,0.62
21,1989,Americas,Costa Rica,Spirits,4.51
47,1986,Americas,Mexico,Other,0.04
55,1989,Americas,Suriname,Wine,0.04
64,1989,Americas,Bolivia (Plurinational State of),Beer,1.26
74,1986,Americas,Bolivia (Plurinational State of),Spirits,2.06
78,1989,Americas,Jamaica,Other,0.0


consumption of beverages per person average >=5 and Beverage Types is Beer

In [None]:
df.columns

Index(['Year', 'WHO region', 'Country', 'Beverage Types', 'Display Value'], dtype='object')

In [None]:
df['Beverage Types'].groupby(df['Display Value']>=5).value_counts().reset_index()

Unnamed: 0,Display Value,Beverage Types,count
0,False,Wine,25
1,False,Beer,23
2,False,Other,22
3,False,Spirits,21
4,True,Wine,2
5,True,Beer,1
6,True,Other,1


average >=4 and Beverage Types is Beer, Wine, Spirits

In [None]:
df[(df['Display Value']>=4) & ((df['Beverage Types']=='Beer') | (df['Beverage Types']=='Wine') | (df['Beverage Types']=='Spirits'))]

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
3,1986,Americas,Colombia,Beer,4.27
21,1989,Americas,Costa Rica,Spirits,4.51
41,1986,Europe,Czech Republic,Beer,6.82
57,1989,Europe,Croatia,Wine,5.1
91,1989,Europe,Bulgaria,Beer,4.43
96,1985,Europe,Luxembourg,Wine,7.38


In [None]:
df[df['WHO region'].str.contains('ea')]

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
13,1984,Eastern Mediterranean,Afghanistan,Other,0.0
25,1984,Eastern Mediterranean,Tunisia,Other,0.0
27,1984,Eastern Mediterranean,Bahrain,Beer,2.22
36,1987,Eastern Mediterranean,Egypt,Beer,0.07
38,1987,Eastern Mediterranean,Qatar,Other,0.0
52,1986,Eastern Mediterranean,Saudi Arabia,Wine,0.0
53,1984,Eastern Mediterranean,Kuwait,Beer,0.0
58,1984,Eastern Mediterranean,Somalia,Spirits,0.0
59,1989,Eastern Mediterranean,Syrian Arab Republic,Other,0.0
60,1987,Eastern Mediterranean,Iran (Islamic Republic of),Other,0.0


In [None]:
df[df['WHO region'].isin(['Africa','Eastern Mediterranean','Europe'])]

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
2,1985,Africa,Cte d'Ivoire,Wine,1.62
6,1987,Africa,Mauritius,Wine,0.13
7,1985,Africa,Angola,Spirits,0.39
9,1984,Africa,Nigeria,Other,6.10
10,1987,Africa,Botswana,Wine,0.20
...,...,...,...,...,...
92,1986,Africa,Eritrea,Spirits,0.00
94,1985,Europe,Ukraine,Spirits,3.06
95,1984,Africa,Niger,Other,0.00
96,1985,Europe,Luxembourg,Wine,7.38


In [None]:
who_region = ["Africa", "Eastern Mediterranean", "Europe"]
df[~df["WHO region"].isin(who_region)]

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
0,1986,Western Pacific,Viet Nam,Wine,0.0
1,1986,Americas,Uruguay,Other,0.5
3,1986,Americas,Colombia,Beer,4.27
4,1987,Americas,Saint Kitts and Nevis,Beer,1.98
5,1987,Americas,Guatemala,Other,0.0
8,1986,Americas,Antigua and Barbuda,Spirits,1.55
11,1989,Americas,Guatemala,Beer,0.62
12,1985,Western Pacific,Lao People's Democratic Republic,Beer,0.0
14,1985,Western Pacific,Viet Nam,Spirits,0.05
16,1984,Americas,Costa Rica,Wine,0.06


filter all records where the average consumption of beverages per person from .5 to 2.50

In [None]:
df[(df['Beverage Types'] == 'Wine') & (df['Display Value'] > .2)].count()

Unnamed: 0,0
Year,9
WHO region,9
Country,9
Beverage Types,9
Display Value,9


In [None]:
df.filter(regex='0$',axis=0)

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
0,1986,Western Pacific,Viet Nam,Wine,0.0
10,1987,Africa,Botswana,Wine,0.2
20,1986,South-East Asia,Myanmar,Wine,0.0
30,1986,Africa,Sierra Leone,Other,4.48
40,1987,Europe,Austria,Spirits,1.9
50,1985,Europe,Switzerland,Other,0.3
60,1987,Eastern Mediterranean,Iran (Islamic Republic of),Other,0.0
70,1986,Africa,Madagascar,Spirits,1.02
80,1985,Africa,Malawi,Other,0.84
90,1989,Africa,Malawi,Wine,0.01


In [None]:
df.loc[0:9,'Year':'Display Value']

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
0,1986,Western Pacific,Viet Nam,Wine,0.0
1,1986,Americas,Uruguay,Other,0.5
2,1985,Africa,Cte d'Ivoire,Wine,1.62
3,1986,Americas,Colombia,Beer,4.27
4,1987,Americas,Saint Kitts and Nevis,Beer,1.98
5,1987,Americas,Guatemala,Other,0.0
6,1987,Africa,Mauritius,Wine,0.13
7,1985,Africa,Angola,Spirits,0.39
8,1986,Americas,Antigua and Barbuda,Spirits,1.55
9,1984,Africa,Nigeria,Other,6.1


In [None]:
df.loc[:,df.all()]

Unnamed: 0,Year,WHO region,Country,Beverage Types
0,1986,Western Pacific,Viet Nam,Wine
1,1986,Americas,Uruguay,Other
2,1985,Africa,Cte d'Ivoire,Wine
3,1986,Americas,Colombia,Beer
4,1987,Americas,Saint Kitts and Nevis,Beer
...,...,...,...,...
95,1984,Africa,Niger,Other
96,1985,Europe,Luxembourg,Wine
97,1984,South-East Asia,Indonesia,Wine
98,1984,Africa,Equatorial Guinea,Wine


In [None]:
df.loc[:,df.any()]

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
0,1986,Western Pacific,Viet Nam,Wine,0.00
1,1986,Americas,Uruguay,Other,0.50
2,1985,Africa,Cte d'Ivoire,Wine,1.62
3,1986,Americas,Colombia,Beer,4.27
4,1987,Americas,Saint Kitts and Nevis,Beer,1.98
...,...,...,...,...,...
95,1984,Africa,Niger,Other,0.00
96,1985,Europe,Luxembourg,Wine,7.38
97,1984,South-East Asia,Indonesia,Wine,0.00
98,1984,Africa,Equatorial Guinea,Wine,0.00


In [None]:
df.loc[:,df.notnull().all()]

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
0,1986,Western Pacific,Viet Nam,Wine,0.00
1,1986,Americas,Uruguay,Other,0.50
2,1985,Africa,Cte d'Ivoire,Wine,1.62
3,1986,Americas,Colombia,Beer,4.27
4,1987,Americas,Saint Kitts and Nevis,Beer,1.98
...,...,...,...,...,...
95,1984,Africa,Niger,Other,0.00
96,1985,Europe,Luxembourg,Wine,7.38
97,1984,South-East Asia,Indonesia,Wine,0.00
98,1984,Africa,Equatorial Guinea,Wine,0.00


In [None]:
df.loc[:,df.isnull().any()]

0
1
2
3
4
...
95
96
97
98
99


In [None]:
df.dropna(how='any')

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
0,1986,Western Pacific,Viet Nam,Wine,0.00
1,1986,Americas,Uruguay,Other,0.50
2,1985,Africa,Cte d'Ivoire,Wine,1.62
3,1986,Americas,Colombia,Beer,4.27
4,1987,Americas,Saint Kitts and Nevis,Beer,1.98
...,...,...,...,...,...
95,1984,Africa,Niger,Other,0.00
96,1985,Europe,Luxembourg,Wine,7.38
97,1984,South-East Asia,Indonesia,Wine,0.00
98,1984,Africa,Equatorial Guinea,Wine,0.00


In [None]:
df.iloc[:,0::2]

Unnamed: 0,Year,Country,Display Value
0,1986,Viet Nam,0.00
1,1986,Uruguay,0.50
2,1985,Cte d'Ivoire,1.62
3,1986,Colombia,4.27
4,1987,Saint Kitts and Nevis,1.98
...,...,...,...
95,1984,Niger,0.00
96,1985,Luxembourg,7.38
97,1984,Indonesia,0.00
98,1984,Equatorial Guinea,0.00


In [None]:
df.loc[1::5,:]

Unnamed: 0,Year,WHO region,Country,Beverage Types,Display Value
1,1986,Americas,Uruguay,Other,0.5
6,1987,Africa,Mauritius,Wine,0.13
11,1989,Americas,Guatemala,Beer,0.62
16,1984,Americas,Costa Rica,Wine,0.06
21,1989,Americas,Costa Rica,Spirits,4.51
27,1984,Eastern Mediterranean,Bahrain,Beer,2.22
33,1985,Africa,Mauritania,Other,0.0
38,1987,Eastern Mediterranean,Qatar,Other,0.0
43,1984,Western Pacific,China,Wine,0.03
49,1986,Europe,Malta,Wine,1.49
