# **Importing libraries**

In [23]:
#importing processing packages
import numpy as np
import pandas as pd
import scipy as sc

#importing visualization packages
import matplotlib.pyplot as plt
import plotly.express as px
import plotly.graph_objects as go
import seaborn as sns
import bokeh as bk

#importing warnings
import warnings
warnings.filterwarnings("ignore")

# **Importing Dataset**

In [24]:
#pre-processed csv file from part 1 has been considered

data=pd.read_csv("E:/Analyzing_Unemployment_rate_across_the_world/Business Case Studies/2ndpart.csv",na_values='NaN')
data.head()

Unnamed: 0.1,Unnamed: 0,Country Name,Country Code,1991,1992,1993,1994,1995,1996,1997,...,2019,2020,2021,code_3,continent,sub_region,average,91-20,20-21,21-22
0,0,Afghanistan,AFG,10.65,10.82,10.72,10.73,11.18,10.96,10.78,...,11.22,11.71,13.28,AFG,Asia,Southern Asia,11.14129,-0.16,-0.54,-0.36
1,1,Albania,ALB,10.31,30.01,25.26,20.84,14.61,13.93,16.88,...,11.47,13.33,11.82,ALB,Europe,Southern Europe,16.318065,-8.72,4.94,0.76
2,2,Algeria,DZA,20.6,24.38,26.23,27.74,31.84,28.53,25.43,...,10.51,12.55,12.7,DZA,Africa,Northern Africa,17.926129,-9.17,19.81,-2.59
3,3,Angola,AGO,4.21,4.21,4.23,4.16,4.11,4.1,4.09,...,7.42,8.33,8.53,AGO,Africa,Middle Africa,5.452258,0.18,-5.4,1.1
4,4,Argentina,ARG,5.44,6.36,10.1,11.76,18.8,17.11,14.82,...,9.84,11.46,10.9,ARG,Americas,South America,10.977742,-9.56,7.29,-3.75


# **Retrieving all Asian continent countries**

In [25]:
data['Country Name'].unique()

array(['Afghanistan', 'Albania', 'Algeria', 'Angola', 'Argentina',
       'Armenia', 'Australia', 'Austria', 'Azerbaijan', 'Bahamas, The',
       'Bahrain', 'Bangladesh', 'Barbados', 'Belarus', 'Belgium',
       'Belize', 'Benin', 'Bhutan', 'Bolivia', 'Bosnia and Herzegovina',
       'Botswana', 'Brazil', 'Brunei Darussalam', 'Bulgaria',
       'Burkina Faso', 'Burundi', 'Cabo Verde', 'Cambodia', 'Cameroon',
       'Canada', 'Central African Republic', 'Chad', 'Chile', 'China',
       'Colombia', 'Comoros', 'Congo, Dem. Rep.', 'Congo, Rep.',
       'Costa Rica', "Cote d'Ivoire", 'Croatia', 'Cuba', 'Cyprus',
       'Czech Republic', 'Denmark', 'Djibouti', 'Dominican Republic',
       'Ecuador', 'Egypt, Arab Rep.', 'El Salvador', 'Equatorial Guinea',
       'Eritrea', 'Estonia', 'Eswatini', 'Ethiopia', 'Fiji', 'Finland',
       'France', 'French Polynesia', 'Gabon', 'Gambia, The', 'Georgia',
       'Germany', 'Ghana', 'Greece', 'Guam', 'Guatemala', 'Guinea',
       'Guinea-Bissau', 'Guya

In [26]:
#retrieving all asian countries
data_asia = data[data['continent']=='Asia']

#dropping unwanted columns
data_asia.drop(['Unnamed: 0','Country Code','code_3'],axis=1,inplace=True)

data_asia.head()

Unnamed: 0,Country Name,1991,1992,1993,1994,1995,1996,1997,1998,1999,...,2018,2019,2020,2021,continent,sub_region,average,91-20,20-21,21-22
0,Afghanistan,10.65,10.82,10.72,10.73,11.18,10.96,10.78,10.8,10.81,...,11.15,11.22,11.71,13.28,Asia,Southern Asia,11.14129,-0.16,-0.54,-0.36
5,Armenia,1.6,1.8,5.3,6.6,6.7,9.3,10.8,9.4,11.2,...,18.97,18.3,21.21,20.9,Asia,Western Asia,12.922581,-9.45,-7.96,-2.2
8,Azerbaijan,0.9,1.8,4.5,6.3,7.2,8.1,9.1,10.0,10.9,...,4.9,4.85,6.46,6.58,Asia,Western Asia,6.592581,-10.88,6.15,-0.83
10,Bahrain,1.01,1.05,1.01,1.11,1.08,1.08,1.09,1.08,1.09,...,1.2,1.2,1.78,1.87,Asia,Western Asia,1.164839,-0.07,-0.05,-0.65
11,Bangladesh,2.2,2.33,2.36,2.38,2.48,2.51,2.69,2.9,3.06,...,4.41,4.44,5.41,5.23,Asia,Southern Asia,3.757419,-1.07,-0.11,-2.03


In [27]:
#visualizing each country unemployment rate

fig=px.bar(x=data_asia['Country Name'],y=data_asia['average'],height=500,width=1000,
           labels={'index':'Country Name','value':'Unemployment Rate'},
           title='Unemployment Rate of ASIAN Countries')
fig.show()

# **Transposing Dataset**

In [28]:
#transposing the dataset
data_n=data_asia.T

#dropping unwanted columns
data_n.drop(['continent','sub_region','average','91-20','20-21','21-22'],axis=0,inplace=True)

#converting rows into header column
header_row = 0
data_n.columns = data_n.iloc[header_row]
#print(data_n)

# Convert row to column header using DataFrame.iloc[]
data_n.columns = data_n.iloc[0]
#print(data_n)

#dropping unwanted columns
data_n.drop('Country Name',axis=0,inplace=True)

#sorting the columns
data_n.sort_index(axis=1,inplace=True)

#resetting index values as column name
data_n.reset_index(level=0,inplace=True)

data_n.rename(columns={'index':'year'},inplace=True)
data_n.head()

Country Name,year,Afghanistan,Armenia,Azerbaijan,Bahrain,Bangladesh,Bhutan,Brunei Darussalam,Cambodia,China,...,Tajikistan,Thailand,Timor-Leste,Turkiye,Turkmenistan,United Arab Emirates,Uzbekistan,Vietnam,West Bank and Gaza,"Yemen, Rep."
0,1991,10.65,1.6,0.9,1.01,2.2,1.41,4.7,0.73,2.37,...,1.9,2.63,3.54,8.21,1.4,1.87,1.9,2.09,11.6,8.32
1,1992,10.82,1.8,1.8,1.05,2.33,1.45,4.86,0.75,2.37,...,2.1,1.35,3.53,8.51,1.5,1.84,2.9,1.91,11.31,8.31
2,1993,10.72,5.3,4.5,1.01,2.36,1.41,4.82,0.8,2.69,...,6.2,1.49,3.52,8.96,1.5,1.85,4.9,1.97,11.29,8.35
3,1994,10.73,6.6,6.3,1.11,2.38,1.43,5.03,1.33,2.9,...,8.8,1.35,3.54,8.58,4.7,1.81,7.3,1.93,11.15,8.34
4,1995,11.18,6.7,7.2,1.08,2.48,1.45,5.18,0.78,3.0,...,10.3,1.1,3.53,7.64,8.3,1.8,7.8,1.9,11.1,8.96


# **ASIAN COUNTRIES**

**Visualizing the performance of Every country over the years**
**Countries are divided into two half. First consist of asian, ocenia, arab countries. Second part consist of american, europien, african countries.**

In [29]:
countries=[]
sub_regions=[]
for i in data_asia['sub_region'].unique():
    countries.append(data_asia[data_asia['sub_region']==i]['Country Name'])
    sub_regions.append(i)

In [30]:
#for i in range(len(sub_regions)):
for i in range(len(sub_regions)):
    fig = px.line(data_n[countries[i]],title = sub_regions[i],labels={
        'index':'Year','value':'Unemployment Rate'
    })
    fig.show()

In [31]:
sample_data_asia= data_asia.drop(['average','91-20','20-21','21-22'],axis=1)
#new_data_asia.head()

**Checking for the performance of every country by classifying it as good or bad WRT each year**

In [35]:
#considering only certain columns
data_ac= pd.DataFrame()
data_ac['country_name']= data_asia['Country Name']
#data_ac['country_code'] = data_asia['Country Code']
data_ac['1995']=data_asia['1995']
data_ac['1997'] = data_asia['1997']
data_ac['1999'] = data_asia['1999']
data_ac['2002'] = data_asia['2002']
data_ac['2004'] = data_asia['2004']
#data_ac['2006'] = data_asia['1997']
data_ac['continent'] = data_asia['continent']
data_ac['sub_region'] = data_asia['sub_region']
data_ac.head()



Unnamed: 0,country_name,1995,1997,1999,2002,2004,continent,sub_region
0,Afghanistan,11.18,10.78,10.81,11.26,10.99,Asia,Southern Asia
5,Armenia,6.7,10.8,11.2,10.78,10.34,Asia,Western Asia
8,Azerbaijan,7.2,9.1,10.9,10.04,7.99,Asia,Western Asia
10,Bahrain,1.08,1.09,1.09,1.11,1.09,Asia,Western Asia
11,Bangladesh,2.48,2.69,3.06,3.9,4.26,Asia,Southern Asia


In [37]:
#calculating difference between median(2007,8) and 2005, 2010 and 2012, 2014
#post financial crisis, pre-financial crisis, recovered_yr, recovered_yr_2014

data_ac['pre_financial']=data_ac['1997']-data_ac['1995']
data_ac['post_financial']=data_ac['1997']-data_ac['1999']
data_ac['recovered_yr']=data_ac['1997']-data_ac['2002']
data_ac['recovered_yr_2004']=data_ac['1997']-data_ac['2004']
data_ac.head()

Unnamed: 0,country_name,1995,1997,1999,2002,2004,continent,sub_region,pre_financial,post_financial,recovered_yr,recovered_yr_2004
0,Afghanistan,11.18,10.78,10.81,11.26,10.99,Asia,Southern Asia,-0.4,-0.03,-0.48,-0.21
5,Armenia,6.7,10.8,11.2,10.78,10.34,Asia,Western Asia,4.1,-0.4,0.02,0.46
8,Azerbaijan,7.2,9.1,10.9,10.04,7.99,Asia,Western Asia,1.9,-1.8,-0.94,1.11
10,Bahrain,1.08,1.09,1.09,1.11,1.09,Asia,Western Asia,0.01,0.0,-0.02,0.0
11,Bangladesh,2.48,2.69,3.06,3.9,4.26,Asia,Southern Asia,0.21,-0.37,-1.21,-1.57


In [38]:
data_recovered_1999 = data_ac[(data_ac['post_financial']>0) ] #fetching all countries that are recovered in 2010
data_recovered_1999.head()

Unnamed: 0,country_name,1995,1997,1999,2002,2004,continent,sub_region,pre_financial,post_financial,recovered_yr,recovered_yr_2004
27,Cambodia,0.78,0.91,0.9,1.1,1.13,Asia,South-Eastern Asia,0.13,0.01,-0.19,-0.22
78,Iraq,8.96,8.77,8.75,8.85,8.61,Asia,Western Asia,-0.19,0.02,-0.08,0.16
91,Lao PDR,2.6,2.38,2.11,1.8,1.51,Asia,South-Eastern Asia,-0.22,0.27,0.58,0.87
93,Lebanon,8.52,8.62,8.44,8.09,7.85,Asia,Western Asia,0.1,0.18,0.53,0.77
114,Myanmar,0.69,0.71,0.67,0.67,0.67,Asia,South-Eastern Asia,0.02,0.04,0.04,0.04


In [39]:
data_recovered_2002 = data_ac[(data_ac['post_financial']<0) & (data_ac['recovered_yr']>0)] #fetching all countries that are recovered in 2012
data_recovered_2002.head()

Unnamed: 0,country_name,1995,1997,1999,2002,2004,continent,sub_region,pre_financial,post_financial,recovered_yr,recovered_yr_2004
5,Armenia,6.7,10.8,11.2,10.78,10.34,Asia,Western Asia,4.1,-0.4,0.02,0.46
42,Cyprus,2.6,3.4,5.7,3.3,4.33,Asia,Western Asia,0.8,-2.3,0.1,-0.93
75,India,5.76,5.61,5.74,5.53,5.63,Asia,Southern Asia,-0.15,-0.13,0.08,-0.02
85,Kazakhstan,10.98,13.01,13.46,9.33,8.4,Asia,Central Asia,2.03,-0.45,3.68,4.61
116,Nepal,1.74,1.83,1.85,1.54,1.55,Asia,Southern Asia,0.09,-0.02,0.29,0.28


In [41]:
data_recovered_2004 = data_ac[((data_ac['post_financial']<0)) & (data_ac['recovered_yr']<0) & (data_ac['recovered_yr_2004']>0)]
data_recovered_2004.head() #fetching all countries that are recovered in 2014

Unnamed: 0,country_name,1995,1997,1999,2002,2004,continent,sub_region,pre_financial,post_financial,recovered_yr,recovered_yr_2004
8,Azerbaijan,7.2,9.1,10.9,10.04,7.99,Asia,Western Asia,1.9,-1.8,-0.94,1.11
131,Philippines,3.63,3.62,3.69,3.63,3.55,Asia,South-Eastern Asia,-0.01,-0.07,-0.01,0.07
161,Tajikistan,10.3,13.9,15.4,14.41,13.61,Asia,Central Asia,3.6,-1.5,-0.51,0.29
164,Timor-Leste,3.53,3.56,3.93,3.57,3.48,Asia,South-Eastern Asia,0.03,-0.37,-0.01,0.08


The Countries Most and Least Affected by the 1997 asian Crisis

In [43]:
#considering only certain columns
data_affected= pd.DataFrame()
data_affected['country_name']= data_asia['Country Name']
#data_affected['country_code'] = data_asia['Country Code']
#data_affected['2005']=data['2005']
#data_affected['2007'] = data['2007']
data_affected['diff_1997']=0
data_affected['1997'] = data_asia['1997']
data_affected['1998'] = data_asia['1998']
data_affected['1999'] = data_asia['1999']
data_affected['2000'] = data_asia['2000']
data_affected['2001'] = data_asia['2001']
data_affected['2002'] = data_asia['2002']
data_affected['2003'] = data_asia['2003']
data_affected['continent'] = data_asia['continent']
data_affected['sub_region'] = data_asia['sub_region']
data_affected.head()

Unnamed: 0,country_name,diff_1997,1997,1998,1999,2000,2001,2002,2003,continent,sub_region
0,Afghanistan,0,10.78,10.8,10.81,10.81,10.81,11.26,11.14,Asia,Southern Asia
5,Armenia,0,10.8,9.4,11.2,11.05,10.91,10.78,10.59,Asia,Western Asia
8,Azerbaijan,0,9.1,10.0,10.9,11.78,10.91,10.04,9.17,Asia,Western Asia
10,Bahrain,0,1.09,1.08,1.09,1.08,1.11,1.11,1.09,Asia,Western Asia
11,Bangladesh,0,2.69,2.9,3.06,3.27,3.62,3.9,4.32,Asia,Southern Asia


In [44]:
#finding the difference of unemployment rate between 2008 and other years for each country
def diff_unp_rate(col_name,year1,year2): #creatting a function that differentiate between crisis year and other year
    data_affected[col_name]=data_affected[year1]-data_affected[year2]

col_name=['diff_1998','diff_1999','diff_2000','diff_2001','diff_2002','diff_2003'] #creating necessary columns
year1=['1997','1998','1999','2000','2001','2002']
year2=['1998','1999','2000','2001','2002','2003']
for i,j,k in zip(col_name,year1,year2): #iterating through respective rows
    diff_unp_rate(i,j,k) #calling the function

In [46]:
data_affected.head()

Unnamed: 0,country_name,diff_1997,1997,1998,1999,2000,2001,2002,2003,continent,sub_region,diff_1998,diff_1999,diff_2000,diff_2001,diff_2002,diff_2003
0,Afghanistan,0,10.78,10.8,10.81,10.81,10.81,11.26,11.14,Asia,Southern Asia,-0.02,-0.01,0.0,0.0,-0.45,0.12
5,Armenia,0,10.8,9.4,11.2,11.05,10.91,10.78,10.59,Asia,Western Asia,1.4,-1.8,0.15,0.14,0.13,0.19
8,Azerbaijan,0,9.1,10.0,10.9,11.78,10.91,10.04,9.17,Asia,Western Asia,-0.9,-0.9,-0.88,0.87,0.87,0.87
10,Bahrain,0,1.09,1.08,1.09,1.08,1.11,1.11,1.09,Asia,Western Asia,0.01,-0.01,0.01,-0.03,0.0,0.02
11,Bangladesh,0,2.69,2.9,3.06,3.27,3.62,3.9,4.32,Asia,Southern Asia,-0.21,-0.16,-0.21,-0.35,-0.28,-0.42


In [49]:
#finding cumulative frequency for each differenced column

#dropping unwanted columns
data_affected.drop(['1997','1998','1999','2000','2001','2002','2003','continent','sub_region'],axis=1,inplace=True)
data_affected.head()

Unnamed: 0,country_name,diff_1997,diff_1998,diff_1999,diff_2000,diff_2001,diff_2002,diff_2003
0,Afghanistan,0,-0.02,-0.01,0.0,0.0,-0.45,0.12
5,Armenia,0,1.4,-1.8,0.15,0.14,0.13,0.19
8,Azerbaijan,0,-0.9,-0.9,-0.88,0.87,0.87,0.87
10,Bahrain,0,0.01,-0.01,0.01,-0.03,0.0,0.02
11,Bangladesh,0,-0.21,-0.16,-0.21,-0.35,-0.28,-0.42


In [50]:

cumulative_frq1=['diff_1998','diff_1999','diff_2000','diff_2001','diff_2002'] #creating necessary columns for iterating
cumulative_frq2=['diff_1999','diff_2000','diff_2001','diff_2002','diff_2003']
def cum_freq(year1,year2): #creating a function that sums up cumulative unemployment rate between two years
    data_affected[year2]=data_affected[year1]+data_affected[year2]

for i,j in zip(cumulative_frq1,cumulative_frq2): #iterating i,j rows
    cum_freq(i,j) #calling the function by assigning necessary packages

data_affected=data_affected.sort_values(by='diff_2003',ascending=True,axis=0) #sorting the dataset WRT 2014 column

In [51]:
data_affected.head()

Unnamed: 0,country_name,diff_1997,diff_1998,diff_1999,diff_2000,diff_2001,diff_2002,diff_2003
182,West Bank and Gaza,0,0.11,0.19,0.2,-10.66,-16.63,-12.17
72,"Hong Kong SAR, China",0,-2.36,-4.03,-2.7,-2.87,-5.06,-5.64
103,Maldives,0,-0.23,-0.47,-0.7,-1.73,-2.92,-4.12
80,Israel,0,-1.0,-1.43,-1.35,-2.06,-3.14,-3.76
169,Turkiye,0,-0.05,-0.85,0.34,-1.54,-3.52,-3.7


In [52]:
#transposing the dataset
data_n1=data_affected.T

#dropping unwanted columns
#data_n.drop('Country Code',axis=0,inplace=True)

#converting rows into header column
header_row = 0
data_n1.columns = data_n1.iloc[header_row]
#print(data_n)

# Convert row to column header using DataFrame.iloc[]
data_n1.columns = data_n1.iloc[0]
#print(data_n)

#dropping unwanted columns
data_n1.drop('country_name',axis=0,inplace=True)

#sorting the columns
data_n1.sort_index(axis=1,inplace=True)

#resetting index values as column name
data_n1.reset_index(level=0,inplace=True)

data_n1.rename(columns={'index':'year'},inplace=True)
data_n1

country_name,year,Afghanistan,Armenia,Azerbaijan,Bahrain,Bangladesh,Bhutan,Brunei Darussalam,Cambodia,China,...,Tajikistan,Thailand,Timor-Leste,Turkiye,Turkmenistan,United Arab Emirates,Uzbekistan,Vietnam,West Bank and Gaza,"Yemen, Rep."
0,diff_1997,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,diff_1998,-0.02,1.4,-0.9,0.01,-0.21,0.0,-0.14,-0.03,-0.01,...,-2.6,-2.53,-0.05,-0.05,-1.2,-0.16,-2.4,0.58,0.11,-0.61
2,diff_1999,-0.03,-0.4,-1.8,0.0,-0.37,0.0,-0.38,0.01,-0.02,...,-1.5,-2.1,-0.37,-0.85,-1.7,-0.24,-2.4,0.54,0.19,-1.26
3,diff_2000,-0.03,-0.25,-2.68,0.01,-0.58,-0.19,-0.49,-0.06,-0.03,...,-1.23,-1.52,0.15,0.34,-0.54,-0.27,-1.33,0.61,0.2,-1.36
4,diff_2001,-0.03,-0.11,-1.81,-0.02,-0.93,-0.5,-0.59,-0.12,-0.57,...,-0.87,-1.73,0.19,-1.54,0.32,-0.51,-0.3,0.11,-10.66,-1.51
5,diff_2002,-0.48,0.02,-0.94,-0.02,-1.21,-0.49,-0.75,-0.19,-1.01,...,-0.51,-0.95,-0.01,-3.52,1.25,-0.67,0.75,0.75,-16.63,-1.64
6,diff_2003,-0.36,0.21,-0.07,0.0,-1.63,-0.4,-0.82,-0.2,-1.35,...,-0.12,-0.67,0.04,-3.7,2.01,-0.77,1.79,0.62,-12.17,-1.77


In [55]:
#retrieving countries through sub-regions

countries=[]
sub_regions=[]
for i in data_asia['sub_region'].unique():
    countries.append(data_asia[data_asia['sub_region']==i]['Country Name'])
    sub_regions.append(i)

In [56]:
#for i in range(len(sub_regions)):
for i in range(len(sub_regions)):
    fig = px.line(data_n1[countries[i]],title = sub_regions[i],labels={
        'index':'Year','value':'Unemployment Rate'
    })
    fig.show()

In [57]:
#now considering only top 10 and least 10 affected countries
data_first_10= data_affected.head(10)
data_last_10=data_affected.tail(10)
data_first_10

Unnamed: 0,country_name,diff_1997,diff_1998,diff_1999,diff_2000,diff_2001,diff_2002,diff_2003
182,West Bank and Gaza,0,0.11,0.19,0.2,-10.66,-16.63,-12.17
72,"Hong Kong SAR, China",0,-2.36,-4.03,-2.7,-2.87,-5.06,-5.64
103,Maldives,0,-0.23,-0.47,-0.7,-1.73,-2.92,-4.12
80,Israel,0,-1.0,-1.43,-1.35,-2.06,-3.14,-3.76
169,Turkiye,0,-0.05,-0.85,0.34,-1.54,-3.52,-3.7
145,Singapore,0,-0.91,-2.35,-1.2,-1.26,-3.15,-3.43
160,Syrian Arab Republic,0,-0.06,-0.21,-2.21,-4.24,-3.54,-2.89
99,"Macao SAR, China",0,-1.35,-3.09,-3.61,-3.13,-3.01,-2.74
90,Kyrgyz Republic,0,-1.4,-0.9,-0.04,-0.34,-5.05,-2.42
76,Indonesia,0,-0.78,-1.68,-1.4,-1.4,-1.92,-1.98


In [58]:
#adding a sub_region as a world for top 10 and least 10 countries
data_first_10['sub_region']='asian'

data_last_10['sub_region']='asian'

working on visualizing top 10 countries that were not affected most

In [59]:
#transposing the dataset
data_first10=data_first_10.T

#dropping unwanted columns
#data_first10.drop('Country Code',axis=0,inplace=True)

#converting rows into header column
header_row = 0
data_first10.columns = data_first10.iloc[header_row]
#print(data_n)

# Convert row to column header using DataFrame.iloc[]
data_first10.columns = data_first10.iloc[0]
#print(data_n)

#dropping unwanted columns
data_first10.drop('country_name',axis=0,inplace=True)

#sorting the columns
data_first10.sort_index(axis=1,inplace=True)

#resetting index values as column name
data_first10.reset_index(level=0,inplace=True)

data_first10.rename(columns={'index':'year'},inplace=True)

data_first10=data_first10.drop(data_first10.index[7])

data_first10

country_name,year,"Hong Kong SAR, China",Indonesia,Israel,Kyrgyz Republic,"Macao SAR, China",Maldives,Singapore,Syrian Arab Republic,Turkiye,West Bank and Gaza
0,diff_1997,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,diff_1998,-2.36,-0.78,-1.0,-1.4,-1.35,-0.23,-0.91,-0.06,-0.05,0.11
2,diff_1999,-4.03,-1.68,-1.43,-0.9,-3.09,-0.47,-2.35,-0.21,-0.85,0.19
3,diff_2000,-2.7,-1.4,-1.35,-0.04,-3.61,-0.7,-1.2,-2.21,0.34,0.2
4,diff_2001,-2.87,-1.4,-2.06,-0.34,-3.13,-1.73,-1.26,-4.24,-1.54,-10.66
5,diff_2002,-5.06,-1.92,-3.14,-5.05,-3.01,-2.92,-3.15,-3.54,-3.52,-16.63
6,diff_2003,-5.64,-1.98,-3.76,-2.42,-2.74,-4.12,-3.43,-2.89,-3.7,-12.17


In [60]:
#retrieving countries through sub-regions

countries=[]
sub_regions=[]
for i in data_first_10['sub_region'].unique():
    countries.append(data_first_10[data_first_10['sub_region']==i]['country_name'])
    sub_regions.append(i)

#for i in range(len(sub_regions)):
for i in range(len(sub_regions)):
    fig = px.line(data_first10[countries[i]],title = 'Top countries that are not affected most',
                  labels={'index':'Year','value':'Cumulative Unemployment Rate'},
                  height=800,width=1400
                  )
    fig.show()

working on visualizing least 10 countries that were affected most

In [61]:
#transposing the dataset
data_last10=data_last_10.T

#dropping unwanted columns
#data_first10.drop('Country Code',axis=0,inplace=True)

#converting rows into header column
header_row = 0
data_last10.columns = data_last10.iloc[header_row]
#print(data_n)

# Convert row to column header using DataFrame.iloc[]
data_last10.columns = data_last10.iloc[0]
#print(data_n)

#dropping unwanted columns
data_last10.drop('country_name',axis=0,inplace=True)

#sorting the columns
data_last10.sort_index(axis=1,inplace=True)

#resetting index values as column name
data_last10.reset_index(level=0,inplace=True)

data_last10.rename(columns={'index':'year'},inplace=True)

data_last10=data_last10.drop(data_last10.index[7])

data_last10

country_name,year,Armenia,Kazakhstan,Lao PDR,Lebanon,Nepal,Philippines,Sri Lanka,Turkmenistan,Uzbekistan,Vietnam
0,diff_1997,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,diff_1998,1.4,-0.12,-0.04,0.13,0.05,-0.19,1.43,-1.2,-2.4,0.58
2,diff_1999,-0.4,-0.45,0.27,0.18,-0.02,-0.07,1.72,-1.7,-2.4,0.54
3,diff_2000,-0.25,0.26,0.32,0.31,-0.03,-0.03,2.86,-0.54,-1.33,0.61
4,diff_2001,-0.11,2.58,0.44,0.43,0.08,-0.08,2.7,0.32,-0.3,0.11
5,diff_2002,0.02,3.68,0.58,0.53,0.29,-0.01,1.84,1.25,0.75,0.75
6,diff_2003,0.21,4.23,0.72,0.63,0.23,0.09,2.38,2.01,1.79,0.62


In [62]:
#retrieving countries through sub-regions

countries=[]
sub_regions=[]
for i in data_last_10['sub_region'].unique():
    countries.append(data_last_10[data_last_10['sub_region']==i]['country_name'])
    sub_regions.append(i)

#for i in range(len(sub_regions)):
for i in range(len(sub_regions)):
    fig = px.line(data_last10[countries[i]],title = 'Least 10 countries that were affected more',
                  labels={'index':'Year','value':'Cumulative Unemployment Rate'},
                  height=800,width=1400
                  )
    fig.show()