# World Values Analysis

## 1. Define question <br>

This project focuses on understanding the differences between attitudes to work around the world, and what drives those differences. Specifically:  <br> <br>
a) How do attitudes towards work differ around the globe? <br>
b) Are attitudes to work correlated to GDP and development efforts? <br>
c) If so, does increasing GDP lead or lag changing attitudes to work?

## 2. Get data

### Import necessary modules

In [3]:
import pandas as pd
from data_dictionary import *
pd.set_option('display.max_columns', 500)

### Import data

In [4]:
df = pd.read_stata('./world-values-survey-data/WVS_Longitudinal_1981_2014_stata_v2015_04_18.dta', convert_categoricals=False) # index_col='S025', 

### Do basic EDA 

#### Check shape and nulls; inspect header

In [5]:
df.shape

(341271, 1410)

In [6]:
nulls = df.isnull().sum().sum()
null_pct = nulls * 100 / df.shape[0]*df.shape[1]
print(f'{null_pct} of cells are null')

208712.60669673074 of cells are null


In [7]:
df.head()

Unnamed: 0,S001,S002,S002EVS,S003,S003A,S004,S006,S007,S007_01,S008,S009,S009A,S010,S010_01,S010_02,S010_03,S010_04,S011,S012,S013,S013B,S014,S015,S016,S017,S017A,S018,S018A,S019,S019A,S020,S021,S021A,S022,S023,S024,S024A,S025,S025A,S026,S027,S028,A001,A001_CO,A002,A002_CO,A003,A003_CO,A004,A004_CO,A005,A005_CO,A006,A006_CO,A007,A008,A009,A010,A011,A012,A013,A014,A015,A016,A017,A018,A019,A020,A021,A022,A023,A024,A025,A026,A026_01,A027,A028,A029,A030,A031,A032,A033,A034,A035,A036,A037,A038,A039,A040,A041,A042,A043,A043_01,A043_01F,A043_F,A043B,A044,A045,A046,A047,A048,A049,A050,A050_01,A050_02,A050_03,A050_04,A051,A052,A053,A054,A055,A056,A057,A058,A059,A060,A061,A062,A063,A064,A065,A066,A067,A068,A069,A070,A071,A071B,A071C,A072,A073,A074,A075,A076,A077,A078,A079,A080,A080_F,A081,A082,A083,A084,A085,A086,A087,A088,A088B,A088C,A089,A090,A091,A092,A093,A094,A095,A096,A097,A097_F,A098,A099,A100,A101,A102,A103,A104,A105,A106,A106B,A106C,A107,A108,A109,A110,A111,A112,A113,A114,A115,A116,A117,A118,A119,A120,A121,A122,A123,A124_01,A124_02,A124_03,A124_04,A124_05,A124_06,A124_07,A124_08,A124_09,A124_10,A124_11,A124_12,A124_13,A124_14,A124_15,A124_16,A124_17,A124_18,A124_19,A124_20,A124_21,A124_22,A124_23,A124_24,A124_25,A124_26,A124_27,A124_28,A124_29,A124_30,A124_31,A124_32,A124_33,A124_34,A124_35,A124_36,A124_37,A124_38,A124_39,A124_40,A124_41,A124_42,A124_43,A124_44,A124_45,A124_46,A124_47,A124_48,A124_49,A124_50,A124_51,A124_52,A124_53,A124_54,A124_55,A124_56,A124_57,A124_58,A124_59,A124_60,A124_61,A165,...,G032,G033,G034,G035,G036,G037,G038,G039,G040,G041,G042,G043,G044,G045,G046,G047,G048,G049,G050,G051,H001,H002_01,H002_02,H002_03,H002_04,H002_05,H003_01,H003_02,H003_03,H004,H005,H006_01,H006_02,H006_03,H006_04,H006_05,H006_06,H007,H008_01,H008_02,H008_03,H008_04,I001,I002,U001A,U001B,U002A,U002B,U003A,U003B,U004A,U004B,U005A,U005B,U006A,U006B,V001,V001A,V002,V002A,V003,V004A,V004B,V004C,V004D,V004E,V004R,V005,V006,V006_2,V006_3,V006_4,V007A,V007B,V007C,V007D,V008,V009,V010,V011,V012,V013,V014,V015,V016,V017,V018,W001,W001A,W002A,W002B,W002C,W002D,W002E,W002R,W003,W004,W005,W005_2,W005_3,W005_4,W006A,W006B,W006C,W006D,W007,W008,W009,W010,W011,X001,X002,X002_01,X002_01A,X002_02,X002_02A,X002_03,X003,X003R,X003R2,X004,X005,X006,X006_01,X006_02,X007,X007_01,X007_02,X008,X009,X009_01,X010,X011,X011_01,X011_02,X011A,X012,X013,X014,X015,X016,X017,X018,X019,X020,X021,X022,X022_01,X022_02A,X022_02B,X022_03A,X022_03B,X022_04A,X022_04B,X022_05A,X022_05B,X022_06A,X022_06B,X023,X023R,X024,X024B,X025,X025A,X025B,X025C,X025CS,X025CSWVS,X025LIT,X025R,X026,X027,X028,X028_01,X029,X030,X031,X032,X032R,X032R_01,X033,X033R,X034,X034R,X034R_01,X035_2,X035_3,X035_4,X036,X036A,X036B,X036C,X036D,X037,X037_01,X037_02,X038,X039,X040,X041,X042_2,X042_3,X042_4,X043,X044,X045,X045B,X046,X047,X047A,X047A_01,X047B,X047B_01,X047C,X047C_01,X047CS,X047D,X047R,X048,X048A,X048B,X048C,X048D,X048E,X048F,X048G,X048WVS,X049,X049CS,X050,X051,X052,X053,X054,X055,Y001,Y002,Y003,Y010,Y011,Y012,Y013,Y014,Y020,Y021,Y022,Y023,Y024,TRADRAT5,survself
0,2,1,-4,392,392,-4.0,1.0,1,3920120000.0,-4,JP,JP,-4.0,-4,-4,-4,-4,-4.0,-4,-4,-4,-4,-4,-4,1.089722,1.089722,0.905084,0.905084,1.357627,1.357627,1981,39201210000.0,39201210000.0,-4,-4,3921,3921,3921981,3921981,20150418,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,-2,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,-2,-4,1,-4,1,0,-4,1,-4,0,0,-4,-4,1,0,0,0,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,0,-4,0,0,0,0,0,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,0,0,0,0,-4,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,...,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,1933,-4,-4,-4,-4,-4,49,4,2,-4,-4,-4,-4,-4,1,-4,-4,-4,-4,-4,-4,2,-4,-4,1,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,17.0,6.0,-4,-4,-4.0,-4,-4,-4,-4,-4,-4,-4.0,-2,-4,1,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,25,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,-4,-4,-4,-4,-3,-4,-4,-4,-4,7,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,392004,-4,-4,1,392001,-4,-4,-4,-4,,2,-1.0,,,0.901,,0.553333,,0.666667,,,0.35248,,
1,2,1,-4,392,392,-4.0,2.0,2,3920120000.0,-4,JP,JP,-4.0,-4,-4,-4,-4,-4.0,-4,-4,-4,-4,-4,-4,1.089722,1.089722,0.905084,0.905084,1.357627,1.357627,1981,39201210000.0,39201210000.0,-4,-4,3921,3921,3921981,3921981,20150418,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,1,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,1,-4,1,-4,1,0,-4,1,-4,0,1,-4,-4,0,0,0,0,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,3,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,0,-4,0,0,0,0,0,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,0,0,0,0,-4,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,...,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,1933,-4,-4,-4,-4,-4,49,4,2,-4,-4,-4,-4,-4,1,-4,-4,-4,-4,-4,-4,3,-4,-4,1,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,14.0,3.0,-4,-4,-4.0,-4,-4,-4,-4,-4,-4,-4.0,-2,-4,3,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,41,-4,-4,-4,-4,-4,-4,-4,-4,-4,0,-4,-4,-4,-4,25,-4,-4,-4,-4,-2,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,392004,-4,-4,2,392001,-4,-4,-4,-4,,1,-1.0,0.36594,0.68776,0.556,0.0,0.22,0.398303,0.666667,,0.259259,0.136,0.515189,-0.548588
2,2,1,-4,392,392,-4.0,3.0,3,3920120000.0,-4,JP,JP,-4.0,-4,-4,-4,-4,-4.0,-4,-4,-4,-4,-4,-4,1.089722,1.089722,0.905084,0.905084,1.357627,1.357627,1981,39201210000.0,39201210000.0,-4,-4,3921,3921,3921981,3921981,20150418,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,3,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,2,-4,0,-4,0,0,-4,1,-4,0,0,-4,-4,0,0,1,0,1,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,0,-4,0,0,0,0,0,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,0,1,1,-4,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,...,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,1901,-4,-4,-4,-4,-4,81,6,3,-4,-4,-4,-4,-4,1,-4,-4,-4,-4,-4,-4,4,-4,-4,1,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,15.0,4.0,-4,-4,-4.0,-4,-4,-4,-4,-4,-4,-4.0,-2,-4,7,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,41,-4,-4,-4,-4,-4,-4,-4,-4,-4,0,-4,-4,-4,-4,41,-4,-4,-4,-4,3,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,392004,-4,-4,2,392001,-4,-4,-4,-4,,1,2.0,0.34294,0.68776,0.244,0.0,0.44,0.141896,0.0,,0.0,0.136,0.241489,-1.603452
3,2,1,-4,392,392,-4.0,4.0,4,3920120000.0,-4,JP,JP,-4.0,-4,-4,-4,-4,-4.0,-4,-4,-4,-4,-4,-4,1.089722,1.089722,0.905084,0.905084,1.357627,1.357627,1981,39201210000.0,39201210000.0,-4,-4,3921,3921,3921981,3921981,20150418,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,3,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,2,-4,0,-4,0,0,-4,1,-4,0,0,-4,-4,0,0,1,0,1,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,0,-4,0,0,0,0,0,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,0,1,1,-4,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,...,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,1901,-4,-4,-4,-4,-4,81,6,3,-4,-4,-4,-4,-4,1,-4,-4,-4,-4,-4,-4,4,-4,-4,1,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,15.0,4.0,-4,-4,-4.0,-4,-4,-4,-4,-4,-4,-4.0,-2,-4,7,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,41,-4,-4,-4,-4,-4,-4,-4,-4,-4,0,-4,-4,-4,-4,41,-4,-4,-4,-4,3,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,392004,-4,-4,2,392001,-4,-4,-4,-4,,1,2.0,0.34294,0.68776,0.244,0.0,0.44,0.141896,0.0,,0.0,0.136,0.241489,-1.603452
4,2,1,-4,392,392,-4.0,5.0,5,3920120000.0,-4,JP,JP,-4.0,-4,-4,-4,-4,-4.0,-4,-4,-4,-4,-4,-4,1.089722,1.089722,0.905084,0.905084,1.357627,1.357627,1981,39201210000.0,39201210000.0,-4,-4,3921,3921,3921981,3921981,20150418,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,2,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,1,-4,1,-4,0,1,-4,0,-4,0,0,-4,-4,0,1,0,0,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,3,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,-4,0,0,0,0,0,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,0,0,1,0,-4,0,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,1,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,...,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,2,1917,-4,-4,-4,-4,-4,65,6,3,-4,-4,-4,-4,-4,5,-4,-4,-4,-4,-4,-4,4,-4,-4,1,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,17.0,6.0,-4,-4,-4.0,-4,-4,-4,-4,-4,-4,-4.0,-2,-4,5,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,41,-4,-4,-4,-4,-4,-4,-4,-4,-4,0,-4,-4,-4,-4,41,-4,-4,-4,-4,8,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,-4,392004,-4,-4,1,392001,-4,-4,-4,-4,,1,-1.0,0.43269,0.68776,0.823,0.0,0.22,0.29834,0.333333,,0.222222,0.136,0.129725,-0.37773


#### We can relabel the columns using the data dictionary found at  http://www.worldvaluessurvey.org/WVSDocumentationWVL.jsp

In [None]:
column_name_map = dict(zip())

In [9]:
new_column_labels = []

for i in df.columns:
    new_column_labels.append(column_name_map.get(i.lower(), i))

NameError: name 'column_name_map' is not defined

In [None]:
df.columns = new_column_labels

In [None]:
df.head()

#### Note that the country is listed as a code (column S003, referencing http://www.worldvaluessurvey.org/WVSDocumentationWVL.jsp). We want to add the name of the country

In [None]:
# Turn each country/ code combination into an item in a list, by splitting on new lines
country_list = country_list.split('\n')

# Create a list of country codes and country names
country_code_list = []
country_name_list = []
for country_pair in country_list:
    country_code_list.append(country_pair.split(':')[0])
    country_name_list.append(country_pair.split(':')[1])
    
# Turn the country code / name lookup into a dataframe, to allow a merge with the original dataframe
country_dictionary = {'country_code': country_code_list, 'country_name': country_name_list}
country_lookup = pd.DataFrame(country_dictionary)

In [None]:
# Merge country names into original dataframe
df['S003'] = df['S003'].astype(int) # match dtypes
country_lookup['country_code'] = country_lookup['country_code'].astype(int)
df = pd.merge(df, country_lookup, left_on='S003', right_on='country_code', how = 'left')
df.head()

In [None]:
# Also add a column for year, which is the last four digits of S0025 (note that S002 is the wave)
df['year'] = df['S025']%10000