In [1]:
import pandas as pd
import numpy as np

In [2]:
pd.options.display.max_columns = None
pd.options.display.max_rows = None

## I. Explore the data  
  
A. Study variable attributes 
 1. Identify variable name and survey item(s) it measures (Codebook available here: https://www.worldvaluessurvey.org/WVSDocumentationWV6.jsp (accessed on 5/25/2021))  
 2. % missing for each variable
 3. Quick descriptives (check for range of values, distribution shape, skew/outliers, potential errors, etc.)  
 4. Identify target variable (and drop duplicates) - don't forget to do feature engineering on the target variable; break out into varying levels of happiness  
  
B. Visualize the data (based on descriptives)
 1. Explore correlations between attributes
 2. Identify transformations that might be needed
 3. Identify extra data that may be useful (gini coefficient, GDP, etc.)
 4. Summarize findings

In [3]:
wvs_w6 = pd.read_csv('../data/Evaluating_Happiness/wvs_w6.csv', low_memory=False)

In [4]:
wvs_w6.shape

(89565, 442)

In [5]:
wvs_w6.head()

Unnamed: 0,V1,V2,V2A,cow,C_COW_ALPHA,B_COUNTRY_ALPHA,V3,V4,V5,V6,V7,V8,V9,V10,V11,V12,V13,V14,V15,V16,V17,V18,V19,V20,V21,V22,V23,V24,V25,V26,V27,V28,V29,V30,V31,V32,V33,V34,V35,V36,V37,V38,V39,V40,V41,V42,V43,V44,V44_ES,V45,V46,V47,V48,V49,V50,V51,V52,V53,V54,V55,V56,V56_NZ,V57,V58,V59,V60,V61,V62,V63,V64,V65,V66,V67,V68,V69,V70,V71,V72,V73,V74,V74B,V75,V76,V77,V78,V79,V80,V81,V82,V83,V84,V85,V86,V87,V88,V89,V90,V91,V92,V93,V94,V95,V96,V97,V98,V99,V100,V101,V102,V103,V104,V105,V106,V107,V108,V109,V110,V111,V112,V113,V114,V115,V116,V117,V118,V119,V120,V121,V122,V123,V124,V125_00,V125_01,V125_02,V125_03,V125_04,V125_05,V125_06,V125_07,V125_08,V125_09,V125_10,V125_11,V125_12,V125_13,V125_14,V125_15,V125_16,V125_17,V126,V127,V128,V129,V130,V131,V132,V133,V134,V135,V136,V137,V138,V139,V140,V141,V142,V143,V144,V144G,V145,V146,V147,V148,V149,V150,V151,V152,V153,V154,V155,V156,V157,V158,V159,V160,V161,V162,V163,V164,V165,V166,V167,V168,V169,V160A,V160B,V160C,V160D,V160E,V160F,V160G,V160H,V160I,V160J,V170,V171,V172,V173,V174,V175,V176,V177,V178,V179,V180,V181,V182,V183,V184,V185,V186,V187,V188,V189,V190,V191,V192,V193,V194,V195,V196,V197,V198,V199,V200,V201,V202,V203,V203A,V204,V205,V206,V207,V207A,V208,V209,V210,V211,V212,V213,V214,V215_01,V215_02,V215_03,V215_04,V215_05,V215_06,V215_07,V215_08,V215_10,V215_11,V215_12,V215_13,V215_14,V215_15,V215_16,V215_17,V215_18,V216,V217,V218,V219,V220,V221,V222,V223,V224,V218_ESMA,V217_ESMA,V219_ESMA,V220_ESMA,V221_ESMA,V222_ESMA,V223_ESMA,V224_ESMA,V225,V226,V227,V228,V228_LOCAL,V228_2,V228A,V228B,V228C,V228D,V228E,V228F,V228G,V228H,V228I,V228J,V228K,V229,V230,V231,V232,V233,V234,V235,V236,V237,V238,V239,V240,V241,V242,X003R2,X003R,V243,V243_AU,V244,V244_AU,V245,V246,V247,V248,V248_CS,V249,V250,V251,V252,V253,V253_CS,V254,V255,N_REGION_ISO,V256,V256B,V256C,V257,V258,V258A,S018,S019,V260,V261,V262,V265,Y001,Y001_1,Y001_2,Y001_3,Y001_4,Y001_5,Y002,Y003,MN_35A,MN_163A,MN_163B,MN_163C,MN_228L,MN_228M,MN_228N,MN_228O,MN_228P,MN_228Q,MN_228R,MN_228S1,MN_228S2,MN_228S3,MN_228S4,MN_228S5,MN_228S6,MN_228S7,MN_228S8,MN_229A,MN_229B,MN_230A,MN_233A,MN_233B,MN_234A,MN_237A,MN_237B1,MN_237B2,MN_237B3,MN_237B4,MN_237B5,MN_237B6,MN_237B7,MN_237C1,MN_237C2,MN_237C3,MN_237C4,MN_237C5,MN_237C6,MN_249A1,MN_249A2,MN_249A3,sacsecval,secvalwgt,resemaval,weightb,I_AUTHORITY,I_NATIONALISM,I_DEVOUT,defiance,WEIGHT1A,I_RELIGIMP,I_RELIGBEL,I_RELIGPRAC,disbelief,WEIGHT2A,I_NORM1,I_NORM2,I_NORM3,relativism,WEIGHT3A,I_TRUSTARMY,I_TRUSTPOLICE,I_TRUSTCOURTS,scepticism,WEIGHT4A,I_INDEP,I_IMAGIN,I_NONOBED,autonomy,WEIGHT1B,I_WOMJOB,I_WOMPOL,I_WOMEDU,equality,WEIGHT2B,I_HOMOLIB,I_ABORTLIB,I_DIVORLIB,choice,WEIGHT3B,I_VOICE1,I_VOICE2,I_VOI2_00,voice,WEIGHT4B
0,6,12,12,615,ALG,DZA,1,1.0,1.0,1.0,,1.0,1.0,2.0,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,1.0,2.0,2.0,1.0,1.0,,1.0,,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,7.0,4.0,,6.0,0.0,10.0,2.0,3.0,1.0,3.0,3.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,1.0,2.0,3.0,3.0,2.0,1.0,2.0,2.0,4.0,,,,,,,,,,,5.0,8.0,7.0,6.0,8.0,7.0,5.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,3.0,3.0,2.0,3.0,2.0,2.0,4.0,3.0,3.0,2.0,3.0,2.0,3.0,4.0,4.0,3.0,,,,4.0,,,,,,,,,,,,,0.0,0.0,4.0,1.0,2.0,2.0,2.0,3.0,8.0,5.0,6.0,9.0,3.0,4.0,7.0,6.0,7.0,5.0,2.0,2.0,50000000.0,5.0,3.0,3.0,1.0,1.0,1.0,,,10.0,1.0,2.0,2.0,1.0,2.0,7.0,4.0,3.0,2.0,3.0,1.0,9.0,1.0,2.0,1.0,2.0,2.0,3.0,2.0,3.0,2.0,1.0,2.0,2.0,3.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,5.0,5.0,1.0,5.0,1.0,2.0,2.0,3.0,2.0,3.0,3.0,2.0,3.0,3.0,3.0,3.0,7.0,8.0,3.0,5.0,6.0,9.0,6.0,6.0,1.0,1.0,1.0,1.0,,1.0,3.0,,1.0,1.0,6.0,5.0,1.0,1.0,2.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,2.0,3.0,4.0,2.0,2.0,3.0,4.0,2.0,4.0,,,,,,,,,2.0,3.0,3.0,12005.0,12005.0,,3.0,4.0,3.0,3.0,3.0,3.0,4.0,4.0,4.0,2.0,1.0,6.0,,,,,,2.0,1.0,1.0,4.0,5.0,1.0,1993.0,21.0,1.0,1.0,2.0,,2.0,,1.0,1.0,110.0,7.0,,24.0,1.0,2.0,2.0,1.0,,12003.0,1.0,12005.0,12105.0,,,110.0,1.0,1.0,0.833333,1.25,5,,2014,,2.0,1,0,0,1,0,1.0,0.0,0.0,2.0,1.0,2.0,3.0,5.0,4.0,2.0,2.0,3.0,2.0,2.0,4.0,2.0,3.0,3.0,3.0,2.0,3.0,,,,,,,2.0,,,,,,,,,,,,,,1.0,2.0,1.0,0.221111,1.0,0.164352,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.333333,0.111111,1.0,1.0,0.0,0.0,0.333333,1.0,0.66,0.33,0.33,0.44,1.0,1.0,0.0,0.0,0.333333,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.222222,0.074074,1.0,0.0,0.5,0.25,0.25,1.0
1,6,12,12,615,ALG,DZA,2,1.0,2.0,3.0,4.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,5.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,,1.0,,1.0,1.0,2.0,2.0,1.0,2.0,3.0,2.0,6.0,8.0,,6.0,0.0,10.0,2.0,1.0,2.0,3.0,4.0,3.0,1.0,1.0,1.0,2.0,2.0,3.0,2.0,1.0,1.0,1.0,3.0,2.0,2.0,2.0,2.0,2.0,1.0,1.0,2.0,3.0,,,,,,,,,,,5.0,7.0,5.0,5.0,4.0,4.0,6.0,1.0,3.0,3.0,3.0,3.0,3.0,1.0,1.0,1.0,2.0,2.0,3.0,1.0,2.0,2.0,3.0,2.0,2.0,2.0,3.0,2.0,2.0,3.0,,,,4.0,,,,,,,,,,,,,0.0,0.0,3.0,1.0,3.0,2.0,1.0,2.0,8.0,8.0,8.0,9.0,2.0,6.0,4.0,2.0,4.0,4.0,3.0,1.0,50000000.0,5.0,2.0,2.0,1.0,1.0,1.0,2.0,1.0,10.0,1.0,1.0,1.0,1.0,4.0,6.0,4.0,4.0,1.0,2.0,3.0,8.0,2.0,3.0,2.0,1.0,2.0,2.0,4.0,4.0,2.0,3.0,2.0,4.0,1.0,1.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,5.0,5.0,5.0,1.0,5.0,2.0,3.0,4.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,4.0,8.0,4.0,6.0,4.0,8.0,3.0,4.0,7.0,1.0,1.0,1.0,,1.0,1.0,,1.0,1.0,3.0,5.0,1.0,2.0,2.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,2.0,2.0,3.0,4.0,3.0,4.0,2.0,3.0,3.0,,,,,,,,,3.0,2.0,3.0,12003.0,12003.0,,3.0,4.0,4.0,3.0,4.0,3.0,3.0,4.0,4.0,1.0,1.0,6.0,,,,,,2.0,2.0,2.0,3.0,6.0,2.0,1990.0,24.0,1.0,1.0,2.0,,2.0,,1.0,1.0,110.0,7.0,,25.0,1.0,1.0,2.0,1.0,,12003.0,1.0,12005.0,12105.0,,,110.0,1.0,1.0,0.833333,1.25,5,,2014,,2.0,0,1,0,0,1,2.0,-1.0,0.0,2.0,3.0,2.0,3.0,5.0,4.0,6.0,2.0,3.0,3.0,2.0,3.0,2.0,3.0,3.0,2.0,4.0,3.0,,,,,,,2.0,,,,,,,,,,,,,,2.0,,,0.276389,1.0,0.11,1.0,0.5,0.33,0.33,0.386667,1.0,0.33,0.0,0.166667,0.165556,1.0,1.0,0.0,0.0,0.333333,1.0,0.0,0.66,0.0,0.22,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.33,0.11,1.0,0.0,0.0,0.0,0.0,1.0,0.66,0.0,0.33,0.33,1.0
2,6,12,12,615,ALG,DZA,3,1.0,3.0,2.0,4.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,1.0,2.0,1.0,2.0,1.0,2.0,4.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,2.0,1.0,1.0,1.0,2.0,,1.0,,2.0,3.0,1.0,1.0,1.0,1.0,1.0,1.0,6.0,8.0,,6.0,0.0,6.0,2.0,4.0,1.0,2.0,1.0,4.0,1.0,2.0,2.0,2.0,1.0,2.0,1.0,1.0,4.0,3.0,1.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,,,3.0,3.0,3.0,,,,,,6.0,7.0,7.0,7.0,5.0,7.0,5.0,1.0,3.0,3.0,4.0,4.0,4.0,3.0,2.0,2.0,2.0,3.0,4.0,3.0,2.0,2.0,2.0,3.0,4.0,3.0,2.0,3.0,2.0,4.0,,,,3.0,,,,,,,,,,,,,0.0,0.0,2.0,1.0,3.0,2.0,2.0,2.0,7.0,4.0,8.0,3.0,3.0,6.0,9.0,5.0,6.0,7.0,2.0,1.0,50000000.0,5.0,2.0,4.0,1.0,1.0,1.0,2.0,1.0,6.0,2.0,3.0,1.0,2.0,2.0,7.0,4.0,4.0,0.0,2.0,2.0,6.0,2.0,3.0,1.0,2.0,4.0,2.0,3.0,2.0,4.0,3.0,3.0,2.0,4.0,3.0,2.0,2.0,2.0,2.0,3.0,3.0,3.0,5.0,5.0,5.0,5.0,5.0,2.0,3.0,2.0,3.0,4.0,4.0,2.0,3.0,3.0,3.0,3.0,4.0,7.0,5.0,5.0,5.0,5.0,5.0,5.0,1.0,1.0,1.0,1.0,,1.0,4.0,,1.0,1.0,4.0,5.0,1.0,1.0,2.0,3.0,2.0,,,,,2.0,,,,,,,,,,,,,4.0,3.0,4.0,2.0,2.0,4.0,3.0,1.0,1.0,,,,,,,,,2.0,2.0,3.0,,,,4.0,4.0,3.0,4.0,2.0,3.0,2.0,4.0,4.0,2.0,1.0,3.0,2.0,7.0,6.0,5.0,2.0,1.0,,1.0,4.0,6.0,2.0,1988.0,26.0,1.0,2.0,2.0,,2.0,,1.0,1.0,500.0,5.0,,18.0,1.0,1.0,1.0,1.0,,12003.0,1.0,12005.0,12105.0,,,110.0,1.0,1.0,0.833333,1.25,5,,2014,,1.0,0,0,1,0,0,2.0,-2.0,0.0,1.0,3.0,2.0,3.0,6.0,4.0,5.0,1.0,2.0,2.0,2.0,3.0,2.0,4.0,3.0,2.0,4.0,4.0,1.0,1.0,1.0,2.0,3.0,3.0,2.0,,,,,,,,,,,,,,1.0,2.0,1.0,0.304722,1.0,0.152361,1.0,0.5,0.0,0.0,0.166667,1.0,0.0,0.0,0.166667,0.055556,1.0,1.0,0.0,0.0,0.333333,1.0,0.33,1.0,0.66,0.663333,1.0,0.0,1.0,0.0,0.333333,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.333333,0.111111,1.0,0.33,0.0,0.165,0.165,1.0
3,6,12,12,615,ALG,DZA,4,1.0,1.0,3.0,4.0,3.0,1.0,2.0,1.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,1.0,1.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,,2.0,,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,6.0,8.0,,6.0,0.0,6.0,2.0,1.0,3.0,1.0,4.0,3.0,1.0,1.0,1.0,1.0,1.0,2.0,3.0,2.0,3.0,3.0,1.0,1.0,2.0,2.0,3.0,1.0,1.0,2.0,2.0,2.0,,,,,,,,,,,6.0,9.0,5.0,6.0,4.0,6.0,8.0,1.0,3.0,3.0,2.0,2.0,3.0,2.0,3.0,4.0,2.0,3.0,4.0,2.0,3.0,3.0,4.0,2.0,2.0,2.0,3.0,1.0,2.0,4.0,,,,3.0,,,,,,,,,,,,,0.0,0.0,3.0,2.0,3.0,4.0,3.0,2.0,7.0,9.0,5.0,5.0,7.0,3.0,8.0,7.0,8.0,8.0,3.0,2.0,50000000.0,5.0,2.0,1.0,1.0,1.0,1.0,2.0,1.0,10.0,2.0,3.0,4.0,2.0,3.0,7.0,6.0,4.0,1.0,3.0,3.0,7.0,3.0,1.0,2.0,3.0,3.0,2.0,3.0,4.0,1.0,2.0,4.0,2.0,2.0,3.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,5.0,5.0,5.0,1.0,5.0,2.0,3.0,3.0,3.0,4.0,4.0,2.0,2.0,3.0,3.0,3.0,6.0,6.0,3.0,5.0,5.0,7.0,4.0,6.0,1.0,1.0,1.0,1.0,,1.0,1.0,,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,2.0,2.0,3.0,1.0,2.0,3.0,4.0,3.0,3.0,,,,,,,,,2.0,2.0,3.0,,,,2.0,4.0,3.0,3.0,2.0,3.0,2.0,2.0,2.0,1.0,3.0,1.0,1.0,8.0,5.0,6.0,2.0,1.0,,4.0,4.0,5.0,2.0,1986.0,28.0,1.0,2.0,2.0,,2.0,,1.0,1.0,500.0,6.0,,14.0,2.0,2.0,1.0,1.0,,12003.0,1.0,12005.0,12105.0,,,500.0,1.0,1.0,0.833333,1.25,5,,2014,,1.0,0,0,0,0,1,1.0,-1.0,0.0,2.0,2.0,2.0,3.0,7.0,5.0,6.0,2.0,3.0,2.0,2.0,3.0,2.0,2.0,4.0,3.0,3.0,2.0,2.0,2.0,1.0,2.0,2.0,3.0,2.0,,,,,,,,,,,,,,1.0,2.0,2.0,0.263056,1.0,0.096667,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.166667,0.055556,1.0,1.0,0.0,0.0,0.333333,1.0,0.66,1.0,0.33,0.663333,1.0,0.0,0.0,0.0,0.0,1.0,0.5,0.33,0.33,0.386667,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0
4,6,12,12,615,ALG,DZA,5,1.0,1.0,1.0,2.0,1.0,1.0,1.0,3.0,2.0,1.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,1.0,1.0,2.0,2.0,1.0,1.0,2.0,,1.0,,1.0,1.0,1.0,2.0,1.0,3.0,2.0,2.0,6.0,6.0,,1.0,3.0,4.0,2.0,1.0,2.0,3.0,4.0,2.0,1.0,2.0,1.0,1.0,2.0,5.0,1.0,2.0,3.0,1.0,4.0,3.0,2.0,2.0,3.0,1.0,2.0,2.0,2.0,2.0,,,,,,,,,,,5.0,8.0,4.0,7.0,4.0,6.0,6.0,2.0,2.0,3.0,4.0,2.0,3.0,2.0,3.0,3.0,2.0,4.0,3.0,2.0,3.0,3.0,3.0,2.0,3.0,3.0,2.0,4.0,3.0,2.0,,,,3.0,,,,,,,,,,,,,0.0,0.0,3.0,2.0,3.0,4.0,2.0,2.0,8.0,4.0,7.0,3.0,3.0,8.0,6.0,5.0,6.0,7.0,3.0,2.0,50000000.0,5.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,10.0,2.0,3.0,2.0,2.0,2.0,4.0,4.0,3.0,1.0,3.0,2.0,8.0,2.0,3.0,3.0,3.0,3.0,2.0,4.0,3.0,3.0,2.0,4.0,3.0,2.0,2.0,3.0,2.0,2.0,3.0,3.0,3.0,3.0,5.0,5.0,5.0,5.0,5.0,2.0,3.0,3.0,4.0,4.0,4.0,2.0,3.0,3.0,3.0,3.0,6.0,2.0,4.0,4.0,6.0,6.0,6.0,5.0,7.0,1.0,1.0,1.0,,1.0,3.0,,1.0,1.0,4.0,5.0,1.0,1.0,2.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,3.0,3.0,4.0,2.0,2.0,4.0,3.0,2.0,3.0,,,,,,,,,2.0,3.0,3.0,2.0,2.0,,3.0,3.0,4.0,2.0,3.0,3.0,4.0,3.0,3.0,1.0,2.0,3.0,2.0,5.0,6.0,9.0,2.0,2.0,1.0,2.0,3.0,7.0,2.0,1979.0,35.0,2.0,3.0,2.0,,2.0,,1.0,1.0,500.0,3.0,,8.0,1.0,1.0,1.0,1.0,,12003.0,1.0,12005.0,12105.0,,,110.0,1.0,1.0,0.833333,1.25,5,,2014,,2.0,0,1,0,0,1,2.0,1.0,0.0,2.0,3.0,3.0,3.0,4.0,7.0,4.0,2.0,2.0,3.0,2.0,3.0,1.0,4.0,3.0,1.0,3.0,2.0,2.0,2.0,1.0,2.0,2.0,3.0,2.0,,,,,,,,,,,,,,1.0,2.0,2.0,0.220833,1.0,0.239352,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.333333,1.0,0.66,0.66,0.33,0.55,1.0,0.0,0.0,1.0,0.333333,1.0,0.0,0.0,0.66,0.22,1.0,0.0,0.0,0.222222,0.074074,1.0,0.66,0.0,0.33,0.33,1.0


In [6]:
wvs_w6.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 89565 entries, 0 to 89564
Columns: 442 entries, V1 to WEIGHT4B
dtypes: float64(428), int64(12), object(2)
memory usage: 302.0+ MB


In [7]:
wvs_w6.info(verbose=True)

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 89565 entries, 0 to 89564
Data columns (total 442 columns):
 #   Column           Dtype  
---  ------           -----  
 0   V1               int64  
 1   V2               int64  
 2   V2A              int64  
 3   cow              int64  
 4   C_COW_ALPHA      object 
 5   B_COUNTRY_ALPHA  object 
 6   V3               int64  
 7   V4               float64
 8   V5               float64
 9   V6               float64
 10  V7               float64
 11  V8               float64
 12  V9               float64
 13  V10              float64
 14  V11              float64
 15  V12              float64
 16  V13              float64
 17  V14              float64
 18  V15              float64
 19  V16              float64
 20  V17              float64
 21  V18              float64
 22  V19              float64
 23  V20              float64
 24  V21              float64
 25  V22              float64
 26  V23              float64
 27  V24            

### Codebook notes:  
  
- Weights (See https://www.worldvaluessurvey.org/WVSContents.jsp for further details): 
    - S018 and S019 are weighting factors that transform N's to 1000 and 1500, respectively
    - these variables are useful for cross-country comparisons 
    - useful for EDA and descriptive analyses; should arguably be dropped for random forest algorithm, **right?**
    - **QUESTION:** are weights useful for PCA and logistic regression?
    - **QUESTION:** I see weights, but not specific population or sample size info - do I need this?
        - sample size shouldn't be too difficult to obtain based on max V3 values for each country
        - population data shouldn't be difficult to obtain based on N preserving weightings (V258) and this formula  
        
        $$Weight = S018/1000 * Population$$  

In [8]:
# sample sizes for each participating country (if needed)
wvs_w6.groupby('C_COW_ALPHA')['V3'].count()

C_COW_ALPHA
ALG    1200
ARG    1030
ARM    1100
AUL    1477
AZE    1002
BLR    1535
BRA    1486
CHL    1000
CHN    2300
COL    1512
CYP    1000
ECU    1202
EGY    1523
EST    1533
GHA    1552
GMY    2046
GRG    1202
HAI    1996
HKG    1000
IND    4078
IRQ    1200
JOR    1200
JPN    2443
KUW    1303
KYR    1500
KZK    1500
LEB    1200
LIB    2131
MAL    1300
MEX    2000
MOR    1200
NEW     841
NIG    1759
NTH    1902
PAK    1200
PER    1210
PHI    1200
POL     966
PSE    1000
QAT    1060
ROK    1200
ROM    1503
RUS    2500
RWA    1527
SAF    3531
SIN    1972
SLV    1069
SPN    1189
SWD    1206
TAW    1238
THI    1200
TRI     999
TUN    1205
TUR    1605
UKR    1500
URU    1000
USA    2232
UZB    1500
YEM    1000
ZIM    1500
Name: V3, dtype: int64

In [9]:
# how many columns with null values?
wvs_w6.isna().sum().count()

442

In [10]:
# another approach for finding the number of columns with null values
#sum(map(any, wvs_w6.isnull()))

In [11]:
# how many null values in each column?
wvs_w6.isna().sum()

V1                     0
V2                     0
V2A                    0
cow                    0
C_COW_ALPHA            0
B_COUNTRY_ALPHA        0
V3                     0
V4                   341
V5                   545
V6                  1035
V7                  1620
V8                  1519
V9                  1348
V10                  758
V11                  326
V12                   14
V13                    6
V14                    7
V15                   17
V16                    9
V17                   13
V18                   12
V19                   18
V20                   15
V21                   19
V22                    3
V23                  586
V24                 2388
V25                  840
V26                  923
V27                  993
V28                 3211
V29                 3129
V30                 1118
V31                 2223
V32                 1055
V33                 1214
V34                 1197
V35                 9696
V36                 3979


In [52]:
# how many missings by country?
grouped_missings = wvs_w6.groupby('C_COW_ALPHA')
grouped_missings = -grouped_missings.count().sub(grouped_missings.size(), 0)

Unnamed: 0_level_0,V1,V2,V2A,cow,B_COUNTRY_ALPHA,V3,V4,V5,V6,V7,V8,V9,V10,V11,V12,V13,V14,V15,V16,V17,V18,V19,V20,V21,V22,V23,V24,V25,V26,V27,V28,V29,V30,V31,V32,V33,V34,V35,V36,V37,V38,V39,V40,V41,V42,V43,V44,V44_ES,V45,V46,V47,V48,V49,V50,V51,V52,V53,V54,V55,V56,V56_NZ,V57,V58,V59,V60,V61,V62,V63,V64,V65,V66,V67,V68,V69,V70,V71,V72,V73,V74,V74B,V75,V76,V77,V78,V79,V80,V81,V82,V83,V84,V85,V86,V87,V88,V89,V90,V91,V92,V93,V94,V95,V96,V97,V98,V99,V100,V101,V102,V103,V104,V105,V106,V107,V108,V109,V110,V111,V112,V113,V114,V115,V116,V117,V118,V119,V120,V121,V122,V123,V124,V125_00,V125_01,V125_02,V125_03,V125_04,V125_05,V125_06,V125_07,V125_08,V125_09,V125_10,V125_11,V125_12,V125_13,V125_14,V125_15,V125_16,V125_17,V126,V127,V128,V129,V130,V131,V132,V133,V134,V135,V136,V137,V138,V139,V140,V141,V142,V143,V144,V144G,V145,V146,V147,V148,V149,V150,V151,V152,V153,V154,V155,V156,V157,V158,V159,V160,V161,V162,V163,V164,V165,V166,V167,V168,V169,V160A,V160B,V160C,V160D,V160E,V160F,V160G,V160H,V160I,V160J,V170,V171,V172,V173,V174,V175,V176,V177,V178,V179,V180,V181,V182,V183,V184,V185,V186,V187,V188,V189,V190,V191,V192,V193,V194,V195,V196,V197,V198,V199,V200,V201,V202,V203,V203A,V204,V205,V206,V207,V207A,V208,V209,V210,V211,V212,V213,V214,V215_01,V215_02,V215_03,V215_04,V215_05,V215_06,V215_07,V215_08,V215_10,V215_11,V215_12,V215_13,V215_14,V215_15,V215_16,V215_17,V215_18,V216,V217,V218,V219,V220,V221,V222,V223,V224,V218_ESMA,V217_ESMA,V219_ESMA,V220_ESMA,V221_ESMA,V222_ESMA,V223_ESMA,V224_ESMA,V225,V226,V227,V228,V228_LOCAL,V228_2,V228A,V228B,V228C,V228D,V228E,V228F,V228G,V228H,V228I,V228J,V228K,V229,V230,V231,V232,V233,V234,V235,V236,V237,V238,V239,V240,V241,V242,X003R2,X003R,V243,V243_AU,V244,V244_AU,V245,V246,V247,V248,V248_CS,V249,V250,V251,V252,V253,V253_CS,V254,V255,N_REGION_ISO,V256,V256B,V256C,V257,V258,V258A,S018,S019,V260,V261,V262,V265,Y001,Y001_1,Y001_2,Y001_3,Y001_4,Y001_5,Y002,Y003,MN_35A,MN_163A,MN_163B,MN_163C,MN_228L,MN_228M,MN_228N,MN_228O,MN_228P,MN_228Q,MN_228R,MN_228S1,MN_228S2,MN_228S3,MN_228S4,MN_228S5,MN_228S6,MN_228S7,MN_228S8,MN_229A,MN_229B,MN_230A,MN_233A,MN_233B,MN_234A,MN_237A,MN_237B1,MN_237B2,MN_237B3,MN_237B4,MN_237B5,MN_237B6,MN_237B7,MN_237C1,MN_237C2,MN_237C3,MN_237C4,MN_237C5,MN_237C6,MN_249A1,MN_249A2,MN_249A3,sacsecval,secvalwgt,resemaval,weightb,I_AUTHORITY,I_NATIONALISM,I_DEVOUT,defiance,WEIGHT1A,I_RELIGIMP,I_RELIGBEL,I_RELIGPRAC,disbelief,WEIGHT2A,I_NORM1,I_NORM2,I_NORM3,relativism,WEIGHT3A,I_TRUSTARMY,I_TRUSTPOLICE,I_TRUSTCOURTS,scepticism,WEIGHT4A,I_INDEP,I_IMAGIN,I_NONOBED,autonomy,WEIGHT1B,I_WOMJOB,I_WOMPOL,I_WOMEDU,equality,WEIGHT2B,I_HOMOLIB,I_ABORTLIB,I_DIVORLIB,choice,WEIGHT3B,I_VOICE1,I_VOICE2,I_VOI2_00,voice,WEIGHT4B
C_COW_ALPHA,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1,Unnamed: 177_level_1,Unnamed: 178_level_1,Unnamed: 179_level_1,Unnamed: 180_level_1,Unnamed: 181_level_1,Unnamed: 182_level_1,Unnamed: 183_level_1,Unnamed: 184_level_1,Unnamed: 185_level_1,Unnamed: 186_level_1,Unnamed: 187_level_1,Unnamed: 188_level_1,Unnamed: 189_level_1,Unnamed: 190_level_1,Unnamed: 191_level_1,Unnamed: 192_level_1,Unnamed: 193_level_1,Unnamed: 194_level_1,Unnamed: 195_level_1,Unnamed: 196_level_1,Unnamed: 197_level_1,Unnamed: 198_level_1,Unnamed: 199_level_1,Unnamed: 200_level_1,Unnamed: 201_level_1,Unnamed: 202_level_1,Unnamed: 203_level_1,Unnamed: 204_level_1,Unnamed: 205_level_1,Unnamed: 206_level_1,Unnamed: 207_level_1,Unnamed: 208_level_1,Unnamed: 209_level_1,Unnamed: 210_level_1,Unnamed: 211_level_1,Unnamed: 212_level_1,Unnamed: 213_level_1,Unnamed: 214_level_1,Unnamed: 215_level_1,Unnamed: 216_level_1,Unnamed: 217_level_1,Unnamed: 218_level_1,Unnamed: 219_level_1,Unnamed: 220_level_1,Unnamed: 221_level_1,Unnamed: 222_level_1,Unnamed: 223_level_1,Unnamed: 224_level_1,Unnamed: 225_level_1,Unnamed: 226_level_1,Unnamed: 227_level_1,Unnamed: 228_level_1,Unnamed: 229_level_1,Unnamed: 230_level_1,Unnamed: 231_level_1,Unnamed: 232_level_1,Unnamed: 233_level_1,Unnamed: 234_level_1,Unnamed: 235_level_1,Unnamed: 236_level_1,Unnamed: 237_level_1,Unnamed: 238_level_1,Unnamed: 239_level_1,Unnamed: 240_level_1,Unnamed: 241_level_1,Unnamed: 242_level_1,Unnamed: 243_level_1,Unnamed: 244_level_1,Unnamed: 245_level_1,Unnamed: 246_level_1,Unnamed: 247_level_1,Unnamed: 248_level_1,Unnamed: 249_level_1,Unnamed: 250_level_1,Unnamed: 251_level_1,Unnamed: 252_level_1,Unnamed: 253_level_1,Unnamed: 254_level_1,Unnamed: 255_level_1,Unnamed: 256_level_1,Unnamed: 257_level_1,Unnamed: 258_level_1,Unnamed: 259_level_1,Unnamed: 260_level_1,Unnamed: 261_level_1,Unnamed: 262_level_1,Unnamed: 263_level_1,Unnamed: 264_level_1,Unnamed: 265_level_1,Unnamed: 266_level_1,Unnamed: 267_level_1,Unnamed: 268_level_1,Unnamed: 269_level_1,Unnamed: 270_level_1,Unnamed: 271_level_1,Unnamed: 272_level_1,Unnamed: 273_level_1,Unnamed: 274_level_1,Unnamed: 275_level_1,Unnamed: 276_level_1,Unnamed: 277_level_1,Unnamed: 278_level_1,Unnamed: 279_level_1,Unnamed: 280_level_1,Unnamed: 281_level_1,Unnamed: 282_level_1,Unnamed: 283_level_1,Unnamed: 284_level_1,Unnamed: 285_level_1,Unnamed: 286_level_1,Unnamed: 287_level_1,Unnamed: 288_level_1,Unnamed: 289_level_1,Unnamed: 290_level_1,Unnamed: 291_level_1,Unnamed: 292_level_1,Unnamed: 293_level_1,Unnamed: 294_level_1,Unnamed: 295_level_1,Unnamed: 296_level_1,Unnamed: 297_level_1,Unnamed: 298_level_1,Unnamed: 299_level_1,Unnamed: 300_level_1,Unnamed: 301_level_1,Unnamed: 302_level_1,Unnamed: 303_level_1,Unnamed: 304_level_1,Unnamed: 305_level_1,Unnamed: 306_level_1,Unnamed: 307_level_1,Unnamed: 308_level_1,Unnamed: 309_level_1,Unnamed: 310_level_1,Unnamed: 311_level_1,Unnamed: 312_level_1,Unnamed: 313_level_1,Unnamed: 314_level_1,Unnamed: 315_level_1,Unnamed: 316_level_1,Unnamed: 317_level_1,Unnamed: 318_level_1,Unnamed: 319_level_1,Unnamed: 320_level_1,Unnamed: 321_level_1,Unnamed: 322_level_1,Unnamed: 323_level_1,Unnamed: 324_level_1,Unnamed: 325_level_1,Unnamed: 326_level_1,Unnamed: 327_level_1,Unnamed: 328_level_1,Unnamed: 329_level_1,Unnamed: 330_level_1,Unnamed: 331_level_1,Unnamed: 332_level_1,Unnamed: 333_level_1,Unnamed: 334_level_1,Unnamed: 335_level_1,Unnamed: 336_level_1,Unnamed: 337_level_1,Unnamed: 338_level_1,Unnamed: 339_level_1,Unnamed: 340_level_1,Unnamed: 341_level_1,Unnamed: 342_level_1,Unnamed: 343_level_1,Unnamed: 344_level_1,Unnamed: 345_level_1,Unnamed: 346_level_1,Unnamed: 347_level_1,Unnamed: 348_level_1,Unnamed: 349_level_1,Unnamed: 350_level_1,Unnamed: 351_level_1,Unnamed: 352_level_1,Unnamed: 353_level_1,Unnamed: 354_level_1,Unnamed: 355_level_1,Unnamed: 356_level_1,Unnamed: 357_level_1,Unnamed: 358_level_1,Unnamed: 359_level_1,Unnamed: 360_level_1,Unnamed: 361_level_1,Unnamed: 362_level_1,Unnamed: 363_level_1,Unnamed: 364_level_1,Unnamed: 365_level_1,Unnamed: 366_level_1,Unnamed: 367_level_1,Unnamed: 368_level_1,Unnamed: 369_level_1,Unnamed: 370_level_1,Unnamed: 371_level_1,Unnamed: 372_level_1,Unnamed: 373_level_1,Unnamed: 374_level_1,Unnamed: 375_level_1,Unnamed: 376_level_1,Unnamed: 377_level_1,Unnamed: 378_level_1,Unnamed: 379_level_1,Unnamed: 380_level_1,Unnamed: 381_level_1,Unnamed: 382_level_1,Unnamed: 383_level_1,Unnamed: 384_level_1,Unnamed: 385_level_1,Unnamed: 386_level_1,Unnamed: 387_level_1,Unnamed: 388_level_1,Unnamed: 389_level_1,Unnamed: 390_level_1,Unnamed: 391_level_1,Unnamed: 392_level_1,Unnamed: 393_level_1,Unnamed: 394_level_1,Unnamed: 395_level_1,Unnamed: 396_level_1,Unnamed: 397_level_1,Unnamed: 398_level_1,Unnamed: 399_level_1,Unnamed: 400_level_1,Unnamed: 401_level_1,Unnamed: 402_level_1,Unnamed: 403_level_1,Unnamed: 404_level_1,Unnamed: 405_level_1,Unnamed: 406_level_1,Unnamed: 407_level_1,Unnamed: 408_level_1,Unnamed: 409_level_1,Unnamed: 410_level_1,Unnamed: 411_level_1,Unnamed: 412_level_1,Unnamed: 413_level_1,Unnamed: 414_level_1,Unnamed: 415_level_1,Unnamed: 416_level_1,Unnamed: 417_level_1,Unnamed: 418_level_1,Unnamed: 419_level_1,Unnamed: 420_level_1,Unnamed: 421_level_1,Unnamed: 422_level_1,Unnamed: 423_level_1,Unnamed: 424_level_1,Unnamed: 425_level_1,Unnamed: 426_level_1,Unnamed: 427_level_1,Unnamed: 428_level_1,Unnamed: 429_level_1,Unnamed: 430_level_1,Unnamed: 431_level_1,Unnamed: 432_level_1,Unnamed: 433_level_1,Unnamed: 434_level_1,Unnamed: 435_level_1,Unnamed: 436_level_1,Unnamed: 437_level_1,Unnamed: 438_level_1,Unnamed: 439_level_1,Unnamed: 440_level_1,Unnamed: 441_level_1
ALG,0,0,0,0,0,0,5,11,18,63,31,7,66,17,0,0,0,0,0,0,0,0,0,0,0,34,51,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1200,39,1200,88,86,104,58,49,42,67,107,39,57,1200,0,14,21,67,190,49,110,49,147,175,94,126,124,103,63,50,67,88,64,79,85,72,85,46,41,220,47,38,34,362,325,262,265,315,1125,1173,1128,1073,1165,655,94,114,44,88,49,83,9,24,25,44,116,136,79,71,100,74,261,63,132,150,215,242,165,135,182,199,259,224,163,1200,1200,1200,263,1200,1200,1200,1200,1200,1200,1200,1200,1200,1200,1200,1200,0,0,240,245,258,318,149,166,194,157,148,277,251,174,167,156,87,116,69,61,0,0,0,0,142,0,0,145,166,25,42,32,113,214,85,91,92,63,117,119,92,60,68,132,70,160,216,131,90,72,71,118,86,109,92,85,161,21,42,64,102,128,132,72,49,52,59,96,78,103,78,69,80,187,129,48,55,51,57,99,119,151,207,129,85,133,80,65,104,74,148,1200,84,62,1200,61,109,61,60,61,30,174,79,29,1200,1200,1200,1200,51,1200,1200,1200,1200,1200,1200,1200,1200,1200,1200,1200,1200,106,23,27,11,16,21,39,35,22,1200,1200,1200,1200,1200,1200,1200,1200,23,44,49,265,265,1200,387,527,429,470,430,427,483,469,519,0,0,0,595,622,628,658,627,120,417,120,122,0,0,0,0,0,0,0,1200,0,1200,0,0,1,1,1200,199,5,0,0,0,1200,3,0,0,0,1200,1200,0,0,0,0,0,0,1200,0,1200,179,0,0,0,0,0,110,0,0,182,221,229,0,0,0,0,0,0,97,38,44,48,70,34,35,33,226,475,475,595,633,633,595,0,775,775,775,775,775,775,775,775,775,775,775,775,775,398,423,507,35,0,27,0,124,32,104,23,0,7,142,0,3,0,80,104,74,71,0,71,63,132,59,0,0,0,0,0,0,39,49,42,33,0,148,84,62,76,0,99,175,199,75,0
ARG,0,0,0,0,0,0,2,2,6,14,17,18,11,6,0,0,0,0,0,0,0,0,0,0,0,10,34,5,0,0,0,1,1,1,2,1,1,748,0,0,0,0,0,0,0,0,0,1030,14,22,33,32,32,1030,52,34,47,69,21,26,1030,0,6,9,18,62,21,49,12,25,120,56,54,63,20,16,16,15,16,1030,22,19,16,16,15,8,107,16,21,16,62,79,55,70,113,823,998,873,909,959,201,51,100,63,61,55,77,5,12,12,15,96,90,12,38,43,18,49,13,17,20,36,46,40,34,39,33,121,182,77,1030,1030,1030,1030,1030,1030,146,1030,1030,1030,1030,1030,1030,1030,1030,1030,0,0,154,114,122,88,64,30,65,21,21,34,68,29,28,21,11,20,22,14,10,10,1,0,54,25,60,74,84,16,112,55,126,124,40,36,27,28,13,23,17,26,10,33,23,90,94,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,0,9,8,31,68,70,13,24,39,2,7,38,58,15,25,26,22,43,5,7,6,7,39,38,47,95,45,43,32,25,23,17,19,109,79,84,74,81,97,1030,15,19,19,12,46,15,16,1030,1030,1030,1030,1030,1030,1030,40,1030,1030,1030,1030,1030,1030,1030,1030,1030,60,19,23,9,9,17,26,22,13,1030,1030,1030,1030,1030,1030,1030,1030,11,22,23,264,264,1030,87,107,88,88,111,117,143,132,75,7,13,1030,259,108,109,113,5,4,5,52,23,47,0,0,0,0,0,8,1030,11,1030,5,11,8,0,1030,0,1,11,17,0,1030,1030,1030,0,0,1030,1030,0,0,0,0,0,0,0,0,1030,64,0,0,0,0,0,49,0,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,1030,6,0,7,0,63,41,32,9,0,18,54,1,3,0,25,17,19,14,0,38,13,17,14,0,0,0,0,0,0,14,52,34,20,0,109,84,74,71,0,42,49,73,18,0
ARM,0,0,0,0,0,0,7,5,26,7,18,1,8,2,0,0,0,0,0,0,0,0,0,0,0,4,15,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1100,1,0,2,4,17,29,38,10,27,47,42,49,1100,1,0,2,17,46,25,55,24,85,145,65,63,63,29,2,3,7,3,1100,10,10,4,21,1,22,102,4,4,0,11,13,7,17,18,1025,1083,1018,1068,1077,455,19,44,12,50,22,92,16,5,9,18,59,81,19,8,34,10,306,39,51,41,52,48,80,85,185,69,237,274,188,210,1100,1100,1100,1100,1100,1100,200,1100,1100,1100,1100,1100,1100,1100,1100,0,0,212,148,230,170,116,65,205,54,59,189,115,109,86,58,42,65,18,11,4,4,8,51,13,14,181,109,114,32,185,34,62,213,50,41,37,23,18,22,11,59,10,10,16,118,134,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,3,28,25,75,99,111,27,7,18,2,9,38,78,0,5,9,107,98,2,22,2,3,61,55,138,314,95,74,9,7,3,11,8,7,3,65,40,42,19,77,5,4,5,11,31,3,3,114,1100,1100,1100,1100,1100,1100,1100,1100,120,1100,1100,1100,1100,1100,1100,1100,33,2,3,0,9,6,6,5,4,1100,1100,1100,1100,1100,1100,1100,1100,0,7,10,281,281,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,0,207,212,214,212,213,0,19,11,24,8,0,0,0,0,0,4,1100,2,1100,0,0,0,2,1100,9,41,2,25,0,1100,0,18,0,0,1100,1100,0,0,0,0,0,0,0,0,1100,109,0,0,0,0,0,55,0,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,1100,0,0,2,0,63,32,17,7,0,1,13,8,1,0,7,11,8,5,0,8,39,51,33,0,0,0,0,0,0,1,38,10,2,0,7,65,40,25,0,51,46,70,27,0
AUL,0,0,0,0,0,0,8,51,56,72,69,57,13,12,0,0,0,0,0,0,0,0,0,0,0,15,11,30,43,43,47,48,47,48,37,55,46,521,0,0,0,0,0,0,0,0,0,1477,19,18,22,21,20,14,40,14,20,17,18,25,1477,12,8,18,26,46,26,46,18,28,35,45,51,39,33,30,29,29,29,1477,30,30,29,26,24,6,23,21,79,14,29,52,47,54,274,519,1264,1185,1244,1389,55,30,33,29,30,26,28,16,41,43,48,62,49,27,28,34,33,39,25,37,29,31,38,36,32,43,29,35,31,25,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,0,0,30,44,46,51,42,48,45,35,38,38,46,47,47,31,31,36,6,12,24,24,16,17,15,30,37,28,40,14,38,47,46,45,40,38,26,14,63,67,29,16,18,35,27,28,27,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,15,21,26,31,28,29,0,0,0,11,19,54,83,32,30,36,35,26,15,16,18,20,17,23,25,27,22,15,8,11,16,11,11,31,18,17,21,23,23,1477,9,13,9,8,54,40,29,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,62,1477,1477,1477,1477,84,22,59,19,30,45,43,32,29,1477,1477,1477,1477,1477,1477,1477,1477,12,22,29,71,71,1477,29,64,40,49,47,43,44,39,37,17,26,14,101,66,68,64,42,69,64,26,30,55,0,9,9,9,9,36,36,39,39,1477,13,13,425,77,211,82,17,1477,62,1477,20,1477,0,0,1477,1477,0,0,0,0,0,0,1477,0,1477,47,0,0,0,0,0,46,0,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,8,0,7,0,39,8,20,5,0,57,15,16,10,0,11,11,11,10,0,28,25,37,24,0,0,0,0,0,0,19,40,14,11,0,31,17,21,15,0,43,37,46,34,0
AZE,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,29,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1002,0,0,0,0,15,4,3,0,2,6,0,0,1002,0,0,2,0,2,0,2,0,2,73,19,10,14,0,0,0,0,0,1002,0,0,0,0,0,7,5,0,0,0,0,0,0,0,0,961,997,972,987,1000,1,0,2,0,0,0,1,6,5,7,33,52,50,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,0,0,0,33,62,46,42,0,0,0,0,0,0,0,0,0,0,0,18,0,0,0,0,0,0,0,0,0,0,0,68,25,40,68,4,3,4,1,6,3,3,1,0,0,0,0,0,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,4,19,9,14,23,18,1,0,0,0,0,9,24,2,23,23,9,6,0,5,12,4,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1002,1002,1002,1002,1002,1002,1002,1002,1002,0,1002,1002,1002,1002,1002,1002,1002,0,0,0,0,0,0,0,0,0,1002,1002,1002,1002,1002,1002,1002,1002,0,0,0,16,16,1002,34,82,44,90,43,58,97,103,46,0,0,0,240,240,240,240,240,0,0,0,3,0,0,0,0,0,0,0,1002,0,1002,0,0,0,0,1002,4,0,0,0,0,1002,0,0,0,0,0,1002,0,0,0,0,0,0,0,0,1002,4,0,0,0,0,0,2,0,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,0,0,0,0,14,0,15,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,0,0,0,0,0,0,0,0,1,2,3,0,0
BLR,0,0,0,0,0,0,6,13,23,20,14,19,84,21,0,0,0,0,0,0,0,0,0,0,0,4,116,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1535,86,66,107,118,15,10,13,13,10,8,1,3,1535,3,10,5,3,34,5,38,4,34,364,10,10,14,3,4,7,8,15,1535,5,7,7,6,5,8,41,3,4,8,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,58,5,5,3,4,3,32,5,3,7,9,14,13,7,3,5,5,18,6,7,8,14,17,15,12,14,16,18,27,20,1535,1535,1535,1535,1535,1535,1535,19,1535,1535,1535,1535,1535,1535,1535,1535,0,0,17,15,18,8,8,14,15,14,14,16,14,17,19,14,6,15,33,38,9,9,7,7,8,20,34,23,33,10,233,242,236,256,101,92,121,6,108,115,81,7,9,15,16,26,22,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,147,253,104,365,721,824,8,4,13,29,75,44,67,66,66,77,93,104,39,62,56,18,4,4,8,11,9,10,6,2,5,7,4,16,8,7,5,4,5,1535,6,3,2,2,14,30,10,1535,1535,1535,1535,1535,1535,1535,1535,1535,22,1535,1535,1535,1535,1535,1535,1535,32,9,18,4,12,20,32,18,18,1535,1535,1535,1535,1535,1535,1535,1535,7,34,37,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,0,1,25,26,30,32,8,917,921,11,16,0,0,0,0,0,0,1535,0,1535,0,0,0,0,1535,62,0,0,0,0,1535,19,0,0,0,0,1535,0,0,0,0,0,0,1535,0,1535,49,0,0,0,0,0,38,0,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,1535,2,0,1,0,14,98,15,4,0,19,8,7,3,0,2,7,4,1,0,3,6,7,3,0,0,0,0,0,0,86,13,13,7,0,16,7,5,1,0,32,28,47,13,0
BRA,0,0,0,0,0,0,1,3,6,11,3,2,1,1,0,0,0,0,0,0,0,0,0,0,0,3,11,6,24,14,16,12,15,14,7,14,11,12,0,0,0,0,0,0,0,0,0,1486,11,17,14,5,12,13,61,18,31,42,19,24,1486,6,1,1,69,150,29,111,16,94,88,34,60,27,17,8,7,8,5,3,6,5,4,8,3,7,118,7,5,4,41,118,41,38,61,848,1425,1258,1306,1360,298,28,53,16,81,25,52,6,9,3,12,36,80,14,83,19,9,86,6,5,15,16,35,12,43,42,9,57,89,53,1486,1486,1486,1486,1486,1486,387,1486,1486,1486,1486,1486,1486,1486,1486,1486,0,0,308,87,116,127,107,127,170,99,108,163,140,111,103,58,56,71,42,19,8,8,12,8,27,4,54,38,59,4,137,48,40,55,91,88,71,30,43,42,25,40,17,21,16,83,102,13,5,5,6,44,9,11,29,4,24,7,18,15,60,58,82,14,14,6,8,31,67,76,19,24,28,57,74,4,6,4,9,54,54,67,139,50,35,14,21,5,22,9,83,46,18,30,50,13,40,5,9,5,7,36,14,15,1486,1486,1486,1486,1486,1486,1486,141,1486,1486,1486,1486,1486,1486,1486,1486,1486,23,11,13,4,3,12,19,12,5,1486,1486,1486,1486,1486,1486,1486,1486,23,33,37,253,253,1486,146,287,176,127,195,214,130,189,59,40,46,0,326,163,160,164,86,75,52,47,20,27,0,0,0,0,0,10,1486,13,1486,0,2,0,8,1486,3,0,0,0,180,1486,0,0,0,0,1486,1486,5,0,0,0,0,0,1,0,1486,181,0,0,0,0,0,111,0,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,1486,2,0,9,0,27,13,12,1,0,2,27,12,8,0,21,22,9,10,0,83,6,5,5,0,0,0,0,0,0,11,61,18,11,0,83,18,30,19,0,86,126,163,49,0
CHL,0,0,0,0,0,0,0,11,8,12,25,8,3,1,0,0,0,0,0,0,0,0,0,0,0,12,29,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1000,16,19,38,30,35,48,43,37,60,87,8,31,1000,5,0,3,9,32,12,25,10,23,121,79,79,80,87,76,76,73,75,1000,77,86,82,84,79,6,54,27,20,17,25,32,17,27,40,789,961,769,836,850,291,16,73,20,27,20,34,1,23,36,65,146,140,11,8,15,11,84,11,15,15,14,22,30,26,20,20,34,80,45,1000,1000,1000,1000,1000,1000,165,1000,1000,1000,1000,1000,1000,1000,1000,1000,0,0,126,113,119,78,61,78,104,41,44,72,127,65,71,44,17,21,27,15,17,17,32,247,37,24,98,44,85,35,148,108,145,115,7,5,3,5,3,3,2,57,13,51,37,100,150,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,20,23,24,88,122,106,9,10,13,13,36,60,56,31,41,50,67,92,2,0,10,17,57,77,83,154,63,13,24,15,11,25,31,74,73,46,47,48,83,1000,20,18,24,4,54,28,15,1000,1000,1000,1000,1000,1000,1000,1000,157,1000,1000,1000,1000,1000,1000,1000,1000,96,3,15,4,4,14,9,7,7,1000,1000,1000,1000,1000,1000,1000,1000,2,26,25,197,197,1000,99,193,149,188,141,163,231,179,215,27,33,0,247,181,164,161,125,2,523,58,5,81,0,0,0,0,0,2,1000,2,1000,0,0,0,0,1000,20,12,0,0,0,1000,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1000,38,0,0,0,0,0,25,0,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000,2,0,8,0,80,9,35,15,0,8,37,32,4,0,15,25,31,17,0,8,11,15,2,0,0,0,0,0,0,16,43,37,18,0,74,46,47,45,0,19,23,35,7,0
CHN,0,0,0,0,0,0,29,51,101,190,107,239,28,15,0,0,0,0,0,0,0,0,0,0,0,48,104,22,0,3,2,3,1,3,2,1,3,164,0,0,0,0,0,0,0,0,0,2300,154,213,220,235,295,252,233,197,286,328,132,179,2300,0,0,55,248,248,225,229,253,254,155,132,165,281,122,122,132,139,130,128,132,133,141,137,138,247,323,48,49,48,113,113,113,113,129,2186,2234,2262,2263,2265,2300,170,333,177,179,178,355,132,173,227,285,1233,1111,740,223,337,261,867,226,274,203,295,265,367,328,466,325,677,754,779,2300,1449,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,0,0,1214,609,623,564,529,311,673,400,332,740,352,334,478,306,236,349,379,155,134,134,61,59,88,276,356,990,1484,374,551,1303,645,1435,346,346,348,465,376,412,372,451,387,478,453,731,780,570,433,398,476,497,458,514,507,491,574,215,257,298,392,348,426,280,305,370,215,246,251,301,333,377,366,492,771,347,355,366,378,458,486,710,755,539,448,364,369,366,436,409,446,418,437,408,467,418,489,391,378,365,283,622,326,308,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,594,2300,2300,2300,2300,330,192,197,188,202,200,205,201,198,2300,2300,2300,2300,2300,2300,2300,2300,186,272,301,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,0,875,884,915,911,855,15,972,144,108,245,0,0,0,0,0,2300,2300,2300,2300,2300,0,0,0,2300,294,15,2,6,0,2300,0,0,0,0,0,2300,0,0,0,0,0,0,0,0,2300,307,0,0,0,0,0,229,0,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,203,0,141,0,281,283,295,167,0,239,88,61,65,0,369,436,409,391,0,223,226,274,227,0,0,0,0,0,0,154,233,197,166,0,446,437,408,415,0,229,248,275,202,0
COL,0,0,0,0,0,0,0,2,2,7,2,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,11,0,1,0,6,0,2,5,2,4,3,4,0,0,0,0,0,0,0,0,0,1512,3,10,20,8,12,26,55,7,18,50,5,18,1512,0,3,1,12,32,6,11,2,7,49,24,24,14,4,2,2,4,2,3,7,6,6,2,4,1,22,3,2,2,24,8,5,3,19,1156,1315,1237,1403,1432,262,15,72,16,16,18,26,1,4,1,9,32,57,5,8,8,8,38,5,23,12,18,26,14,20,17,16,26,47,28,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,453,1512,1512,0,0,166,83,69,52,59,41,89,40,52,73,146,61,42,30,18,40,5,10,5,5,5,5,12,2,37,17,23,17,49,49,36,45,17,16,17,6,0,7,0,10,3,26,12,39,52,2,0,3,3,11,4,7,3,3,5,2,12,10,24,35,70,3,0,2,24,22,6,31,4,4,1512,21,27,0,1,2,3,10,20,13,53,20,13,8,6,2,4,1,39,18,10,20,32,6,64,3,1,2,1,22,8,2,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,461,1512,1512,1512,104,4,4,1,1,4,6,6,1,1512,1512,1512,1512,1512,1512,1512,1512,0,6,6,155,155,1512,92,184,123,70,116,128,84,134,106,0,0,0,122,123,123,123,122,3,555,14,15,17,0,0,0,0,0,0,1512,0,1512,0,0,0,16,1512,95,0,3,3,0,1512,2,5,0,0,1512,1512,0,0,0,0,0,0,1512,0,1512,23,0,0,0,0,0,11,0,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1,0,0,0,14,2,12,1,0,1,12,5,2,0,6,4,1,1,0,8,5,23,4,0,0,0,0,0,0,3,55,7,4,0,39,10,20,10,0,10,25,31,4,0


In [12]:
# calculate proportion missing
pct_missing = pd.DataFrame(wvs_w6.isna().sum())
pct_missing = pct_missing.reset_index().rename(columns = {'index':'variable', 0:'NA_count'})
pct_missing

Unnamed: 0,variable,NA_count
0,V1,0
1,V2,0
2,V2A,0
3,cow,0
4,C_COW_ALPHA,0
5,B_COUNTRY_ALPHA,0
6,V3,0
7,V4,341
8,V5,545
9,V6,1035


In [13]:
pct_missing['NA_pct'] = (pct_missing['NA_count'] / len(wvs_w6)) * 100
pct_missing['NA_pct'] = pct_missing['NA_pct'].round(decimals=2)
pct_missing

Unnamed: 0,variable,NA_count,NA_pct
0,V1,0,0.0
1,V2,0,0.0
2,V2A,0,0.0
3,cow,0,0.0
4,C_COW_ALPHA,0,0.0
5,B_COUNTRY_ALPHA,0,0.0
6,V3,0,0.0
7,V4,341,0.38
8,V5,545,0.61
9,V6,1035,1.16


In [14]:
# how many columns contain missing values?
print(np.count_nonzero(wvs_w6.isna().sum() != 0), 'columns contain missing values')

# how many columns do not?
print(np.count_nonzero(wvs_w6.isna().sum() == 0), 'columns DO NOT contain missing values')

414 columns contain missing values
28 columns DO NOT contain missing values


#### Observations so far:
This data set contains 28 columns without any missing information, and 414 columns (out of 442) that contain at least 1 missing value.

#### Next steps:
- figure out if these missing values matter for my analyses
- decide what to do about missing values

In [15]:
# list columns containing missing data
wvs_w6.columns[wvs_w6.isna().any()].tolist()

['V4',
 'V5',
 'V6',
 'V7',
 'V8',
 'V9',
 'V10',
 'V11',
 'V12',
 'V13',
 'V14',
 'V15',
 'V16',
 'V17',
 'V18',
 'V19',
 'V20',
 'V21',
 'V22',
 'V23',
 'V24',
 'V25',
 'V26',
 'V27',
 'V28',
 'V29',
 'V30',
 'V31',
 'V32',
 'V33',
 'V34',
 'V35',
 'V36',
 'V37',
 'V38',
 'V39',
 'V40',
 'V41',
 'V42',
 'V43',
 'V44',
 'V44_ES',
 'V45',
 'V46',
 'V47',
 'V48',
 'V49',
 'V50',
 'V51',
 'V52',
 'V53',
 'V54',
 'V55',
 'V56',
 'V56_NZ',
 'V57',
 'V58',
 'V59',
 'V60',
 'V61',
 'V62',
 'V63',
 'V64',
 'V65',
 'V66',
 'V67',
 'V68',
 'V69',
 'V70',
 'V71',
 'V72',
 'V73',
 'V74',
 'V74B',
 'V75',
 'V76',
 'V77',
 'V78',
 'V79',
 'V80',
 'V81',
 'V82',
 'V83',
 'V84',
 'V85',
 'V86',
 'V87',
 'V88',
 'V89',
 'V90',
 'V91',
 'V92',
 'V93',
 'V94',
 'V95',
 'V96',
 'V97',
 'V98',
 'V99',
 'V100',
 'V101',
 'V102',
 'V103',
 'V104',
 'V105',
 'V106',
 'V107',
 'V108',
 'V109',
 'V110',
 'V111',
 'V112',
 'V113',
 'V114',
 'V115',
 'V116',
 'V117',
 'V118',
 'V119',
 'V120',
 'V121',
 'V122',


In [16]:
# view variables containing missing values and % missing
pct_missing[pct_missing['NA_count'] != 0]

Unnamed: 0,variable,NA_count,NA_pct
7,V4,341,0.38
8,V5,545,0.61
9,V6,1035,1.16
10,V7,1620,1.81
11,V8,1519,1.7
12,V9,1348,1.51
13,V10,758,0.85
14,V11,326,0.36
15,V12,14,0.02
16,V13,6,0.01


In [17]:
# create list of variables where pct missing is 50% or higher
half_missing = pct_missing[pct_missing['NA_pct'] >= 50.00]['variable'].tolist()
half_missing

['V44_ES',
 'V56_NZ',
 'V74B',
 'V90',
 'V91',
 'V92',
 'V93',
 'V94',
 'V125_00',
 'V125_01',
 'V125_02',
 'V125_03',
 'V125_04',
 'V125_05',
 'V125_06',
 'V125_07',
 'V125_08',
 'V125_09',
 'V125_10',
 'V125_11',
 'V125_12',
 'V125_13',
 'V125_14',
 'V125_15',
 'V160A',
 'V160B',
 'V160C',
 'V160D',
 'V160E',
 'V160F',
 'V160G',
 'V160H',
 'V160I',
 'V160J',
 'V207A',
 'V215_01',
 'V215_02',
 'V215_03',
 'V215_04',
 'V215_05',
 'V215_06',
 'V215_07',
 'V215_08',
 'V215_10',
 'V215_11',
 'V215_12',
 'V215_13',
 'V215_14',
 'V215_15',
 'V215_16',
 'V215_17',
 'V215_18',
 'V218_ESMA',
 'V217_ESMA',
 'V219_ESMA',
 'V220_ESMA',
 'V221_ESMA',
 'V222_ESMA',
 'V223_ESMA',
 'V224_ESMA',
 'V228_2',
 'V243_AU',
 'V244_AU',
 'V248_CS',
 'V253_CS',
 'V256B',
 'V256C',
 'V265',
 'MN_35A',
 'MN_163A',
 'MN_163B',
 'MN_163C',
 'MN_228L',
 'MN_228M',
 'MN_228N',
 'MN_228O',
 'MN_228P',
 'MN_228Q',
 'MN_228R',
 'MN_228S1',
 'MN_228S2',
 'MN_228S3',
 'MN_228S4',
 'MN_228S5',
 'MN_228S6',
 'MN_228S7',
 

### Options for handling missing data:  
Advice from https://heartbeat.fritz.ai/data-handling-scenarios-part-2-working-with-missing-values-in-a-dataset-34b758cfc9fa and https://analyticsindiamag.com/5-ways-handle-missing-values-machine-learning-datasets/  
  
**Drop rows and columns with missing data**  
1. pros: 
  - quick and easy approach 
2. cons: 
  - could mean losing important information about the data along with the missing values
  - when using your model in production, the model will not automatically know how to handle missing data
3. when this makes sense: 
  - rows containing NULL values (missing values) are around 5% (or less) of the total data
  - NULL values in columns are significantly more than the other values present; it wouldn’t make sense to keep these, as they hold little or no descriptive information about the data  
  
**Mean/Median (numerical) & Mode (categorical) imputation**  
1. pros: 
  - easy to do
  - can be integrated into production or for a future unknown dataset
2. cons: 
  - distorts the distribution of the dataset
  - distorts the variance and covariance of the dataset
  - for mode imputation, may lead to an over-representation of the most frequent label if the missing values are quite large
3. when this makes sense: 
  - mean imputation works best for normally distributed distributions
  - median is better for skewed distributions 
  - mode imputation for categorical data works best if the missing values are missing at random
  - best to use this method when the missing values are around 5% (or less) of the total data
  
**Systematic Random Sampling Imputation**  
1. pros: 
  - does not distort variance or distribution 
2. cons: 
  - when replacing missing values in the test set as well, the imputed values from the train set will need to be stored in memory
3. when this makes sense: 
  - can be applied to both numerical and categorical variables
  - used when the values are missing at random
  - when we want to be able to reproduce the same value every time the variable is used (by using a random state)
  
### Remaining Questions:
Is "stratified" mean/median imputation an option?

In [18]:
# first step in droping columns with 50% or more missing observations
half_missing

['V44_ES',
 'V56_NZ',
 'V74B',
 'V90',
 'V91',
 'V92',
 'V93',
 'V94',
 'V125_00',
 'V125_01',
 'V125_02',
 'V125_03',
 'V125_04',
 'V125_05',
 'V125_06',
 'V125_07',
 'V125_08',
 'V125_09',
 'V125_10',
 'V125_11',
 'V125_12',
 'V125_13',
 'V125_14',
 'V125_15',
 'V160A',
 'V160B',
 'V160C',
 'V160D',
 'V160E',
 'V160F',
 'V160G',
 'V160H',
 'V160I',
 'V160J',
 'V207A',
 'V215_01',
 'V215_02',
 'V215_03',
 'V215_04',
 'V215_05',
 'V215_06',
 'V215_07',
 'V215_08',
 'V215_10',
 'V215_11',
 'V215_12',
 'V215_13',
 'V215_14',
 'V215_15',
 'V215_16',
 'V215_17',
 'V215_18',
 'V218_ESMA',
 'V217_ESMA',
 'V219_ESMA',
 'V220_ESMA',
 'V221_ESMA',
 'V222_ESMA',
 'V223_ESMA',
 'V224_ESMA',
 'V228_2',
 'V243_AU',
 'V244_AU',
 'V248_CS',
 'V253_CS',
 'V256B',
 'V256C',
 'V265',
 'MN_35A',
 'MN_163A',
 'MN_163B',
 'MN_163C',
 'MN_228L',
 'MN_228M',
 'MN_228N',
 'MN_228O',
 'MN_228P',
 'MN_228Q',
 'MN_228R',
 'MN_228S1',
 'MN_228S2',
 'MN_228S3',
 'MN_228S4',
 'MN_228S5',
 'MN_228S6',
 'MN_228S7',
 

In [19]:
len(half_missing)

110

#### Re-insert variables that shouldn't be dropped
- V74B (Schwartz value scale item)
- V207A (euthanasia justifiable); curious to see if this could be imputed
- V215_01 - V215_18; use these to create a "sense of belonging to political/economic union" variable (V215_B)

In [20]:
# create a for loop to re-insert variables into the list that shouldn't be dropped (at this point)
# original list: high_missings_list
# new list
vars_to_keep = ['V56_NZ', 'V74B', 'V207A', 'V215_01', 'V215_02', 'V215_03', 'V215_04', 'V215_05', 
                'V215_06', 'V215_07', 'V215_08', 'V215_10', 'V215_11', 'V215_12', 'V215_13', 'V215_14', 
                'V215_15', 'V215_16', 'V215_17', 'V215_18']

vars_to_drop = []

for variable in half_missing:
    if variable not in vars_to_keep:
        
        vars_to_drop.append(variable)

print(vars_to_drop)

['V44_ES', 'V90', 'V91', 'V92', 'V93', 'V94', 'V160A', 'V160B', 'V160C', 'V160D', 'V160E', 'V160F', 'V160G', 'V160H', 'V160I', 'V160J', 'V218_ESMA', 'V217_ESMA', 'V219_ESMA', 'V220_ESMA', 'V221_ESMA', 'V222_ESMA', 'V223_ESMA', 'V224_ESMA', 'V228_2', 'V243_AU', 'V244_AU', 'V248_CS', 'V253_CS', 'V256B', 'V256C', 'V265', 'MN_35A', 'MN_163A', 'MN_163B', 'MN_163C', 'MN_228L', 'MN_228M', 'MN_228N', 'MN_228O', 'MN_228P', 'MN_228Q', 'MN_228R', 'MN_228S1', 'MN_228S2', 'MN_228S3', 'MN_228S4', 'MN_228S5', 'MN_228S6', 'MN_228S7', 'MN_228S8', 'MN_229A', 'MN_229B', 'MN_230A', 'MN_233A', 'MN_233B', 'MN_234A', 'MN_237A', 'MN_237B1', 'MN_237B2', 'MN_237B3', 'MN_237B4', 'MN_237B5', 'MN_237B6', 'MN_237B7', 'MN_237C1', 'MN_237C2', 'MN_237C3', 'MN_237C4', 'MN_237C5', 'MN_237C6', 'MN_249A1', 'MN_249A2', 'MN_249A3']


In [21]:
len(vars_to_drop)

74

In [22]:
# view original imported data set
wvs_w6.head()

Unnamed: 0,V1,V2,V2A,cow,C_COW_ALPHA,B_COUNTRY_ALPHA,V3,V4,V5,V6,V7,V8,V9,V10,V11,V12,V13,V14,V15,V16,V17,V18,V19,V20,V21,V22,V23,V24,V25,V26,V27,V28,V29,V30,V31,V32,V33,V34,V35,V36,V37,V38,V39,V40,V41,V42,V43,V44,V44_ES,V45,V46,V47,V48,V49,V50,V51,V52,V53,V54,V55,V56,V56_NZ,V57,V58,V59,V60,V61,V62,V63,V64,V65,V66,V67,V68,V69,V70,V71,V72,V73,V74,V74B,V75,V76,V77,V78,V79,V80,V81,V82,V83,V84,V85,V86,V87,V88,V89,V90,V91,V92,V93,V94,V95,V96,V97,V98,V99,V100,V101,V102,V103,V104,V105,V106,V107,V108,V109,V110,V111,V112,V113,V114,V115,V116,V117,V118,V119,V120,V121,V122,V123,V124,V125_00,V125_01,V125_02,V125_03,V125_04,V125_05,V125_06,V125_07,V125_08,V125_09,V125_10,V125_11,V125_12,V125_13,V125_14,V125_15,V125_16,V125_17,V126,V127,V128,V129,V130,V131,V132,V133,V134,V135,V136,V137,V138,V139,V140,V141,V142,V143,V144,V144G,V145,V146,V147,V148,V149,V150,V151,V152,V153,V154,V155,V156,V157,V158,V159,V160,V161,V162,V163,V164,V165,V166,V167,V168,V169,V160A,V160B,V160C,V160D,V160E,V160F,V160G,V160H,V160I,V160J,V170,V171,V172,V173,V174,V175,V176,V177,V178,V179,V180,V181,V182,V183,V184,V185,V186,V187,V188,V189,V190,V191,V192,V193,V194,V195,V196,V197,V198,V199,V200,V201,V202,V203,V203A,V204,V205,V206,V207,V207A,V208,V209,V210,V211,V212,V213,V214,V215_01,V215_02,V215_03,V215_04,V215_05,V215_06,V215_07,V215_08,V215_10,V215_11,V215_12,V215_13,V215_14,V215_15,V215_16,V215_17,V215_18,V216,V217,V218,V219,V220,V221,V222,V223,V224,V218_ESMA,V217_ESMA,V219_ESMA,V220_ESMA,V221_ESMA,V222_ESMA,V223_ESMA,V224_ESMA,V225,V226,V227,V228,V228_LOCAL,V228_2,V228A,V228B,V228C,V228D,V228E,V228F,V228G,V228H,V228I,V228J,V228K,V229,V230,V231,V232,V233,V234,V235,V236,V237,V238,V239,V240,V241,V242,X003R2,X003R,V243,V243_AU,V244,V244_AU,V245,V246,V247,V248,V248_CS,V249,V250,V251,V252,V253,V253_CS,V254,V255,N_REGION_ISO,V256,V256B,V256C,V257,V258,V258A,S018,S019,V260,V261,V262,V265,Y001,Y001_1,Y001_2,Y001_3,Y001_4,Y001_5,Y002,Y003,MN_35A,MN_163A,MN_163B,MN_163C,MN_228L,MN_228M,MN_228N,MN_228O,MN_228P,MN_228Q,MN_228R,MN_228S1,MN_228S2,MN_228S3,MN_228S4,MN_228S5,MN_228S6,MN_228S7,MN_228S8,MN_229A,MN_229B,MN_230A,MN_233A,MN_233B,MN_234A,MN_237A,MN_237B1,MN_237B2,MN_237B3,MN_237B4,MN_237B5,MN_237B6,MN_237B7,MN_237C1,MN_237C2,MN_237C3,MN_237C4,MN_237C5,MN_237C6,MN_249A1,MN_249A2,MN_249A3,sacsecval,secvalwgt,resemaval,weightb,I_AUTHORITY,I_NATIONALISM,I_DEVOUT,defiance,WEIGHT1A,I_RELIGIMP,I_RELIGBEL,I_RELIGPRAC,disbelief,WEIGHT2A,I_NORM1,I_NORM2,I_NORM3,relativism,WEIGHT3A,I_TRUSTARMY,I_TRUSTPOLICE,I_TRUSTCOURTS,scepticism,WEIGHT4A,I_INDEP,I_IMAGIN,I_NONOBED,autonomy,WEIGHT1B,I_WOMJOB,I_WOMPOL,I_WOMEDU,equality,WEIGHT2B,I_HOMOLIB,I_ABORTLIB,I_DIVORLIB,choice,WEIGHT3B,I_VOICE1,I_VOICE2,I_VOI2_00,voice,WEIGHT4B
0,6,12,12,615,ALG,DZA,1,1.0,1.0,1.0,,1.0,1.0,2.0,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,1.0,2.0,2.0,1.0,1.0,,1.0,,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,7.0,4.0,,6.0,0.0,10.0,2.0,3.0,1.0,3.0,3.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,1.0,2.0,3.0,3.0,2.0,1.0,2.0,2.0,4.0,,,,,,,,,,,5.0,8.0,7.0,6.0,8.0,7.0,5.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,3.0,3.0,2.0,3.0,2.0,2.0,4.0,3.0,3.0,2.0,3.0,2.0,3.0,4.0,4.0,3.0,,,,4.0,,,,,,,,,,,,,0.0,0.0,4.0,1.0,2.0,2.0,2.0,3.0,8.0,5.0,6.0,9.0,3.0,4.0,7.0,6.0,7.0,5.0,2.0,2.0,50000000.0,5.0,3.0,3.0,1.0,1.0,1.0,,,10.0,1.0,2.0,2.0,1.0,2.0,7.0,4.0,3.0,2.0,3.0,1.0,9.0,1.0,2.0,1.0,2.0,2.0,3.0,2.0,3.0,2.0,1.0,2.0,2.0,3.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,5.0,5.0,1.0,5.0,1.0,2.0,2.0,3.0,2.0,3.0,3.0,2.0,3.0,3.0,3.0,3.0,7.0,8.0,3.0,5.0,6.0,9.0,6.0,6.0,1.0,1.0,1.0,1.0,,1.0,3.0,,1.0,1.0,6.0,5.0,1.0,1.0,2.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,2.0,3.0,4.0,2.0,2.0,3.0,4.0,2.0,4.0,,,,,,,,,2.0,3.0,3.0,12005.0,12005.0,,3.0,4.0,3.0,3.0,3.0,3.0,4.0,4.0,4.0,2.0,1.0,6.0,,,,,,2.0,1.0,1.0,4.0,5.0,1.0,1993.0,21.0,1.0,1.0,2.0,,2.0,,1.0,1.0,110.0,7.0,,24.0,1.0,2.0,2.0,1.0,,12003.0,1.0,12005.0,12105.0,,,110.0,1.0,1.0,0.833333,1.25,5,,2014,,2.0,1,0,0,1,0,1.0,0.0,0.0,2.0,1.0,2.0,3.0,5.0,4.0,2.0,2.0,3.0,2.0,2.0,4.0,2.0,3.0,3.0,3.0,2.0,3.0,,,,,,,2.0,,,,,,,,,,,,,,1.0,2.0,1.0,0.221111,1.0,0.164352,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.333333,0.111111,1.0,1.0,0.0,0.0,0.333333,1.0,0.66,0.33,0.33,0.44,1.0,1.0,0.0,0.0,0.333333,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.222222,0.074074,1.0,0.0,0.5,0.25,0.25,1.0
1,6,12,12,615,ALG,DZA,2,1.0,2.0,3.0,4.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,5.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,,1.0,,1.0,1.0,2.0,2.0,1.0,2.0,3.0,2.0,6.0,8.0,,6.0,0.0,10.0,2.0,1.0,2.0,3.0,4.0,3.0,1.0,1.0,1.0,2.0,2.0,3.0,2.0,1.0,1.0,1.0,3.0,2.0,2.0,2.0,2.0,2.0,1.0,1.0,2.0,3.0,,,,,,,,,,,5.0,7.0,5.0,5.0,4.0,4.0,6.0,1.0,3.0,3.0,3.0,3.0,3.0,1.0,1.0,1.0,2.0,2.0,3.0,1.0,2.0,2.0,3.0,2.0,2.0,2.0,3.0,2.0,2.0,3.0,,,,4.0,,,,,,,,,,,,,0.0,0.0,3.0,1.0,3.0,2.0,1.0,2.0,8.0,8.0,8.0,9.0,2.0,6.0,4.0,2.0,4.0,4.0,3.0,1.0,50000000.0,5.0,2.0,2.0,1.0,1.0,1.0,2.0,1.0,10.0,1.0,1.0,1.0,1.0,4.0,6.0,4.0,4.0,1.0,2.0,3.0,8.0,2.0,3.0,2.0,1.0,2.0,2.0,4.0,4.0,2.0,3.0,2.0,4.0,1.0,1.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,5.0,5.0,5.0,1.0,5.0,2.0,3.0,4.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,4.0,8.0,4.0,6.0,4.0,8.0,3.0,4.0,7.0,1.0,1.0,1.0,,1.0,1.0,,1.0,1.0,3.0,5.0,1.0,2.0,2.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,2.0,2.0,3.0,4.0,3.0,4.0,2.0,3.0,3.0,,,,,,,,,3.0,2.0,3.0,12003.0,12003.0,,3.0,4.0,4.0,3.0,4.0,3.0,3.0,4.0,4.0,1.0,1.0,6.0,,,,,,2.0,2.0,2.0,3.0,6.0,2.0,1990.0,24.0,1.0,1.0,2.0,,2.0,,1.0,1.0,110.0,7.0,,25.0,1.0,1.0,2.0,1.0,,12003.0,1.0,12005.0,12105.0,,,110.0,1.0,1.0,0.833333,1.25,5,,2014,,2.0,0,1,0,0,1,2.0,-1.0,0.0,2.0,3.0,2.0,3.0,5.0,4.0,6.0,2.0,3.0,3.0,2.0,3.0,2.0,3.0,3.0,2.0,4.0,3.0,,,,,,,2.0,,,,,,,,,,,,,,2.0,,,0.276389,1.0,0.11,1.0,0.5,0.33,0.33,0.386667,1.0,0.33,0.0,0.166667,0.165556,1.0,1.0,0.0,0.0,0.333333,1.0,0.0,0.66,0.0,0.22,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.33,0.11,1.0,0.0,0.0,0.0,0.0,1.0,0.66,0.0,0.33,0.33,1.0
2,6,12,12,615,ALG,DZA,3,1.0,3.0,2.0,4.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,1.0,2.0,1.0,2.0,1.0,2.0,4.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,2.0,1.0,1.0,1.0,2.0,,1.0,,2.0,3.0,1.0,1.0,1.0,1.0,1.0,1.0,6.0,8.0,,6.0,0.0,6.0,2.0,4.0,1.0,2.0,1.0,4.0,1.0,2.0,2.0,2.0,1.0,2.0,1.0,1.0,4.0,3.0,1.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,,,3.0,3.0,3.0,,,,,,6.0,7.0,7.0,7.0,5.0,7.0,5.0,1.0,3.0,3.0,4.0,4.0,4.0,3.0,2.0,2.0,2.0,3.0,4.0,3.0,2.0,2.0,2.0,3.0,4.0,3.0,2.0,3.0,2.0,4.0,,,,3.0,,,,,,,,,,,,,0.0,0.0,2.0,1.0,3.0,2.0,2.0,2.0,7.0,4.0,8.0,3.0,3.0,6.0,9.0,5.0,6.0,7.0,2.0,1.0,50000000.0,5.0,2.0,4.0,1.0,1.0,1.0,2.0,1.0,6.0,2.0,3.0,1.0,2.0,2.0,7.0,4.0,4.0,0.0,2.0,2.0,6.0,2.0,3.0,1.0,2.0,4.0,2.0,3.0,2.0,4.0,3.0,3.0,2.0,4.0,3.0,2.0,2.0,2.0,2.0,3.0,3.0,3.0,5.0,5.0,5.0,5.0,5.0,2.0,3.0,2.0,3.0,4.0,4.0,2.0,3.0,3.0,3.0,3.0,4.0,7.0,5.0,5.0,5.0,5.0,5.0,5.0,1.0,1.0,1.0,1.0,,1.0,4.0,,1.0,1.0,4.0,5.0,1.0,1.0,2.0,3.0,2.0,,,,,2.0,,,,,,,,,,,,,4.0,3.0,4.0,2.0,2.0,4.0,3.0,1.0,1.0,,,,,,,,,2.0,2.0,3.0,,,,4.0,4.0,3.0,4.0,2.0,3.0,2.0,4.0,4.0,2.0,1.0,3.0,2.0,7.0,6.0,5.0,2.0,1.0,,1.0,4.0,6.0,2.0,1988.0,26.0,1.0,2.0,2.0,,2.0,,1.0,1.0,500.0,5.0,,18.0,1.0,1.0,1.0,1.0,,12003.0,1.0,12005.0,12105.0,,,110.0,1.0,1.0,0.833333,1.25,5,,2014,,1.0,0,0,1,0,0,2.0,-2.0,0.0,1.0,3.0,2.0,3.0,6.0,4.0,5.0,1.0,2.0,2.0,2.0,3.0,2.0,4.0,3.0,2.0,4.0,4.0,1.0,1.0,1.0,2.0,3.0,3.0,2.0,,,,,,,,,,,,,,1.0,2.0,1.0,0.304722,1.0,0.152361,1.0,0.5,0.0,0.0,0.166667,1.0,0.0,0.0,0.166667,0.055556,1.0,1.0,0.0,0.0,0.333333,1.0,0.33,1.0,0.66,0.663333,1.0,0.0,1.0,0.0,0.333333,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.333333,0.111111,1.0,0.33,0.0,0.165,0.165,1.0
3,6,12,12,615,ALG,DZA,4,1.0,1.0,3.0,4.0,3.0,1.0,2.0,1.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,1.0,1.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,,2.0,,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,6.0,8.0,,6.0,0.0,6.0,2.0,1.0,3.0,1.0,4.0,3.0,1.0,1.0,1.0,1.0,1.0,2.0,3.0,2.0,3.0,3.0,1.0,1.0,2.0,2.0,3.0,1.0,1.0,2.0,2.0,2.0,,,,,,,,,,,6.0,9.0,5.0,6.0,4.0,6.0,8.0,1.0,3.0,3.0,2.0,2.0,3.0,2.0,3.0,4.0,2.0,3.0,4.0,2.0,3.0,3.0,4.0,2.0,2.0,2.0,3.0,1.0,2.0,4.0,,,,3.0,,,,,,,,,,,,,0.0,0.0,3.0,2.0,3.0,4.0,3.0,2.0,7.0,9.0,5.0,5.0,7.0,3.0,8.0,7.0,8.0,8.0,3.0,2.0,50000000.0,5.0,2.0,1.0,1.0,1.0,1.0,2.0,1.0,10.0,2.0,3.0,4.0,2.0,3.0,7.0,6.0,4.0,1.0,3.0,3.0,7.0,3.0,1.0,2.0,3.0,3.0,2.0,3.0,4.0,1.0,2.0,4.0,2.0,2.0,3.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,5.0,5.0,5.0,1.0,5.0,2.0,3.0,3.0,3.0,4.0,4.0,2.0,2.0,3.0,3.0,3.0,6.0,6.0,3.0,5.0,5.0,7.0,4.0,6.0,1.0,1.0,1.0,1.0,,1.0,1.0,,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,2.0,2.0,3.0,1.0,2.0,3.0,4.0,3.0,3.0,,,,,,,,,2.0,2.0,3.0,,,,2.0,4.0,3.0,3.0,2.0,3.0,2.0,2.0,2.0,1.0,3.0,1.0,1.0,8.0,5.0,6.0,2.0,1.0,,4.0,4.0,5.0,2.0,1986.0,28.0,1.0,2.0,2.0,,2.0,,1.0,1.0,500.0,6.0,,14.0,2.0,2.0,1.0,1.0,,12003.0,1.0,12005.0,12105.0,,,500.0,1.0,1.0,0.833333,1.25,5,,2014,,1.0,0,0,0,0,1,1.0,-1.0,0.0,2.0,2.0,2.0,3.0,7.0,5.0,6.0,2.0,3.0,2.0,2.0,3.0,2.0,2.0,4.0,3.0,3.0,2.0,2.0,2.0,1.0,2.0,2.0,3.0,2.0,,,,,,,,,,,,,,1.0,2.0,2.0,0.263056,1.0,0.096667,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.166667,0.055556,1.0,1.0,0.0,0.0,0.333333,1.0,0.66,1.0,0.33,0.663333,1.0,0.0,0.0,0.0,0.0,1.0,0.5,0.33,0.33,0.386667,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0
4,6,12,12,615,ALG,DZA,5,1.0,1.0,1.0,2.0,1.0,1.0,1.0,3.0,2.0,1.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,1.0,1.0,2.0,2.0,1.0,1.0,2.0,,1.0,,1.0,1.0,1.0,2.0,1.0,3.0,2.0,2.0,6.0,6.0,,1.0,3.0,4.0,2.0,1.0,2.0,3.0,4.0,2.0,1.0,2.0,1.0,1.0,2.0,5.0,1.0,2.0,3.0,1.0,4.0,3.0,2.0,2.0,3.0,1.0,2.0,2.0,2.0,2.0,,,,,,,,,,,5.0,8.0,4.0,7.0,4.0,6.0,6.0,2.0,2.0,3.0,4.0,2.0,3.0,2.0,3.0,3.0,2.0,4.0,3.0,2.0,3.0,3.0,3.0,2.0,3.0,3.0,2.0,4.0,3.0,2.0,,,,3.0,,,,,,,,,,,,,0.0,0.0,3.0,2.0,3.0,4.0,2.0,2.0,8.0,4.0,7.0,3.0,3.0,8.0,6.0,5.0,6.0,7.0,3.0,2.0,50000000.0,5.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,10.0,2.0,3.0,2.0,2.0,2.0,4.0,4.0,3.0,1.0,3.0,2.0,8.0,2.0,3.0,3.0,3.0,3.0,2.0,4.0,3.0,3.0,2.0,4.0,3.0,2.0,2.0,3.0,2.0,2.0,3.0,3.0,3.0,3.0,5.0,5.0,5.0,5.0,5.0,2.0,3.0,3.0,4.0,4.0,4.0,2.0,3.0,3.0,3.0,3.0,6.0,2.0,4.0,4.0,6.0,6.0,6.0,5.0,7.0,1.0,1.0,1.0,,1.0,3.0,,1.0,1.0,4.0,5.0,1.0,1.0,2.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,3.0,3.0,4.0,2.0,2.0,4.0,3.0,2.0,3.0,,,,,,,,,2.0,3.0,3.0,2.0,2.0,,3.0,3.0,4.0,2.0,3.0,3.0,4.0,3.0,3.0,1.0,2.0,3.0,2.0,5.0,6.0,9.0,2.0,2.0,1.0,2.0,3.0,7.0,2.0,1979.0,35.0,2.0,3.0,2.0,,2.0,,1.0,1.0,500.0,3.0,,8.0,1.0,1.0,1.0,1.0,,12003.0,1.0,12005.0,12105.0,,,110.0,1.0,1.0,0.833333,1.25,5,,2014,,2.0,0,1,0,0,1,2.0,1.0,0.0,2.0,3.0,3.0,3.0,4.0,7.0,4.0,2.0,2.0,3.0,2.0,3.0,1.0,4.0,3.0,1.0,3.0,2.0,2.0,2.0,1.0,2.0,2.0,3.0,2.0,,,,,,,,,,,,,,1.0,2.0,2.0,0.220833,1.0,0.239352,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.333333,1.0,0.66,0.66,0.33,0.55,1.0,0.0,0.0,1.0,0.333333,1.0,0.0,0.0,0.66,0.22,1.0,0.0,0.0,0.222222,0.074074,1.0,0.66,0.0,0.33,0.33,1.0


In [23]:
# drop variables in the vars_to_drop list
cleaning_w6 = wvs_w6.drop(columns=vars_to_drop)

In [24]:
# check out current freq of missing values
cleaning_w6.isna().sum()

V1                     0
V2                     0
V2A                    0
cow                    0
C_COW_ALPHA            0
B_COUNTRY_ALPHA        0
V3                     0
V4                   341
V5                   545
V6                  1035
V7                  1620
V8                  1519
V9                  1348
V10                  758
V11                  326
V12                   14
V13                    6
V14                    7
V15                   17
V16                    9
V17                   13
V18                   12
V19                   18
V20                   15
V21                   19
V22                    3
V23                  586
V24                 2388
V25                  840
V26                  923
V27                  993
V28                 3211
V29                 3129
V30                 1118
V31                 2223
V32                 1055
V33                 1214
V34                 1197
V35                 9696
V36                 3979


In [25]:
# peek at data to ensure that correct columns are being dropped so far
cleaning_w6.head()

Unnamed: 0,V1,V2,V2A,cow,C_COW_ALPHA,B_COUNTRY_ALPHA,V3,V4,V5,V6,V7,V8,V9,V10,V11,V12,V13,V14,V15,V16,V17,V18,V19,V20,V21,V22,V23,V24,V25,V26,V27,V28,V29,V30,V31,V32,V33,V34,V35,V36,V37,V38,V39,V40,V41,V42,V43,V44,V45,V46,V47,V48,V49,V50,V51,V52,V53,V54,V55,V56,V56_NZ,V57,V58,V59,V60,V61,V62,V63,V64,V65,V66,V67,V68,V69,V70,V71,V72,V73,V74,V74B,V75,V76,V77,V78,V79,V80,V81,V82,V83,V84,V85,V86,V87,V88,V89,V95,V96,V97,V98,V99,V100,V101,V102,V103,V104,V105,V106,V107,V108,V109,V110,V111,V112,V113,V114,V115,V116,V117,V118,V119,V120,V121,V122,V123,V124,V125_00,V125_01,V125_02,V125_03,V125_04,V125_05,V125_06,V125_07,V125_08,V125_09,V125_10,V125_11,V125_12,V125_13,V125_14,V125_15,V125_16,V125_17,V126,V127,V128,V129,V130,V131,V132,V133,V134,V135,V136,V137,V138,V139,V140,V141,V142,V143,V144,V144G,V145,V146,V147,V148,V149,V150,V151,V152,V153,V154,V155,V156,V157,V158,V159,V160,V161,V162,V163,V164,V165,V166,V167,V168,V169,V170,V171,V172,V173,V174,V175,V176,V177,V178,V179,V180,V181,V182,V183,V184,V185,V186,V187,V188,V189,V190,V191,V192,V193,V194,V195,V196,V197,V198,V199,V200,V201,V202,V203,V203A,V204,V205,V206,V207,V207A,V208,V209,V210,V211,V212,V213,V214,V215_01,V215_02,V215_03,V215_04,V215_05,V215_06,V215_07,V215_08,V215_10,V215_11,V215_12,V215_13,V215_14,V215_15,V215_16,V215_17,V215_18,V216,V217,V218,V219,V220,V221,V222,V223,V224,V225,V226,V227,V228,V228_LOCAL,V228A,V228B,V228C,V228D,V228E,V228F,V228G,V228H,V228I,V228J,V228K,V229,V230,V231,V232,V233,V234,V235,V236,V237,V238,V239,V240,V241,V242,X003R2,X003R,V243,V244,V245,V246,V247,V248,V249,V250,V251,V252,V253,V254,V255,N_REGION_ISO,V256,V257,V258,V258A,S018,S019,V260,V261,V262,Y001,Y001_1,Y001_2,Y001_3,Y001_4,Y001_5,Y002,Y003,sacsecval,secvalwgt,resemaval,weightb,I_AUTHORITY,I_NATIONALISM,I_DEVOUT,defiance,WEIGHT1A,I_RELIGIMP,I_RELIGBEL,I_RELIGPRAC,disbelief,WEIGHT2A,I_NORM1,I_NORM2,I_NORM3,relativism,WEIGHT3A,I_TRUSTARMY,I_TRUSTPOLICE,I_TRUSTCOURTS,scepticism,WEIGHT4A,I_INDEP,I_IMAGIN,I_NONOBED,autonomy,WEIGHT1B,I_WOMJOB,I_WOMPOL,I_WOMEDU,equality,WEIGHT2B,I_HOMOLIB,I_ABORTLIB,I_DIVORLIB,choice,WEIGHT3B,I_VOICE1,I_VOICE2,I_VOI2_00,voice,WEIGHT4B
0,6,12,12,615,ALG,DZA,1,1.0,1.0,1.0,,1.0,1.0,2.0,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,1.0,2.0,2.0,1.0,1.0,1.0,,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,7.0,4.0,,6.0,0.0,10.0,2.0,3.0,1.0,3.0,3.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,1.0,2.0,3.0,3.0,2.0,1.0,2.0,2.0,4.0,,,,,,5.0,8.0,7.0,6.0,8.0,7.0,5.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,3.0,3.0,2.0,3.0,2.0,2.0,4.0,3.0,3.0,2.0,3.0,2.0,3.0,4.0,4.0,3.0,,,,4.0,,,,,,,,,,,,,0.0,0.0,4.0,1.0,2.0,2.0,2.0,3.0,8.0,5.0,6.0,9.0,3.0,4.0,7.0,6.0,7.0,5.0,2.0,2.0,50000000.0,5.0,3.0,3.0,1.0,1.0,1.0,,,10.0,1.0,2.0,2.0,1.0,2.0,7.0,4.0,3.0,2.0,3.0,1.0,9.0,1.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,5.0,5.0,1.0,5.0,1.0,2.0,2.0,3.0,2.0,3.0,3.0,2.0,3.0,3.0,3.0,3.0,7.0,8.0,3.0,5.0,6.0,9.0,6.0,6.0,1.0,1.0,1.0,1.0,,1.0,3.0,,1.0,1.0,6.0,5.0,1.0,1.0,2.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,2.0,3.0,4.0,2.0,2.0,3.0,4.0,2.0,4.0,2.0,3.0,3.0,12005.0,12005.0,3.0,4.0,3.0,3.0,3.0,3.0,4.0,4.0,4.0,2.0,1.0,6.0,,,,,,2.0,1.0,1.0,4.0,5.0,1.0,1993.0,21.0,1.0,1.0,2.0,2.0,1.0,1.0,110.0,7.0,24.0,1.0,2.0,2.0,1.0,12003.0,1.0,12005.0,12105.0,110.0,1.0,1.0,0.833333,1.25,5,,2014,2.0,1,0,0,1,0,1.0,0.0,0.221111,1.0,0.164352,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.333333,0.111111,1.0,1.0,0.0,0.0,0.333333,1.0,0.66,0.33,0.33,0.44,1.0,1.0,0.0,0.0,0.333333,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.222222,0.074074,1.0,0.0,0.5,0.25,0.25,1.0
1,6,12,12,615,ALG,DZA,2,1.0,2.0,3.0,4.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,5.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,,1.0,1.0,2.0,2.0,1.0,2.0,3.0,2.0,6.0,8.0,,6.0,0.0,10.0,2.0,1.0,2.0,3.0,4.0,3.0,1.0,1.0,1.0,2.0,2.0,3.0,2.0,1.0,1.0,1.0,3.0,2.0,2.0,2.0,2.0,2.0,1.0,1.0,2.0,3.0,,,,,,5.0,7.0,5.0,5.0,4.0,4.0,6.0,1.0,3.0,3.0,3.0,3.0,3.0,1.0,1.0,1.0,2.0,2.0,3.0,1.0,2.0,2.0,3.0,2.0,2.0,2.0,3.0,2.0,2.0,3.0,,,,4.0,,,,,,,,,,,,,0.0,0.0,3.0,1.0,3.0,2.0,1.0,2.0,8.0,8.0,8.0,9.0,2.0,6.0,4.0,2.0,4.0,4.0,3.0,1.0,50000000.0,5.0,2.0,2.0,1.0,1.0,1.0,2.0,1.0,10.0,1.0,1.0,1.0,1.0,4.0,6.0,4.0,4.0,1.0,2.0,3.0,8.0,2.0,3.0,2.0,1.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,5.0,5.0,5.0,1.0,5.0,2.0,3.0,4.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,4.0,8.0,4.0,6.0,4.0,8.0,3.0,4.0,7.0,1.0,1.0,1.0,,1.0,1.0,,1.0,1.0,3.0,5.0,1.0,2.0,2.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,2.0,2.0,3.0,4.0,3.0,4.0,2.0,3.0,3.0,3.0,2.0,3.0,12003.0,12003.0,3.0,4.0,4.0,3.0,4.0,3.0,3.0,4.0,4.0,1.0,1.0,6.0,,,,,,2.0,2.0,2.0,3.0,6.0,2.0,1990.0,24.0,1.0,1.0,2.0,2.0,1.0,1.0,110.0,7.0,25.0,1.0,1.0,2.0,1.0,12003.0,1.0,12005.0,12105.0,110.0,1.0,1.0,0.833333,1.25,5,,2014,2.0,0,1,0,0,1,2.0,-1.0,0.276389,1.0,0.11,1.0,0.5,0.33,0.33,0.386667,1.0,0.33,0.0,0.166667,0.165556,1.0,1.0,0.0,0.0,0.333333,1.0,0.0,0.66,0.0,0.22,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.33,0.11,1.0,0.0,0.0,0.0,0.0,1.0,0.66,0.0,0.33,0.33,1.0
2,6,12,12,615,ALG,DZA,3,1.0,3.0,2.0,4.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,1.0,2.0,1.0,2.0,1.0,2.0,4.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,2.0,1.0,1.0,1.0,2.0,1.0,,2.0,3.0,1.0,1.0,1.0,1.0,1.0,1.0,6.0,8.0,,6.0,0.0,6.0,2.0,4.0,1.0,2.0,1.0,4.0,1.0,2.0,2.0,2.0,1.0,2.0,1.0,1.0,4.0,3.0,1.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,,,3.0,3.0,3.0,6.0,7.0,7.0,7.0,5.0,7.0,5.0,1.0,3.0,3.0,4.0,4.0,4.0,3.0,2.0,2.0,2.0,3.0,4.0,3.0,2.0,2.0,2.0,3.0,4.0,3.0,2.0,3.0,2.0,4.0,,,,3.0,,,,,,,,,,,,,0.0,0.0,2.0,1.0,3.0,2.0,2.0,2.0,7.0,4.0,8.0,3.0,3.0,6.0,9.0,5.0,6.0,7.0,2.0,1.0,50000000.0,5.0,2.0,4.0,1.0,1.0,1.0,2.0,1.0,6.0,2.0,3.0,1.0,2.0,2.0,7.0,4.0,4.0,0.0,2.0,2.0,6.0,2.0,3.0,1.0,2.0,4.0,2.0,2.0,2.0,3.0,3.0,3.0,5.0,5.0,5.0,5.0,5.0,2.0,3.0,2.0,3.0,4.0,4.0,2.0,3.0,3.0,3.0,3.0,4.0,7.0,5.0,5.0,5.0,5.0,5.0,5.0,1.0,1.0,1.0,1.0,,1.0,4.0,,1.0,1.0,4.0,5.0,1.0,1.0,2.0,3.0,2.0,,,,,2.0,,,,,,,,,,,,,4.0,3.0,4.0,2.0,2.0,4.0,3.0,1.0,1.0,2.0,2.0,3.0,,,4.0,4.0,3.0,4.0,2.0,3.0,2.0,4.0,4.0,2.0,1.0,3.0,2.0,7.0,6.0,5.0,2.0,1.0,,1.0,4.0,6.0,2.0,1988.0,26.0,1.0,2.0,2.0,2.0,1.0,1.0,500.0,5.0,18.0,1.0,1.0,1.0,1.0,12003.0,1.0,12005.0,12105.0,110.0,1.0,1.0,0.833333,1.25,5,,2014,1.0,0,0,1,0,0,2.0,-2.0,0.304722,1.0,0.152361,1.0,0.5,0.0,0.0,0.166667,1.0,0.0,0.0,0.166667,0.055556,1.0,1.0,0.0,0.0,0.333333,1.0,0.33,1.0,0.66,0.663333,1.0,0.0,1.0,0.0,0.333333,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.333333,0.111111,1.0,0.33,0.0,0.165,0.165,1.0
3,6,12,12,615,ALG,DZA,4,1.0,1.0,3.0,4.0,3.0,1.0,2.0,1.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,1.0,1.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,6.0,8.0,,6.0,0.0,6.0,2.0,1.0,3.0,1.0,4.0,3.0,1.0,1.0,1.0,1.0,1.0,2.0,3.0,2.0,3.0,3.0,1.0,1.0,2.0,2.0,3.0,1.0,1.0,2.0,2.0,2.0,,,,,,6.0,9.0,5.0,6.0,4.0,6.0,8.0,1.0,3.0,3.0,2.0,2.0,3.0,2.0,3.0,4.0,2.0,3.0,4.0,2.0,3.0,3.0,4.0,2.0,2.0,2.0,3.0,1.0,2.0,4.0,,,,3.0,,,,,,,,,,,,,0.0,0.0,3.0,2.0,3.0,4.0,3.0,2.0,7.0,9.0,5.0,5.0,7.0,3.0,8.0,7.0,8.0,8.0,3.0,2.0,50000000.0,5.0,2.0,1.0,1.0,1.0,1.0,2.0,1.0,10.0,2.0,3.0,4.0,2.0,3.0,7.0,6.0,4.0,1.0,3.0,3.0,7.0,3.0,1.0,2.0,3.0,3.0,1.0,2.0,2.0,2.0,2.0,2.0,5.0,5.0,5.0,1.0,5.0,2.0,3.0,3.0,3.0,4.0,4.0,2.0,2.0,3.0,3.0,3.0,6.0,6.0,3.0,5.0,5.0,7.0,4.0,6.0,1.0,1.0,1.0,1.0,,1.0,1.0,,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,2.0,2.0,3.0,1.0,2.0,3.0,4.0,3.0,3.0,2.0,2.0,3.0,,,2.0,4.0,3.0,3.0,2.0,3.0,2.0,2.0,2.0,1.0,3.0,1.0,1.0,8.0,5.0,6.0,2.0,1.0,,4.0,4.0,5.0,2.0,1986.0,28.0,1.0,2.0,2.0,2.0,1.0,1.0,500.0,6.0,14.0,2.0,2.0,1.0,1.0,12003.0,1.0,12005.0,12105.0,500.0,1.0,1.0,0.833333,1.25,5,,2014,1.0,0,0,0,0,1,1.0,-1.0,0.263056,1.0,0.096667,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.166667,0.055556,1.0,1.0,0.0,0.0,0.333333,1.0,0.66,1.0,0.33,0.663333,1.0,0.0,0.0,0.0,0.0,1.0,0.5,0.33,0.33,0.386667,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0
4,6,12,12,615,ALG,DZA,5,1.0,1.0,1.0,2.0,1.0,1.0,1.0,3.0,2.0,1.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,1.0,1.0,2.0,2.0,1.0,1.0,2.0,1.0,,1.0,1.0,1.0,2.0,1.0,3.0,2.0,2.0,6.0,6.0,,1.0,3.0,4.0,2.0,1.0,2.0,3.0,4.0,2.0,1.0,2.0,1.0,1.0,2.0,5.0,1.0,2.0,3.0,1.0,4.0,3.0,2.0,2.0,3.0,1.0,2.0,2.0,2.0,2.0,,,,,,5.0,8.0,4.0,7.0,4.0,6.0,6.0,2.0,2.0,3.0,4.0,2.0,3.0,2.0,3.0,3.0,2.0,4.0,3.0,2.0,3.0,3.0,3.0,2.0,3.0,3.0,2.0,4.0,3.0,2.0,,,,3.0,,,,,,,,,,,,,0.0,0.0,3.0,2.0,3.0,4.0,2.0,2.0,8.0,4.0,7.0,3.0,3.0,8.0,6.0,5.0,6.0,7.0,3.0,2.0,50000000.0,5.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,10.0,2.0,3.0,2.0,2.0,2.0,4.0,4.0,3.0,1.0,3.0,2.0,8.0,2.0,3.0,3.0,3.0,3.0,2.0,2.0,3.0,3.0,3.0,3.0,5.0,5.0,5.0,5.0,5.0,2.0,3.0,3.0,4.0,4.0,4.0,2.0,3.0,3.0,3.0,3.0,6.0,2.0,4.0,4.0,6.0,6.0,6.0,5.0,7.0,1.0,1.0,1.0,,1.0,3.0,,1.0,1.0,4.0,5.0,1.0,1.0,2.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,3.0,3.0,4.0,2.0,2.0,4.0,3.0,2.0,3.0,2.0,3.0,3.0,2.0,2.0,3.0,3.0,4.0,2.0,3.0,3.0,4.0,3.0,3.0,1.0,2.0,3.0,2.0,5.0,6.0,9.0,2.0,2.0,1.0,2.0,3.0,7.0,2.0,1979.0,35.0,2.0,3.0,2.0,2.0,1.0,1.0,500.0,3.0,8.0,1.0,1.0,1.0,1.0,12003.0,1.0,12005.0,12105.0,110.0,1.0,1.0,0.833333,1.25,5,,2014,2.0,0,1,0,0,1,2.0,1.0,0.220833,1.0,0.239352,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.333333,1.0,0.66,0.66,0.33,0.55,1.0,0.0,0.0,1.0,0.333333,1.0,0.0,0.0,0.66,0.22,1.0,0.0,0.0,0.222222,0.074074,1.0,0.66,0.0,0.33,0.33,1.0


In [26]:
# original shape for comparison
wvs_w6.shape

(89565, 442)

In [27]:
# current shape so far
cleaning_w6.shape

(89565, 368)

In [28]:
# Columns to drop
# drop a handful of item scales at the end of the data set since these come from items that appear earlier in the survey
# also dropping their associated weights
cleaning_w6 = cleaning_w6.drop(['Y001_1', 'Y001_2', 'Y001_3', 'Y001_4', 'Y001_5', 'Y001', 'Y002', 'Y003', 'sacsecval',
 'secvalwgt', 'resemaval', 'weightb', 'I_AUTHORITY', 'I_NATIONALISM', 'I_DEVOUT', 'defiance', 'I_RELIGIMP', 'I_RELIGBEL',
 'I_RELIGPRAC', 'disbelief', 'I_NORM1', 'I_NORM2', 'I_NORM3', 'relativism', 'I_TRUSTARMY', 'I_TRUSTPOLICE', 'I_TRUSTCOURTS',
 'scepticism', 'I_INDEP', 'I_IMAGIN', 'I_NONOBED',  'autonomy',  'I_WOMJOB', 'I_WOMPOL', 'I_WOMEDU', 'equality',
 'I_HOMOLIB', 'I_ABORTLIB', 'I_DIVORLIB', 'choice', 'I_VOICE1', 'I_VOICE2', 'I_VOI2_00', 'voice', 'WEIGHT1A',  'WEIGHT2A', 
 'WEIGHT3A',  'WEIGHT4A', 'WEIGHT1B',  'WEIGHT2B',  'WEIGHT3B', 'WEIGHT4B'], axis=1)

In [29]:
cleaning_w6.shape

(89565, 316)

In [30]:
# dropping interviewer observations and other items with high proportion of missings
cleaning_w6 = cleaning_w6.drop(['V228', # items assessing country-specific political party preferences
 'V228_LOCAL', 'V228A', 'V228B', 'V228C', 'V228D', 'V228E', 'V228F', 'V228G', 'V228H', 'V228I', 'V228J', 'V228K',

# keep these employment, income, and savings items
# 'V230', 'V231', 'V232', 'V233', 'V234', 'V236', 'V237', 'V239' (# scale of incomes)
                                
 'V241', # year of birth
                                
# these X003 items are age groups; drop them since I'll use and scale the actual age values (from V242) anyway
 'X003R2', 'X003R',
                                
# keep these immigrant status items
# 'V243', 'V244', 'V245', 'V246', 'V247'
# keeping highest education level ('V248') 
                                
 'V249',
# 'V250', # respondent lives with parents
# items assessing whether respondent was interested; would be nice/interesting to include, but missings here would be
# difficult to impute
 'V251',
 'V252',
 'V253', # size of town; interesting, but arguably hard to impute missing values
 'V254', # ethnic group
 'V255', # literacy; difficult to impute
                                
# region where interview was conducted
 'N_REGION_ISO',
 'V256', 
 'V257', # interview language
 'V260', # questionnaire version
 'V261'], # date of interview
axis=1)

In [31]:
print(cleaning_w6.shape)

(89565, 289)


In [32]:
cleaning_w6.head()

Unnamed: 0,V1,V2,V2A,cow,C_COW_ALPHA,B_COUNTRY_ALPHA,V3,V4,V5,V6,V7,V8,V9,V10,V11,V12,V13,V14,V15,V16,V17,V18,V19,V20,V21,V22,V23,V24,V25,V26,V27,V28,V29,V30,V31,V32,V33,V34,V35,V36,V37,V38,V39,V40,V41,V42,V43,V44,V45,V46,V47,V48,V49,V50,V51,V52,V53,V54,V55,V56,V56_NZ,V57,V58,V59,V60,V61,V62,V63,V64,V65,V66,V67,V68,V69,V70,V71,V72,V73,V74,V74B,V75,V76,V77,V78,V79,V80,V81,V82,V83,V84,V85,V86,V87,V88,V89,V95,V96,V97,V98,V99,V100,V101,V102,V103,V104,V105,V106,V107,V108,V109,V110,V111,V112,V113,V114,V115,V116,V117,V118,V119,V120,V121,V122,V123,V124,V125_00,V125_01,V125_02,V125_03,V125_04,V125_05,V125_06,V125_07,V125_08,V125_09,V125_10,V125_11,V125_12,V125_13,V125_14,V125_15,V125_16,V125_17,V126,V127,V128,V129,V130,V131,V132,V133,V134,V135,V136,V137,V138,V139,V140,V141,V142,V143,V144,V144G,V145,V146,V147,V148,V149,V150,V151,V152,V153,V154,V155,V156,V157,V158,V159,V160,V161,V162,V163,V164,V165,V166,V167,V168,V169,V170,V171,V172,V173,V174,V175,V176,V177,V178,V179,V180,V181,V182,V183,V184,V185,V186,V187,V188,V189,V190,V191,V192,V193,V194,V195,V196,V197,V198,V199,V200,V201,V202,V203,V203A,V204,V205,V206,V207,V207A,V208,V209,V210,V211,V212,V213,V214,V215_01,V215_02,V215_03,V215_04,V215_05,V215_06,V215_07,V215_08,V215_10,V215_11,V215_12,V215_13,V215_14,V215_15,V215_16,V215_17,V215_18,V216,V217,V218,V219,V220,V221,V222,V223,V224,V225,V226,V227,V229,V230,V231,V232,V233,V234,V235,V236,V237,V238,V239,V240,V242,V243,V244,V245,V246,V247,V248,V250,V258,V258A,S018,S019,V262
0,6,12,12,615,ALG,DZA,1,1.0,1.0,1.0,,1.0,1.0,2.0,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,1.0,2.0,2.0,1.0,1.0,1.0,,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,7.0,4.0,,6.0,0.0,10.0,2.0,3.0,1.0,3.0,3.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,1.0,2.0,3.0,3.0,2.0,1.0,2.0,2.0,4.0,,,,,,5.0,8.0,7.0,6.0,8.0,7.0,5.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,3.0,3.0,2.0,3.0,2.0,2.0,4.0,3.0,3.0,2.0,3.0,2.0,3.0,4.0,4.0,3.0,,,,4.0,,,,,,,,,,,,,0.0,0.0,4.0,1.0,2.0,2.0,2.0,3.0,8.0,5.0,6.0,9.0,3.0,4.0,7.0,6.0,7.0,5.0,2.0,2.0,50000000.0,5.0,3.0,3.0,1.0,1.0,1.0,,,10.0,1.0,2.0,2.0,1.0,2.0,7.0,4.0,3.0,2.0,3.0,1.0,9.0,1.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,5.0,5.0,1.0,5.0,1.0,2.0,2.0,3.0,2.0,3.0,3.0,2.0,3.0,3.0,3.0,3.0,7.0,8.0,3.0,5.0,6.0,9.0,6.0,6.0,1.0,1.0,1.0,1.0,,1.0,3.0,,1.0,1.0,6.0,5.0,1.0,1.0,2.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,2.0,3.0,4.0,2.0,2.0,3.0,4.0,2.0,4.0,2.0,3.0,3.0,6.0,,,,,,2.0,1.0,1.0,4.0,5.0,1.0,21.0,2.0,2.0,1.0,1.0,110.0,7.0,1.0,1.0,1.0,0.833333,1.25,2014
1,6,12,12,615,ALG,DZA,2,1.0,2.0,3.0,4.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,5.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,,1.0,1.0,2.0,2.0,1.0,2.0,3.0,2.0,6.0,8.0,,6.0,0.0,10.0,2.0,1.0,2.0,3.0,4.0,3.0,1.0,1.0,1.0,2.0,2.0,3.0,2.0,1.0,1.0,1.0,3.0,2.0,2.0,2.0,2.0,2.0,1.0,1.0,2.0,3.0,,,,,,5.0,7.0,5.0,5.0,4.0,4.0,6.0,1.0,3.0,3.0,3.0,3.0,3.0,1.0,1.0,1.0,2.0,2.0,3.0,1.0,2.0,2.0,3.0,2.0,2.0,2.0,3.0,2.0,2.0,3.0,,,,4.0,,,,,,,,,,,,,0.0,0.0,3.0,1.0,3.0,2.0,1.0,2.0,8.0,8.0,8.0,9.0,2.0,6.0,4.0,2.0,4.0,4.0,3.0,1.0,50000000.0,5.0,2.0,2.0,1.0,1.0,1.0,2.0,1.0,10.0,1.0,1.0,1.0,1.0,4.0,6.0,4.0,4.0,1.0,2.0,3.0,8.0,2.0,3.0,2.0,1.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,5.0,5.0,5.0,1.0,5.0,2.0,3.0,4.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,4.0,8.0,4.0,6.0,4.0,8.0,3.0,4.0,7.0,1.0,1.0,1.0,,1.0,1.0,,1.0,1.0,3.0,5.0,1.0,2.0,2.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,2.0,2.0,3.0,4.0,3.0,4.0,2.0,3.0,3.0,3.0,2.0,3.0,6.0,,,,,,2.0,2.0,2.0,3.0,6.0,2.0,24.0,2.0,2.0,1.0,1.0,110.0,7.0,1.0,1.0,1.0,0.833333,1.25,2014
2,6,12,12,615,ALG,DZA,3,1.0,3.0,2.0,4.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,1.0,2.0,1.0,2.0,1.0,2.0,4.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,2.0,1.0,1.0,1.0,2.0,1.0,,2.0,3.0,1.0,1.0,1.0,1.0,1.0,1.0,6.0,8.0,,6.0,0.0,6.0,2.0,4.0,1.0,2.0,1.0,4.0,1.0,2.0,2.0,2.0,1.0,2.0,1.0,1.0,4.0,3.0,1.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,,,3.0,3.0,3.0,6.0,7.0,7.0,7.0,5.0,7.0,5.0,1.0,3.0,3.0,4.0,4.0,4.0,3.0,2.0,2.0,2.0,3.0,4.0,3.0,2.0,2.0,2.0,3.0,4.0,3.0,2.0,3.0,2.0,4.0,,,,3.0,,,,,,,,,,,,,0.0,0.0,2.0,1.0,3.0,2.0,2.0,2.0,7.0,4.0,8.0,3.0,3.0,6.0,9.0,5.0,6.0,7.0,2.0,1.0,50000000.0,5.0,2.0,4.0,1.0,1.0,1.0,2.0,1.0,6.0,2.0,3.0,1.0,2.0,2.0,7.0,4.0,4.0,0.0,2.0,2.0,6.0,2.0,3.0,1.0,2.0,4.0,2.0,2.0,2.0,3.0,3.0,3.0,5.0,5.0,5.0,5.0,5.0,2.0,3.0,2.0,3.0,4.0,4.0,2.0,3.0,3.0,3.0,3.0,4.0,7.0,5.0,5.0,5.0,5.0,5.0,5.0,1.0,1.0,1.0,1.0,,1.0,4.0,,1.0,1.0,4.0,5.0,1.0,1.0,2.0,3.0,2.0,,,,,2.0,,,,,,,,,,,,,4.0,3.0,4.0,2.0,2.0,4.0,3.0,1.0,1.0,2.0,2.0,3.0,3.0,2.0,7.0,6.0,5.0,2.0,1.0,,1.0,4.0,6.0,2.0,26.0,2.0,2.0,1.0,1.0,500.0,5.0,1.0,1.0,1.0,0.833333,1.25,2014
3,6,12,12,615,ALG,DZA,4,1.0,1.0,3.0,4.0,3.0,1.0,2.0,1.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,1.0,1.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,6.0,8.0,,6.0,0.0,6.0,2.0,1.0,3.0,1.0,4.0,3.0,1.0,1.0,1.0,1.0,1.0,2.0,3.0,2.0,3.0,3.0,1.0,1.0,2.0,2.0,3.0,1.0,1.0,2.0,2.0,2.0,,,,,,6.0,9.0,5.0,6.0,4.0,6.0,8.0,1.0,3.0,3.0,2.0,2.0,3.0,2.0,3.0,4.0,2.0,3.0,4.0,2.0,3.0,3.0,4.0,2.0,2.0,2.0,3.0,1.0,2.0,4.0,,,,3.0,,,,,,,,,,,,,0.0,0.0,3.0,2.0,3.0,4.0,3.0,2.0,7.0,9.0,5.0,5.0,7.0,3.0,8.0,7.0,8.0,8.0,3.0,2.0,50000000.0,5.0,2.0,1.0,1.0,1.0,1.0,2.0,1.0,10.0,2.0,3.0,4.0,2.0,3.0,7.0,6.0,4.0,1.0,3.0,3.0,7.0,3.0,1.0,2.0,3.0,3.0,1.0,2.0,2.0,2.0,2.0,2.0,5.0,5.0,5.0,1.0,5.0,2.0,3.0,3.0,3.0,4.0,4.0,2.0,2.0,3.0,3.0,3.0,6.0,6.0,3.0,5.0,5.0,7.0,4.0,6.0,1.0,1.0,1.0,1.0,,1.0,1.0,,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,2.0,2.0,3.0,1.0,2.0,3.0,4.0,3.0,3.0,2.0,2.0,3.0,1.0,1.0,8.0,5.0,6.0,2.0,1.0,,4.0,4.0,5.0,2.0,28.0,2.0,2.0,1.0,1.0,500.0,6.0,2.0,1.0,1.0,0.833333,1.25,2014
4,6,12,12,615,ALG,DZA,5,1.0,1.0,1.0,2.0,1.0,1.0,1.0,3.0,2.0,1.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,8.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,1.0,1.0,2.0,2.0,1.0,1.0,2.0,1.0,,1.0,1.0,1.0,2.0,1.0,3.0,2.0,2.0,6.0,6.0,,1.0,3.0,4.0,2.0,1.0,2.0,3.0,4.0,2.0,1.0,2.0,1.0,1.0,2.0,5.0,1.0,2.0,3.0,1.0,4.0,3.0,2.0,2.0,3.0,1.0,2.0,2.0,2.0,2.0,,,,,,5.0,8.0,4.0,7.0,4.0,6.0,6.0,2.0,2.0,3.0,4.0,2.0,3.0,2.0,3.0,3.0,2.0,4.0,3.0,2.0,3.0,3.0,3.0,2.0,3.0,3.0,2.0,4.0,3.0,2.0,,,,3.0,,,,,,,,,,,,,0.0,0.0,3.0,2.0,3.0,4.0,2.0,2.0,8.0,4.0,7.0,3.0,3.0,8.0,6.0,5.0,6.0,7.0,3.0,2.0,50000000.0,5.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,10.0,2.0,3.0,2.0,2.0,2.0,4.0,4.0,3.0,1.0,3.0,2.0,8.0,2.0,3.0,3.0,3.0,3.0,2.0,2.0,3.0,3.0,3.0,3.0,5.0,5.0,5.0,5.0,5.0,2.0,3.0,3.0,4.0,4.0,4.0,2.0,3.0,3.0,3.0,3.0,6.0,2.0,4.0,4.0,6.0,6.0,6.0,5.0,7.0,1.0,1.0,1.0,,1.0,3.0,,1.0,1.0,4.0,5.0,1.0,1.0,2.0,2.0,2.0,,,,,2.0,,,,,,,,,,,,,3.0,3.0,4.0,2.0,2.0,4.0,3.0,2.0,3.0,2.0,3.0,3.0,3.0,2.0,5.0,6.0,9.0,2.0,2.0,1.0,2.0,3.0,7.0,2.0,35.0,2.0,2.0,1.0,1.0,500.0,3.0,1.0,1.0,1.0,0.833333,1.25,2014


In [33]:
cleaning_w6.describe()

Unnamed: 0,V1,V2,V2A,cow,V3,V4,V5,V6,V7,V8,V9,V10,V11,V12,V13,V14,V15,V16,V17,V18,V19,V20,V21,V22,V23,V24,V25,V26,V27,V28,V29,V30,V31,V32,V33,V34,V35,V36,V37,V38,V39,V40,V41,V42,V43,V44,V45,V46,V47,V48,V49,V50,V51,V52,V53,V54,V55,V56,V56_NZ,V57,V58,V59,V60,V61,V62,V63,V64,V65,V66,V67,V68,V69,V70,V71,V72,V73,V74,V74B,V75,V76,V77,V78,V79,V80,V81,V82,V83,V84,V85,V86,V87,V88,V89,V95,V96,V97,V98,V99,V100,V101,V102,V103,V104,V105,V106,V107,V108,V109,V110,V111,V112,V113,V114,V115,V116,V117,V118,V119,V120,V121,V122,V123,V124,V125_00,V125_01,V125_02,V125_03,V125_04,V125_05,V125_06,V125_07,V125_08,V125_09,V125_10,V125_11,V125_12,V125_13,V125_14,V125_15,V125_16,V125_17,V126,V127,V128,V129,V130,V131,V132,V133,V134,V135,V136,V137,V138,V139,V140,V141,V142,V143,V144,V144G,V145,V146,V147,V148,V149,V150,V151,V152,V153,V154,V155,V156,V157,V158,V159,V160,V161,V162,V163,V164,V165,V166,V167,V168,V169,V170,V171,V172,V173,V174,V175,V176,V177,V178,V179,V180,V181,V182,V183,V184,V185,V186,V187,V188,V189,V190,V191,V192,V193,V194,V195,V196,V197,V198,V199,V200,V201,V202,V203,V203A,V204,V205,V206,V207,V207A,V208,V209,V210,V211,V212,V213,V214,V215_01,V215_02,V215_03,V215_04,V215_05,V215_06,V215_07,V215_08,V215_10,V215_11,V215_12,V215_13,V215_14,V215_15,V215_16,V215_17,V215_18,V216,V217,V218,V219,V220,V221,V222,V223,V224,V225,V226,V227,V229,V230,V231,V232,V233,V234,V235,V236,V237,V238,V239,V240,V242,V243,V244,V245,V246,V247,V248,V250,V258,V258A,S018,S019,V262
count,89565.0,89565.0,89565.0,89565.0,89565.0,89224.0,89020.0,88530.0,87945.0,88046.0,88217.0,88807.0,89239.0,89551.0,89559.0,89558.0,89548.0,89556.0,89552.0,89553.0,89547.0,89550.0,89546.0,89562.0,88979.0,87177.0,88725.0,88642.0,88572.0,86354.0,86436.0,88447.0,87342.0,88510.0,88351.0,88368.0,79869.0,85586.0,88024.0,85583.0,88019.0,84284.0,86724.0,85591.0,86724.0,89545.0,87949.0,81958.0,86109.0,86599.0,86372.0,85517.0,85467.0,86960.0,85653.0,84909.0,88117.0,86839.0,783.0,89321.0,87898.0,88917.0,86284.0,83948.0,86628.0,84730.0,86753.0,85039.0,80660.0,86291.0,86099.0,85781.0,86588.0,86970.0,87474.0,87079.0,83963.0,39887.0,86721.0,86433.0,87229.0,87239.0,87444.0,88450.0,83017.0,88510.0,88214.0,88568.0,78941.0,76604.0,78775.0,78248.0,69604.0,68199.0,86680.0,84267.0,87312.0,86411.0,87307.0,84963.0,88110.0,87502.0,87610.0,86435.0,82609.0,82376.0,86638.0,85168.0,86782.0,87546.0,78395.0,87487.0,86227.0,86387.0,83212.0,85068.0,83910.0,84193.0,83097.0,85542.0,82017.0,80238.0,82736.0,16200.0,4549.0,2694.0,1683.0,1940.0,4090.0,3693.0,10023.0,10984.0,5475.0,643.0,1077.0,3104.0,1059.0,1192.0,6760.0,89486.0,89559.0,78727.0,81514.0,80596.0,79608.0,82999.0,85771.0,83763.0,86199.0,86191.0,82246.0,84314.0,85442.0,84888.0,86728.0,87335.0,82553.0,85430.0,87889.0,88313.0,88292.0,84720.0,83840.0,84916.0,79847.0,77586.0,84131.0,82224.0,84679.0,80868.0,79806.0,81437.0,77151.0,81017.0,81365.0,80997.0,82868.0,81527.0,80928.0,82169.0,82351.0,83615.0,80683.0,82907.0,79820.0,78730.0,87721.0,85276.0,84613.0,82079.0,79575.0,76070.0,87467.0,87705.0,84874.0,88102.0,86791.0,84029.0,82574.0,86323.0,86323.0,82033.0,81254.0,83899.0,88242.0,87795.0,87915.0,87917.0,86673.0,86379.0,84827.0,83034.0,85969.0,86820.0,87105.0,87816.0,88175.0,84362.0,87834.0,82179.0,64335.0,84917.0,86965.0,77072.0,86881.0,41253.0,88091.0,88110.0,88064.0,88034.0,83823.0,86066.0,87145.0,15730.0,1112.0,1189.0,2916.0,1724.0,7650.0,4147.0,5515.0,1722.0,11516.0,10622.0,5646.0,6461.0,1051.0,2113.0,1221.0,0.0,83887.0,85354.0,85078.0,85515.0,85262.0,85013.0,84826.0,84974.0,85242.0,88318.0,83277.0,86232.0,88038.0,68158.0,73377.0,73173.0,73212.0,76199.0,85633.0,66325.0,83241.0,86883.0,86311.0,89474.0,89385.0,80830.0,80736.0,78665.0,80429.0,86800.0,88766.0,87836.0,89565.0,89565.0,89565.0,89565.0,89565.0
mean,6.0,471.966147,486.231943,494.832155,39943.26,1.094537,1.673961,1.888693,2.624129,1.516605,1.887856,1.854291,2.094499,1.485835,1.396242,1.287121,1.77,1.317031,1.605894,1.604871,1.590349,1.659296,1.583019,1.731281,6.834219,1.752985,0.513959,0.328806,0.237547,0.183431,0.185386,0.130677,0.16369,0.19286,0.110729,0.163419,0.134921,1.163765,1.81421,1.572018,1.747077,1.481681,1.807677,1.306399,1.728483,1.830376,2.028676,1.472852,2.096157,1.611554,1.654089,2.480595,2.419811,2.94126,2.552975,2.208894,7.071337,5.693248,1.761175,2.720749,1.858017,5.884454,1.700246,2.564754,2.051173,2.496542,1.874759,2.74193,1.330846,2.292464,1.3799,1.498164,2.780027,3.772163,2.381336,3.210544,2.462859,2.363427,2.908557,3.723532,2.54115,2.537294,2.531975,2.153488,1.53224,1.877178,1.931224,2.639881,2.322773,2.619302,2.411184,2.570162,2.605281,5.654482,5.280676,5.602976,4.451713,3.84267,4.192928,6.237645,1.208092,2.135003,2.059879,3.07055,2.76212,2.845671,2.14182,2.182686,2.613941,2.50899,2.715275,2.412107,2.428833,2.585655,2.932173,2.733531,2.588309,2.146912,2.514928,2.414159,2.386566,2.391473,2.332008,2.670556,2.456364,2.817001,3.063577,2.47268,2.852812,2.725968,2.382021,2.587673,2.322922,2.427683,2.640669,2.598905,2.749764,2.744128,3.232692,0.031279,0.034045,2.656039,2.632026,2.352958,3.08214,1.681382,6.306712,4.233623,8.006926,6.998004,4.4804,7.405354,5.982269,6.006809,7.880696,8.253232,5.997444,2.378251,1.833688,50864050.0,3.40605,4.107731,3.71448,1.365903,1.142222,1.378818,1.71435,1.713794,7.754496,2.384342,2.466957,2.566303,2.1418,5.369873,6.909334,5.67284,6.937443,2.764704,2.47887,3.04711,6.036247,2.337475,2.928857,3.163014,2.597557,2.536911,1.901814,3.148905,2.906043,3.472191,3.536877,3.361154,2.659277,3.009737,4.736456,4.685319,4.582399,2.078663,2.020297,2.094448,2.083906,2.236344,2.565191,1.650222,3.442692,3.409283,3.348678,3.086161,7.624116,7.747022,5.49878,5.378423,4.736696,7.253893,2.798301,2.641762,1.815991,2.271674,1.957192,3.274218,2.757597,3.22847,4.550589,4.563823,2.247292,3.310402,2.082914,2.948735,1.972611,1.556035,2.002732,1.78606,1.504848,2.244692,2.186151,2.121951,2.05144,2.008701,1.820784,2.19701,1.976609,2.588269,2.447725,1.816889,2.073858,2.017025,2.501427,1.17558,1.588043,,2.07441,2.80295,3.684537,1.551833,2.528899,2.839754,3.637705,3.30254,2.012846,2.007462,1.632251,1.595081,3.400668,1.986869,5.124589,4.619518,6.438398,1.6843,1.56407,1.25749,2.080705,3.313939,4.825017,1.522509,41.938804,1.920661,1.92006,1.042636,1.014037,2159.070265,5.650294,1.70043,0.999997,1.005937,0.669904,1.004856,2012.112198
std,0.0,245.114798,251.387109,251.203268,191843.1,0.346876,0.734792,0.837273,0.98591,0.796788,1.054521,0.741204,0.85171,0.499802,0.489118,0.452421,0.420835,0.465322,0.488661,0.488881,0.491772,0.473948,0.493062,0.443296,2.274908,0.431278,0.781936,0.664859,0.574433,0.487573,0.489744,0.420481,0.477121,0.517943,0.383026,0.48417,0.443735,0.370064,0.38894,0.494789,0.434689,0.499667,0.394128,0.461,0.444744,0.375304,0.90039,0.74715,0.845553,0.784604,0.753147,0.91738,0.997887,0.936599,0.987174,0.932282,2.251519,2.647946,0.426638,2.188875,1.789133,2.485472,0.992579,1.035385,1.034761,1.046136,1.166069,1.160827,0.47052,0.850311,0.606197,0.691646,1.412249,1.549026,1.307573,1.53361,1.24921,1.188178,1.457765,1.60135,1.357345,1.30127,1.429862,1.50874,0.562384,0.328235,0.253074,0.976105,0.778201,0.599865,0.71325,0.639849,0.593384,2.358175,2.977975,2.794246,2.919882,2.62259,2.88445,2.78805,0.508802,0.829647,0.805362,0.79549,0.862962,0.865,1.028706,0.938031,0.874388,0.881314,0.897022,0.945028,0.947158,0.957196,0.88299,0.936093,0.896902,0.863057,0.879427,0.939982,0.87925,0.900419,0.898237,0.819945,0.720749,0.925117,0.966809,1.084742,0.820887,0.878706,0.913339,0.947188,0.791473,0.741921,1.016563,0.985495,0.996538,0.886961,0.912909,0.289185,0.33297,0.959279,1.053171,0.93269,0.950176,0.779901,2.976814,2.960424,2.479094,2.754898,3.116436,2.575625,3.027969,3.003679,2.590198,2.114488,2.535919,0.87321,0.860794,31131380.0,3.014599,2.189,2.695868,0.586407,0.34928,0.485096,0.557491,0.561546,2.960739,1.068442,1.082328,1.014164,0.884948,2.378603,1.976169,2.660349,2.43349,1.11632,1.181345,1.055321,2.758472,0.911224,0.871462,0.811289,0.902446,0.889714,0.813611,0.911989,1.049022,0.780578,0.771827,0.960368,1.970775,1.999988,0.992336,1.076899,1.223123,1.138784,1.102335,1.106842,1.105828,1.172436,1.179069,0.476902,0.871608,0.885282,0.919773,1.038908,2.269153,2.223732,2.815202,2.745192,2.886767,2.356384,2.580357,2.420803,1.821476,2.185223,1.939492,3.038461,2.497447,2.765436,3.091655,3.36375,2.217978,2.978405,2.065761,2.609065,1.909986,0.784855,0.881643,0.794068,0.631844,0.886573,0.618109,0.654766,0.847615,0.991218,0.90807,0.902914,0.870045,0.87282,1.071946,0.782593,0.755517,0.704709,0.955559,0.419607,0.772364,,0.96294,1.593819,1.297602,1.129369,1.654349,1.820169,1.674299,1.778908,1.370702,0.929785,0.782287,0.779044,2.149471,0.876479,3.059375,2.832743,2.759067,0.464797,0.495881,0.437255,0.924673,0.998554,2.109361,0.499496,16.552421,0.270269,0.271201,0.202037,0.117645,1736.196124,2.421468,0.458072,0.446249,0.489467,0.350799,0.526198,1.241979
min,6.0,12.0,12.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,10000000.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,16.0,1.0,1.0,1.0,1.0,20.0,1.0,1.0,0.050687,0.0213,0.023785,0.035678,2010.0
25%,6.0,276.0,332.0,349.0,391.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,5.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,1.0,1.0,1.0,2.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,2.0,2.0,1.0,6.0,4.0,2.0,1.0,0.0,4.0,1.0,2.0,1.0,2.0,1.0,2.0,1.0,1.0,1.0,1.0,2.0,3.0,1.0,2.0,1.0,1.0,2.0,2.0,1.0,2.0,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,5.0,3.0,3.0,2.0,1.0,1.0,5.0,1.0,2.0,2.0,3.0,2.0,2.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,0.0,0.0,2.0,2.0,2.0,2.0,1.0,4.0,1.0,7.0,5.0,1.0,6.0,4.0,4.0,6.0,7.0,4.0,2.0,1.0,20000000.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,6.0,1.0,1.0,2.0,2.0,4.0,6.0,4.0,5.0,2.0,2.0,2.0,4.0,2.0,2.0,3.0,2.0,2.0,1.0,3.0,2.0,3.0,3.0,3.0,1.0,1.0,5.0,5.0,5.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,3.0,3.0,3.0,2.0,6.0,6.0,3.0,3.0,2.0,6.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,2.0,1.0,1.0,1.0,2.0,1.0,2.0,2.0,1.0,2.0,2.0,2.0,1.0,1.0,,1.0,1.0,3.0,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,2.0,5.0,1.0,1.0,1.0,1.0,3.0,3.0,1.0,28.0,2.0,2.0,1.0,1.0,1240.0,4.0,1.0,0.868382,0.87026,0.409333,0.613999,2011.0
50%,6.0,434.0,484.0,560.0,812.0,1.0,2.0,2.0,3.0,1.0,1.0,2.0,2.0,1.0,1.0,1.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,7.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,1.0,2.0,1.0,2.0,2.0,2.0,1.0,2.0,1.0,2.0,3.0,2.0,3.0,3.0,2.0,7.0,6.0,2.0,1.0,2.0,6.0,1.0,3.0,2.0,3.0,1.0,3.0,1.0,3.0,1.0,1.0,3.0,4.0,2.0,3.0,2.0,2.0,3.0,4.0,2.0,2.0,2.0,1.0,1.0,2.0,2.0,3.0,3.0,3.0,3.0,3.0,3.0,5.0,5.0,5.0,4.0,3.0,4.0,7.0,1.0,2.0,2.0,3.0,3.0,3.0,2.0,2.0,3.0,3.0,3.0,2.0,2.0,3.0,3.0,3.0,3.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,2.0,3.0,3.0,2.0,3.0,3.0,2.0,3.0,2.0,2.0,3.0,3.0,3.0,3.0,3.0,0.0,0.0,3.0,3.0,2.0,3.0,2.0,7.0,4.0,9.0,8.0,4.0,8.0,6.0,6.0,9.0,9.0,6.0,2.0,2.0,50000000.0,3.0,4.0,3.0,1.0,1.0,1.0,2.0,2.0,9.0,2.0,3.0,3.0,2.0,5.0,7.0,6.0,7.0,3.0,3.0,3.0,6.0,2.0,3.0,3.0,3.0,3.0,2.0,3.0,3.0,4.0,4.0,4.0,1.0,5.0,5.0,5.0,5.0,2.0,2.0,2.0,2.0,2.0,3.0,2.0,4.0,4.0,4.0,3.0,8.0,8.0,5.0,5.0,5.0,8.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,2.0,5.0,4.0,1.0,2.0,1.0,1.0,1.0,1.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,2.0,2.0,2.0,2.0,2.0,1.0,1.0,,2.0,2.0,4.0,1.0,2.0,2.0,5.0,4.0,1.0,2.0,1.0,1.0,3.0,2.0,5.0,5.0,7.0,2.0,2.0,1.0,2.0,3.0,5.0,2.0,40.0,2.0,2.0,1.0,1.0,1580.0,6.0,2.0,1.0,1.0,0.661376,0.992063,2012.0
75%,6.0,702.0,710.0,705.0,1356.0,1.0,2.0,2.0,3.0,2.0,3.0,2.0,3.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,8.0,2.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,2.0,3.0,2.0,2.0,3.0,3.0,4.0,3.0,3.0,9.0,8.0,2.0,6.0,3.0,8.0,2.0,3.0,3.0,3.0,3.0,4.0,2.0,3.0,2.0,2.0,4.0,5.0,3.0,4.0,3.0,3.0,4.0,5.0,3.0,3.0,3.0,3.0,2.0,2.0,2.0,3.0,3.0,3.0,3.0,3.0,3.0,7.0,8.0,8.0,7.0,5.0,6.0,8.0,1.0,3.0,2.0,4.0,3.0,4.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,4.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,4.0,4.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,4.0,3.0,4.0,0.0,0.0,3.0,4.0,3.0,4.0,2.0,9.0,6.0,10.0,10.0,7.0,10.0,9.0,9.0,10.0,10.0,8.0,3.0,2.0,70000000.0,5.0,6.0,7.0,2.0,1.0,2.0,2.0,2.0,10.0,3.0,3.0,3.0,3.0,7.0,8.0,8.0,9.0,4.0,3.0,4.0,8.0,3.0,4.0,4.0,3.0,3.0,2.0,4.0,4.0,4.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,3.0,3.0,3.0,3.0,3.0,4.0,2.0,4.0,4.0,4.0,4.0,10.0,10.0,8.0,7.0,7.0,9.0,4.0,4.0,2.0,3.0,2.0,5.0,4.0,5.0,7.0,8.0,3.0,5.0,2.0,5.0,2.0,2.0,2.0,2.0,2.0,3.0,2.0,2.0,3.0,3.0,2.0,3.0,2.0,3.0,3.0,2.0,3.0,2.0,3.0,1.0,2.0,,3.0,5.0,5.0,2.0,4.0,5.0,5.0,5.0,2.0,3.0,2.0,2.0,5.0,2.0,8.0,7.0,9.0,2.0,2.0,2.0,3.0,4.0,6.0,2.0,54.0,2.0,2.0,1.0,1.0,3580.0,8.0,2.0,1.0,1.0,0.833333,1.25,2013.0
max,6.0,887.0,901.0,920.0,1394604.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,10.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,3.0,3.0,3.0,4.0,4.0,4.0,4.0,4.0,4.0,10.0,10.0,2.0,6.0,8.0,10.0,4.0,4.0,4.0,4.0,4.0,4.0,2.0,3.0,3.0,3.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,6.0,5.0,3.0,2.0,2.0,4.0,3.0,3.0,3.0,3.0,3.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,4.0,4.0,100000000.0,9.0,7.0,8.0,3.0,2.0,2.0,4.0,4.0,10.0,4.0,4.0,4.0,4.0,10.0,10.0,10.0,10.0,4.0,4.0,4.0,10.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,4.0,4.0,4.0,4.0,4.0,4.0,2.0,4.0,4.0,4.0,4.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,5.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,4.0,,4.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,5.0,4.0,3.0,3.0,8.0,4.0,10.0,10.0,10.0,2.0,2.0,2.0,4.0,5.0,10.0,2.0,102.0,2.0,2.0,2.0,2.0,9900.0,9.0,2.0,22.790557,22.790557,10.694771,16.042156,2016.0


#### Additional variables that may need to be dropped:
- 'V258A' (sample weights for "splitted samples"; note, Germany is the only country in this data set that appears to have a splitted sample); when using weights, use 'V258' instead
- 'V2A' (use 'V2' instead) for country code
- 'C_COW_ALPHA'
- 'V144' (religious affiliation; I can't find the codes for these values, so I'm not sure how to interpret these); keep 'V144G' instead
- 'V1' (wave; there shouldn't be any variation here as these are all wave 6 data)
- 'V3' (interview number; unnecessary identifier)
- 'V23' (satisfaction with life question; redundant because using V10 as target variable instead)
- 'V262' (survey year)
- 'V247' (language spoken at home)

#### Variables to un-drop:
- Return V56_NZ to the data set (**done!**)
    - Next, use V56_NZ to fill V56 missing values if 'C_COW_ALPHA' = 'NEW'? (justify why or why not)
  
#### Thinking ahead to future steps:
- items may need to be normalized or re-scaled so that the ranges are more similar
- items may need to be reverse-coded to assist with interpretability for linear regression
- as mentioned earlier, create a new variable for V125 and V215 items
- retain and rename B_COUNTRY_ALPHA for country labels
- recode age variable 'V242'; create age categories based on groupings identified here: https://www.cia.gov/the-world-factbook/field/age-structure/

In [34]:
# what's the difference between V2 and V2A for countries that have splitted samples? Germany is the only one I'm seeing
# for this wave; there's variation in V2A values, but not in V2, COW_ALPHA or COUNTRY_ALPHA distinctions
# may not be worth it to hang on to splitted samples for this survey wave
cleaning_w6[cleaning_w6['C_COW_ALPHA'] == 'GMY'].sample(50)

Unnamed: 0,V1,V2,V2A,cow,C_COW_ALPHA,B_COUNTRY_ALPHA,V3,V4,V5,V6,V7,V8,V9,V10,V11,V12,V13,V14,V15,V16,V17,V18,V19,V20,V21,V22,V23,V24,V25,V26,V27,V28,V29,V30,V31,V32,V33,V34,V35,V36,V37,V38,V39,V40,V41,V42,V43,V44,V45,V46,V47,V48,V49,V50,V51,V52,V53,V54,V55,V56,V56_NZ,V57,V58,V59,V60,V61,V62,V63,V64,V65,V66,V67,V68,V69,V70,V71,V72,V73,V74,V74B,V75,V76,V77,V78,V79,V80,V81,V82,V83,V84,V85,V86,V87,V88,V89,V95,V96,V97,V98,V99,V100,V101,V102,V103,V104,V105,V106,V107,V108,V109,V110,V111,V112,V113,V114,V115,V116,V117,V118,V119,V120,V121,V122,V123,V124,V125_00,V125_01,V125_02,V125_03,V125_04,V125_05,V125_06,V125_07,V125_08,V125_09,V125_10,V125_11,V125_12,V125_13,V125_14,V125_15,V125_16,V125_17,V126,V127,V128,V129,V130,V131,V132,V133,V134,V135,V136,V137,V138,V139,V140,V141,V142,V143,V144,V144G,V145,V146,V147,V148,V149,V150,V151,V152,V153,V154,V155,V156,V157,V158,V159,V160,V161,V162,V163,V164,V165,V166,V167,V168,V169,V170,V171,V172,V173,V174,V175,V176,V177,V178,V179,V180,V181,V182,V183,V184,V185,V186,V187,V188,V189,V190,V191,V192,V193,V194,V195,V196,V197,V198,V199,V200,V201,V202,V203,V203A,V204,V205,V206,V207,V207A,V208,V209,V210,V211,V212,V213,V214,V215_01,V215_02,V215_03,V215_04,V215_05,V215_06,V215_07,V215_08,V215_10,V215_11,V215_12,V215_13,V215_14,V215_15,V215_16,V215_17,V215_18,V216,V217,V218,V219,V220,V221,V222,V223,V224,V225,V226,V227,V229,V230,V231,V232,V233,V234,V235,V236,V237,V238,V239,V240,V242,V243,V244,V245,V246,V247,V248,V250,V258,V258A,S018,S019,V262
21713,6,276,900,255,GMY,DEU,672,1.0,1.0,1.0,3.0,2.0,2.0,1.0,1.0,1.0,2.0,1.0,2.0,1.0,2.0,1.0,2.0,2.0,2.0,1.0,10.0,2.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,3.0,1.0,3.0,2.0,2.0,3.0,3.0,3.0,3.0,3.0,5.0,5.0,,1.0,0.0,5.0,2.0,3.0,2.0,3.0,1.0,4.0,1.0,2.0,1.0,1.0,4.0,4.0,2.0,2.0,2.0,,3.0,6.0,3.0,2.0,2.0,1.0,2.0,2.0,2.0,3.0,2.0,2.0,2.0,2.0,,5.0,5.0,5.0,8.0,5.0,7.0,6.0,1.0,2.0,2.0,3.0,3.0,,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,,,,,,,,,,,,,,,,0.0,0.0,2.0,4.0,4.0,4.0,1.0,5.0,1.0,10.0,6.0,4.0,5.0,3.0,1.0,10.0,10.0,8.0,2.0,2.0,80400035.0,8.0,6.0,8.0,1.0,1.0,2.0,1.0,2.0,5.0,3.0,3.0,2.0,2.0,5.0,6.0,7.0,10.0,2.0,2.0,2.0,10.0,3.0,4.0,3.0,3.0,3.0,1.0,4.0,4.0,4.0,4.0,4.0,1.0,1.0,5.0,5.0,5.0,,,4.0,3.0,4.0,4.0,2.0,4.0,4.0,4.0,4.0,10.0,10.0,4.0,5.0,5.0,10.0,1.0,1.0,1.0,,1.0,10.0,10.0,4.0,10.0,10.0,5.0,,1.0,1.0,1.0,1.0,3.0,1.0,1.0,2.0,,,,,,,,,,,,,,,,,3.0,1.0,2.0,1.0,1.0,1.0,5.0,5.0,1.0,1.0,1.0,1.0,7.0,3.0,3.0,3.0,1.0,2.0,2.0,1.0,1.0,3.0,5.0,2.0,48.0,2.0,2.0,1.0,1.0,1530.0,5.0,2.0,2.732429,3.9726,1.335498,2.003247,2013
20178,6,276,900,255,GMY,DEU,63,1.0,2.0,2.0,3.0,,3.0,2.0,3.0,1.0,2.0,1.0,2.0,1.0,2.0,1.0,2.0,2.0,2.0,1.0,8.0,2.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,2.0,2.0,2.0,2.0,1.0,1.0,2.0,1.0,1.0,3.0,2.0,3.0,1.0,1.0,3.0,4.0,2.0,3.0,1.0,8.0,4.0,,3.0,3.0,7.0,1.0,2.0,3.0,1.0,1.0,4.0,,3.0,1.0,1.0,1.0,5.0,1.0,1.0,,1.0,1.0,6.0,1.0,1.0,2.0,1.0,2.0,2.0,2.0,3.0,3.0,3.0,3.0,3.0,3.0,8.0,4.0,,5.0,1.0,3.0,3.0,2.0,2.0,2.0,2.0,2.0,,2.0,2.0,2.0,3.0,,1.0,3.0,3.0,3.0,3.0,2.0,,3.0,3.0,2.0,2.0,2.0,3.0,,,,,,,,,,,,,,,,0.0,0.0,3.0,4.0,4.0,4.0,1.0,5.0,1.0,10.0,8.0,1.0,,1.0,1.0,10.0,10.0,8.0,3.0,1.0,10000000.0,1.0,6.0,7.0,1.0,1.0,2.0,2.0,2.0,7.0,2.0,,1.0,1.0,5.0,7.0,6.0,4.0,4.0,3.0,2.0,6.0,2.0,4.0,4.0,2.0,3.0,2.0,4.0,4.0,4.0,4.0,4.0,1.0,1.0,5.0,5.0,5.0,,,4.0,3.0,4.0,3.0,,4.0,4.0,4.0,4.0,10.0,10.0,5.0,,1.0,10.0,1.0,1.0,1.0,,1.0,10.0,10.0,3.0,10.0,10.0,10.0,,1.0,1.0,1.0,1.0,4.0,1.0,1.0,3.0,,,,,,,,,,,,,,,,,1.0,4.0,2.0,1.0,1.0,1.0,5.0,5.0,1.0,3.0,2.0,2.0,4.0,1.0,1.0,1.0,3.0,2.0,1.0,,2.0,4.0,3.0,2.0,77.0,2.0,2.0,1.0,1.0,1530.0,2.0,2.0,1.264528,1.8385,0.618049,0.927074,2013
21886,6,276,900,255,GMY,DEU,989,3.0,1.0,1.0,4.0,2.0,4.0,1.0,1.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,9.0,2.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,1.0,3.0,1.0,4.0,4.0,4.0,3.0,1.0,4.0,10.0,3.0,,6.0,0.0,7.0,3.0,4.0,3.0,2.0,2.0,3.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,2.0,,4.0,3.0,2.0,5.0,3.0,5.0,2.0,2.0,2.0,2.0,4.0,3.0,3.0,3.0,3.0,3.0,4.0,1.0,1.0,2.0,7.0,4.0,7.0,3.0,4.0,2.0,4.0,4.0,4.0,4.0,2.0,3.0,2.0,1.0,1.0,2.0,3.0,4.0,4.0,2.0,4.0,3.0,4.0,2.0,1.0,1.0,4.0,,,,,,,,,,,,,,,,0.0,0.0,3.0,4.0,1.0,4.0,1.0,10.0,1.0,10.0,6.0,1.0,6.0,5.0,2.0,6.0,6.0,3.0,3.0,4.0,100000020.0,0.0,7.0,8.0,3.0,2.0,2.0,,,1.0,4.0,,3.0,4.0,7.0,4.0,7.0,6.0,1.0,0.0,1.0,1.0,4.0,2.0,4.0,3.0,4.0,4.0,3.0,2.0,4.0,4.0,4.0,1.0,1.0,5.0,5.0,5.0,1.0,4.0,3.0,2.0,4.0,1.0,1.0,4.0,4.0,4.0,3.0,10.0,10.0,1.0,1.0,1.0,10.0,6.0,4.0,1.0,,6.0,10.0,3.0,6.0,10.0,10.0,1.0,,1.0,1.0,1.0,3.0,1.0,4.0,3.0,4.0,,,,,,,,,,,,,,,,,1.0,4.0,3.0,3.0,1.0,1.0,1.0,1.0,1.0,3.0,3.0,3.0,1.0,2.0,4.0,6.0,8.0,2.0,1.0,,2.0,3.0,4.0,2.0,30.0,2.0,2.0,1.0,1.0,1530.0,3.0,2.0,2.194229,3.1901,1.072448,1.608672,2013
21951,6,276,901,255,GMY,DEU,1978,1.0,1.0,1.0,4.0,1.0,4.0,2.0,1.0,2.0,2.0,1.0,1.0,1.0,1.0,2.0,2.0,2.0,1.0,2.0,9.0,1.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,2.0,1.0,2.0,1.0,1.0,1.0,2.0,2.0,1.0,1.0,1.0,1.0,3.0,1.0,4.0,4.0,4.0,4.0,3.0,10.0,8.0,,6.0,0.0,10.0,3.0,2.0,1.0,4.0,4.0,1.0,1.0,3.0,3.0,2.0,3.0,2.0,3.0,1.0,1.0,,2.0,1.0,2.0,2.0,1.0,4.0,1.0,2.0,2.0,4.0,3.0,3.0,2.0,3.0,3.0,2.0,1.0,4.0,2.0,10.0,1.0,10.0,1.0,1.0,1.0,3.0,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,3.0,3.0,3.0,2.0,2.0,3.0,1.0,1.0,1.0,2.0,2.0,,,,,,,,,,,,,,,,0.0,0.0,3.0,3.0,2.0,2.0,1.0,4.0,5.0,3.0,5.0,9.0,7.0,6.0,7.0,5.0,7.0,7.0,2.0,4.0,100000020.0,0.0,7.0,8.0,2.0,2.0,2.0,2.0,2.0,2.0,4.0,4.0,3.0,2.0,7.0,6.0,9.0,9.0,0.0,2.0,1.0,2.0,2.0,4.0,3.0,4.0,4.0,1.0,4.0,3.0,4.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,3.0,3.0,3.0,2.0,3.0,4.0,2.0,4.0,4.0,4.0,4.0,10.0,7.0,8.0,6.0,3.0,8.0,1.0,1.0,1.0,,1.0,1.0,1.0,1.0,1.0,1.0,1.0,,1.0,1.0,1.0,2.0,3.0,2.0,2.0,3.0,,,,,,,,,,,,,,,,,3.0,4.0,2.0,2.0,3.0,1.0,2.0,1.0,1.0,3.0,3.0,2.0,1.0,3.0,7.0,4.0,7.0,2.0,2.0,1.0,1.0,2.0,7.0,2.0,21.0,2.0,2.0,1.0,1.0,1530.0,7.0,1.0,0.464441,0.1723,0.227,0.340499,2013
20288,6,276,901,255,GMY,DEU,1154,2.0,1.0,1.0,3.0,1.0,2.0,2.0,1.0,1.0,2.0,1.0,2.0,1.0,1.0,2.0,2.0,2.0,2.0,1.0,9.0,2.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,1.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,3.0,1.0,3.0,1.0,2.0,2.0,3.0,4.0,4.0,4.0,8.0,5.0,,6.0,0.0,4.0,4.0,3.0,2.0,4.0,2.0,3.0,,3.0,3.0,1.0,5.0,5.0,2.0,3.0,3.0,,3.0,4.0,4.0,2.0,4.0,1.0,1.0,2.0,2.0,3.0,1.0,2.0,2.0,2.0,2.0,5.0,7.0,,1.0,8.0,8.0,8.0,1.0,2.0,2.0,3.0,,2.0,2.0,3.0,3.0,2.0,3.0,3.0,3.0,3.0,3.0,2.0,3.0,3.0,3.0,3.0,,,2.0,3.0,,,,,,,,,,,,,,,,0.0,0.0,3.0,4.0,3.0,4.0,2.0,9.0,1.0,9.0,8.0,1.0,9.0,3.0,1.0,10.0,8.0,8.0,3.0,2.0,10000000.0,1.0,2.0,3.0,1.0,2.0,2.0,2.0,2.0,6.0,3.0,3.0,3.0,3.0,8.0,8.0,7.0,8.0,2.0,3.0,4.0,7.0,3.0,4.0,4.0,4.0,4.0,2.0,3.0,4.0,4.0,4.0,4.0,1.0,5.0,5.0,5.0,5.0,1.0,,,4.0,4.0,2.0,1.0,4.0,4.0,4.0,4.0,9.0,9.0,5.0,,5.0,7.0,5.0,1.0,1.0,,1.0,1.0,1.0,1.0,,7.0,1.0,,1.0,1.0,1.0,2.0,2.0,2.0,2.0,3.0,,,,,,,,,,,,,,,,,2.0,3.0,5.0,3.0,2.0,1.0,5.0,2.0,1.0,2.0,1.0,1.0,1.0,2.0,1.0,3.0,5.0,2.0,2.0,1.0,1.0,3.0,4.0,1.0,22.0,2.0,2.0,1.0,1.0,1530.0,3.0,1.0,0.37943,0.1408,0.18545,0.278175,2013
20146,6,276,901,255,GMY,DEU,1395,1.0,2.0,2.0,2.0,,4.0,2.0,4.0,1.0,1.0,1.0,2.0,1.0,2.0,1.0,2.0,2.0,2.0,2.0,3.0,2.0,0.0,0.0,0.0,,0.0,0.0,,0.0,0.0,0.0,,1.0,2.0,1.0,2.0,1.0,2.0,1.0,2.0,2.0,3.0,2.0,3.0,1.0,1.0,2.0,4.0,4.0,4.0,4.0,5.0,1.0,,1.0,0.0,1.0,3.0,1.0,2.0,1.0,3.0,4.0,2.0,2.0,1.0,1.0,3.0,5.0,1.0,4.0,3.0,,2.0,6.0,1.0,2.0,2.0,4.0,1.0,1.0,2.0,1.0,2.0,3.0,3.0,3.0,2.0,5.0,1.0,1.0,1.0,1.0,5.0,10.0,1.0,1.0,2.0,3.0,2.0,2.0,4.0,2.0,4.0,2.0,4.0,1.0,,4.0,4.0,4.0,3.0,2.0,4.0,4.0,2.0,,3.0,4.0,,,,,,,,,,,,,,,,0.0,0.0,4.0,4.0,2.0,4.0,1.0,10.0,1.0,10.0,10.0,1.0,10.0,1.0,1.0,10.0,10.0,5.0,2.0,1.0,100000020.0,0.0,7.0,8.0,3.0,1.0,2.0,,,1.0,4.0,,2.0,4.0,5.0,5.0,5.0,10.0,2.0,2.0,0.0,10.0,2.0,4.0,3.0,4.0,2.0,1.0,4.0,4.0,4.0,4.0,4.0,5.0,5.0,5.0,5.0,5.0,,,1.0,2.0,4.0,1.0,1.0,4.0,4.0,4.0,4.0,9.0,10.0,1.0,5.0,1.0,10.0,1.0,1.0,1.0,,1.0,10.0,,5.0,8.0,10.0,10.0,,1.0,4.0,1.0,1.0,4.0,2.0,1.0,1.0,,,,,,,,,,,,,,,,,1.0,2.0,3.0,1.0,1.0,1.0,5.0,5.0,2.0,1.0,1.0,1.0,4.0,2.0,1.0,4.0,5.0,2.0,1.0,,2.0,4.0,2.0,1.0,75.0,2.0,2.0,1.0,1.0,1530.0,2.0,2.0,0.141788,0.0526,0.0693,0.10395,2013
21467,6,276,901,255,GMY,DEU,1757,1.0,1.0,1.0,3.0,1.0,3.0,1.0,2.0,1.0,2.0,1.0,2.0,2.0,1.0,1.0,2.0,2.0,2.0,2.0,9.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,1.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,3.0,3.0,3.0,2.0,2.0,1.0,4.0,4.0,4.0,4.0,10.0,7.0,,3.0,2.0,8.0,3.0,4.0,2.0,3.0,4.0,1.0,1.0,3.0,1.0,2.0,5.0,6.0,2.0,5.0,,2.0,4.0,6.0,5.0,2.0,6.0,1.0,1.0,2.0,2.0,4.0,1.0,3.0,1.0,2.0,2.0,5.0,3.0,6.0,2.0,5.0,9.0,7.0,1.0,2.0,2.0,3.0,3.0,3.0,3.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,3.0,3.0,2.0,2.0,3.0,3.0,,,,,,,,,,,,,,,,0.0,0.0,3.0,2.0,2.0,3.0,2.0,2.0,1.0,9.0,8.0,8.0,7.0,6.0,7.0,7.0,6.0,4.0,3.0,1.0,100000020.0,0.0,7.0,8.0,2.0,2.0,2.0,2.0,2.0,1.0,4.0,3.0,2.0,2.0,3.0,8.0,8.0,8.0,2.0,2.0,1.0,7.0,1.0,3.0,4.0,3.0,3.0,2.0,3.0,2.0,2.0,3.0,3.0,1.0,5.0,5.0,5.0,5.0,4.0,2.0,3.0,4.0,4.0,4.0,2.0,4.0,4.0,4.0,4.0,3.0,2.0,2.0,1.0,2.0,5.0,1.0,1.0,1.0,,1.0,7.0,2.0,1.0,2.0,4.0,1.0,,1.0,1.0,1.0,2.0,3.0,3.0,4.0,4.0,,,,,,,,,,,,,,,,,4.0,5.0,4.0,2.0,5.0,4.0,4.0,1.0,1.0,3.0,3.0,3.0,7.0,3.0,1.0,1.0,1.0,2.0,1.0,,4.0,4.0,1.0,1.0,44.0,2.0,2.0,1.0,1.0,1530.0,2.0,2.0,0.370837,0.1376,0.18125,0.271875,2013
20198,6,276,900,255,GMY,DEU,173,1.0,1.0,2.0,2.0,1.0,1.0,1.0,2.0,1.0,2.0,1.0,1.0,1.0,2.0,1.0,2.0,2.0,2.0,2.0,8.0,1.0,2.0,2.0,0.0,1.0,0.0,0.0,0.0,2.0,0.0,0.0,,1.0,1.0,1.0,1.0,1.0,1.0,2.0,1.0,1.0,3.0,2.0,2.0,1.0,3.0,3.0,3.0,3.0,3.0,3.0,6.0,7.0,,1.0,1.0,4.0,3.0,4.0,4.0,2.0,3.0,2.0,2.0,2.0,2.0,3.0,4.0,5.0,6.0,3.0,,1.0,4.0,4.0,5.0,2.0,3.0,1.0,3.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,,,1.0,6.0,6.0,6.0,8.0,7.0,1.0,2.0,2.0,3.0,2.0,2.0,2.0,3.0,2.0,3.0,2.0,2.0,2.0,3.0,3.0,3.0,2.0,,,3.0,2.0,3.0,2.0,2.0,,,,,,,,,,,,,,,,0.0,0.0,3.0,4.0,3.0,4.0,2.0,8.0,1.0,10.0,10.0,1.0,10.0,2.0,1.0,10.0,10.0,8.0,2.0,2.0,80400035.0,8.0,3.0,3.0,1.0,1.0,2.0,2.0,2.0,10.0,3.0,3.0,3.0,2.0,4.0,7.0,8.0,8.0,2.0,2.0,2.0,8.0,3.0,4.0,3.0,3.0,3.0,1.0,3.0,4.0,4.0,3.0,3.0,5.0,5.0,5.0,5.0,5.0,2.0,2.0,2.0,3.0,4.0,3.0,2.0,4.0,4.0,4.0,4.0,6.0,6.0,6.0,8.0,3.0,6.0,2.0,1.0,1.0,,1.0,10.0,8.0,8.0,8.0,10.0,6.0,,2.0,2.0,1.0,3.0,3.0,2.0,2.0,2.0,,,,,,,,,,,,,,,,,2.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,3.0,1.0,1.0,4.0,2.0,5.0,8.0,8.0,1.0,2.0,2.0,,4.0,2.0,2.0,70.0,2.0,2.0,1.0,1.0,1530.0,,2.0,3.138047,4.5623,1.533748,2.300621,2013
21449,6,276,901,255,GMY,DEU,1424,1.0,2.0,2.0,2.0,,4.0,1.0,3.0,1.0,2.0,1.0,2.0,1.0,1.0,2.0,2.0,2.0,2.0,1.0,10.0,2.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,,2.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,3.0,3.0,3.0,1.0,,4.0,4.0,4.0,4.0,1.0,8.0,7.0,,1.0,2.0,6.0,3.0,4.0,4.0,3.0,1.0,4.0,2.0,3.0,1.0,3.0,2.0,6.0,3.0,1.0,,2.0,5.0,6.0,2.0,1.0,2.0,1.0,1.0,2.0,2.0,1.0,3.0,3.0,2.0,2.0,3.0,3.0,3.0,5.0,3.0,1.0,2.0,6.0,1.0,3.0,1.0,3.0,2.0,2.0,4.0,4.0,3.0,3.0,2.0,2.0,2.0,2.0,4.0,3.0,3.0,1.0,2.0,3.0,1.0,1.0,1.0,2.0,,,,,,,,,,,,,,,,0.0,0.0,2.0,4.0,3.0,4.0,1.0,9.0,2.0,9.0,7.0,1.0,5.0,2.0,2.0,9.0,10.0,4.0,3.0,2.0,100000020.0,0.0,7.0,8.0,3.0,2.0,2.0,1.0,2.0,1.0,4.0,1.0,4.0,2.0,7.0,7.0,5.0,9.0,4.0,1.0,2.0,3.0,1.0,4.0,1.0,3.0,4.0,1.0,4.0,3.0,4.0,3.0,4.0,1.0,5.0,5.0,5.0,5.0,4.0,4.0,3.0,3.0,3.0,4.0,2.0,4.0,4.0,4.0,4.0,9.0,9.0,1.0,4.0,1.0,9.0,2.0,1.0,1.0,,4.0,5.0,3.0,3.0,4.0,8.0,2.0,,2.0,2.0,2.0,2.0,3.0,1.0,3.0,4.0,,,,,,,,,,,,,,,,,1.0,5.0,5.0,1.0,1.0,5.0,5.0,5.0,2.0,,1.0,1.0,4.0,3.0,10.0,10.0,9.0,1.0,2.0,2.0,1.0,3.0,4.0,1.0,77.0,1.0,1.0,2.0,1.0,1530.0,3.0,2.0,0.286235,0.1062,0.1399,0.20985,2013
20194,6,276,900,255,GMY,DEU,482,1.0,2.0,1.0,3.0,3.0,4.0,2.0,2.0,1.0,2.0,1.0,2.0,1.0,2.0,2.0,2.0,2.0,2.0,2.0,7.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,,1.0,2.0,2.0,2.0,2.0,2.0,1.0,2.0,2.0,3.0,1.0,3.0,1.0,2.0,,3.0,3.0,3.0,1.0,5.0,5.0,,1.0,2.0,5.0,1.0,3.0,1.0,2.0,4.0,2.0,2.0,,1.0,1.0,4.0,3.0,3.0,3.0,,2.0,3.0,5.0,5.0,3.0,4.0,1.0,,2.0,2.0,2.0,2.0,2.0,2.0,3.0,2.0,1.0,1.0,4.0,5.0,3.0,7.0,7.0,1.0,2.0,2.0,3.0,3.0,3.0,3.0,2.0,3.0,3.0,3.0,2.0,2.0,3.0,3.0,3.0,2.0,2.0,3.0,3.0,2.0,2.0,2.0,3.0,,,,,,,,,,,,,,,,0.0,0.0,2.0,3.0,2.0,3.0,1.0,10.0,3.0,6.0,10.0,1.0,10.0,6.0,1.0,10.0,5.0,5.0,2.0,3.0,100000020.0,0.0,7.0,8.0,2.0,2.0,2.0,,2.0,2.0,3.0,,2.0,,7.0,7.0,4.0,10.0,1.0,1.0,3.0,10.0,2.0,4.0,3.0,,3.0,2.0,4.0,4.0,4.0,4.0,4.0,1.0,5.0,5.0,5.0,5.0,4.0,4.0,2.0,3.0,4.0,3.0,2.0,4.0,4.0,4.0,4.0,10.0,6.0,5.0,5.0,9.0,5.0,1.0,1.0,1.0,,1.0,5.0,5.0,6.0,6.0,6.0,1.0,,1.0,1.0,1.0,2.0,2.0,2.0,2.0,3.0,,,,,,,,,,,,,,,,,2.0,2.0,5.0,1.0,1.0,5.0,4.0,4.0,2.0,1.0,1.0,1.0,4.0,2.0,1.0,5.0,1.0,1.0,2.0,2.0,1.0,4.0,3.0,1.0,63.0,2.0,2.0,1.0,1.0,1530.0,7.0,2.0,1.330307,1.9341,0.650199,0.975298,2013


In [35]:
# how many respondents from various countries did not respond to V56?
# are these values missing at random, or en masse for some samples?
cleaning_w6[~cleaning_w6.V56.notnull()]['C_COW_ALPHA'].value_counts()

NEW    841
JPN    216
CHN    179
RUS    147
NTH    116
MOR     88
LIB     87
UZB     75
YEM     73
KUW     63
SPN     60
ALG     57
ARM     49
TAW     45
PER     42
URU     41
GRG     37
SAF     36
POL     34
EST     32
ROM     32
TUN     31
CHL     31
USA     27
ARG     26
IND     25
AUL     25
BRA     24
SWD     23
GMY     19
COL     18
TUR     16
SLV     15
MEX     13
IRQ     13
HAI      9
ECU      8
QAT      8
PSE      7
CYP      7
TRI      6
ROK      5
JOR      5
THI      4
BLR      3
SIN      2
HKG      2
LEB      2
KYR      2
Name: C_COW_ALPHA, dtype: int64

In [36]:
# how many respondents from various countries responded to V56_NZ?
wvs_w6[wvs_w6.V56_NZ.notnull()]['C_COW_ALPHA'].value_counts()

# V56 is missing entirely for repondents from New Zeland; all responses to V56_NZ are from New Zeland
# responses have a different range/scale, but could possibly be meaningfully combined into the same variable...
# justify why or why not do this

NEW    783
Name: C_COW_ALPHA, dtype: int64

In [37]:
# what to do about age?
cleaning_w6.V242.value_counts()

# create age groups based on CIA.gov categories

25.0     2383
30.0     2362
23.0     2309
20.0     2252
24.0     2215
22.0     2147
40.0     2125
26.0     2112
35.0     2092
27.0     2069
28.0     2064
18.0     2062
19.0     1999
32.0     1983
21.0     1981
29.0     1911
31.0     1886
45.0     1854
42.0     1821
36.0     1815
50.0     1805
38.0     1804
33.0     1787
34.0     1660
37.0     1633
39.0     1606
43.0     1604
41.0     1532
46.0     1524
44.0     1511
47.0     1494
55.0     1486
52.0     1463
48.0     1438
49.0     1414
60.0     1405
51.0     1373
54.0     1288
53.0     1231
56.0     1220
58.0     1213
62.0     1157
57.0     1147
65.0     1024
63.0     1008
61.0      994
59.0      967
64.0      898
70.0      839
66.0      822
68.0      723
67.0      675
72.0      647
69.0      602
73.0      597
71.0      560
74.0      511
75.0      488
76.0      432
77.0      363
78.0      297
80.0      262
79.0      257
81.0      232
82.0      173
83.0      164
84.0      153
85.0      137
17.0       56
86.0       48
87.0       42
89.0  

In [54]:
# how many missings by country?
grouped_missings = cleaning_w6.groupby('C_COW_ALPHA')
-grouped_missings.count().sub(grouped_missings.size(), 0)

Unnamed: 0_level_0,V1,V2,V2A,cow,B_COUNTRY_ALPHA,V3,V4,V5,V6,V7,V8,V9,V10,V11,V12,V13,V14,V15,V16,V17,V18,V19,V20,V21,V22,V23,V24,V25,V26,V27,V28,V29,V30,V31,V32,V33,V34,V35,V36,V37,V38,V39,V40,V41,V42,V43,V44,V45,V46,V47,V48,V49,V50,V51,V52,V53,V54,V55,V56,V56_NZ,V57,V58,V59,V60,V61,V62,V63,V64,V65,V66,V67,V68,V69,V70,V71,V72,V73,V74,V74B,V75,V76,V77,V78,V79,V80,V81,V82,V83,V84,V85,V86,V87,V88,V89,V95,V96,V97,V98,V99,V100,V101,V102,V103,V104,V105,V106,V107,V108,V109,V110,V111,V112,V113,V114,V115,V116,V117,V118,V119,V120,V121,V122,V123,V124,V125_00,V125_01,V125_02,V125_03,V125_04,V125_05,V125_06,V125_07,V125_08,V125_09,V125_10,V125_11,V125_12,V125_13,V125_14,V125_15,V125_16,V125_17,V126,V127,V128,V129,V130,V131,V132,V133,V134,V135,V136,V137,V138,V139,V140,V141,V142,V143,V144,V144G,V145,V146,V147,V148,V149,V150,V151,V152,V153,V154,V155,V156,V157,V158,V159,V160,V161,V162,V163,V164,V165,V166,V167,V168,V169,V170,V171,V172,V173,V174,V175,V176,V177,V178,V179,V180,V181,V182,V183,V184,V185,V186,V187,V188,V189,V190,V191,V192,V193,V194,V195,V196,V197,V198,V199,V200,V201,V202,V203,V203A,V204,V205,V206,V207,V207A,V208,V209,V210,V211,V212,V213,V214,V215_01,V215_02,V215_03,V215_04,V215_05,V215_06,V215_07,V215_08,V215_10,V215_11,V215_12,V215_13,V215_14,V215_15,V215_16,V215_17,V215_18,V216,V217,V218,V219,V220,V221,V222,V223,V224,V225,V226,V227,V229,V230,V231,V232,V233,V234,V235,V236,V237,V238,V239,V240,V242,V243,V244,V245,V246,V247,V248,V250,V258,V258A,S018,S019,V262
C_COW_ALPHA,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1,Unnamed: 177_level_1,Unnamed: 178_level_1,Unnamed: 179_level_1,Unnamed: 180_level_1,Unnamed: 181_level_1,Unnamed: 182_level_1,Unnamed: 183_level_1,Unnamed: 184_level_1,Unnamed: 185_level_1,Unnamed: 186_level_1,Unnamed: 187_level_1,Unnamed: 188_level_1,Unnamed: 189_level_1,Unnamed: 190_level_1,Unnamed: 191_level_1,Unnamed: 192_level_1,Unnamed: 193_level_1,Unnamed: 194_level_1,Unnamed: 195_level_1,Unnamed: 196_level_1,Unnamed: 197_level_1,Unnamed: 198_level_1,Unnamed: 199_level_1,Unnamed: 200_level_1,Unnamed: 201_level_1,Unnamed: 202_level_1,Unnamed: 203_level_1,Unnamed: 204_level_1,Unnamed: 205_level_1,Unnamed: 206_level_1,Unnamed: 207_level_1,Unnamed: 208_level_1,Unnamed: 209_level_1,Unnamed: 210_level_1,Unnamed: 211_level_1,Unnamed: 212_level_1,Unnamed: 213_level_1,Unnamed: 214_level_1,Unnamed: 215_level_1,Unnamed: 216_level_1,Unnamed: 217_level_1,Unnamed: 218_level_1,Unnamed: 219_level_1,Unnamed: 220_level_1,Unnamed: 221_level_1,Unnamed: 222_level_1,Unnamed: 223_level_1,Unnamed: 224_level_1,Unnamed: 225_level_1,Unnamed: 226_level_1,Unnamed: 227_level_1,Unnamed: 228_level_1,Unnamed: 229_level_1,Unnamed: 230_level_1,Unnamed: 231_level_1,Unnamed: 232_level_1,Unnamed: 233_level_1,Unnamed: 234_level_1,Unnamed: 235_level_1,Unnamed: 236_level_1,Unnamed: 237_level_1,Unnamed: 238_level_1,Unnamed: 239_level_1,Unnamed: 240_level_1,Unnamed: 241_level_1,Unnamed: 242_level_1,Unnamed: 243_level_1,Unnamed: 244_level_1,Unnamed: 245_level_1,Unnamed: 246_level_1,Unnamed: 247_level_1,Unnamed: 248_level_1,Unnamed: 249_level_1,Unnamed: 250_level_1,Unnamed: 251_level_1,Unnamed: 252_level_1,Unnamed: 253_level_1,Unnamed: 254_level_1,Unnamed: 255_level_1,Unnamed: 256_level_1,Unnamed: 257_level_1,Unnamed: 258_level_1,Unnamed: 259_level_1,Unnamed: 260_level_1,Unnamed: 261_level_1,Unnamed: 262_level_1,Unnamed: 263_level_1,Unnamed: 264_level_1,Unnamed: 265_level_1,Unnamed: 266_level_1,Unnamed: 267_level_1,Unnamed: 268_level_1,Unnamed: 269_level_1,Unnamed: 270_level_1,Unnamed: 271_level_1,Unnamed: 272_level_1,Unnamed: 273_level_1,Unnamed: 274_level_1,Unnamed: 275_level_1,Unnamed: 276_level_1,Unnamed: 277_level_1,Unnamed: 278_level_1,Unnamed: 279_level_1,Unnamed: 280_level_1,Unnamed: 281_level_1,Unnamed: 282_level_1,Unnamed: 283_level_1,Unnamed: 284_level_1,Unnamed: 285_level_1,Unnamed: 286_level_1,Unnamed: 287_level_1,Unnamed: 288_level_1
ALG,0,0,0,0,0,0,5,11,18,63,31,7,66,17,0,0,0,0,0,0,0,0,0,0,0,34,51,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,39,1200,88,86,104,58,49,42,67,107,39,57,1200,0,14,21,67,190,49,110,49,147,175,94,126,124,103,63,50,67,88,64,79,85,72,85,46,41,220,47,38,34,362,325,262,265,315,655,94,114,44,88,49,83,9,24,25,44,116,136,79,71,100,74,261,63,132,150,215,242,165,135,182,199,259,224,163,1200,1200,1200,263,1200,1200,1200,1200,1200,1200,1200,1200,1200,1200,1200,1200,0,0,240,245,258,318,149,166,194,157,148,277,251,174,167,156,87,116,69,61,0,0,0,0,142,0,0,145,166,25,42,32,113,214,85,91,92,63,117,119,92,60,68,132,70,160,216,21,42,64,102,128,132,72,49,52,59,96,78,103,78,69,80,187,129,48,55,51,57,99,119,151,207,129,85,133,80,65,104,74,148,1200,84,62,1200,61,109,61,60,61,30,174,79,29,1200,1200,1200,1200,51,1200,1200,1200,1200,1200,1200,1200,1200,1200,1200,1200,1200,106,23,27,11,16,21,39,35,22,23,44,49,0,595,622,628,658,627,120,417,120,122,0,0,0,0,0,0,0,1,1,5,0,0,0,0,0
ARG,0,0,0,0,0,0,2,2,6,14,17,18,11,6,0,0,0,0,0,0,0,0,0,0,0,10,34,5,0,0,0,1,1,1,2,1,1,748,0,0,0,0,0,0,0,0,0,14,22,33,32,32,1030,52,34,47,69,21,26,1030,0,6,9,18,62,21,49,12,25,120,56,54,63,20,16,16,15,16,1030,22,19,16,16,15,8,107,16,21,16,62,79,55,70,113,201,51,100,63,61,55,77,5,12,12,15,96,90,12,38,43,18,49,13,17,20,36,46,40,34,39,33,121,182,77,1030,1030,1030,1030,1030,1030,146,1030,1030,1030,1030,1030,1030,1030,1030,1030,0,0,154,114,122,88,64,30,65,21,21,34,68,29,28,21,11,20,22,14,10,10,1,0,54,25,60,74,84,16,112,55,126,124,40,36,27,28,13,23,17,26,10,33,23,90,94,0,9,8,31,68,70,13,24,39,2,7,38,58,15,25,26,22,43,5,7,6,7,39,38,47,95,45,43,32,25,23,17,19,109,79,84,74,81,97,1030,15,19,19,12,46,15,16,1030,1030,1030,1030,1030,1030,1030,40,1030,1030,1030,1030,1030,1030,1030,1030,1030,60,19,23,9,9,17,26,22,13,11,22,23,1030,259,108,109,113,5,4,5,52,23,47,0,0,8,11,5,11,8,0,1,0,0,0,0,0
ARM,0,0,0,0,0,0,7,5,26,7,18,1,8,2,0,0,0,0,0,0,0,0,0,0,0,4,15,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,2,4,17,29,38,10,27,47,42,49,1100,1,0,2,17,46,25,55,24,85,145,65,63,63,29,2,3,7,3,1100,10,10,4,21,1,22,102,4,4,0,11,13,7,17,18,455,19,44,12,50,22,92,16,5,9,18,59,81,19,8,34,10,306,39,51,41,52,48,80,85,185,69,237,274,188,210,1100,1100,1100,1100,1100,1100,200,1100,1100,1100,1100,1100,1100,1100,1100,0,0,212,148,230,170,116,65,205,54,59,189,115,109,86,58,42,65,18,11,4,4,8,51,13,14,181,109,114,32,185,34,62,213,50,41,37,23,18,22,11,59,10,10,16,118,134,3,28,25,75,99,111,27,7,18,2,9,38,78,0,5,9,107,98,2,22,2,3,61,55,138,314,95,74,9,7,3,11,8,7,3,65,40,42,19,77,5,4,5,11,31,3,3,114,1100,1100,1100,1100,1100,1100,1100,1100,120,1100,1100,1100,1100,1100,1100,1100,33,2,3,0,9,6,6,5,4,0,7,10,0,207,212,214,212,213,0,19,11,24,8,0,0,4,2,0,0,0,2,41,0,0,0,0,0
AUL,0,0,0,0,0,0,8,51,56,72,69,57,13,12,0,0,0,0,0,0,0,0,0,0,0,15,11,30,43,43,47,48,47,48,37,55,46,521,0,0,0,0,0,0,0,0,0,19,18,22,21,20,14,40,14,20,17,18,25,1477,12,8,18,26,46,26,46,18,28,35,45,51,39,33,30,29,29,29,1477,30,30,29,26,24,6,23,21,79,14,29,52,47,54,274,55,30,33,29,30,26,28,16,41,43,48,62,49,27,28,34,33,39,25,37,29,31,38,36,32,43,29,35,31,25,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,0,0,30,44,46,51,42,48,45,35,38,38,46,47,47,31,31,36,6,12,24,24,16,17,15,30,37,28,40,14,38,47,46,45,40,38,26,14,63,67,29,16,18,35,27,28,27,15,21,26,31,28,29,0,0,0,11,19,54,83,32,30,36,35,26,15,16,18,20,17,23,25,27,22,15,8,11,16,11,11,31,18,17,21,23,23,1477,9,13,9,8,54,40,29,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,1477,62,1477,1477,1477,1477,84,22,59,19,30,45,43,32,29,12,22,29,14,101,66,68,64,42,69,64,26,30,55,0,9,36,39,1477,13,13,425,82,0,0,0,0,0
AZE,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,29,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,15,4,3,0,2,6,0,0,1002,0,0,2,0,2,0,2,0,2,73,19,10,14,0,0,0,0,0,1002,0,0,0,0,0,7,5,0,0,0,0,0,0,0,0,1,0,2,0,0,0,1,6,5,7,33,52,50,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,1002,0,0,0,33,62,46,42,0,0,0,0,0,0,0,0,0,0,0,18,0,0,0,0,0,0,0,0,0,0,0,68,25,40,68,4,3,4,1,6,3,3,1,0,0,0,0,0,4,19,9,14,23,18,1,0,0,0,0,9,24,2,23,23,9,6,0,5,12,4,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1002,1002,1002,1002,1002,1002,1002,1002,1002,0,1002,1002,1002,1002,1002,1002,1002,0,0,0,0,0,0,0,0,0,0,0,0,0,240,240,240,240,240,0,0,0,3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
BLR,0,0,0,0,0,0,6,13,23,20,14,19,84,21,0,0,0,0,0,0,0,0,0,0,0,4,116,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,86,66,107,118,15,10,13,13,10,8,1,3,1535,3,10,5,3,34,5,38,4,34,364,10,10,14,3,4,7,8,15,1535,5,7,7,6,5,8,41,3,4,8,1535,1535,1535,1535,1535,58,5,5,3,4,3,32,5,3,7,9,14,13,7,3,5,5,18,6,7,8,14,17,15,12,14,16,18,27,20,1535,1535,1535,1535,1535,1535,1535,19,1535,1535,1535,1535,1535,1535,1535,1535,0,0,17,15,18,8,8,14,15,14,14,16,14,17,19,14,6,15,33,38,9,9,7,7,8,20,34,23,33,10,233,242,236,256,101,92,121,6,108,115,81,7,9,15,16,26,22,147,253,104,365,721,824,8,4,13,29,75,44,67,66,66,77,93,104,39,62,56,18,4,4,8,11,9,10,6,2,5,7,4,16,8,7,5,4,5,1535,6,3,2,2,14,30,10,1535,1535,1535,1535,1535,1535,1535,1535,1535,22,1535,1535,1535,1535,1535,1535,1535,32,9,18,4,12,20,32,18,18,7,34,37,0,1,25,26,30,32,8,917,921,11,16,0,0,0,0,0,0,0,0,0,0,0,0,0,0
BRA,0,0,0,0,0,0,1,3,6,11,3,2,1,1,0,0,0,0,0,0,0,0,0,0,0,3,11,6,24,14,16,12,15,14,7,14,11,12,0,0,0,0,0,0,0,0,0,11,17,14,5,12,13,61,18,31,42,19,24,1486,6,1,1,69,150,29,111,16,94,88,34,60,27,17,8,7,8,5,3,6,5,4,8,3,7,118,7,5,4,41,118,41,38,61,298,28,53,16,81,25,52,6,9,3,12,36,80,14,83,19,9,86,6,5,15,16,35,12,43,42,9,57,89,53,1486,1486,1486,1486,1486,1486,387,1486,1486,1486,1486,1486,1486,1486,1486,1486,0,0,308,87,116,127,107,127,170,99,108,163,140,111,103,58,56,71,42,19,8,8,12,8,27,4,54,38,59,4,137,48,40,55,91,88,71,30,43,42,25,40,17,21,16,83,102,7,18,15,60,58,82,14,14,6,8,31,67,76,19,24,28,57,74,4,6,4,9,54,54,67,139,50,35,14,21,5,22,9,83,46,18,30,50,13,40,5,9,5,7,36,14,15,1486,1486,1486,1486,1486,1486,1486,141,1486,1486,1486,1486,1486,1486,1486,1486,1486,23,11,13,4,3,12,19,12,5,23,33,37,0,326,163,160,164,86,75,52,47,20,27,0,0,10,13,0,2,0,8,0,0,0,0,0,0
CHL,0,0,0,0,0,0,0,11,8,12,25,8,3,1,0,0,0,0,0,0,0,0,0,0,0,12,29,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,16,19,38,30,35,48,43,37,60,87,8,31,1000,5,0,3,9,32,12,25,10,23,121,79,79,80,87,76,76,73,75,1000,77,86,82,84,79,6,54,27,20,17,25,32,17,27,40,291,16,73,20,27,20,34,1,23,36,65,146,140,11,8,15,11,84,11,15,15,14,22,30,26,20,20,34,80,45,1000,1000,1000,1000,1000,1000,165,1000,1000,1000,1000,1000,1000,1000,1000,1000,0,0,126,113,119,78,61,78,104,41,44,72,127,65,71,44,17,21,27,15,17,17,32,247,37,24,98,44,85,35,148,108,145,115,7,5,3,5,3,3,2,57,13,51,37,100,150,20,23,24,88,122,106,9,10,13,13,36,60,56,31,41,50,67,92,2,0,10,17,57,77,83,154,63,13,24,15,11,25,31,74,73,46,47,48,83,1000,20,18,24,4,54,28,15,1000,1000,1000,1000,1000,1000,1000,1000,157,1000,1000,1000,1000,1000,1000,1000,1000,96,3,15,4,4,14,9,7,7,2,26,25,0,247,181,164,161,125,2,523,58,5,81,0,0,2,2,0,0,0,0,12,0,0,0,0,0
CHN,0,0,0,0,0,0,29,51,101,190,107,239,28,15,0,0,0,0,0,0,0,0,0,0,0,48,104,22,0,3,2,3,1,3,2,1,3,164,0,0,0,0,0,0,0,0,0,154,213,220,235,295,252,233,197,286,328,132,179,2300,0,0,55,248,248,225,229,253,254,155,132,165,281,122,122,132,139,130,128,132,133,141,137,138,247,323,48,49,48,113,113,113,113,129,2300,170,333,177,179,178,355,132,173,227,285,1233,1111,740,223,337,261,867,226,274,203,295,265,367,328,466,325,677,754,779,2300,1449,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,0,0,1214,609,623,564,529,311,673,400,332,740,352,334,478,306,236,349,379,155,134,134,61,59,88,276,356,990,1484,374,551,1303,645,1435,346,346,348,465,376,412,372,451,387,478,453,731,780,215,257,298,392,348,426,280,305,370,215,246,251,301,333,377,366,492,771,347,355,366,378,458,486,710,755,539,448,364,369,366,436,409,446,418,437,408,467,418,489,391,378,365,283,622,326,308,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,2300,594,2300,2300,2300,2300,330,192,197,188,202,200,205,201,198,186,272,301,0,875,884,915,911,855,15,972,144,108,245,0,0,2300,2300,2300,0,0,0,15,0,0,0,0,0
COL,0,0,0,0,0,0,0,2,2,7,2,1,1,1,0,0,0,0,0,0,0,0,0,0,0,0,11,0,1,0,6,0,2,5,2,4,3,4,0,0,0,0,0,0,0,0,0,3,10,20,8,12,26,55,7,18,50,5,18,1512,0,3,1,12,32,6,11,2,7,49,24,24,14,4,2,2,4,2,3,7,6,6,2,4,1,22,3,2,2,24,8,5,3,19,262,15,72,16,16,18,26,1,4,1,9,32,57,5,8,8,8,38,5,23,12,18,26,14,20,17,16,26,47,28,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,453,1512,1512,0,0,166,83,69,52,59,41,89,40,52,73,146,61,42,30,18,40,5,10,5,5,5,5,12,2,37,17,23,17,49,49,36,45,17,16,17,6,0,7,0,10,3,26,12,39,52,2,12,10,24,35,70,3,0,2,24,22,6,31,4,4,1512,21,27,0,1,2,3,10,20,13,53,20,13,8,6,2,4,1,39,18,10,20,32,6,64,3,1,2,1,22,8,2,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,1512,461,1512,1512,1512,104,4,4,1,1,4,6,6,1,0,6,6,0,122,123,123,123,122,3,555,14,15,17,0,0,0,0,0,0,0,16,0,0,0,0,0,0


In [60]:
# explore proportion of missings by country
# step 1: create a new dataframe
cleaning_missing_pct = cleaning_w6.isna()

In [63]:
# overwrite True/False values with underlying country codes to then groupby country
cleaning_missing_pct['C_COW_ALPHA'] = cleaning_w6['C_COW_ALPHA']

In [64]:
# check to see that things are looking the way they should
cleaning_missing_pct.head(2)

Unnamed: 0,V1,V2,V2A,cow,C_COW_ALPHA,B_COUNTRY_ALPHA,V3,V4,V5,V6,V7,V8,V9,V10,V11,V12,V13,V14,V15,V16,V17,V18,V19,V20,V21,V22,V23,V24,V25,V26,V27,V28,V29,V30,V31,V32,V33,V34,V35,V36,V37,V38,V39,V40,V41,V42,V43,V44,V45,V46,V47,V48,V49,V50,V51,V52,V53,V54,V55,V56,V56_NZ,V57,V58,V59,V60,V61,V62,V63,V64,V65,V66,V67,V68,V69,V70,V71,V72,V73,V74,V74B,V75,V76,V77,V78,V79,V80,V81,V82,V83,V84,V85,V86,V87,V88,V89,V95,V96,V97,V98,V99,V100,V101,V102,V103,V104,V105,V106,V107,V108,V109,V110,V111,V112,V113,V114,V115,V116,V117,V118,V119,V120,V121,V122,V123,V124,V125_00,V125_01,V125_02,V125_03,V125_04,V125_05,V125_06,V125_07,V125_08,V125_09,V125_10,V125_11,V125_12,V125_13,V125_14,V125_15,V125_16,V125_17,V126,V127,V128,V129,V130,V131,V132,V133,V134,V135,V136,V137,V138,V139,V140,V141,V142,V143,V144,V144G,V145,V146,V147,V148,V149,V150,V151,V152,V153,V154,V155,V156,V157,V158,V159,V160,V161,V162,V163,V164,V165,V166,V167,V168,V169,V170,V171,V172,V173,V174,V175,V176,V177,V178,V179,V180,V181,V182,V183,V184,V185,V186,V187,V188,V189,V190,V191,V192,V193,V194,V195,V196,V197,V198,V199,V200,V201,V202,V203,V203A,V204,V205,V206,V207,V207A,V208,V209,V210,V211,V212,V213,V214,V215_01,V215_02,V215_03,V215_04,V215_05,V215_06,V215_07,V215_08,V215_10,V215_11,V215_12,V215_13,V215_14,V215_15,V215_16,V215_17,V215_18,V216,V217,V218,V219,V220,V221,V222,V223,V224,V225,V226,V227,V229,V230,V231,V232,V233,V234,V235,V236,V237,V238,V239,V240,V242,V243,V244,V245,V246,V247,V248,V250,V258,V258A,S018,S019,V262
0,False,False,False,False,ALG,False,False,False,False,False,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,True,False,False,False,False,False,False,False,False,False,False,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,True,True,True,True,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,True,True,True,False,True,True,True,True,True,True,True,True,True,True,True,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,True,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,True,False,False,True,False,False,False,False,False,False,False,False,False,True,True,True,True,False,True,True,True,True,True,True,True,True,True,True,True,True,False,False,False,False,False,False,False,False,False,False,False,False,False,True,True,True,True,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False
1,False,False,False,False,ALG,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,True,False,False,False,False,False,False,False,False,False,False,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,True,True,True,True,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,True,True,True,False,True,True,True,True,True,True,True,True,True,True,True,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,True,False,False,True,False,False,False,False,False,False,False,False,False,True,True,True,True,False,True,True,True,True,True,True,True,True,True,True,True,True,False,False,False,False,False,False,False,False,False,False,False,False,False,True,True,True,True,True,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False,False


In [74]:
# solution: how many missings by country for each variable?
missing_grpby_country = (cleaning_missing_pct.groupby('C_COW_ALPHA').mean()*100).round(decimals=2)
missing_grpby_country

Unnamed: 0_level_0,V1,V2,V2A,cow,B_COUNTRY_ALPHA,V3,V4,V5,V6,V7,V8,V9,V10,V11,V12,V13,V14,V15,V16,V17,V18,V19,V20,V21,V22,V23,V24,V25,V26,V27,V28,V29,V30,V31,V32,V33,V34,V35,V36,V37,V38,V39,V40,V41,V42,V43,V44,V45,V46,V47,V48,V49,V50,V51,V52,V53,V54,V55,V56,V56_NZ,V57,V58,V59,V60,V61,V62,V63,V64,V65,V66,V67,V68,V69,V70,V71,V72,V73,V74,V74B,V75,V76,V77,V78,V79,V80,V81,V82,V83,V84,V85,V86,V87,V88,V89,V95,V96,V97,V98,V99,V100,V101,V102,V103,V104,V105,V106,V107,V108,V109,V110,V111,V112,V113,V114,V115,V116,V117,V118,V119,V120,V121,V122,V123,V124,V125_00,V125_01,V125_02,V125_03,V125_04,V125_05,V125_06,V125_07,V125_08,V125_09,V125_10,V125_11,V125_12,V125_13,V125_14,V125_15,V125_16,V125_17,V126,V127,V128,V129,V130,V131,V132,V133,V134,V135,V136,V137,V138,V139,V140,V141,V142,V143,V144,V144G,V145,V146,V147,V148,V149,V150,V151,V152,V153,V154,V155,V156,V157,V158,V159,V160,V161,V162,V163,V164,V165,V166,V167,V168,V169,V170,V171,V172,V173,V174,V175,V176,V177,V178,V179,V180,V181,V182,V183,V184,V185,V186,V187,V188,V189,V190,V191,V192,V193,V194,V195,V196,V197,V198,V199,V200,V201,V202,V203,V203A,V204,V205,V206,V207,V207A,V208,V209,V210,V211,V212,V213,V214,V215_01,V215_02,V215_03,V215_04,V215_05,V215_06,V215_07,V215_08,V215_10,V215_11,V215_12,V215_13,V215_14,V215_15,V215_16,V215_17,V215_18,V216,V217,V218,V219,V220,V221,V222,V223,V224,V225,V226,V227,V229,V230,V231,V232,V233,V234,V235,V236,V237,V238,V239,V240,V242,V243,V244,V245,V246,V247,V248,V250,V258,V258A,S018,S019,V262
C_COW_ALPHA,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1,Unnamed: 177_level_1,Unnamed: 178_level_1,Unnamed: 179_level_1,Unnamed: 180_level_1,Unnamed: 181_level_1,Unnamed: 182_level_1,Unnamed: 183_level_1,Unnamed: 184_level_1,Unnamed: 185_level_1,Unnamed: 186_level_1,Unnamed: 187_level_1,Unnamed: 188_level_1,Unnamed: 189_level_1,Unnamed: 190_level_1,Unnamed: 191_level_1,Unnamed: 192_level_1,Unnamed: 193_level_1,Unnamed: 194_level_1,Unnamed: 195_level_1,Unnamed: 196_level_1,Unnamed: 197_level_1,Unnamed: 198_level_1,Unnamed: 199_level_1,Unnamed: 200_level_1,Unnamed: 201_level_1,Unnamed: 202_level_1,Unnamed: 203_level_1,Unnamed: 204_level_1,Unnamed: 205_level_1,Unnamed: 206_level_1,Unnamed: 207_level_1,Unnamed: 208_level_1,Unnamed: 209_level_1,Unnamed: 210_level_1,Unnamed: 211_level_1,Unnamed: 212_level_1,Unnamed: 213_level_1,Unnamed: 214_level_1,Unnamed: 215_level_1,Unnamed: 216_level_1,Unnamed: 217_level_1,Unnamed: 218_level_1,Unnamed: 219_level_1,Unnamed: 220_level_1,Unnamed: 221_level_1,Unnamed: 222_level_1,Unnamed: 223_level_1,Unnamed: 224_level_1,Unnamed: 225_level_1,Unnamed: 226_level_1,Unnamed: 227_level_1,Unnamed: 228_level_1,Unnamed: 229_level_1,Unnamed: 230_level_1,Unnamed: 231_level_1,Unnamed: 232_level_1,Unnamed: 233_level_1,Unnamed: 234_level_1,Unnamed: 235_level_1,Unnamed: 236_level_1,Unnamed: 237_level_1,Unnamed: 238_level_1,Unnamed: 239_level_1,Unnamed: 240_level_1,Unnamed: 241_level_1,Unnamed: 242_level_1,Unnamed: 243_level_1,Unnamed: 244_level_1,Unnamed: 245_level_1,Unnamed: 246_level_1,Unnamed: 247_level_1,Unnamed: 248_level_1,Unnamed: 249_level_1,Unnamed: 250_level_1,Unnamed: 251_level_1,Unnamed: 252_level_1,Unnamed: 253_level_1,Unnamed: 254_level_1,Unnamed: 255_level_1,Unnamed: 256_level_1,Unnamed: 257_level_1,Unnamed: 258_level_1,Unnamed: 259_level_1,Unnamed: 260_level_1,Unnamed: 261_level_1,Unnamed: 262_level_1,Unnamed: 263_level_1,Unnamed: 264_level_1,Unnamed: 265_level_1,Unnamed: 266_level_1,Unnamed: 267_level_1,Unnamed: 268_level_1,Unnamed: 269_level_1,Unnamed: 270_level_1,Unnamed: 271_level_1,Unnamed: 272_level_1,Unnamed: 273_level_1,Unnamed: 274_level_1,Unnamed: 275_level_1,Unnamed: 276_level_1,Unnamed: 277_level_1,Unnamed: 278_level_1,Unnamed: 279_level_1,Unnamed: 280_level_1,Unnamed: 281_level_1,Unnamed: 282_level_1,Unnamed: 283_level_1,Unnamed: 284_level_1,Unnamed: 285_level_1,Unnamed: 286_level_1,Unnamed: 287_level_1,Unnamed: 288_level_1
ALG,0.0,0.0,0.0,0.0,0.0,0.0,0.42,0.92,1.5,5.25,2.58,0.58,5.5,1.42,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.83,4.25,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.25,100.0,7.33,7.17,8.67,4.83,4.08,3.5,5.58,8.92,3.25,4.75,100.0,0.0,1.17,1.75,5.58,15.83,4.08,9.17,4.08,12.25,14.58,7.83,10.5,10.33,8.58,5.25,4.17,5.58,7.33,5.33,6.58,7.08,6.0,7.08,3.83,3.42,18.33,3.92,3.17,2.83,30.17,27.08,21.83,22.08,26.25,54.58,7.83,9.5,3.67,7.33,4.08,6.92,0.75,2.0,2.08,3.67,9.67,11.33,6.58,5.92,8.33,6.17,21.75,5.25,11.0,12.5,17.92,20.17,13.75,11.25,15.17,16.58,21.58,18.67,13.58,100.0,100.0,100.0,21.92,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,0.0,0.0,20.0,20.42,21.5,26.5,12.42,13.83,16.17,13.08,12.33,23.08,20.92,14.5,13.92,13.0,7.25,9.67,5.75,5.08,0.0,0.0,0.0,0.0,11.83,0.0,0.0,12.08,13.83,2.08,3.5,2.67,9.42,17.83,7.08,7.58,7.67,5.25,9.75,9.92,7.67,5.0,5.67,11.0,5.83,13.33,18.0,1.75,3.5,5.33,8.5,10.67,11.0,6.0,4.08,4.33,4.92,8.0,6.5,8.58,6.5,5.75,6.67,15.58,10.75,4.0,4.58,4.25,4.75,8.25,9.92,12.58,17.25,10.75,7.08,11.08,6.67,5.42,8.67,6.17,12.33,100.0,7.0,5.17,100.0,5.08,9.08,5.08,5.0,5.08,2.5,14.5,6.58,2.42,100.0,100.0,100.0,100.0,4.25,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,8.83,1.92,2.25,0.92,1.33,1.75,3.25,2.92,1.83,1.92,3.67,4.08,0.0,49.58,51.83,52.33,54.83,52.25,10.0,34.75,10.0,10.17,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.08,0.08,0.42,0.0,0.0,0.0,0.0,0.0
ARG,0.0,0.0,0.0,0.0,0.0,0.0,0.19,0.19,0.58,1.36,1.65,1.75,1.07,0.58,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.97,3.3,0.49,0.0,0.0,0.0,0.1,0.1,0.1,0.19,0.1,0.1,72.62,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.36,2.14,3.2,3.11,3.11,100.0,5.05,3.3,4.56,6.7,2.04,2.52,100.0,0.0,0.58,0.87,1.75,6.02,2.04,4.76,1.17,2.43,11.65,5.44,5.24,6.12,1.94,1.55,1.55,1.46,1.55,100.0,2.14,1.84,1.55,1.55,1.46,0.78,10.39,1.55,2.04,1.55,6.02,7.67,5.34,6.8,10.97,19.51,4.95,9.71,6.12,5.92,5.34,7.48,0.49,1.17,1.17,1.46,9.32,8.74,1.17,3.69,4.17,1.75,4.76,1.26,1.65,1.94,3.5,4.47,3.88,3.3,3.79,3.2,11.75,17.67,7.48,100.0,100.0,100.0,100.0,100.0,100.0,14.17,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,0.0,0.0,14.95,11.07,11.84,8.54,6.21,2.91,6.31,2.04,2.04,3.3,6.6,2.82,2.72,2.04,1.07,1.94,2.14,1.36,0.97,0.97,0.1,0.0,5.24,2.43,5.83,7.18,8.16,1.55,10.87,5.34,12.23,12.04,3.88,3.5,2.62,2.72,1.26,2.23,1.65,2.52,0.97,3.2,2.23,8.74,9.13,0.0,0.87,0.78,3.01,6.6,6.8,1.26,2.33,3.79,0.19,0.68,3.69,5.63,1.46,2.43,2.52,2.14,4.17,0.49,0.68,0.58,0.68,3.79,3.69,4.56,9.22,4.37,4.17,3.11,2.43,2.23,1.65,1.84,10.58,7.67,8.16,7.18,7.86,9.42,100.0,1.46,1.84,1.84,1.17,4.47,1.46,1.55,100.0,100.0,100.0,100.0,100.0,100.0,100.0,3.88,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,5.83,1.84,2.23,0.87,0.87,1.65,2.52,2.14,1.26,1.07,2.14,2.23,100.0,25.15,10.49,10.58,10.97,0.49,0.39,0.49,5.05,2.23,4.56,0.0,0.0,0.78,1.07,0.49,1.07,0.78,0.0,0.1,0.0,0.0,0.0,0.0,0.0
ARM,0.0,0.0,0.0,0.0,0.0,0.0,0.64,0.45,2.36,0.64,1.64,0.09,0.73,0.18,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.36,1.36,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.09,0.0,0.18,0.36,1.55,2.64,3.45,0.91,2.45,4.27,3.82,4.45,100.0,0.09,0.0,0.18,1.55,4.18,2.27,5.0,2.18,7.73,13.18,5.91,5.73,5.73,2.64,0.18,0.27,0.64,0.27,100.0,0.91,0.91,0.36,1.91,0.09,2.0,9.27,0.36,0.36,0.0,1.0,1.18,0.64,1.55,1.64,41.36,1.73,4.0,1.09,4.55,2.0,8.36,1.45,0.45,0.82,1.64,5.36,7.36,1.73,0.73,3.09,0.91,27.82,3.55,4.64,3.73,4.73,4.36,7.27,7.73,16.82,6.27,21.55,24.91,17.09,19.09,100.0,100.0,100.0,100.0,100.0,100.0,18.18,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,0.0,0.0,19.27,13.45,20.91,15.45,10.55,5.91,18.64,4.91,5.36,17.18,10.45,9.91,7.82,5.27,3.82,5.91,1.64,1.0,0.36,0.36,0.73,4.64,1.18,1.27,16.45,9.91,10.36,2.91,16.82,3.09,5.64,19.36,4.55,3.73,3.36,2.09,1.64,2.0,1.0,5.36,0.91,0.91,1.45,10.73,12.18,0.27,2.55,2.27,6.82,9.0,10.09,2.45,0.64,1.64,0.18,0.82,3.45,7.09,0.0,0.45,0.82,9.73,8.91,0.18,2.0,0.18,0.27,5.55,5.0,12.55,28.55,8.64,6.73,0.82,0.64,0.27,1.0,0.73,0.64,0.27,5.91,3.64,3.82,1.73,7.0,0.45,0.36,0.45,1.0,2.82,0.27,0.27,10.36,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,10.91,100.0,100.0,100.0,100.0,100.0,100.0,100.0,3.0,0.18,0.27,0.0,0.82,0.55,0.55,0.45,0.36,0.0,0.64,0.91,0.0,18.82,19.27,19.45,19.27,19.36,0.0,1.73,1.0,2.18,0.73,0.0,0.0,0.36,0.18,0.0,0.0,0.0,0.18,3.73,0.0,0.0,0.0,0.0,0.0
AUL,0.0,0.0,0.0,0.0,0.0,0.0,0.54,3.45,3.79,4.87,4.67,3.86,0.88,0.81,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.02,0.74,2.03,2.91,2.91,3.18,3.25,3.18,3.25,2.51,3.72,3.11,35.27,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.29,1.22,1.49,1.42,1.35,0.95,2.71,0.95,1.35,1.15,1.22,1.69,100.0,0.81,0.54,1.22,1.76,3.11,1.76,3.11,1.22,1.9,2.37,3.05,3.45,2.64,2.23,2.03,1.96,1.96,1.96,100.0,2.03,2.03,1.96,1.76,1.62,0.41,1.56,1.42,5.35,0.95,1.96,3.52,3.18,3.66,18.55,3.72,2.03,2.23,1.96,2.03,1.76,1.9,1.08,2.78,2.91,3.25,4.2,3.32,1.83,1.9,2.3,2.23,2.64,1.69,2.51,1.96,2.1,2.57,2.44,2.17,2.91,1.96,2.37,2.1,1.69,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,0.0,0.0,2.03,2.98,3.11,3.45,2.84,3.25,3.05,2.37,2.57,2.57,3.11,3.18,3.18,2.1,2.1,2.44,0.41,0.81,1.62,1.62,1.08,1.15,1.02,2.03,2.51,1.9,2.71,0.95,2.57,3.18,3.11,3.05,2.71,2.57,1.76,0.95,4.27,4.54,1.96,1.08,1.22,2.37,1.83,1.9,1.83,1.02,1.42,1.76,2.1,1.9,1.96,0.0,0.0,0.0,0.74,1.29,3.66,5.62,2.17,2.03,2.44,2.37,1.76,1.02,1.08,1.22,1.35,1.15,1.56,1.69,1.83,1.49,1.02,0.54,0.74,1.08,0.74,0.74,2.1,1.22,1.15,1.42,1.56,1.56,100.0,0.61,0.88,0.61,0.54,3.66,2.71,1.96,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,4.2,100.0,100.0,100.0,100.0,5.69,1.49,3.99,1.29,2.03,3.05,2.91,2.17,1.96,0.81,1.49,1.96,0.95,6.84,4.47,4.6,4.33,2.84,4.67,4.33,1.76,2.03,3.72,0.0,0.61,2.44,2.64,100.0,0.88,0.88,28.77,5.55,0.0,0.0,0.0,0.0,0.0
AZE,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.89,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.5,0.4,0.3,0.0,0.2,0.6,0.0,0.0,100.0,0.0,0.0,0.2,0.0,0.2,0.0,0.2,0.0,0.2,7.29,1.9,1.0,1.4,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,0.7,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.2,0.0,0.0,0.0,0.1,0.6,0.5,0.7,3.29,5.19,4.99,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,0.0,0.0,0.0,3.29,6.19,4.59,4.19,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.8,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.79,2.5,3.99,6.79,0.4,0.3,0.4,0.1,0.6,0.3,0.3,0.1,0.0,0.0,0.0,0.0,0.0,0.4,1.9,0.9,1.4,2.3,1.8,0.1,0.0,0.0,0.0,0.0,0.9,2.4,0.2,2.3,2.3,0.9,0.6,0.0,0.5,1.2,0.4,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,0.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,23.95,23.95,23.95,23.95,23.95,0.0,0.0,0.0,0.3,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
BLR,0.0,0.0,0.0,0.0,0.0,0.0,0.39,0.85,1.5,1.3,0.91,1.24,5.47,1.37,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.26,7.56,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.6,4.3,6.97,7.69,0.98,0.65,0.85,0.85,0.65,0.52,0.07,0.2,100.0,0.2,0.65,0.33,0.2,2.21,0.33,2.48,0.26,2.21,23.71,0.65,0.65,0.91,0.2,0.26,0.46,0.52,0.98,100.0,0.33,0.46,0.46,0.39,0.33,0.52,2.67,0.2,0.26,0.52,100.0,100.0,100.0,100.0,100.0,3.78,0.33,0.33,0.2,0.26,0.2,2.08,0.33,0.2,0.46,0.59,0.91,0.85,0.46,0.2,0.33,0.33,1.17,0.39,0.46,0.52,0.91,1.11,0.98,0.78,0.91,1.04,1.17,1.76,1.3,100.0,100.0,100.0,100.0,100.0,100.0,100.0,1.24,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,0.0,0.0,1.11,0.98,1.17,0.52,0.52,0.91,0.98,0.91,0.91,1.04,0.91,1.11,1.24,0.91,0.39,0.98,2.15,2.48,0.59,0.59,0.46,0.46,0.52,1.3,2.21,1.5,2.15,0.65,15.18,15.77,15.37,16.68,6.58,5.99,7.88,0.39,7.04,7.49,5.28,0.46,0.59,0.98,1.04,1.69,1.43,9.58,16.48,6.78,23.78,46.97,53.68,0.52,0.26,0.85,1.89,4.89,2.87,4.36,4.3,4.3,5.02,6.06,6.78,2.54,4.04,3.65,1.17,0.26,0.26,0.52,0.72,0.59,0.65,0.39,0.13,0.33,0.46,0.26,1.04,0.52,0.46,0.33,0.26,0.33,100.0,0.39,0.2,0.13,0.13,0.91,1.95,0.65,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,1.43,100.0,100.0,100.0,100.0,100.0,100.0,100.0,2.08,0.59,1.17,0.26,0.78,1.3,2.08,1.17,1.17,0.46,2.21,2.41,0.0,0.07,1.63,1.69,1.95,2.08,0.52,59.74,60.0,0.72,1.04,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
BRA,0.0,0.0,0.0,0.0,0.0,0.0,0.07,0.2,0.4,0.74,0.2,0.13,0.07,0.07,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.2,0.74,0.4,1.62,0.94,1.08,0.81,1.01,0.94,0.47,0.94,0.74,0.81,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.74,1.14,0.94,0.34,0.81,0.87,4.1,1.21,2.09,2.83,1.28,1.62,100.0,0.4,0.07,0.07,4.64,10.09,1.95,7.47,1.08,6.33,5.92,2.29,4.04,1.82,1.14,0.54,0.47,0.54,0.34,0.2,0.4,0.34,0.27,0.54,0.2,0.47,7.94,0.47,0.34,0.27,2.76,7.94,2.76,2.56,4.1,20.05,1.88,3.57,1.08,5.45,1.68,3.5,0.4,0.61,0.2,0.81,2.42,5.38,0.94,5.59,1.28,0.61,5.79,0.4,0.34,1.01,1.08,2.36,0.81,2.89,2.83,0.61,3.84,5.99,3.57,100.0,100.0,100.0,100.0,100.0,100.0,26.04,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,0.0,0.0,20.73,5.85,7.81,8.55,7.2,8.55,11.44,6.66,7.27,10.97,9.42,7.47,6.93,3.9,3.77,4.78,2.83,1.28,0.54,0.54,0.81,0.54,1.82,0.27,3.63,2.56,3.97,0.27,9.22,3.23,2.69,3.7,6.12,5.92,4.78,2.02,2.89,2.83,1.68,2.69,1.14,1.41,1.08,5.59,6.86,0.47,1.21,1.01,4.04,3.9,5.52,0.94,0.94,0.4,0.54,2.09,4.51,5.11,1.28,1.62,1.88,3.84,4.98,0.27,0.4,0.27,0.61,3.63,3.63,4.51,9.35,3.36,2.36,0.94,1.41,0.34,1.48,0.61,5.59,3.1,1.21,2.02,3.36,0.87,2.69,0.34,0.61,0.34,0.47,2.42,0.94,1.01,100.0,100.0,100.0,100.0,100.0,100.0,100.0,9.49,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,1.55,0.74,0.87,0.27,0.2,0.81,1.28,0.81,0.34,1.55,2.22,2.49,0.0,21.94,10.97,10.77,11.04,5.79,5.05,3.5,3.16,1.35,1.82,0.0,0.0,0.67,0.87,0.0,0.13,0.0,0.54,0.0,0.0,0.0,0.0,0.0,0.0
CHL,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.1,0.8,1.2,2.5,0.8,0.3,0.1,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.2,2.9,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.6,1.9,3.8,3.0,3.5,4.8,4.3,3.7,6.0,8.7,0.8,3.1,100.0,0.5,0.0,0.3,0.9,3.2,1.2,2.5,1.0,2.3,12.1,7.9,7.9,8.0,8.7,7.6,7.6,7.3,7.5,100.0,7.7,8.6,8.2,8.4,7.9,0.6,5.4,2.7,2.0,1.7,2.5,3.2,1.7,2.7,4.0,29.1,1.6,7.3,2.0,2.7,2.0,3.4,0.1,2.3,3.6,6.5,14.6,14.0,1.1,0.8,1.5,1.1,8.4,1.1,1.5,1.5,1.4,2.2,3.0,2.6,2.0,2.0,3.4,8.0,4.5,100.0,100.0,100.0,100.0,100.0,100.0,16.5,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,0.0,0.0,12.6,11.3,11.9,7.8,6.1,7.8,10.4,4.1,4.4,7.2,12.7,6.5,7.1,4.4,1.7,2.1,2.7,1.5,1.7,1.7,3.2,24.7,3.7,2.4,9.8,4.4,8.5,3.5,14.8,10.8,14.5,11.5,0.7,0.5,0.3,0.5,0.3,0.3,0.2,5.7,1.3,5.1,3.7,10.0,15.0,2.0,2.3,2.4,8.8,12.2,10.6,0.9,1.0,1.3,1.3,3.6,6.0,5.6,3.1,4.1,5.0,6.7,9.2,0.2,0.0,1.0,1.7,5.7,7.7,8.3,15.4,6.3,1.3,2.4,1.5,1.1,2.5,3.1,7.4,7.3,4.6,4.7,4.8,8.3,100.0,2.0,1.8,2.4,0.4,5.4,2.8,1.5,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,15.7,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,9.6,0.3,1.5,0.4,0.4,1.4,0.9,0.7,0.7,0.2,2.6,2.5,0.0,24.7,18.1,16.4,16.1,12.5,0.2,52.3,5.8,0.5,8.1,0.0,0.0,0.2,0.2,0.0,0.0,0.0,0.0,1.2,0.0,0.0,0.0,0.0,0.0
CHN,0.0,0.0,0.0,0.0,0.0,0.0,1.26,2.22,4.39,8.26,4.65,10.39,1.22,0.65,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.09,4.52,0.96,0.0,0.13,0.09,0.13,0.04,0.13,0.09,0.04,0.13,7.13,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.7,9.26,9.57,10.22,12.83,10.96,10.13,8.57,12.43,14.26,5.74,7.78,100.0,0.0,0.0,2.39,10.78,10.78,9.78,9.96,11.0,11.04,6.74,5.74,7.17,12.22,5.3,5.3,5.74,6.04,5.65,5.57,5.74,5.78,6.13,5.96,6.0,10.74,14.04,2.09,2.13,2.09,4.91,4.91,4.91,4.91,5.61,100.0,7.39,14.48,7.7,7.78,7.74,15.43,5.74,7.52,9.87,12.39,53.61,48.3,32.17,9.7,14.65,11.35,37.7,9.83,11.91,8.83,12.83,11.52,15.96,14.26,20.26,14.13,29.43,32.78,33.87,100.0,63.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,0.0,0.0,52.78,26.48,27.09,24.52,23.0,13.52,29.26,17.39,14.43,32.17,15.3,14.52,20.78,13.3,10.26,15.17,16.48,6.74,5.83,5.83,2.65,2.57,3.83,12.0,15.48,43.04,64.52,16.26,23.96,56.65,28.04,62.39,15.04,15.04,15.13,20.22,16.35,17.91,16.17,19.61,16.83,20.78,19.7,31.78,33.91,9.35,11.17,12.96,17.04,15.13,18.52,12.17,13.26,16.09,9.35,10.7,10.91,13.09,14.48,16.39,15.91,21.39,33.52,15.09,15.43,15.91,16.43,19.91,21.13,30.87,32.83,23.43,19.48,15.83,16.04,15.91,18.96,17.78,19.39,18.17,19.0,17.74,20.3,18.17,21.26,17.0,16.43,15.87,12.3,27.04,14.17,13.39,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,25.83,100.0,100.0,100.0,100.0,14.35,8.35,8.57,8.17,8.78,8.7,8.91,8.74,8.61,8.09,11.83,13.09,0.0,38.04,38.43,39.78,39.61,37.17,0.65,42.26,6.26,4.7,10.65,0.0,0.0,100.0,100.0,100.0,0.0,0.0,0.0,0.65,0.0,0.0,0.0,0.0,0.0
COL,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.13,0.13,0.46,0.13,0.07,0.07,0.07,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.73,0.0,0.07,0.0,0.4,0.0,0.13,0.33,0.13,0.26,0.2,0.26,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.2,0.66,1.32,0.53,0.79,1.72,3.64,0.46,1.19,3.31,0.33,1.19,100.0,0.0,0.2,0.07,0.79,2.12,0.4,0.73,0.13,0.46,3.24,1.59,1.59,0.93,0.26,0.13,0.13,0.26,0.13,0.2,0.46,0.4,0.4,0.13,0.26,0.07,1.46,0.2,0.13,0.13,1.59,0.53,0.33,0.2,1.26,17.33,0.99,4.76,1.06,1.06,1.19,1.72,0.07,0.26,0.07,0.6,2.12,3.77,0.33,0.53,0.53,0.53,2.51,0.33,1.52,0.79,1.19,1.72,0.93,1.32,1.12,1.06,1.72,3.11,1.85,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,29.96,100.0,100.0,0.0,0.0,10.98,5.49,4.56,3.44,3.9,2.71,5.89,2.65,3.44,4.83,9.66,4.03,2.78,1.98,1.19,2.65,0.33,0.66,0.33,0.33,0.33,0.33,0.79,0.13,2.45,1.12,1.52,1.12,3.24,3.24,2.38,2.98,1.12,1.06,1.12,0.4,0.0,0.46,0.0,0.66,0.2,1.72,0.79,2.58,3.44,0.13,0.79,0.66,1.59,2.31,4.63,0.2,0.0,0.13,1.59,1.46,0.4,2.05,0.26,0.26,100.0,1.39,1.79,0.0,0.07,0.13,0.2,0.66,1.32,0.86,3.51,1.32,0.86,0.53,0.4,0.13,0.26,0.07,2.58,1.19,0.66,1.32,2.12,0.4,4.23,0.2,0.07,0.13,0.07,1.46,0.53,0.13,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,30.49,100.0,100.0,100.0,6.88,0.26,0.26,0.07,0.07,0.26,0.4,0.4,0.07,0.0,0.4,0.4,0.0,8.07,8.13,8.13,8.13,8.07,0.2,36.71,0.93,0.99,1.12,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.06,0.0,0.0,0.0,0.0,0.0,0.0


In [72]:
# what's the largest proportion of missing values for any given country for each variable?
((cleaning_missing_pct.groupby('C_COW_ALPHA').mean()*100).max()).round(decimals=2)

V1                   0.00
V2                   0.00
V2A                  0.00
cow                  0.00
B_COUNTRY_ALPHA      0.00
V3                   0.00
V4                   4.58
V5                   3.45
V6                   6.75
V7                   9.00
V8                   7.64
V9                  13.55
V10                  5.50
V11                  2.18
V12                  0.44
V13                  0.12
V14                  0.16
V15                  0.56
V16                  0.24
V17                  0.40
V18                  0.36
V19                  0.60
V20                  0.48
V21                  0.64
V22                  0.10
V23                  2.84
V24                 10.80
V25                 16.04
V26                 17.11
V27                 17.65
V28                100.00
V29                100.00
V30                 19.49
V31                100.00
V32                 16.04
V33                 19.57
V34                 22.41
V35                100.00
V36         

Notes:
- features to drop (variables where 100% of values are missing for any given sample (cannot impute) or too many missings or simply unnecessary):
    - V28, V29, V31: membership items
    - V35: organizational membership
    - V36-V43: attitudes towards neighbors 
    - V46: attitudes when jobs are scarce 
    - V50: opinion on how woman working impacts children 
    - V85-V89: willingness to take political action 
    - V95: political leanings
    - V109: confidence in armed forces; 100% missing for Egypt only (N = 1523)
    - V112: confidence in labor unions
    - V118: confidence in civil service
    - V125_01-V125_17: confidence in political/economic union variables
    - V127-V130: political system variables
    - V135: essential characteristic of democracy; 100% missing for Egypt only (N = 1523)
    - V141: how democratic is govt; missing for multiple countries
    - V142: respect for human rights; missing for Uzbekistan only (N = 1500); would be nice to keep, but arguably not crucial
    - V145-V146, then V148-149: religious beliefs and practices; KEEP V147 (how religious are you)
    
- cases to drop (participating countries) due to too many missings:
    - Egypt (N = 1523)

- feature engineering notes: 
    - V56 and V56_NZ: people would try to take advantage; consolidate into one variable
    - V58: number of children; missing entirely for Hong Kong...contemplating just dropping them (N = 1000) to preserve this feature; alternatively I could pull in birthrate and other health/wellbeing data for all countries...we'll see; TBD
    - V60-V65: prioritizing country aims; missing entirely for Kuwait...contemplating dropping them as well (N = 1303)
    - V74 and V74B: Schwartz helpful value; consolidate into one variable based on whichever has fewer missings???
    - V81: priorities (protecting environment vs economic growth); 100% missing for TRI (N = 999) only; considering dropping them
    - V102-107: trust in various groups (family, neighborhood, etc.) items. New Zealand is the only country that has missings across the board (N = 841); contemplating dropping them
    

In [89]:
# what's going on with V74 and V74B for respondents from GMY? 
# it looks like they're responding to one item OR the other...maybe I can combine these into the same variable
cleaning_w6[cleaning_w6['C_COW_ALPHA'] == 'GMY'][['V74', 'V74B']].sample(20)

Unnamed: 0,V74,V74B
21034,1.0,
21492,3.0,
22127,,4.0
21429,,3.0
21534,4.0,
22051,,1.0
20215,4.0,
20918,3.0,
21840,5.0,
21858,4.0,


In [87]:
# how do V74 and V74B look for respondents from other countries with 100% missings on one or the other?
# countries where this is the case: from top - ARG, ARM, AUL, AZE, BLR, CHL...from bottom - ZIM, UZB, USA, URU, UKR, TUR
# it looks like they're responding to one item OR the other...maybe I can combine these into the same variable
cleaning_w6[cleaning_w6['C_COW_ALPHA'] == 'ZIM'][['V74', 'V74B']].sample(20)

Unnamed: 0,V74,V74B
88396,2.0,
89396,1.0,
88417,1.0,
88252,1.0,
88074,2.0,
88531,2.0,
88926,1.0,
89075,1.0,
88824,1.0,
89115,2.0,


In [73]:
# sample sizes for reference
cleaning_w6.groupby('C_COW_ALPHA')['V3'].count()

C_COW_ALPHA
ALG    1200
ARG    1030
ARM    1100
AUL    1477
AZE    1002
BLR    1535
BRA    1486
CHL    1000
CHN    2300
COL    1512
CYP    1000
ECU    1202
EGY    1523
EST    1533
GHA    1552
GMY    2046
GRG    1202
HAI    1996
HKG    1000
IND    4078
IRQ    1200
JOR    1200
JPN    2443
KUW    1303
KYR    1500
KZK    1500
LEB    1200
LIB    2131
MAL    1300
MEX    2000
MOR    1200
NEW     841
NIG    1759
NTH    1902
PAK    1200
PER    1210
PHI    1200
POL     966
PSE    1000
QAT    1060
ROK    1200
ROM    1503
RUS    2500
RWA    1527
SAF    3531
SIN    1972
SLV    1069
SPN    1189
SWD    1206
TAW    1238
THI    1200
TRI     999
TUN    1205
TUR    1605
UKR    1500
URU    1000
USA    2232
UZB    1500
YEM    1000
ZIM    1500
Name: V3, dtype: int64