# PRELIMINARIES

In [1]:
import pandas as pd
import missingno as msn
import os

# Display settings
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.float_format', '{:.2f}'.format)

# DATA LOADING

In [2]:
#Getting a DtypeWarning. Set low_memory=False to get around it
#Low_memory=False instructs pandas to read the entire file before
#inferring data types. It significantly increases memory usage though
#In the path, use trailing dots to go one directory level
orig_df = pd.read_csv('../data/raw/GlobalFindexDatabase2025.csv', low_memory=False)

Check DataFrame info: file is around 28.6 MB

In [3]:
orig_df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 8564 entries, 0 to 8563
Columns: 437 entries, countrynewwb to con32h_s
dtypes: float64(430), int64(1), object(6)
memory usage: 28.6+ MB


Describe tells us that the indicators are expressed as aggregates (weighted averages)

In [4]:
orig_df.describe()

Unnamed: 0,year,pop_adult,account_t_d,fiaccount_t_d,mobileaccount_t_d,borrow_any_t_d,fin4_d,dig_acc,fin11_2a,fin11a,fin11b,fin11c,fin11f,fin11d,fin11e,fin14a,fin14b,fin14c,fin14d,fin13_1a,fin13_1b,fin26a,fin26b,fin27a,fin27b,fin17f,fin17a_17a1_d,fin17a,fin17b,fin17c,fin22d,fin22e,fin22a_22a1_22g_d,fin22a,fin22a_1,fin22b,fin22c,fin24sav,fin24fam,fin24work,fin24bor,fin24sell,fin24other,fin24aVD,fin24aSD,fin24aND,fin24aSD_ND,fin24aP,fin24aN,fin24sav_SD_ND,fin24fam_SD_ND,fin24work_SD_ND,fin24bor_SD_ND,fin24sell_SD_ND,fin24other_SD_ND,fin24sav_VD,fin24fam_VD,fin24work_VD,fin24bor_VD,fin24sell_VD,fin24other_VD,fh1,fin28,fh2,fin29,fin31a_31b,fin30,fin31a,fin31b,fin31d,fin32_33_34a,fin32_33_34b,fin32_33_34c,fin32_33_34d,fin32_33_acc,fin32_33,fin32_n33_34a,fin32_n33_34b,fin32_n33_34c,fin32_n33_34d,fin32_n33_acc,fin32_n33,fin32,fin32_acc,fin34a,fin34b,fin34c,fin34d,fin37_38_39a,fin37_38_39b,fin37_38_39c,fin37_38_39d,fin37_38_39_acc,fin37_38,fin37_39a,fin37_39b,fin37_39c,fin37_39d,fin37_39_acc,fin37,fin38_39a,fin38_39b,fin38_39c,fin38_39d,fin38_39_acc,fin38,fin2_t_d,fin42,fin42_acc,fin43a,fin43b,fin43c,fin43d,fin45a,fin45c,fin45d,fin45e,fin45b,fin25e2,fin9b,fin10,fin22g,fin22h,inactive_t_d,fing2p_acc,fing2p_card,fing2p_cash,fing2p_fin,fing2p_mob,fing2p,g20_made,g20_received,g20_any,merchant_pay,save_any_t_d,fin11_1,fin5w,fin5m,fin5lm,fin5n,fin6w,fin6m,fin6lm,fin6n,fin11_0,fin9a,fin17dw,fin17dm,fin17dlm,fin17e,fin7,fin3,fin19,fin20,fin21,fin24ba,fin24bb,fin24bc,fin24bd,fin24c,fin24d1,fin24d2,fin24d3,fin25e1,fin25e2b,fin25e3w,fin25e3m,fin25e3lm,fin25e4a,fin25e4b,fin25e4c,fin25e4d,fin25e4e,fh2a,fin31c,fin36a,fin36b,fin40a,fin40b,fin36Aa,fin36Ab,fin8,fin13aw,fin13am,fin13alm,fin13an,fin13bw,fin13bm,fin13blm,fin13bn,fin13cw,fin13cm,fin13clm,fin13cn,fin13e,fin13f,fin13f_1,fin15,fin16,fin22f,fin41,fin35,fin44,fh1_fh2,fin28_29,fin31d_s,fin32_n33_34c_s,fin34c_s,fin43c_s,fin32_acc_s,fin34a_s,fin32_33_acc_s,inactive_t_d_s,fing2p_fin_s,fin32_33_34a_s,fin32_n33_acc_s,fin37_39_acc_s,fin37_39c_s,fin31a_31b_s,fin31a_s,fin31b_s,fin32_n33_34a_s,fin37_39a_s,fin34d_s,fin32_33_34d_s,fin32_n33_34d_s,fing2p_card_s,fin37_39d_s,fin42_acc_s,fin32_33_34c_s,fin37_38_39c_s,fin38_39c_s,fing2p_acc_s,fing2p_cash_s,fin37_38_39a_s,fin37_38_39_acc_s,fin38_39a_s,fin38_39_acc_s,fin34b_s,fin32_n33_34b_s,fin43b_s,fin27b_s,fin27a_s,fin22h_s,fin28_29_s,fin28_s,fin29_s,fing2p_mob_s,fin37_38_39d_s,fin37_38_39b_s,fin37_39b_s,fin11_2a_s,fin11b_s,fin11f_s,fin11d_s,fin11e_s,fin9b_s,fin11_1_s,fin5m_s,fin6m_s,fin9a_s,fin5w_s,fin6w_s,fin17dm_s,fin17dlm_s,fin25e3w_s,fin25e3m_s,fin24d1_s,fin14d_s,fin24d2_s,fin11a_s,fin11c_s,fin5lm_s,fin6lm_s,fin17dw_s,fin14c_s,fin13_1a_s,fin13_1b_s,fin13am_s,fin13alm_s,fin13bm_s,fin13blm_s,fin13cm_s,fin13clm_s,fin21_s,fin14b_s,fin13cw_s,fin13f_s,fin14a_s,fin25e3lm_s,fin13aw_s,fin13bw_s,fin24d3_s,fin5n_s,fin6n_s,fin13f_1_s,fin32_33_34b_s,con1,con2a,con2b,con2c,con2d,con2e,con2f,con2g,con3a,con3b,con3c,con3d,con3e,con3f,con3g,con4,con5a,con5b,con6,con7,con8,con9a,con9b,con10,con11,con12d,con12w,con12m,con12lm,con13,con14,con15,con16,con17a,con17b,con17c,con17d,con18,con19,con20,con21,con22,con23,internet,con26d,con26w,con26m,con26lm,con27,con28d,con28w,con28m,con28lm,con28n,con29,con30a,con30b,con30c,con30d,con30e,con30f,con30g,con30h,con31a,con31b,con31c,con31d,con31e,con31f,con31g,con31h,con32a,con32b,con32c,con32d,con32e,con32f,con32g,con32h,con10_s,con11_s,con12d_s,con14_s,con16_s,con17a_s,con17b_s,con18_s,con19_s,con20_s,con21_s,con26d_s,con27_s,con28m_s,con30a_s,con30b_s,con30c_s,con30d_s,con30e_s,con30f_s,con30g_s,con30h_s,con31a_s,con31b_s,con31f_s,con2a_s,con15_s,con17d_s,con29_s,con31d_s,con31h_s,con32a_s,con3a_s,con4_s,con28d_s,con28w_s,con23_s,con31c_s,con2b_s,con2d_s,con26w_s,con2c_s,con2e_s,con2g_s,con5b_s,con12m_s,con26lm_s,con12w_s,con2f_s,con13_s,con26m_s,con28lm_s,con5a_s,con17c_s,con32h_s
count,8564.0,7880.0,8474.0,8382.0,2514.0,6412.0,1123.0,1375.0,620.0,440.0,512.0,356.0,380.0,608.0,740.0,277.0,265.0,336.0,454.0,322.0,239.0,3170.0,1959.0,1223.0,659.0,442.0,6192.0,5712.0,1002.0,2932.0,4038.0,1673.0,4956.0,4603.0,344.0,6044.0,958.0,2419.0,2996.0,2493.0,856.0,1130.0,257.0,2908.0,3036.0,2695.0,3036.0,6454.0,5090.0,1857.0,2795.0,1709.0,373.0,399.0,257.0,313.0,2326.0,565.0,311.0,585.0,257.0,2378.0,1478.0,2506.0,1642.0,3940.0,6220.0,3386.0,2538.0,4941.0,1669.0,569.0,577.0,597.0,1801.0,2169.0,3114.0,795.0,2441.0,697.0,3536.0,5796.0,6188.0,4398.0,3946.0,1024.0,2999.0,807.0,2353.0,471.0,713.0,415.0,2602.0,3534.0,2299.0,599.0,769.0,617.0,2609.0,3864.0,1591.0,405.0,569.0,405.0,1643.0,1973.0,7180.0,3508.0,717.0,557.0,491.0,2789.0,405.0,838.0,1327.0,1399.0,933.0,395.0,1710.0,985.0,4211.0,2867.0,1027.0,869.0,3114.0,747.0,769.0,3618.0,702.0,4020.0,5780.0,5778.0,6152.0,1754.0,6402.0,176.0,316.0,1009.0,472.0,172.0,616.0,949.0,532.0,160.0,68.0,1021.0,172.0,781.0,604.0,478.0,232.0,1159.0,847.0,571.0,307.0,1255.0,1399.0,1387.0,1387.0,1195.0,777.0,729.0,204.0,829.0,2498.0,646.0,382.0,180.0,232.0,100.0,100.0,1189.0,100.0,853.0,100.0,135.0,724.0,352.0,280.0,20.0,20.0,1057.0,169.0,334.0,335.0,37.0,145.0,310.0,334.0,37.0,193.0,298.0,323.0,37.0,264.0,205.0,73.0,205.0,73.0,1209.0,100.0,100.0,196.0,2560.0,1874.0,423.0,182.0,236.0,216.0,371.0,328.0,122.0,29.0,233.0,109.0,288.0,200.0,21.0,325.0,274.0,186.0,248.0,170.0,25.0,4.0,14.0,1.0,6.0,15.0,2.0,30.0,16.0,260.0,35.0,187.0,211.0,115.0,120.0,42.0,21.0,8.0,37.0,86.0,72.0,150.0,114.0,129.0,13.0,1.0,6.0,4.0,46.0,37.0,26.0,45.0,56.0,73.0,9.0,76.0,71.0,76.0,18.0,43.0,56.0,42.0,44.0,22.0,56.0,35.0,52.0,31.0,24.0,31.0,36.0,6.0,25.0,24.0,17.0,25.0,25.0,23.0,25.0,22.0,24.0,17.0,19.0,13.0,14.0,20.0,6.0,11.0,9.0,8.0,6.0,5.0,3.0,1.0,1969.0,598.0,275.0,145.0,289.0,121.0,157.0,277.0,433.0,85.0,85.0,85.0,85.0,85.0,85.0,409.0,97.0,217.0,85.0,85.0,301.0,1945.0,1170.0,181.0,1102.0,1102.0,142.0,97.0,85.0,95.0,1102.0,104.0,1102.0,1102.0,1102.0,97.0,265.0,1102.0,1102.0,865.0,828.0,85.0,528.0,1969.0,1006.0,406.0,95.0,109.0,1078.0,253.0,646.0,720.0,97.0,85.0,301.0,1054.0,1054.0,1090.0,1054.0,1018.0,310.0,874.0,598.0,790.0,589.0,193.0,564.0,85.0,241.0,85.0,336.0,646.0,85.0,85.0,85.0,85.0,85.0,85.0,97.0,8.0,85.0,85.0,85.0,85.0,85.0,85.0,85.0,85.0,65.0,62.0,77.0,83.0,53.0,81.0,81.0,84.0,81.0,78.0,19.0,66.0,43.0,59.0,42.0,13.0,43.0,8.0,15.0,18.0,40.0,21.0,47.0,29.0,27.0,14.0,47.0,37.0,9.0,16.0,17.0,27.0,5.0,3.0,16.0,11.0,1.0,2.0,5.0,6.0,1.0,1.0,1.0,1.0,1.0,1.0
mean,2017.75,38015962.82,0.61,0.58,0.28,0.51,0.35,0.46,0.23,0.18,0.21,0.15,0.17,0.28,0.18,0.2,0.19,0.2,0.31,0.21,0.15,0.32,0.33,0.24,0.12,0.15,0.28,0.27,0.21,0.19,0.19,0.13,0.25,0.25,0.11,0.28,0.1,0.22,0.36,0.18,0.11,0.14,0.02,0.33,0.32,0.26,0.55,0.7,0.35,0.22,0.21,0.14,0.07,0.07,0.01,0.04,0.18,0.1,0.05,0.09,0.01,0.24,0.2,0.29,0.21,0.31,0.51,0.31,0.18,0.32,0.11,0.01,0.01,0.02,0.12,0.12,0.23,0.06,0.13,0.04,0.23,0.26,0.32,0.28,0.28,0.08,0.14,0.07,0.23,0.05,0.08,0.01,0.24,0.27,0.19,0.03,0.05,0.03,0.19,0.21,0.14,0.01,0.05,0.0,0.14,0.18,0.49,0.22,0.05,0.01,0.03,0.2,0.0,0.15,0.27,0.32,0.19,0.13,0.32,0.3,0.26,0.24,0.22,0.08,0.27,0.06,0.09,0.25,0.05,0.3,0.47,0.4,0.53,0.33,0.5,0.09,0.12,0.31,0.15,0.08,0.22,0.22,0.15,0.08,0.01,0.27,0.08,0.15,0.13,0.16,0.12,0.36,0.19,0.14,0.13,0.19,0.27,0.17,0.3,0.27,0.19,0.2,0.08,0.28,0.35,0.28,0.12,0.08,0.1,0.01,0.02,0.27,0.01,0.2,0.01,0.06,0.19,0.11,0.12,0.01,0.0,0.29,0.16,0.17,0.19,0.01,0.15,0.15,0.21,0.03,0.18,0.15,0.2,0.02,0.21,0.17,0.12,0.13,0.09,0.3,0.02,0.04,0.09,0.37,0.26,0.66,0.62,0.54,0.82,0.72,0.7,0.95,0.25,0.71,0.93,0.75,0.78,0.63,0.56,0.53,0.39,0.75,0.75,0.45,0.82,0.49,0.2,0.41,0.45,0.72,0.49,0.54,0.75,0.41,0.7,0.75,0.77,0.8,0.41,0.49,0.4,0.54,0.77,0.83,0.62,0.67,0.64,0.42,0.2,0.42,0.41,0.48,0.44,0.32,0.55,0.42,0.51,0.25,0.53,0.39,0.47,0.21,0.35,0.49,0.4,0.64,0.29,0.6,0.53,0.63,0.38,0.31,0.28,0.27,0.31,0.32,0.57,0.39,0.34,0.38,0.29,0.42,0.29,0.39,0.79,0.3,0.33,0.3,0.31,0.45,0.28,0.29,0.25,0.23,0.21,0.6,0.72,0.87,0.19,0.13,0.09,0.12,0.06,0.08,0.12,0.17,0.01,0.01,0.02,0.01,0.01,0.02,0.12,0.05,0.09,0.01,0.02,0.12,0.69,0.26,0.09,0.61,0.72,0.08,0.03,0.02,0.05,0.63,0.38,0.57,0.41,0.31,0.04,0.12,0.49,0.41,0.19,0.21,0.01,0.13,0.73,0.49,0.11,0.04,0.05,0.46,0.13,0.18,0.31,0.05,0.0,0.12,0.47,0.46,0.52,0.44,0.32,0.11,0.21,0.16,0.24,0.13,0.1,0.13,0.03,0.11,0.04,0.11,0.22,0.01,0.01,0.03,0.0,0.01,0.01,0.04,0.54,0.76,0.88,0.75,0.68,0.49,0.39,0.59,0.82,0.23,0.27,0.73,0.77,0.62,0.74,0.72,0.82,0.69,0.51,0.18,0.33,0.23,0.45,0.28,0.31,0.75,0.92,0.17,0.19,0.26,0.25,0.38,0.62,0.46,0.39,0.41,0.16,0.18,0.53,0.49,0.22,0.36,0.39,0.42,0.84,0.19,0.25,0.15,0.37,0.43,0.24,0.22,0.79,0.16,0.41
std,4.7,126950906.09,0.28,0.3,0.19,0.15,0.2,0.22,0.12,0.09,0.1,0.07,0.1,0.16,0.07,0.11,0.1,0.12,0.16,0.08,0.06,0.22,0.23,0.19,0.09,0.1,0.18,0.18,0.14,0.1,0.09,0.06,0.17,0.17,0.1,0.12,0.08,0.15,0.13,0.09,0.06,0.07,0.02,0.14,0.09,0.17,0.18,0.22,0.2,0.16,0.09,0.08,0.05,0.05,0.01,0.04,0.07,0.06,0.04,0.06,0.01,0.13,0.11,0.13,0.12,0.22,0.22,0.24,0.12,0.18,0.08,0.02,0.02,0.05,0.08,0.08,0.15,0.07,0.07,0.07,0.15,0.14,0.18,0.2,0.2,0.08,0.07,0.1,0.15,0.09,0.08,0.03,0.15,0.16,0.13,0.08,0.06,0.06,0.14,0.13,0.1,0.01,0.07,0.01,0.1,0.12,0.3,0.13,0.06,0.02,0.05,0.12,0.0,0.05,0.09,0.1,0.1,0.06,0.22,0.19,0.2,0.19,0.18,0.08,0.16,0.08,0.08,0.16,0.09,0.17,0.28,0.23,0.27,0.22,0.18,0.04,0.08,0.18,0.07,0.08,0.15,0.1,0.07,0.07,0.02,0.16,0.07,0.07,0.05,0.11,0.07,0.23,0.12,0.08,0.08,0.07,0.06,0.04,0.09,0.16,0.12,0.13,0.06,0.18,0.14,0.19,0.06,0.06,0.06,0.01,0.01,0.12,0.01,0.09,0.01,0.04,0.13,0.06,0.07,0.02,0.0,0.17,0.1,0.07,0.06,0.01,0.1,0.06,0.07,0.02,0.11,0.05,0.06,0.01,0.12,0.12,0.1,0.05,0.04,0.14,0.01,0.02,0.06,0.16,0.15,0.23,0.17,0.18,0.13,0.19,0.2,0.06,0.1,0.14,0.07,0.17,0.12,0.21,0.24,0.26,0.19,0.17,0.13,0.14,0.07,0.11,,0.18,0.2,0.05,0.16,0.15,0.14,0.15,0.14,0.14,0.14,0.13,0.12,0.13,0.15,0.23,0.14,0.1,0.14,0.11,0.13,0.14,,0.14,0.16,0.11,0.13,0.11,0.19,0.16,0.14,0.12,0.16,0.12,0.13,0.06,0.11,0.09,0.1,0.12,0.12,0.13,0.13,0.14,0.1,0.08,0.1,0.1,0.06,0.13,0.14,0.09,0.1,0.11,0.08,0.12,0.07,0.11,0.09,0.09,0.1,0.11,0.1,0.19,0.09,0.08,0.07,0.03,0.02,0.16,,0.12,0.11,0.09,0.08,0.08,0.06,0.05,0.06,0.1,0.01,0.01,0.02,0.01,0.01,0.01,0.05,0.04,0.06,0.01,0.02,0.06,0.23,0.14,0.06,0.15,0.16,0.05,0.04,0.02,0.11,0.2,0.15,0.21,0.15,0.12,0.05,0.06,0.17,0.17,0.09,0.11,0.01,0.05,0.24,0.25,0.04,0.03,0.04,0.18,0.09,0.11,0.17,0.04,0.0,0.06,0.21,0.2,0.23,0.2,0.16,0.05,0.12,0.07,0.12,0.05,0.06,0.06,0.02,0.05,0.02,0.05,0.11,0.01,0.01,0.02,0.0,0.01,0.0,0.05,0.22,0.09,0.1,0.15,0.17,0.14,0.14,0.12,0.07,0.09,0.12,0.17,0.14,0.22,0.13,0.1,0.11,0.11,0.13,0.05,0.11,0.07,0.1,0.1,0.14,0.1,0.02,0.03,0.05,0.08,0.13,0.11,0.11,0.12,0.09,0.15,0.04,0.05,0.16,0.08,0.06,0.1,0.16,0.1,0.08,,0.14,0.03,0.16,,,,,,
min,2011.0,228016.0,0.0,0.0,0.0,0.07,0.02,0.03,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.01,0.02,0.03,0.03,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.01,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.01,0.0,0.0,0.03,0.05,0.01,0.1,0.0,0.0,0.0,0.02,0.0,0.0,0.0,0.0,0.0,0.01,0.0,0.0,0.0,0.0,0.02,0.0,0.04,0.0,0.0,0.03,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.07,0.03,0.01,0.0,0.02,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.01,0.0,0.01,0.0,0.06,0.0,0.0,0.02,0.02,0.0,0.0,0.01,0.01,0.0,0.0,0.01,0.0,0.0,0.01,0.0,0.01,0.02,0.01,0.0,0.0,0.04,0.1,0.06,0.05,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.02,0.0,0.03,0.0,0.01,0.0,0.0,0.01,0.0,0.0,0.03,0.01,0.01,0.01,0.0,0.01,0.01,0.01,0.0,0.01,0.01,0.01,0.0,0.01,0.0,0.0,0.03,0.01,0.0,0.0,0.0,0.0,0.05,0.0,0.13,0.22,0.17,0.34,0.27,0.17,0.62,0.13,0.32,0.67,0.34,0.39,0.24,0.14,0.14,0.13,0.26,0.37,0.27,0.76,0.29,0.2,0.21,0.24,0.69,0.27,0.36,0.24,0.18,0.3,0.32,0.39,0.45,0.14,0.28,0.22,0.17,0.37,0.57,0.29,0.43,0.28,0.24,0.2,0.25,0.26,0.27,0.18,0.18,0.22,0.14,0.21,0.18,0.22,0.2,0.25,0.12,0.11,0.3,0.21,0.28,0.15,0.18,0.24,0.23,0.16,0.21,0.12,0.13,0.25,0.12,0.12,0.24,0.12,0.14,0.1,0.15,0.18,0.13,0.58,0.1,0.12,0.18,0.11,0.15,0.1,0.19,0.17,0.18,0.17,0.45,0.72,0.26,0.01,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.01,0.0,0.0,0.0,0.0,0.0,0.07,0.0,0.0,0.1,0.12,0.02,0.0,0.0,0.0,0.09,0.06,0.04,0.05,0.05,0.0,0.01,0.07,0.04,0.04,0.02,0.0,0.01,0.04,0.02,0.02,0.01,0.0,0.05,0.0,0.01,0.01,0.01,0.0,0.0,0.04,0.06,0.05,0.04,0.01,0.01,0.01,0.02,0.0,0.01,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.2,0.54,0.21,0.34,0.26,0.21,0.11,0.32,0.67,0.11,0.11,0.28,0.34,0.18,0.35,0.43,0.32,0.36,0.23,0.12,0.13,0.13,0.3,0.13,0.12,0.52,0.89,0.13,0.13,0.16,0.13,0.2,0.45,0.28,0.18,0.18,0.11,0.11,0.29,0.35,0.13,0.28,0.23,0.25,0.67,0.19,0.15,0.12,0.22,0.43,0.24,0.22,0.79,0.16,0.41
25%,2014.0,3739546.0,0.37,0.31,0.13,0.4,0.18,0.28,0.14,0.11,0.13,0.12,0.11,0.14,0.12,0.12,0.12,0.12,0.19,0.14,0.11,0.14,0.14,0.09,0.05,0.07,0.14,0.13,0.11,0.11,0.12,0.09,0.13,0.13,0.03,0.19,0.03,0.12,0.29,0.12,0.08,0.1,0.01,0.22,0.25,0.14,0.42,0.53,0.17,0.11,0.14,0.09,0.03,0.02,0.0,0.02,0.14,0.04,0.02,0.03,0.0,0.15,0.11,0.18,0.12,0.14,0.32,0.13,0.09,0.17,0.04,0.0,0.0,0.0,0.05,0.06,0.1,0.0,0.09,0.0,0.11,0.15,0.18,0.12,0.11,0.01,0.09,0.0,0.13,0.0,0.02,0.0,0.13,0.15,0.1,0.0,0.01,0.0,0.11,0.12,0.06,0.0,0.0,0.0,0.07,0.09,0.22,0.12,0.01,0.0,0.0,0.11,0.0,0.12,0.2,0.24,0.12,0.09,0.14,0.15,0.11,0.1,0.08,0.02,0.15,0.0,0.02,0.14,0.0,0.16,0.24,0.21,0.3,0.15,0.36,0.06,0.05,0.16,0.1,0.02,0.11,0.14,0.1,0.02,0.0,0.15,0.02,0.1,0.1,0.08,0.05,0.16,0.11,0.09,0.07,0.13,0.23,0.15,0.23,0.16,0.12,0.12,0.02,0.14,0.25,0.13,0.08,0.04,0.05,0.0,0.01,0.18,0.0,0.13,0.0,0.03,0.09,0.07,0.06,0.0,0.0,0.15,0.08,0.12,0.15,0.01,0.08,0.1,0.16,0.01,0.1,0.11,0.15,0.01,0.12,0.09,0.04,0.1,0.06,0.19,0.01,0.03,0.04,0.25,0.15,0.49,0.51,0.41,0.74,0.57,0.54,0.92,0.17,0.63,0.9,0.62,0.72,0.5,0.35,0.31,0.24,0.61,0.67,0.34,0.76,0.44,0.2,0.31,0.34,0.7,0.38,0.47,0.68,0.31,0.62,0.68,0.68,0.72,0.33,0.39,0.29,0.36,0.68,0.79,0.52,0.59,0.54,0.31,0.2,0.31,0.29,0.4,0.38,0.25,0.36,0.31,0.41,0.19,0.4,0.32,0.38,0.16,0.28,0.44,0.34,0.54,0.21,0.54,0.47,0.58,0.31,0.27,0.19,0.19,0.28,0.23,0.51,0.32,0.28,0.31,0.23,0.36,0.24,0.33,0.77,0.23,0.26,0.23,0.23,0.35,0.23,0.23,0.21,0.23,0.21,0.51,0.72,0.83,0.11,0.07,0.02,0.06,0.02,0.03,0.07,0.09,0.0,0.0,0.01,0.0,0.0,0.01,0.09,0.02,0.03,0.0,0.01,0.07,0.55,0.14,0.03,0.51,0.64,0.05,0.01,0.01,0.01,0.48,0.27,0.41,0.29,0.22,0.01,0.07,0.36,0.28,0.12,0.13,0.01,0.1,0.58,0.27,0.09,0.02,0.02,0.33,0.06,0.12,0.16,0.02,0.0,0.09,0.31,0.3,0.33,0.27,0.19,0.07,0.12,0.11,0.14,0.1,0.05,0.09,0.01,0.07,0.02,0.08,0.13,0.0,0.0,0.02,0.0,0.0,0.0,0.01,0.34,0.7,0.86,0.66,0.57,0.39,0.28,0.49,0.79,0.16,0.17,0.61,0.68,0.47,0.65,0.66,0.81,0.62,0.43,0.14,0.25,0.18,0.36,0.2,0.18,0.69,0.9,0.15,0.15,0.19,0.18,0.3,0.53,0.37,0.35,0.31,0.14,0.15,0.39,0.43,0.18,0.31,0.31,0.35,0.82,0.19,0.2,0.13,0.28,0.43,0.24,0.22,0.79,0.16,0.41
50%,2017.0,8517166.0,0.62,0.57,0.24,0.49,0.32,0.45,0.21,0.17,0.2,0.15,0.15,0.23,0.16,0.18,0.17,0.16,0.28,0.21,0.14,0.27,0.26,0.18,0.12,0.12,0.23,0.22,0.19,0.17,0.17,0.12,0.2,0.2,0.08,0.27,0.1,0.17,0.36,0.17,0.11,0.14,0.02,0.33,0.31,0.21,0.55,0.76,0.33,0.16,0.19,0.13,0.05,0.05,0.01,0.03,0.18,0.1,0.03,0.1,0.01,0.22,0.18,0.25,0.19,0.24,0.52,0.23,0.16,0.3,0.11,0.0,0.01,0.0,0.11,0.12,0.2,0.02,0.13,0.01,0.2,0.23,0.29,0.23,0.22,0.06,0.13,0.01,0.19,0.01,0.05,0.01,0.2,0.23,0.16,0.0,0.03,0.01,0.16,0.17,0.13,0.0,0.01,0.0,0.14,0.17,0.44,0.19,0.02,0.01,0.01,0.18,0.0,0.15,0.28,0.3,0.17,0.13,0.26,0.27,0.2,0.19,0.17,0.04,0.23,0.02,0.07,0.22,0.01,0.26,0.41,0.34,0.5,0.27,0.49,0.1,0.11,0.26,0.14,0.05,0.19,0.22,0.13,0.04,0.01,0.24,0.06,0.15,0.13,0.14,0.11,0.31,0.16,0.12,0.13,0.17,0.26,0.17,0.3,0.23,0.16,0.16,0.07,0.23,0.35,0.25,0.12,0.07,0.1,0.01,0.02,0.26,0.01,0.19,0.01,0.05,0.16,0.11,0.12,0.0,0.0,0.26,0.14,0.16,0.19,0.01,0.13,0.14,0.22,0.02,0.16,0.15,0.21,0.01,0.18,0.14,0.09,0.13,0.09,0.29,0.02,0.03,0.07,0.34,0.23,0.68,0.63,0.53,0.83,0.75,0.73,0.96,0.24,0.74,0.96,0.77,0.79,0.62,0.54,0.49,0.36,0.77,0.75,0.43,0.81,0.51,0.2,0.39,0.39,0.72,0.48,0.52,0.78,0.39,0.71,0.77,0.78,0.82,0.41,0.47,0.34,0.5,0.8,0.85,0.63,0.68,0.64,0.38,0.2,0.44,0.41,0.46,0.44,0.32,0.6,0.41,0.5,0.21,0.5,0.37,0.44,0.21,0.36,0.5,0.39,0.66,0.24,0.6,0.54,0.64,0.38,0.3,0.28,0.24,0.31,0.3,0.59,0.37,0.33,0.42,0.27,0.46,0.28,0.41,0.8,0.3,0.29,0.26,0.3,0.54,0.31,0.29,0.24,0.24,0.21,0.58,0.72,0.91,0.16,0.12,0.06,0.11,0.04,0.08,0.11,0.15,0.0,0.0,0.02,0.01,0.0,0.01,0.12,0.03,0.1,0.01,0.02,0.11,0.76,0.23,0.1,0.64,0.75,0.07,0.01,0.01,0.01,0.65,0.39,0.58,0.41,0.3,0.02,0.13,0.49,0.4,0.16,0.19,0.01,0.12,0.82,0.49,0.11,0.03,0.03,0.45,0.13,0.16,0.3,0.04,0.0,0.13,0.47,0.45,0.54,0.44,0.3,0.11,0.19,0.16,0.23,0.13,0.09,0.13,0.03,0.11,0.03,0.11,0.22,0.01,0.0,0.03,0.0,0.01,0.0,0.02,0.58,0.76,0.91,0.78,0.68,0.5,0.4,0.57,0.83,0.21,0.25,0.8,0.82,0.65,0.76,0.73,0.83,0.7,0.53,0.16,0.3,0.22,0.43,0.26,0.36,0.77,0.91,0.16,0.19,0.25,0.2,0.37,0.63,0.46,0.4,0.39,0.15,0.17,0.53,0.51,0.21,0.31,0.39,0.44,0.85,0.19,0.25,0.14,0.33,0.43,0.24,0.22,0.79,0.16,0.41
75%,2022.0,25903954.0,0.88,0.87,0.41,0.6,0.5,0.63,0.29,0.23,0.27,0.19,0.2,0.41,0.22,0.26,0.27,0.25,0.42,0.27,0.19,0.48,0.5,0.35,0.18,0.2,0.39,0.37,0.28,0.26,0.23,0.16,0.32,0.33,0.17,0.36,0.15,0.26,0.44,0.23,0.14,0.18,0.03,0.44,0.38,0.33,0.69,0.9,0.51,0.28,0.26,0.17,0.1,0.11,0.02,0.05,0.23,0.14,0.06,0.12,0.01,0.32,0.26,0.37,0.29,0.45,0.69,0.48,0.25,0.45,0.16,0.01,0.02,0.01,0.16,0.17,0.35,0.1,0.17,0.04,0.34,0.34,0.44,0.41,0.42,0.13,0.18,0.1,0.31,0.04,0.13,0.01,0.31,0.36,0.24,0.02,0.09,0.02,0.25,0.27,0.19,0.01,0.08,0.0,0.19,0.25,0.77,0.3,0.07,0.02,0.04,0.27,0.0,0.18,0.34,0.38,0.23,0.17,0.47,0.42,0.39,0.35,0.31,0.13,0.36,0.09,0.14,0.35,0.07,0.41,0.68,0.57,0.77,0.49,0.63,0.12,0.17,0.42,0.19,0.13,0.31,0.29,0.18,0.12,0.02,0.35,0.13,0.2,0.16,0.21,0.18,0.55,0.24,0.18,0.18,0.23,0.3,0.19,0.36,0.33,0.24,0.26,0.12,0.38,0.44,0.4,0.16,0.12,0.14,0.02,0.02,0.35,0.02,0.25,0.01,0.08,0.26,0.15,0.17,0.0,0.0,0.38,0.21,0.22,0.24,0.02,0.2,0.2,0.27,0.04,0.24,0.19,0.24,0.02,0.29,0.2,0.17,0.15,0.12,0.4,0.02,0.06,0.14,0.48,0.36,0.86,0.76,0.67,0.93,0.89,0.88,0.99,0.29,0.82,0.98,0.9,0.87,0.8,0.79,0.79,0.51,0.91,0.85,0.56,0.87,0.56,0.2,0.47,0.55,0.74,0.56,0.58,0.85,0.48,0.82,0.85,0.9,0.91,0.49,0.61,0.54,0.74,0.87,0.91,0.72,0.75,0.73,0.53,0.2,0.54,0.53,0.56,0.51,0.36,0.7,0.51,0.62,0.23,0.64,0.45,0.55,0.25,0.41,0.57,0.47,0.74,0.35,0.68,0.61,0.72,0.46,0.33,0.35,0.34,0.33,0.4,0.68,0.46,0.35,0.47,0.33,0.52,0.34,0.47,0.84,0.36,0.42,0.31,0.37,0.58,0.35,0.36,0.28,0.25,0.22,0.67,0.72,0.96,0.25,0.18,0.16,0.18,0.09,0.11,0.16,0.23,0.01,0.01,0.03,0.02,0.01,0.02,0.15,0.05,0.13,0.02,0.03,0.15,0.88,0.36,0.14,0.73,0.84,0.11,0.03,0.02,0.02,0.79,0.47,0.74,0.53,0.38,0.04,0.16,0.62,0.54,0.24,0.26,0.02,0.16,0.93,0.71,0.14,0.04,0.07,0.58,0.2,0.22,0.41,0.05,0.0,0.16,0.63,0.59,0.7,0.6,0.44,0.15,0.28,0.21,0.34,0.16,0.13,0.17,0.03,0.14,0.05,0.14,0.3,0.02,0.01,0.04,0.01,0.01,0.01,0.04,0.7,0.82,0.93,0.89,0.83,0.6,0.47,0.69,0.87,0.29,0.31,0.86,0.86,0.79,0.84,0.77,0.89,0.76,0.6,0.2,0.4,0.26,0.53,0.34,0.41,0.82,0.93,0.18,0.23,0.31,0.25,0.46,0.7,0.52,0.46,0.5,0.2,0.22,0.65,0.54,0.27,0.38,0.47,0.48,0.88,0.19,0.3,0.16,0.39,0.43,0.24,0.22,0.79,0.16,0.41
max,2024.0,1176678702.0,1.0,1.0,0.94,0.96,0.86,0.98,0.65,0.44,0.55,0.39,0.63,0.75,0.55,0.51,0.48,0.57,0.75,0.4,0.31,0.96,0.95,0.92,0.52,0.52,0.88,0.88,0.69,0.57,0.68,0.36,0.94,0.94,0.4,0.75,0.38,0.77,0.85,0.6,0.33,0.34,0.1,0.78,0.61,0.9,0.98,1.0,0.92,0.75,0.75,0.5,0.27,0.2,0.07,0.17,0.47,0.26,0.17,0.25,0.07,0.71,0.62,0.76,0.66,0.89,0.95,0.89,0.66,0.92,0.44,0.15,0.25,0.38,0.44,0.44,0.78,0.39,0.5,0.41,0.8,0.85,0.96,0.95,0.94,0.49,0.54,0.62,0.86,0.51,0.4,0.22,0.89,0.89,0.85,0.5,0.39,0.38,0.87,0.89,0.62,0.09,0.37,0.04,0.62,0.8,1.0,0.78,0.25,0.1,0.21,0.72,0.01,0.36,0.56,0.7,0.67,0.3,0.97,0.86,0.93,0.91,0.77,0.41,0.9,0.43,0.43,0.89,0.53,0.92,1.0,0.99,1.0,0.97,0.97,0.18,0.34,0.85,0.35,0.3,0.78,0.55,0.39,0.29,0.1,0.83,0.27,0.44,0.34,0.65,0.3,0.97,0.66,0.49,0.39,0.54,0.49,0.36,0.58,0.83,0.62,0.71,0.21,0.93,0.81,0.84,0.34,0.26,0.32,0.05,0.07,0.66,0.06,0.52,0.05,0.2,0.7,0.29,0.4,0.04,0.01,0.87,0.46,0.4,0.36,0.04,0.42,0.35,0.39,0.08,0.5,0.31,0.37,0.06,0.58,0.62,0.35,0.39,0.19,0.66,0.07,0.1,0.27,0.86,0.76,1.0,0.98,0.98,1.0,1.0,0.99,1.0,0.63,0.98,1.0,1.0,0.99,0.94,0.98,0.98,0.94,0.99,0.99,0.81,0.89,0.7,0.2,0.71,0.96,0.76,0.92,0.99,0.99,0.86,0.97,0.99,0.99,0.99,0.67,0.71,0.63,0.89,0.98,0.98,0.94,0.89,0.95,0.7,0.2,0.56,0.57,0.79,0.71,0.7,0.9,0.89,0.88,0.55,0.83,0.75,0.89,0.34,0.73,0.65,0.62,0.89,0.56,0.85,0.8,0.87,0.54,0.48,0.52,0.57,0.4,0.65,0.75,0.55,0.55,0.52,0.45,0.59,0.46,0.53,0.94,0.46,0.46,0.61,0.55,0.6,0.41,0.4,0.39,0.27,0.23,0.76,0.72,1.0,0.58,0.38,0.33,0.38,0.28,0.24,0.31,0.48,0.05,0.04,0.08,0.08,0.03,0.06,0.26,0.21,0.22,0.06,0.08,0.31,1.0,0.7,0.26,0.9,0.98,0.25,0.16,0.09,0.44,0.98,0.81,0.98,0.84,0.67,0.2,0.3,0.96,0.92,0.53,0.66,0.06,0.29,1.0,0.97,0.26,0.18,0.18,0.96,0.36,0.87,0.79,0.17,0.0,0.3,0.98,0.97,0.98,0.94,0.9,0.29,0.76,0.44,0.57,0.36,0.26,0.36,0.09,0.33,0.1,0.44,0.5,0.06,0.03,0.07,0.03,0.06,0.02,0.26,0.8,0.95,0.97,0.97,0.95,0.81,0.74,0.82,0.97,0.54,0.71,0.96,0.97,0.94,0.98,0.94,0.98,0.91,0.77,0.31,0.65,0.47,0.65,0.57,0.57,0.95,0.95,0.23,0.32,0.51,0.67,0.61,0.89,0.68,0.51,0.87,0.29,0.26,0.8,0.61,0.35,0.54,0.56,0.62,0.97,0.19,0.34,0.2,0.66,0.43,0.24,0.22,0.79,0.16,0.41


Check shape

In [5]:
orig_df.shape

(8564, 437)

The shape tells us that there are 8564 rows with 437 columns.

In [6]:
orig_df.dtypes

countrynewwb          object
codewb                object
year                   int64
pop_adult            float64
regionwb24_hi         object
incomegroupwb24       object
group                 object
group2                object
account_t_d          float64
fiaccount_t_d        float64
mobileaccount_t_d    float64
borrow_any_t_d       float64
fin4_d               float64
dig_acc              float64
fin11_2a             float64
fin11a               float64
fin11b               float64
fin11c               float64
fin11f               float64
fin11d               float64
fin11e               float64
fin14a               float64
fin14b               float64
fin14c               float64
fin14d               float64
fin13_1a             float64
fin13_1b             float64
fin26a               float64
fin26b               float64
fin27a               float64
fin27b               float64
fin17f               float64
fin17a_17a1_d        float64
fin17a               float64
fin17b        

Check first 5 rows

In [7]:
orig_df.head(5)

Unnamed: 0,countrynewwb,codewb,year,pop_adult,regionwb24_hi,incomegroupwb24,group,group2,account_t_d,fiaccount_t_d,mobileaccount_t_d,borrow_any_t_d,fin4_d,dig_acc,fin11_2a,fin11a,fin11b,fin11c,fin11f,fin11d,fin11e,fin14a,fin14b,fin14c,fin14d,fin13_1a,fin13_1b,fin26a,fin26b,fin27a,fin27b,fin17f,fin17a_17a1_d,fin17a,fin17b,fin17c,fin22d,fin22e,fin22a_22a1_22g_d,fin22a,fin22a_1,fin22b,fin22c,fin24sav,fin24fam,fin24work,fin24bor,fin24sell,fin24other,fin24aVD,fin24aSD,fin24aND,fin24aSD_ND,fin24aP,fin24aN,fin24sav_SD_ND,fin24fam_SD_ND,fin24work_SD_ND,fin24bor_SD_ND,fin24sell_SD_ND,fin24other_SD_ND,fin24sav_VD,fin24fam_VD,fin24work_VD,fin24bor_VD,fin24sell_VD,fin24other_VD,fh1,fin28,fh2,fin29,fin31a_31b,fin30,fin31a,fin31b,fin31d,fin32_33_34a,fin32_33_34b,fin32_33_34c,fin32_33_34d,fin32_33_acc,fin32_33,fin32_n33_34a,fin32_n33_34b,fin32_n33_34c,fin32_n33_34d,fin32_n33_acc,fin32_n33,fin32,fin32_acc,fin34a,fin34b,fin34c,fin34d,fin37_38_39a,fin37_38_39b,fin37_38_39c,fin37_38_39d,fin37_38_39_acc,fin37_38,fin37_39a,fin37_39b,fin37_39c,fin37_39d,fin37_39_acc,fin37,fin38_39a,fin38_39b,fin38_39c,fin38_39d,fin38_39_acc,fin38,fin2_t_d,fin42,fin42_acc,fin43a,fin43b,fin43c,fin43d,fin45a,fin45c,fin45d,fin45e,fin45b,fin25e2,fin9b,fin10,fin22g,fin22h,inactive_t_d,fing2p_acc,fing2p_card,fing2p_cash,fing2p_fin,fing2p_mob,fing2p,g20_made,g20_received,g20_any,merchant_pay,save_any_t_d,fin11_1,fin5w,fin5m,fin5lm,fin5n,fin6w,fin6m,fin6lm,fin6n,fin11_0,fin9a,fin17dw,fin17dm,fin17dlm,fin17e,fin7,fin3,fin19,fin20,fin21,fin24ba,fin24bb,fin24bc,fin24bd,fin24c,fin24d1,fin24d2,fin24d3,fin25e1,fin25e2b,fin25e3w,fin25e3m,fin25e3lm,fin25e4a,fin25e4b,fin25e4c,fin25e4d,fin25e4e,fh2a,fin31c,fin36a,fin36b,fin40a,fin40b,fin36Aa,fin36Ab,fin8,fin13aw,fin13am,fin13alm,fin13an,fin13bw,fin13bm,fin13blm,fin13bn,fin13cw,fin13cm,fin13clm,fin13cn,fin13e,fin13f,fin13f_1,fin15,fin16,fin22f,fin41,fin35,fin44,fh1_fh2,fin28_29,fin31d_s,fin32_n33_34c_s,fin34c_s,fin43c_s,fin32_acc_s,fin34a_s,fin32_33_acc_s,inactive_t_d_s,fing2p_fin_s,fin32_33_34a_s,fin32_n33_acc_s,fin37_39_acc_s,fin37_39c_s,fin31a_31b_s,fin31a_s,fin31b_s,fin32_n33_34a_s,fin37_39a_s,fin34d_s,fin32_33_34d_s,fin32_n33_34d_s,fing2p_card_s,fin37_39d_s,fin42_acc_s,fin32_33_34c_s,fin37_38_39c_s,fin38_39c_s,fing2p_acc_s,fing2p_cash_s,fin37_38_39a_s,fin37_38_39_acc_s,fin38_39a_s,fin38_39_acc_s,fin34b_s,fin32_n33_34b_s,fin43b_s,fin27b_s,fin27a_s,fin22h_s,fin28_29_s,fin28_s,fin29_s,fing2p_mob_s,fin37_38_39d_s,fin37_38_39b_s,fin37_39b_s,fin11_2a_s,fin11b_s,fin11f_s,fin11d_s,fin11e_s,fin9b_s,fin11_1_s,fin5m_s,fin6m_s,fin9a_s,fin5w_s,fin6w_s,fin17dm_s,fin17dlm_s,fin25e3w_s,fin25e3m_s,fin24d1_s,fin14d_s,fin24d2_s,fin11a_s,fin11c_s,fin5lm_s,fin6lm_s,fin17dw_s,fin14c_s,fin13_1a_s,fin13_1b_s,fin13am_s,fin13alm_s,fin13bm_s,fin13blm_s,fin13cm_s,fin13clm_s,fin21_s,fin14b_s,fin13cw_s,fin13f_s,fin14a_s,fin25e3lm_s,fin13aw_s,fin13bw_s,fin24d3_s,fin5n_s,fin6n_s,fin13f_1_s,fin32_33_34b_s,con1,con2a,con2b,con2c,con2d,con2e,con2f,con2g,con3a,con3b,con3c,con3d,con3e,con3f,con3g,con4,con5a,con5b,con6,con7,con8,con9a,con9b,con10,con11,con12d,con12w,con12m,con12lm,con13,con14,con15,con16,con17a,con17b,con17c,con17d,con18,con19,con20,con21,con22,con23,internet,con26d,con26w,con26m,con26lm,con27,con28d,con28w,con28m,con28lm,con28n,con29,con30a,con30b,con30c,con30d,con30e,con30f,con30g,con30h,con31a,con31b,con31c,con31d,con31e,con31f,con31g,con31h,con32a,con32b,con32c,con32d,con32e,con32f,con32g,con32h,con10_s,con11_s,con12d_s,con14_s,con16_s,con17a_s,con17b_s,con18_s,con19_s,con20_s,con21_s,con26d_s,con27_s,con28m_s,con30a_s,con30b_s,con30c_s,con30d_s,con30e_s,con30f_s,con30g_s,con30h_s,con31a_s,con31b_s,con31f_s,con2a_s,con15_s,con17d_s,con29_s,con31d_s,con31h_s,con32a_s,con3a_s,con4_s,con28d_s,con28w_s,con23_s,con31c_s,con2b_s,con2d_s,con26w_s,con2c_s,con2e_s,con2g_s,con5b_s,con12m_s,con26lm_s,con12w_s,con2f_s,con13_s,con26m_s,con28lm_s,con5a_s,con17c_s,con32h_s
0,Afghanistan,AFG,2011,14575546.0,South Asia (excluding high income),Low income,all,all,0.09,0.09,,,,,,,,,,,,,,,,,,,,,,,0.03,0.03,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.05,,,,,,,,,,,,,,0.01,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,Albania,ALB,2011,2281010.0,Europe & Central Asia (excluding high income),Upper middle income,all,all,0.28,0.28,,,,,,,,,,,,,,,,,,,,,,,0.09,0.09,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.21,,,,,,,,,,,,,,0.11,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,Algeria,DZA,2011,26251587.0,Middle East & North Africa (excluding high inc...,Lower middle income,all,all,0.33,0.33,,,,,,,,,,,,,,,,,,,,,,,0.04,0.04,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.14,,,,,,,,,,,,,,0.01,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,Angola,AGO,2011,12779501.0,Sub-Saharan Africa (excluding high income),Lower middle income,all,all,0.39,0.39,,,,,,,,,,,,,,,,,,,,,,,0.16,0.16,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.3,,,,,,,,,,,,,,0.15,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,Argentina,ARG,2011,30685516.0,Latin America & Caribbean (excluding high income),Upper middle income,all,all,0.33,0.33,,,,,,,,,,,,,,,,,,,,,,,0.04,0.04,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.3,,,,,,,,,,,,,,0.22,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


The first 5 rows tells us the following:
1. There are 8 dimensions (`countrynewwb`, `codewb`, `year`, `pop_adult`, `regionwb24_hi`, `incomegroupwb24`, `group`, and `group2`)
2. Then the rest of the columns must be the indicators (we will investigate next)

## Indicator Check
According to the Global Findex data, there are "almost 300 indicators on topics such as mobile phone ownership, internet use, digital safety, account ownership, payments, saving, credit, and financial resilience."

In [8]:
#Exclude dimensions
dimensions = ['countrynewwb', 'codewb', 'year', 
              'pop_adult', 'regionwb24_hi', 
              'incomegroupwb24', 'group', 'group2']

columns = orig_df.columns.tolist()
indicators = [indicator for indicator in columns if indicator not in dimensions]
print(f"There are {len(indicators)} indicators in the dataset.")
print("Indicator list:")
print(indicators)

There are 429 indicators in the dataset.
Indicator list:
['account_t_d', 'fiaccount_t_d', 'mobileaccount_t_d', 'borrow_any_t_d', 'fin4_d', 'dig_acc', 'fin11_2a', 'fin11a', 'fin11b', 'fin11c', 'fin11f', 'fin11d', 'fin11e', 'fin14a', 'fin14b', 'fin14c', 'fin14d', 'fin13_1a', 'fin13_1b', 'fin26a', 'fin26b', 'fin27a', 'fin27b', 'fin17f', 'fin17a_17a1_d', 'fin17a', 'fin17b', 'fin17c', 'fin22d', 'fin22e', 'fin22a_22a1_22g_d', 'fin22a', 'fin22a_1', 'fin22b', 'fin22c', 'fin24sav', 'fin24fam', 'fin24work', 'fin24bor', 'fin24sell', 'fin24other', 'fin24aVD', 'fin24aSD', 'fin24aND', 'fin24aSD_ND', 'fin24aP', 'fin24aN', 'fin24sav_SD_ND', 'fin24fam_SD_ND', 'fin24work_SD_ND', 'fin24bor_SD_ND', 'fin24sell_SD_ND', 'fin24other_SD_ND', 'fin24sav_VD', 'fin24fam_VD', 'fin24work_VD', 'fin24bor_VD', 'fin24sell_VD', 'fin24other_VD', 'fh1', 'fin28', 'fh2', 'fin29', 'fin31a_31b', 'fin30', 'fin31a', 'fin31b', 'fin31d', 'fin32_33_34a', 'fin32_33_34b', 'fin32_33_34c', 'fin32_33_34d', 'fin32_33_acc', 'fin32_33', 'f

There are 429 indicators in the list. We have gone through the Glossary of these indicators and have found that some of them are the same indicator but with different expressions. For example, `con26d`, `con26w`, and `con26m` are internet use, aggregated daily, weekly, and monthly respectively. Therefore we think that there might be 300 **unique** indicators in the list, while the rest are different aggregations of the data.

## Country Check

In [9]:
#Check unique countries
countries = orig_df.codewb.unique()
print(f"There are {len(countries)} countries in the dataset.")
print("Country list:")
print(countries)

There are 174 countries in the dataset.
Country list:
['AFG' 'ALB' 'DZA' 'AGO' 'ARG' 'ARM' 'AUS' 'AUT' 'AZE' 'BHR' 'BGD' 'BLR'
 'BEL' 'BEN' 'BOL' 'BIH' 'BWA' 'BRA' 'BGR' 'BFA' 'BDI' 'KHM' 'CMR' 'CAN'
 'CAF' 'TCD' 'CHL' 'CHN' 'COL' 'COM' 'COD' 'COG' 'CRI' 'HRV' 'CYP' 'CZE'
 'DNK' 'DJI' 'DOM' 'ECU' 'EGY' 'SLV' 'EST' 'SWZ' 'FIN' 'FRA' 'GAB' 'GEO'
 'DEU' 'GHA' 'GRC' 'GTM' 'GIN' 'HTI' 'HND' 'HKG' 'HUN' 'IND' 'IDN' 'IRN'
 'IRQ' 'IRL' 'ISR' 'ITA' 'JAM' 'JPN' 'JOR' 'KAZ' 'KEN' 'KOR' 'XKX' 'KWT'
 'KGZ' 'LAO' 'LVA' 'LBN' 'LSO' 'LBR' 'LTU' 'LUX' 'MDG' 'MWI' 'MYS' 'MLI'
 'MLT' 'MRT' 'MUS' 'MEX' 'MDA' 'MNG' 'MNE' 'NPL' 'NLD' 'NZL' 'NIC' 'NER'
 'NGA' 'MKD' 'OMN' 'PAK' 'PAN' 'PRY' 'PER' 'PHL' 'POL' 'PRT' 'QAT' 'ROU'
 'RUS' 'RWA' 'SAU' 'SEN' 'SRB' 'SLE' 'SGP' 'SVK' 'SVN' 'ZAF' 'ESP' 'LKA'
 'SDN' 'SWE' 'SYR' 'TWN' 'TJK' 'TZA' 'THA' 'TGO' 'TTO' 'TUR' 'TKM' 'UGA'
 'UKR' 'ARE' 'GBR' 'USA' 'URY' 'UZB' 'VEN' 'VNM' 'PSE' 'YEM' 'ZMB' 'ZWE'
 'BLZ' 'BTN' 'CIV' 'ETH' 'MMR' 'NAM' 'NOR' 'PRI' 'SOM' 'CHE' 'TUN' 'GM

For this analysis, we are interested in the ASEAN 5, including Singapore and the Global average:
1. `PHL`: Philippines
2. `IDN`: Indonesia
3. `THA`: Thailand
4. `VNM`: Vietnam
5. `MYS`: Malaysia
6. `SGP`: Singapore
7. `WLD`: World

## Year Check

In [10]:
#Check years
years = orig_df.year.unique()
print(f"There are {len(years)} countries in the dataset.")
print("Year list:")
print(years)

There are 6 countries in the dataset.
Year list:
[2011 2014 2017 2021 2022 2024]


Confirming that the study spans 13 years. We are only interested in the last 10 years, so we will exclude 2011 in our analysis.

# DATA PREPARATION
In this section, we'll prepare the dataset we're going to use for our analysis.

1. We will keep only ASEAN 5, Singapore, World `country` values.
2. We will remove 2011 in the `year` values
3. We will keep the following indicators (please see the next section)

## SECTION HERE ON INDICATORS TO USE

In [11]:
df = orig_df.copy()

In [12]:
asean_5 = ['PHL', 'IDN', 'THA', 'VNM', 'MYS', 'SGP', 'WLD']

In [13]:
#Filter for Asean 5
df = df[df['codewb'].isin(asean_5)]

In [14]:
#Remove 2011
df = df[~df['year'].isin([2011])]

In [15]:
df.shape

(319, 437)

We're down to 394 rows!

In [16]:
#Recheck countries
countries = df.codewb.unique()
print(f"There are {len(countries)} countries in the dataset.")
print("Country list:")
print(countries)

There are 7 countries in the dataset.
Country list:
['IDN' 'MYS' 'PHL' 'SGP' 'THA' 'VNM' 'WLD']


In [17]:
#Recheck years
years = df.year.unique()
print(f"There are {len(years)} countries in the dataset.")
print("Year list:")
print(years)

There are 5 countries in the dataset.
Year list:
[2014 2017 2021 2022 2024]


In [18]:
#Check info
print(df.info())

<class 'pandas.core.frame.DataFrame'>
Index: 319 entries, 202 to 7936
Columns: 437 entries, countrynewwb to con32h_s
dtypes: float64(430), int64(1), object(6)
memory usage: 1.1+ MB
None


## Saving processed data for analysis

In [19]:
file_path = '../data/processed/global_findex_for_analysis.csv'

if not os.path.exists(file_path):
    df.to_csv(file_path, index=False)
    print("File saved successfully!")
else:
    print("File already exists. Skipping save.")

File already exists. Skipping save.


We have now filtered the data for what we need for our analysis. We will then investigate the missingness of the data and see how we must handle them.

# HANDLING MISSINGNESS
(Draft still but):
1. "If the variable is not gonna be needed, it does not matter whether the particular item is missing or not and should be excluded in the subset of dataframe before applying listwise deletion." - so by selecting the variables that we need, we already have handled an important part here.
2. Since this is a survey, I think the data is **MCAR**. It is most likely that the missing data is just because the variable is not being measure at that year. My hunch is that most of these data are in missing years (will have to confirm).