## Extract HH variables for equity stratifiers
### ** Residence, Region, Wealth, Ethnicity of HoH **

In [3]:
# %load std_imports.py
from pathlib import Path

import numpy as np
import pandas as pd

import json
import pyreadstat

from std_utils import (
    read_file,
    run_quality_assurance,
    generate_HHID,
    merge_hh_hl_data,
    subset_hl_df,
    standardize_col_names,
    standardize_col_values,
    create_elderly_hoh,
    save_merge,
    export_analyzed_data
)

pd.set_option("display.max_rows", 1500)
pd.set_option("display.max_columns", None)


In [4]:
# Set parameters
country = 'VNM'
recode = 'household'
var_rename = ['residence', 'region', 'wealth', 'eth_hoh']
var_replace = ['residence', 'region', 'wealth', 'eth_hoh']

# -------------------------------------------------------------------
year_list = ['2000', '2006', '2011', '2014', '2021']
# -------------------------------------------------------------------


In [5]:
for year in year_list:

    # Read file
    df = read_file(country, year, recode)

    # Create HHID to facilitate merge of HH and HL data
    generate_HHID(df, country, year, recode)

    # Standardize column names
    df = standardize_col_names(df, country, year, recode, var_rename)

    # Standardize column values
    df = standardize_col_values(df, country, year, recode, var_replace)

    # Save to merge folder
    save_merge(df, country, year, recode)

The file -- hh_2000.sav -- has the following shape: Rows: 7628; Columns: 54
HHID is unique
The file -- hh_2006.sav -- has the following shape: Rows: 8356; Columns: 102
HHID is unique
The file -- hh_2011.sav -- has the following shape: Rows: 11874; Columns: 127
HHID is unique
The file -- hh_2014.sav -- has the following shape: Rows: 10200; Columns: 147
HHID is unique
The file -- hh_2021.sav -- has the following shape: Rows: 14000; Columns: 382
HHID is unique
