## Extract HL variables for equity stratifiers
### ** Age and Sex HoH **

In [1]:
# %load std_imports.py
from pathlib import Path

import numpy as np
import pandas as pd

import json
import pyreadstat

from std_utils import (
    read_file,
    run_quality_assurance,
    generate_HHID,
    merge_hh_hl_data,
    subset_hl_df,
    standardize_col_names,
    standardize_col_values,
    create_elderly_hoh,
    save_merge,
    export_analyzed_data
)

pd.set_option("display.max_rows", 1500)
pd.set_option("display.max_columns", None)


In [2]:
## Set parameters
country = 'VNM'
recode = 'listing'
var_subset = 'relationship_hoh'
var_rename = ['elderly_hoh', 'sex_hoh']
var_replace = ['sex_hoh']

# -------------------------------------------------------------------
year_list = ['2000', '2006', '2011', '2014', '2021']
# -------------------------------------------------------------------


In [3]:
for year in year_list:

    # Read file
    df = read_file(country, year, recode)

    # Create HHID to facilitate merge of HH and HL data
    generate_HHID(df, country, year, recode)

    # Subset df
    df = subset_hl_df(df, country, year, recode, var_subset)

    # Standardize column names
    df = standardize_col_names(df, country, year, recode, var_rename)

    # Standardize column values
    df = standardize_col_values(df, country, year, recode, var_replace)

    # Create Elderly HoH
    df = create_elderly_hoh(df, var_rename[0])

    # Save to merge folder
    save_merge(df, country, year, recode)

The file -- hl_2000.sav -- has the following shape: Rows: 35657; Columns: 99
HHID is NOT unique
The merge variable *HHID* is unique: True
The file -- hl_2006.sav -- has the following shape: Rows: 36573; Columns: 154
HHID is NOT unique
The merge variable *HHID* is unique: True
The file -- hl_2011.sav -- has the following shape: Rows: 44831; Columns: 64
HHID is NOT unique
The merge variable *HHID* is unique: True
The file -- hl_2014.sav -- has the following shape: Rows: 39380; Columns: 50
HHID is NOT unique
The merge variable *HHID* is unique: True
The file -- hl_2021.sav -- has the following shape: Rows: 47821; Columns: 73
HHID is NOT unique
The merge variable *HHID* is unique: True
