# LEEP 2024 Multi-Country CEA

In [1]:
import numpy as np
import pandas as pd
import squigglepy as sq
# from squigglepy.numbers import K

pd.set_option('display.float_format', lambda x: f'{x:,.3f}')
idx = pd.IndexSlice

COUNTRIES = ["Malawi", "Madagascar", "Sierra Leone", "Liberia", "Angola", "Pakistan",
             "Niger", "Zimbabwe", "Bolivia", "Ghana", "Nigeria", "Cote d'Ivoire", "Senegal"]
SCENARIOS = ["Counterfactual", "LEEP intervention"]
YEARS = range(2021, 2101)

# N = 100*K
N = 10
SAMPLES = range(N)

SAMPLE_YEAR_INDEX = pd.MultiIndex.from_product(
    [SAMPLES, YEARS], names=["Sample", "Year"])
SCENARIO_SAMPLE_INDEX = pd.MultiIndex.from_product(
    [SCENARIOS, SAMPLES], names=["Scenario", "Sample"])
SCENARIO_SAMPLE_YEAR_INDEX = pd.MultiIndex.from_product(
    [SCENARIOS, SAMPLES, YEARS], names=["Scenario", "Sample", "Year"])

## Inputs

### Population

The population and projected future population estimates for each country are from the [UN population projections](https://population.un.org/wpp/Download/Standard/CSV/).

In [2]:
# TODO(drw): Could use uncertainty estimates here?
population = pd.read_csv('population.csv', index_col=0)
population.head()

Unnamed: 0_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Year,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1
2021,19889742,28915652,8420642,5193422,34503776,231402110,25252722,15993525,12079474,32833036,213401330,27478250,16876726
2022,20405318,29611718,8605723,5302690,35588996,235824860,26207982,16320539,12224114,33475870,218541220,28160548,17316452
2023,20931750,30325736,8791092,5418378,36684212,240485660,27202844,16665407,12388575,34121990,223804640,28873040,17763164
2024,21475962,31056608,8977979,5536954,37804630,245209810,28238976,17020320,12567344,34777524,229152220,29603304,18221560
2025,22033992,31797310,9165381,5657236,38942796,249948880,29315974,17375286,12746151,35439790,234573600,30344186,18687806


### Births

Projections of future annual births in each country are from the [UN population projections](https://population.un.org/wpp/Download/Standard/Population/).

In [3]:
# TODO(drw): Could use uncertainty estimates here?
births = pd.read_csv('births.csv', index_col=0)
births.head()

Unnamed: 0_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Year,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1
2021,653703,895045,264106,162685,1338792,6374741,1144371,488807,263820,904679,7923294,932943,549984
2022,665678,906130,265023,164452,1359723,6424944,1180654,491195,264070,906677,8002758,943133,555696
2023,678962,918152,266774,166979,1381742,6474370,1216927,493840,263936,909913,8109136,959962,562482
2024,687950,927190,267219,169153,1404185,6512176,1256001,496655,265235,911299,8234399,974998,568369
2025,698306,937701,268121,171399,1426882,6559877,1296167,498207,266191,916924,8321052,989981,575820


### Decline in lead market share once enforcement/compliance begins

We estimate that, once enforcement/compliance begins, the market share captured by lead-based paint will decline at a rate of 20% annually. This is a conservative estimate relative to our compliance goal: in the majority of our target countries, we aim to achieve 50% compliance a year after regulation is implemented and enforcement begins. [Follow up study](https://leadelimination.org/malawi-follow-up-study/) data from Malawi suggests that our compliance goals are achievable, as do preliminary reports of manufacturers representing >50% of market share switching to lead-free alternatives in Pakistan, Ghana, and Zimbabwe.

In [4]:
decline_in_lead_market_share_once_enforcement_compliance_begins = pd.Series(
    sq.norm(-0.3, -0.1) @ N)
decline_in_lead_market_share_once_enforcement_compliance_begins.head()

0   -0.199
1   -0.091
2   -0.178
3   -0.187
4   -0.198
dtype: float64

### % of new painted homes that use some colored solvent based lead paint

To develop this estimate, we surveyed members of the LEEP team to understand their best guess of the portion of homes that use some coloured solvent-based paints in the countries where they work. We averaged the estimates provided by LEEP’s team members, which gave us the estimate that coloured solvent-based paint is used in 80% of new painted homes in the LMICs included in this model. We are uncertain of this estimate given the difficulty of approximating this input across the variety of painting practices used in LMICs.

In [5]:
pct_of_new_painted_homes_that_use_some_colored_solvent_based_lead_paint = pd.Series(
    sq.lognorm(0.65, 0.9) @ N)
pct_of_new_painted_homes_that_use_some_colored_solvent_based_lead_paint.head()

0   0.627
1   0.910
2   0.843
3   0.742
4   0.684
dtype: float64

### Lead market share of colored solvent based paints (2021)

In [6]:
lead_market_share_of_colored_solvent_based_paints_2021 = pd.DataFrame(
    np.array(
        [sq.lognorm(0.60, 0.83) @ N,
         sq.lognorm(0.60, 0.83) @ N,
         sq.lognorm(0.32, 0.44) @ N,
         sq.lognorm(0.60, 0.83) @ N,
         sq.lognorm(0.48, 0.66) @ N,
         sq.lognorm(0.52, 0.72) @ N,
         sq.lognorm(0.32, 0.44) @ N,
         sq.lognorm(0.52, 0.72) @ N,
         sq.lognorm(0.32, 0.44) @ N,
         sq.lognorm(0.16, 0.22) @ N,
         sq.lognorm(0.68, 0.94) @ N,
         sq.lognorm(0.60, 0.83) @ N,
         sq.lognorm(0.60, 0.83) @ N]).T,
    columns=COUNTRIES)
lead_market_share_of_colored_solvent_based_paints_2021.head()

Unnamed: 0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
0,0.605,0.787,0.422,0.659,0.539,0.646,0.42,0.572,0.381,0.219,0.742,0.756,0.601
1,0.786,0.661,0.39,0.688,0.565,0.627,0.349,0.509,0.362,0.183,0.859,0.722,0.691
2,0.764,0.637,0.364,0.716,0.597,0.576,0.395,0.544,0.369,0.194,0.724,0.613,0.558
3,0.753,0.651,0.444,0.727,0.505,0.586,0.387,0.592,0.375,0.19,0.749,0.775,0.603
4,0.592,0.654,0.339,0.685,0.714,0.57,0.374,0.581,0.345,0.185,0.762,0.821,0.74


### Annual time discount rate

We discount future costs and benefits at a rate of 4% per year, in line with [GiveWell](https://docs.google.com/spreadsheets/d/1B1fODKVbnGP4fejsZCVNvBm5zvI1jC7DhkaJpFk6zfo/edit#gid=1362437801). There is debate over the appropriate discount rate. [Haacker, Hallett, and Atun (2020)](https://academic.oup.com/heapol/article/35/1/107/5591528) found that 85% of 188 global health CEAs used a discount of 3% for both health and costs. Given the 100-year timeframe of this model, this is an important factor (e.g. a value of 1 in year 1 discounted by 4% per year would be 0.46 in year 20, 0.14 in year 50, and 0.06 by year 70; whereas using a discount rate of 3% would give a value of 0.55 in year 20, 0.23 in year 50, and 0.13 by year 70).

In [7]:
annual_time_discount_rate = pd.Series(sq.norm(0.03, 0.05) @ N)
annual_time_discount_rate.head()

0   0.049
1   0.038
2   0.034
3   0.049
4   0.040
dtype: float64

### Discount factor

In [8]:
discount_factor = pd.DataFrame(
    np.array(
        [1/(1 + annual_time_discount_rate)**(year - YEARS[0]) for year in YEARS]).T,
    columns=YEARS)
discount_factor.head()

Unnamed: 0,2021,2022,2023,2024,2025,2026,2027,2028,2029,2030,...,2091,2092,2093,2094,2095,2096,2097,2098,2099,2100
0,1.0,0.953,0.909,0.866,0.826,0.787,0.75,0.715,0.682,0.65,...,0.035,0.033,0.032,0.03,0.029,0.028,0.026,0.025,0.024,0.023
1,1.0,0.963,0.928,0.894,0.861,0.829,0.799,0.769,0.741,0.714,...,0.073,0.07,0.067,0.065,0.063,0.06,0.058,0.056,0.054,0.052
2,1.0,0.967,0.935,0.904,0.875,0.846,0.818,0.791,0.765,0.74,...,0.096,0.093,0.09,0.087,0.084,0.081,0.078,0.076,0.073,0.071
3,1.0,0.954,0.909,0.867,0.827,0.789,0.752,0.717,0.684,0.652,...,0.036,0.034,0.033,0.031,0.03,0.028,0.027,0.026,0.025,0.024
4,1.0,0.962,0.925,0.889,0.855,0.822,0.79,0.76,0.731,0.703,...,0.064,0.062,0.06,0.057,0.055,0.053,0.051,0.049,0.047,0.045


### Increase in BLL from living in a home with lead paint

In [9]:
increase_in_bll_from_living_in_a_home_with_lead_paint = pd.Series(
    sq.norm(0.7, 3.0) @ N)
increase_in_bll_from_living_in_a_home_with_lead_paint.head()

0   2.281
1   1.927
2   0.800
3   0.735
4   2.151
dtype: float64

### Implied % of childhood BLL caused by lead paint initially

In [10]:
# TODO(drw): This formula references non-inputs

### Probability of success

We calculate a probability of success for each country, which encapsulates our estimate of the likelihood that our intervention that country is likely to succeed in its implementation, and hence that its associated benefits will be realised. These figures were estimated by the LEEP team based on knowledge of each country and an assessment of current progress towards implementation in each country. Overall, our probability of success estimates are relatively high, since they mostly capture the “stochastic” possibility of failure due to events such as unexplained government withdrawal / reversal, or political instability, which we feel to be relatively unlikely. The possibility of implementation being delayed, on the other hand, is already captured in our uncertainty intervals around intervention start dates.

We multiply total discounted benefits by these probabilities of success to get total expected discounted benefits, and calculate the final cost-effectiveness number as total discounted costs divided by total expected discounted benefits. We choose only to weight benefits, and not costs, by the probabilities of success, in order to be conservative and reflect the possibility that failure occurs even despite government and LEEP costs having already been incurred.


In [11]:
probability_of_success = pd.DataFrame(
    np.array(
        [sq.lognorm(0.85, 0.95) @ N,
         sq.lognorm(0.75, 0.85) @ N,
         sq.lognorm(0.70, 0.80) @ N,
         sq.lognorm(0.65, 0.75) @ N,
         sq.lognorm(0.75, 0.85) @ N,
         sq.lognorm(0.85, 0.95) @ N,
         sq.lognorm(0.70, 0.80) @ N,
         sq.lognorm(0.75, 0.85) @ N,
         sq.lognorm(0.70, 0.80) @ N,
         sq.lognorm(0.75, 0.85) @ N,
         sq.lognorm(0.75, 0.85) @ N,
         sq.lognorm(0.70, 0.80) @ N,
         sq.lognorm(0.70, 0.80) @ N,]).T,
    columns=COUNTRIES)

probability_of_success.head()

Unnamed: 0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
0,0.894,0.824,0.74,0.694,0.772,0.834,0.761,0.859,0.811,0.793,0.814,0.737,0.708
1,0.872,0.822,0.693,0.671,0.824,0.88,0.775,0.803,0.727,0.814,0.82,0.754,0.775
2,0.836,0.779,0.743,0.688,0.774,0.932,0.746,0.815,0.728,0.808,0.741,0.778,0.748
3,0.901,0.821,0.76,0.67,0.807,0.925,0.803,0.793,0.78,0.799,0.776,0.784,0.754
4,0.853,0.763,0.722,0.731,0.783,0.913,0.722,0.792,0.746,0.827,0.823,0.775,0.75


## Births with averted lead paint exposure

### Number of homes painted

#### People per household

We use recent data on average household size from the [Global Data Lab](https://globaldatalab.org/areadata/table/hhsize/AGO+CIV+GHA+LBR+MDG+MWI+NER+NGA+SEN+SLE+ZWE+BOL+PAK/?levels=1+4). We assume that average household size will decrease at a constant rate of 1% annually across countries. Average household size in high income countries is approximately 2.5, thus we treat this value as a long term minimum assumption in our estimates. Our estimate for people per household is used to calculate the total number of homes within a country. Our model is relatively insensitive to this input because the proportion of homes exposed to lead paint has a greater effect on our final estimate of cost-effectiveness than the absolute number of homes within the country.

In [12]:
PEOPLE_PER_HOUSEHOLD_INIT = pd.Series([3.96, 4.18, 9.01, 4.33, 6.45, 8.21, 7.45, 3.27, 4.86, 4.22, 6.86, 2.81, 10.8],
                                      index=COUNTRIES)
PEOPLE_PER_HOUSEHOLD_MIN = 2.5
PEOPLE_PER_HOUSEHOLD_RATE = -0.01

people_per_household = pd.DataFrame(
    np.array(
        [np.maximum(
            PEOPLE_PER_HOUSEHOLD_INIT * (1 + PEOPLE_PER_HOUSEHOLD_RATE)**(year - YEARS[0]), PEOPLE_PER_HOUSEHOLD_MIN)
         for year in YEARS]),
    index=YEARS, columns=COUNTRIES)
people_per_household.head()

Unnamed: 0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
2021,3.96,4.18,9.01,4.33,6.45,8.21,7.45,3.27,4.86,4.22,6.86,2.81,10.8
2022,3.92,4.138,8.92,4.287,6.386,8.128,7.375,3.237,4.811,4.178,6.791,2.782,10.692
2023,3.881,4.097,8.831,4.244,6.322,8.047,7.302,3.205,4.763,4.136,6.723,2.754,10.585
2024,3.842,4.056,8.742,4.201,6.258,7.966,7.229,3.173,4.716,4.095,6.656,2.727,10.479
2025,3.804,4.015,8.655,4.159,6.196,7.886,7.156,3.141,4.668,4.054,6.59,2.699,10.374


#### Number of homes

In [13]:
number_of_homes = (population / people_per_household)
number_of_homes.head()

Unnamed: 0_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Year,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1
2021,5022662.121,6917620.096,934588.457,1199404.619,5349422.636,28185397.077,3389627.114,4890986.239,2485488.477,7780340.284,31108065.598,9778736.655,1562659.815
2022,5204907.152,7155700.063,964777.968,1237009.821,5573407.877,29014242.301,3553383.771,5041404.566,2540656.358,8012798.602,32179111.818,10122775.082,1619570.894
2023,5393118.513,7402265.856,995514.626,1276765.132,5802953.503,29886539.953,3725526.432,5199933.415,2600846.349,8249953.699,33286994.276,10483729.418,1678132.239
2024,5589228.4,7657238.157,1026947.425,1317884.758,6040594.647,30781451.838,3906493.336,5364316.387,2665027.225,8493381.351,34426618.705,10857461.081,1738826.363
2025,5792382.371,7919054.298,1058973.162,1360114.973,6285309.045,31693285.257,4096446.4,5531506.548,2730247.458,8742545.685,35597068.878,11241606.869,1801332.079


#### Growth in the paint market

We use data from a [variety of sources](https://docs.google.com/spreadsheets/d/1bIiee05WlPt4B7NV3uvol2vu5JVbwOvL/edit#gid=508218074)  – IndustryArc, European Coatings, and Emerald Group, among others – to calculate an initial paint market growth rate of 5.5%. We arrive at this estimate by considering the average of the paint market growth rates from these sources, which is 5.75%. However, these growth rates correspond to a range of different countries and regions, and reflect growth in the paint market as a whole, rather than in the portion of the market that is specifically captured by home-use paints. Therefore, to be more conservative, we choose 5.5% as the initial value in 2021. 5.5% is also in line with a 20-year average of the World Bank’s estimate for real [GDP growth](https://data.worldbank.org/indicator/NY.GDP.MKTP.KD.ZG?locations=XO) in low- and middle-income countries (LMICs), which we would expect to approximate future GDP growth and correlate with paint market growth.

We assume that the paint market growth rate decreases by 0.03% per year (i.e. 5.5% in year 1, 5.47% in year 2). We expect that once all existing homes within a country are painted, then growth in the paint market will be roughly equal to population growth from that point forward. To reflect our expectation that growth in the paint market will converge with population growth in the long term, we treat the population growth rate in each country as the long term minimum for paint market growth.

This figure is a simplification in that we use one estimate of paint market growth rate for all countries within our model, rather than calculating unique growth rates for each country.


In [14]:
growth_in_the_paint_market = pd.Series(sq.norm(0.025, 0.08) @ N)
growth_in_the_paint_market.head()

0   0.031
1   0.027
2   0.078
3   0.055
4   0.038
dtype: float64

#### % population urban

We use UN population projections of urban populations to determine the proportion of each country’s population that lives in an urban area. We use the UN’s estimate for the urban percentage of the population in 2020.

In our Malawi CEA, we assumed that the proportion of homes that are painted is equal to the proportion of the population that lives in urban areas. In our current CEA, we update this starting assumption such that in Year 1, the proportion of homes that are painted is equal to the sum of 75% of the urban population and 25% of the rural (non-urban) population. In our model, the urban population percentage is only used to calculate the percentage of homes painted in Year 1 (2021). In future years, our estimate for the percentage of homes painted is calculated using a different formula that is primarily dependent on changes in the paint market growth rate, rather than urban population projections. We use this approach because we are uncertain about how urban-rural classification will correspond with home painting rates in future years. For example, it is possible that the proportion of homes painted in rural areas will increase significantly as countries continue to experience economic growth.


In [15]:
pct_population_urban = pd.DataFrame(
    np.array(
        [sq.lognorm(0.165, 0.183) @ N,
         sq.lognorm(0.371, 0.410) @ N,
         sq.lognorm(0.409, 0.452) @ N,
         sq.lognorm(0.494, 0.546) @ N,
         sq.lognorm(0.637, 0.704) @ N,
         sq.lognorm(0.353, 0.391) @ N,
         sq.lognorm(0.162, 0.179) @ N,
         sq.lognorm(0.304, 0.336) @ N,
         sq.lognorm(0.665, 0.735) @ N,
         sq.lognorm(0.542, 0.599) @ N,
         sq.lognorm(0.494, 0.546) @ N,
         sq.lognorm(0.494, 0.546) @ N,
         sq.lognorm(0.456, 0.504) @ N]).T,
    columns=COUNTRIES)
pct_population_urban.head()

Unnamed: 0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
0,0.174,0.397,0.423,0.529,0.687,0.387,0.172,0.312,0.714,0.559,0.526,0.545,0.485
1,0.167,0.397,0.429,0.52,0.65,0.367,0.161,0.329,0.721,0.554,0.536,0.514,0.508
2,0.178,0.381,0.433,0.509,0.677,0.361,0.173,0.329,0.675,0.57,0.51,0.547,0.463
3,0.166,0.388,0.436,0.514,0.655,0.354,0.169,0.338,0.742,0.553,0.538,0.532,0.501
4,0.168,0.403,0.421,0.536,0.628,0.355,0.171,0.313,0.722,0.552,0.525,0.524,0.478


#### Number of painted homes

In [16]:
PCT_OF_HOMES_PAINTED_URBAN = 0.75
PCT_OF_HOMES_PAINTED_RURAL = 0.25
PCT_OF_HOMES_PAINTED_INIT = PCT_OF_HOMES_PAINTED_URBAN*pct_population_urban + \
    PCT_OF_HOMES_PAINTED_RURAL*(1 - pct_population_urban)

number_of_painted_homes = pd.DataFrame(
    index=SAMPLE_YEAR_INDEX, columns=COUNTRIES)
number_of_painted_homes.loc[idx[:, YEARS[0]], :] = \
    (number_of_homes.loc[YEARS[0]] * PCT_OF_HOMES_PAINTED_INIT).values

for year in YEARS[1:]:
    number_of_painted_homes.loc[idx[:, year], :] = np.minimum(
        number_of_painted_homes.loc[idx[:, year - 1], :].mul(
            1 + growth_in_the_paint_market, level=0, axis=0).values,
        number_of_homes.loc[year].values)

number_of_painted_homes.head()
# number_of_painted_homes.loc[idx[:, :], 'Pakistan'].unstack(level=-1).T.plot()

Unnamed: 0_level_0,Unnamed: 1_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Sample,Year,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1
0,2021,1693518.804,3103990.56,431533.294,617092.464,3175575.448,12504775.594,1138164.042,1985755.036,1508917.649,4118972.587,15962331.629,5111339.815,769299.95
0,2022,1746555.295,3201199.263,445047.765,636418.153,3275025.999,12896391.807,1173808.303,2047943.587,1556172.925,4247967.82,16462229.273,5271413.342,793392.373
0,2023,1801252.748,3301452.284,458985.474,656349.072,3377591.077,13300272.394,1210568.848,2112079.716,1604908.11,4381002.84,16977782.377,5436499.945,818239.305
0,2024,1857663.179,3404844.963,473359.675,676904.174,3483368.219,13716801.444,1248480.635,2178224.419,1655169.55,4518204.162,17509481.229,5606756.621,843864.377
0,2025,1915840.234,3511475.624,488184.037,698103.007,3592458.019,14146375.073,1287579.718,2246440.597,1707005.045,4659702.263,18057831.471,5782345.281,870291.958


#### % of homes painted

In [17]:
pct_of_homes_painted = number_of_painted_homes / number_of_homes
pct_of_homes_painted.head()
# pct_of_homes_painted.loc[idx[:, :], 'Pakistan'].unstack(level=-1).T.plot()

Unnamed: 0_level_0,Unnamed: 1_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Sample,Year,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1
0,2021,0.337,0.449,0.462,0.514,0.594,0.444,0.336,0.406,0.607,0.529,0.513,0.523,0.492
0,2022,0.336,0.447,0.461,0.514,0.588,0.444,0.33,0.406,0.613,0.53,0.512,0.521,0.49
0,2023,0.334,0.446,0.461,0.514,0.582,0.445,0.325,0.406,0.617,0.531,0.51,0.519,0.488
0,2024,0.332,0.445,0.461,0.514,0.577,0.446,0.32,0.406,0.621,0.532,0.509,0.516,0.485
0,2025,0.331,0.443,0.461,0.513,0.572,0.446,0.314,0.406,0.625,0.533,0.507,0.514,0.483


#### New painted homes

In [18]:
# TODO(drw): I'm a little skeptical that new paint will grow exponentially and suddenly hit a ceiling
new_painted_homes = number_of_painted_homes.groupby("Sample").diff()
new_painted_homes.head()
# new_painted_homes.loc[idx[:, :], 'Pakistan'].unstack(level=-1).T.plot()

Unnamed: 0_level_0,Unnamed: 1_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Sample,Year,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1
0,2021,,,,,,,,,,,,,
0,2022,53036.491,97208.704,13514.472,19325.69,99450.551,391616.212,35644.261,62188.55,47255.275,128995.233,499897.644,160073.527,24092.422
0,2023,54697.453,100253.021,13937.709,19930.919,102565.077,403880.588,36760.545,64136.13,48735.185,133035.02,515553.104,165086.603,24846.933
0,2024,56410.431,103392.678,14374.201,20555.102,105777.142,416529.05,37911.787,66144.702,50261.441,137201.322,531698.852,170256.675,25625.072
0,2025,58177.055,106630.661,14824.362,21198.833,109089.8,429573.629,39099.083,68216.178,51835.495,141498.101,548350.242,175588.66,26427.581


#### % of prior year painted homes repainted

In our [first cost-effectiveness analysis](https://my.causal.app/models/61262) evaluating LEEP’s Malawi program, we used a conservative estimate for the repainting rate (2%) due to the relative lack of information available to inform this approximation. Since the original Malawi CEA was published, we have conducted informal surveys within our program countries to gather more information about repainting rates from relevant stakeholders. Data from these surveys suggest that repainting actually occurs about every 5-20 years within focus countries – implying a repainting rate within the range of 5-20%. In this CEA, we estimate the repainting rate at 4%. This is still a conservative estimate. In the future, we hope to conduct more formal data collection procedures that will allow us to further hone this estimate.

In [19]:
pct_of_prior_year_painted_homes_repainted = pd.Series(
    sq.lognorm(0.02, 0.1) @ N)
pct_of_prior_year_painted_homes_repainted.head()

0   0.059
1   0.089
2   0.034
3   0.058
4   0.057
dtype: float64

#### Number of homes repainted

In [20]:
number_of_homes_repainted = pd.DataFrame(
    index=SAMPLE_YEAR_INDEX, columns=COUNTRIES)

for year in YEARS[1:]:
    number_of_homes_repainted.loc[idx[:, year], :] = \
        number_of_painted_homes.loc[idx[:, year], :].mul(
        pct_of_prior_year_painted_homes_repainted, level=0, axis=0).values

number_of_homes_repainted.head()
# number_of_homes_repainted.loc[idx[:, :], 'Pakistan'].unstack(level=-1).T.plot()

Unnamed: 0_level_0,Unnamed: 1_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Sample,Year,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1
0,2021,,,,,,,,,,,,,
0,2022,102289.814,187483.372,26064.937,37272.85,191807.153,755297.882,68745.967,119941.103,91139.765,248789.053,964136.876,308728.782,46466.298
0,2023,105493.258,193354.851,26881.221,38440.137,197814.042,778951.797,70898.907,123697.338,93994.019,256580.462,994331.071,318397.344,47921.498
0,2024,108797.025,199410.209,27723.069,39643.979,204009.05,803346.489,73119.272,127571.209,96937.661,264615.878,1025470.867,328368.699,49422.271
0,2025,112204.258,205655.205,28591.282,40885.523,210398.069,828505.158,75409.172,131566.399,99973.49,272902.941,1057585.879,338652.331,50970.045


### Scenarios

#### Start of enforcement/compliance

The predicted start dates for enforcement/compliance in the counterfactual v.s. LEEP scenarios reflect a best guess estimate for the number of years that compliance to regulation is brought forward due to LEEP’s activities.

Our estimate for the year in which enforcement/compliance begins in the counterfactual scenario is based on our understanding of how much progress a country has made toward implementing lead paint regulation, as well as any barriers or catalysts identified, independent of LEEP intervention. We expect that enforcement of lead paint regulation will be initiated more quickly in countries where governments are already aware of the threats of lead poisoning and/or have already drafted regulation that bans lead paint manufacturing. For example, in Pakistan, where implementation has already begun, the start date for enforcement/compliance under the LEEP scenario is 2023 versus 2028 in the counterfactual scenario. In Angola, the start date is 2025 under the LEEP scenario and 2032 under the counterfactual scenario.

Historically, LMIC governments have very rarely implemented lead paint regulation without externally funded paint studies and advocacy. Of 38 LMICs with lead paint regulation, we were only able to identify one in Africa (Algeria), five in Latin America (all upper-middle income countries), and five in Europe (as a result of EU laws) that implemented lead paint regulation without an externally )funded paint study and advocacy. At present, support for progress toward lead paint regulation in LMICs is very limited, in part because the SAICM’s [Global Environment Facility Project](https://www.saicm.org/Implementation/GEFProject/tabid/7893/language/en-US/Default.aspx) has come to an end.
Under the LEEP scenario, we assume countries that have made more progress toward implementing lead paint regulation prior to intervention will achieve compliance objectives sooner with LEEP’s support than those that have made less regulatory progress. Our estimate for the LEEP scenario is also informed by observed progress within a given country since LEEP started working there. 


In [21]:
start_of_enforcement_compliance = pd.Series([2031, 2024], index=SCENARIOS)
start_of_enforcement_compliance.head()

Counterfactual       2031
LEEP intervention    2024
dtype: int64

#### Lead market share of colored solvent based paint

For each country, we estimate the proportion of paint within the coloured solvent-based paint market that has a lead concentration greater than 90 parts per million (ppm). Estimates are primarily based on studies conducted by LEEP and by [IPEN](https://ipen.org/) that evaluate lead content among paints produced and sold within a given country. We use domestic and regional industry data to inform our estimates for countries in which a formal paint study has not been conducted. We adjust estimates slightly to reflect any information available about the relative market share of different brands within a given country. It is possible that we overestimate the value of this input because the paint studies that inform this estimate primarily test yellow and red paints, which are more likely to contain lead than other coloured paints, such as blue paint.

At the same time, because we only consider the contribution of the coloured solvent-based paint market to overall lead paint exposure, our approach is also at risk of underestimating the overall number of homes that contain lead paint. For simplicity, we ignore the contribution of both white paints and water-based paints, which on average are less likely to contain high levels of lead. However, evidence indicates that these types of paint may still, in some cases, contain high levels of lead. Across studies of solvent-based paints in the countries included in this CEA, 26% of white paints had lead content >90 ppm. In a study of water-based paints [in Nigeria](https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6221508/), all tested samples had lead content >90 ppm. LEEP typically does not test the lead content of water-based paints, but has also identified high lead levels in some countries. 

In [22]:
lead_market_share_of_colored_solvent_based_paint = pd.DataFrame(
    index=SCENARIO_SAMPLE_YEAR_INDEX, columns=COUNTRIES)

for scenario in SCENARIOS:
    lead_market_share_of_colored_solvent_based_paint.loc[idx[scenario, :, YEARS[0]], :] = \
        lead_market_share_of_colored_solvent_based_paints_2021.values

    for year in YEARS[1:]:
        if year < start_of_enforcement_compliance[scenario]:
            lead_market_share_of_colored_solvent_based_paint.loc[idx[scenario, :, year], :] = \
                lead_market_share_of_colored_solvent_based_paint.loc[idx[scenario,
                                                                         :, year - 1], :].values
        else:
            lead_market_share_of_colored_solvent_based_paint.loc[idx[scenario, :, year], :] = \
                lead_market_share_of_colored_solvent_based_paint.loc[idx[scenario, :, year - 1], :].mul(
                (1 + decline_in_lead_market_share_once_enforcement_compliance_begins), level=1, axis=0).values

lead_market_share_of_colored_solvent_based_paint.head()
# lead_market_share_of_colored_solvent_based_paint.loc[idx['Counterfactual', :, :], 'Pakistan'].unstack(level=-1).T.plot()

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Scenario,Sample,Year,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
Counterfactual,0,2021,0.605,0.787,0.422,0.659,0.539,0.646,0.42,0.572,0.381,0.219,0.742,0.756,0.601
Counterfactual,0,2022,0.605,0.787,0.422,0.659,0.539,0.646,0.42,0.572,0.381,0.219,0.742,0.756,0.601
Counterfactual,0,2023,0.605,0.787,0.422,0.659,0.539,0.646,0.42,0.572,0.381,0.219,0.742,0.756,0.601
Counterfactual,0,2024,0.605,0.787,0.422,0.659,0.539,0.646,0.42,0.572,0.381,0.219,0.742,0.756,0.601
Counterfactual,0,2025,0.605,0.787,0.422,0.659,0.539,0.646,0.42,0.572,0.381,0.219,0.742,0.756,0.601


#### Number of homes with lead paint

In [23]:
# TODO(drw): Verify that % of new painted homes is used here as an approx. of lead paint in existing homes
PCT_OF_PAINTED_HOMES_WITH_LEAD_PAINT_INIT = pd.DataFrame(
    index=SCENARIO_SAMPLE_INDEX, columns=COUNTRIES)
for scenario in SCENARIOS:
    PCT_OF_PAINTED_HOMES_WITH_LEAD_PAINT_INIT.loc[idx[scenario, :], :] = \
        lead_market_share_of_colored_solvent_based_paint.loc[idx[scenario, :, YEARS[0]], :].mul(
        pct_of_new_painted_homes_that_use_some_colored_solvent_based_lead_paint, level=1, axis=0).values

number_of_homes_with_lead_paint = pd.DataFrame(
    index=SCENARIO_SAMPLE_YEAR_INDEX, columns=COUNTRIES)

for scenario in SCENARIOS:
    number_of_homes_with_lead_paint.loc[idx[scenario, :, YEARS[0]], :] = \
        PCT_OF_PAINTED_HOMES_WITH_LEAD_PAINT_INIT.loc[idx[scenario, :], :] * \
        number_of_painted_homes.loc[idx[:, YEARS[0]], :]

    for year in YEARS[1:]:
        number_of_homes_with_lead_paint.loc[idx[scenario, :, year], :] = \
            number_of_homes_with_lead_paint.loc[idx[scenario, :, year - 1], :].mul(
            (1 - pct_of_prior_year_painted_homes_repainted), level=1, axis=0).values + \
            (lead_market_share_of_colored_solvent_based_paint.loc[idx[scenario, :, year], :] *
             (number_of_homes_repainted.loc[idx[:, year], :] + new_painted_homes.loc[idx[:, year], :])).mul(
            pct_of_new_painted_homes_that_use_some_colored_solvent_based_lead_paint, level=1, axis=0).values

number_of_homes_with_lead_paint.head()
# number_of_homes_with_lead_paint.loc[idx['LEEP intervention', :, :], 'Pakistan'].unstack(level=-1).T.plot()

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Scenario,Sample,Year,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
Counterfactual,0,2021,641548.285,1530151.799,114182.634,254842.663,1072064.245,5064590.029,299865.801,711766.621,360602.872,564947.542,7420604.983,2422731.391,289478.579
Counterfactual,0,2022,662816.561,1580878.599,117967.957,263291.075,1107604.764,5232488.695,309806.796,735362.739,372557.392,583676.391,7666609.037,2503048.528,299075.223
Counterfactual,0,2023,684681.988,1633029.658,121859.561,271976.694,1144143.156,5405101.461,320026.906,759621.367,384847.56,602931.09,7919520.16,2585620.733,308941.312
Counterfactual,0,2024,707167.303,1686659.207,125861.493,280908.551,1181717.416,5582607.823,330536.757,784567.731,397486.155,622731.663,8179601.349,2670533.872,319087.107
Counterfactual,0,2025,730295.719,1741822.611,129977.884,290095.867,1220366.335,5765191.032,341347.2,810227.583,410486.226,643098.55,8447121.101,2757875.605,329523.08


#### % of total homes with lead paint

In [24]:
pct_of_total_homes_with_lead_paint = number_of_homes_with_lead_paint/number_of_homes

pct_of_total_homes_with_lead_paint.head()
# pct_of_total_homes_with_lead_paint.loc[idx['Counterfactual', :, :], 'Pakistan'].unstack(level=-1).T.plot()

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Scenario,Sample,Year,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
Counterfactual,0,2021,0.128,0.221,0.122,0.212,0.2,0.18,0.088,0.146,0.145,0.073,0.239,0.248,0.185
Counterfactual,0,2022,0.127,0.221,0.122,0.213,0.199,0.18,0.087,0.146,0.147,0.073,0.238,0.247,0.185
Counterfactual,0,2023,0.127,0.221,0.122,0.213,0.197,0.181,0.086,0.146,0.148,0.073,0.238,0.247,0.184
Counterfactual,0,2024,0.127,0.22,0.123,0.213,0.196,0.181,0.085,0.146,0.149,0.073,0.238,0.246,0.184
Counterfactual,0,2025,0.126,0.22,0.123,0.213,0.194,0.182,0.083,0.146,0.15,0.074,0.237,0.245,0.183


#### Births in homes with lead paint

In [25]:
births_in_homes_with_lead_paint_counterfactual = pct_of_total_homes_with_lead_paint*births

births_in_homes_with_lead_paint_counterfactual.head()
# births_in_homes_with_lead_paint_counterfactual.loc[idx[:, :], 'Pakistan'].unstack(level=-1).T.plot()

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Scenario,Sample,Year,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
Counterfactual,0,2021,83497.96,197980.62,32266.95,34566.382,268303.915,1145467.265,101237.604,71134.223,38275.876,65690.723,1890044.714,231141.34,101883.075
Counterfactual,0,2022,84770.466,200187.475,32405.613,35002.749,270218.097,1158687.74,102936.991,71647.989,38722.762,66045.084,1906641.089,233207.559,102616.629
Counterfactual,0,2023,86197.448,202555.471,32655.434,35569.891,272432.073,1170915.964,104535.396,72141.581,39054.643,66499.141,1929296.034,236757.126,103551.987
Counterfactual,0,2024,87041.665,204232.064,32750.053,36055.144,274699.755,1181065.951,106272.931,72639.169,39559.536,66816.115,1956454.154,239813.448,104299.787
Counterfactual,0,2025,88041.474,206250.487,32909.05,36557.308,277045.845,1193279.388,108006.534,72974.885,40021.185,67448.603,1974570.832,242869.59,105336.48


### Births with averted lead paint exposure vs. counterfactual

In [26]:
births_with_averted_lead_paint_exposure_vs_counterfactual = \
    births_in_homes_with_lead_paint_counterfactual.loc[idx['Counterfactual', :, :], :].droplevel(0) - \
    births_in_homes_with_lead_paint_counterfactual.loc[idx['LEEP intervention', :, :], :].droplevel(
        0)

births_with_averted_lead_paint_exposure_vs_counterfactual.head()
# births_with_averted_lead_paint_exposure_vs_counterfactual.loc[idx[:, :], 'Pakistan'].unstack(level=-1).T.plot()

Unnamed: 0_level_0,Unnamed: 1_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Sample,Year,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1
0,2021,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
0,2022,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
0,2023,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
0,2024,1535.11,3601.937,577.596,635.886,4844.74,20829.86,1874.282,1281.1,697.691,1178.402,34504.987,4229.468,1839.482
0,2025,4207.803,9857.416,1572.836,1747.199,13240.969,57030.904,5162.002,3487.719,1912.749,3223.599,94371.495,11607.569,5034.391


### Total number of births with averted lead paint exposure

In [27]:
total_number_of_births_with_averted_lead_paint_exposure = \
    births_with_averted_lead_paint_exposure_vs_counterfactual.groupby(
        level=0).sum()

total_number_of_births_with_averted_lead_paint_exposure.head()

Unnamed: 0_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Sample,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1
0,703196.706,1690005.166,255546.91,301174.946,2236898.329,9794461.941,891502.39,623629.942,328468.743,576506.618,15624177.937,2321430.22,890529.041
1,1225695.781,1932731.617,320694.648,423343.395,3073055.47,12584137.668,983771.599,778526.769,426439.727,657445.605,24608588.842,3017142.79,1429982.891
2,3325329.303,4772359.978,743411.927,1062983.675,8028661.202,29115172.87,3158698.352,2194803.963,809825.784,1615521.571,49584367.177,6392002.908,2836674.342
3,1631542.968,2609216.309,509656.641,613426.291,3832682.892,16071306.838,1541209.902,1254710.283,580262.651,930104.709,29875360.373,4410425.902,1716058.746
4,859213.309,1780256.102,257032.301,396751.901,3544144.341,10478836.343,998353.479,800244.625,376361.291,611119.201,20147283.868,3121418.249,1372155.898


### Total expected number of births with averted lead paint exposure

In [28]:
total_expected_number_of_births_with_averted_lead_paint_exposure = \
    total_number_of_births_with_averted_lead_paint_exposure * \
    probability_of_success

total_expected_number_of_births_with_averted_lead_paint_exposure.head()

Unnamed: 0_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Sample,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1
0,628659.68,1393369.734,189210.554,209097.215,1725951.489,8173387.244,678663.723,535637.3,266229.28,457182.185,12712697.641,1711258.3,630454.464
1,1069162.263,1588536.065,222346.87,284130.707,2531057.225,11069103.409,761992.823,624783.324,310074.272,535297.513,20189496.391,2274481.256,1108487.253
2,2779311.412,3716705.422,552249.276,730935.132,6216469.071,27125791.165,2355744.867,1789574.457,589276.386,1305290.767,36719014.376,4972369.781,2123025.028
3,1470077.255,2141442.616,387213.496,411157.858,3093590.372,14859494.596,1237458.672,994689.368,452585.531,743311.758,23197506.761,3456155.56,1294673.659
4,732553.983,1358626.067,185600.057,289996.087,2775667.013,9566213.886,720608.53,633513.025,280726.231,505212.551,16580623.881,2418642.076,1028535.267


### Number of homes with averted lead paint vs. counterfactual

In [29]:
number_of_homes_with_averted_lead_paint_vs_counterfactual = \
    number_of_homes_with_lead_paint.loc[idx['Counterfactual', :, :], :].droplevel(0) - \
    number_of_homes_with_lead_paint.loc[idx['LEEP intervention', :, :], :].droplevel(
        0)

number_of_homes_with_averted_lead_paint_vs_counterfactual.head()

Unnamed: 0_level_0,Unnamed: 1_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Sample,Year,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1
0,2021,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
0,2022,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
0,2023,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
0,2024,12471.95,29746.751,2219.755,4954.241,20841.349,98457.616,5829.509,13837.022,7010.261,10982.802,144259.471,47098.848,5627.577
0,2025,34903.331,83247.661,6212.088,13864.674,58325.482,275538.202,16314.15,38723.548,19618.541,30735.88,403716.814,131808.31,15749.035


### Total number of homes with averted lead paint

In [30]:
total_number_of_homes_with_averted_lead_paint = \
    number_of_homes_with_averted_lead_paint_vs_counterfactual.groupby(
        level=0).sum()

total_number_of_homes_with_averted_lead_paint.head()

Unnamed: 0_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Sample,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1
0,9248737.146,22059090.327,1646088.006,3673879.794,15455174.061,73012524.68,4322948.147,10260990.612,5197699.935,8144403.61,106977488.877,34926459.06,4173203.091
1,17306641.097,26952401.209,2225974.601,5532212.443,22834392.327,100620505.988,5131222.9,13549868.259,7182979.801,9879474.101,181871585.57,47041013.293,7150929.697
2,50770495.193,70901735.963,5495925.752,14685553.468,63616213.682,248346199.933,18241897.871,40064216.349,14144399.988,25376357.714,391360341.483,102618748.827,15161837.78
3,22039085.012,34858349.298,3361281.309,7645133.07,27136404.199,122615675.063,7681310.831,21039795.006,9221879.514,13356011.821,209519414.328,66995544.028,8224169.36
4,11434118.482,23494835.057,1676329.653,4895398.403,24786947.505,79033522.887,4900645.216,13289991.108,6013386.086,8722522.276,139710022.853,47249099.448,6501020.743


### Total expected number of homes with averted lead paint

In [31]:
total_expected_number_of_homes_with_averted_lead_paint = \
    total_number_of_homes_with_averted_lead_paint * \
    probability_of_success

total_expected_number_of_homes_with_averted_lead_paint.head()

Unnamed: 0_level_0,Malawi,Madagascar,Sierra Leone,Liberia,Angola,Pakistan,Niger,Zimbabwe,Bolivia,Ghana,Nigeria,Cote d'Ivoire,Senegal
Sample,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1
0,8268395.016,18187204.061,1218786.887,2550670.439,11924941.04,60928271.655,3290880.784,8813190.219,4212820.664,6458687.757,87042817.61,25746280.213,2954439.888
1,15096411.235,22152512.533,1543332.539,3712993.883,18807064.901,88506563.99,3974454.055,10874040.652,5222912.157,8043947.487,149211957.83,35461995.151,5543223.258
2,42433997.911,55218145.262,4082690.778,10098167.284,49257057.289,231377199.305,13604736.03,32667108.059,10292288.882,20503301.234,289816464.81,79827617.89,11347429.134
3,19857986.114,28609032.707,2553745.765,5124261.189,21903434.519,113370180.745,6167430.333,16679595.819,7192758.711,10673723.639,162686841.922,52499923.396,6204691.688
4,9748579.254,17930395.127,1210458.289,3578171.592,19412390.109,72150338.012,3537270.936,10521010.959,4485358.212,7210913.562,114977252.342,36611133.412,4873009.776
