In [1]:
campers.ipv <- read.csv("/work/campers_ipv_wealth.csv")

Important Demographics:

V012	Respondent's current age
V013	Age in 5-year groups
V024	Region
V106	Highest educational level
V149	Educational attainment
V190	Wealth index combined
V191	Wealth index factor score combined (5 decimals)
V190A	Wealth index for urban/rural
V191A	Wealth index factor score for urban/rural (5 decimals)

V501	Current marital status
V502	Currently/formerly/never in union

V701	Husband/partner's education level
V704	Husband/partner's occupation
V705	Husband/partner's occupation (grouped)
V714	Respondent currently working
V716	Respondent's occupation
V717	Respondent's occupation (grouped)
V729	Husband/partner's educational attainment
V730	Husband/partner's age
V731	Respondent worked in last 12 months




In [2]:
# Remove rows with missing important demographics since they may
# be attributed to measurement or recording errors

demographics <- c("V012", "V013", "V024", "V106","V149","V190","V190A","V501", "V502", "V701", "V704", "V705", 
"V714", "V716", "V717", "V729", "V730", "V731")


In [3]:
campers.ipv.clean <- campers.ipv[complete.cases(campers.ipv[, demographics]), ]

In [4]:
# measure how many data were removed

nrow(campers.ipv)
nrow(campers.ipv.clean)

##### V106_VS1	Highest educational level				
		No education	0		
		Primary	1		
		Secondary	2		
		Higher	3		
		Don't know	8		
		Missing	9		Missing

##### V501_VS1	Current marital status				
		Never in union	0		
		Married	1		
		Living with partner	2		
		Widowed	3		
		Divorced	4		
		No longer living together/separated	5		
		Missing	9		Missing

##### V701_VS1	Husband/partner's education level				
		No education	0		
		Primary	1		
		Secondary	2		
		Higher	3		
		Don't know	8		
		Missing	9		Missing
		Not applicable	 		Not Applicable

##### V704_VS1	Husband/partner's occupation				
		Not working and didn't work in last 12 months	0		
			1	9995	
		Other	9996		
		Don't know	9998		
		Missing	9999		Missing
		Not applicable	    		Not Applicable

##### V716_VS1	Respondent's occupation				
		Not working and didn't work in last 12 months	0		
			1	9995	
		Other	9996		
		Don't know	9998		
		Missing	9999		Missing
		Not applicable	    		Not Applicable

##### V730_VS1	Husband/partner's age				
			15	95	
		96+	96		
			97		
		Don't know	98		
		Missing	99		Missing
		Not applicable	  		Not Applicable


In [5]:
# Remove rows with values of variables categorized as 'missing' or 'don't know' 
# since they provide incomplete information, and therefore may affect accuracy of estimates

campers.ipv.final.data <- campers.ipv.clean[
    campers.ipv.clean$V106 < 8 &
    campers.ipv.clean$V501 < 9 &
    campers.ipv.clean$V701 < 8 &
    campers.ipv.clean$V704 < 9998 &
    campers.ipv.clean$V716 < 9998 &
    campers.ipv.clean$V730 < 98,
    -c(1)
]

In [6]:
# measure how many data were removed

nrow(campers.ipv)
nrow(campers.ipv.clean)
nrow(campers.ipv.final.data)
ncol(campers.ipv.final.data)

# Final Number of Observations: 14232 women respondents

In [7]:
View(campers.ipv.final.data)

Unnamed: 0_level_0,CASEID,V000,V001,V002,V003,V004,V005,V006,V007,V008,...,D110D,D110E,D110F,D110G,D110H,D111,D112,D112A,D113,D114
Unnamed: 0_level_1,<chr>,<chr>,<int>,<int>,<int>,<int>,<int>,<int>,<int>,<int>,...,<int>,<int>,<int>,<int>,<lgl>,<int>,<int>,<int>,<int>,<int>
1,00010007 2,PH7,1,7,2,1,361799,8,2017,1412,...,,,,,,0,0,,0,
2,00010010 2,PH7,1,10,2,1,361799,8,2017,1412,...,,,,,,0,0,,0,
3,00010013 2,PH7,1,13,2,1,361799,8,2017,1412,...,,,,,,0,0,,0,
5,00010015 7,PH7,1,15,7,1,361799,8,2017,1412,...,,,,,,,,,,
6,00010018 9,PH7,1,18,9,1,361799,8,2017,1412,...,,,,,,,,,,
7,00010022 4,PH7,1,22,4,1,361799,8,2017,1412,...,,,,,,0,0,,0,
8,00010025 2,PH7,1,25,2,1,361799,8,2017,1412,...,,,,,,0,0,,0,
9,00010029 2,PH7,1,29,2,1,361799,8,2017,1412,...,,,,,,0,0,,0,
10,00020007 2,PH7,2,7,2,2,416591,8,2017,1412,...,,,,,,0,0,,0,
11,00020016 2,PH7,2,16,2,2,416591,8,2017,1412,...,,,,,,0,0,,0,


In [8]:
write.csv(campers.ipv.final.data, "/work/campers_ipv_final_data_wealth.csv")

<a style='text-decoration:none;line-height:16px;display:flex;color:#5B5B62;padding:10px;justify-content:end;' href='https://deepnote.com?utm_source=created-in-deepnote-cell&projectId=8672f010-76e5-4fe5-a087-2513d801c0e9' target="_blank">
 </img>
Created in <span style='font-weight:600;margin-left:4px;'>Deepnote</span></a>