## Predatory Inclusion in Non-Profit and For-Profit Online Education
### By Christian Michael Smith, Amber D. Villalobos (equal authors), Laura T. Hamilton, and Charlie Eaton

### Code by Christian Smith

### Merge Data for Tables 3 and 5

In [1]:
***(IX) PREPARE DATA ON LOAN PROGRESS OUTCOMES FROM SCORECARD***

qui {
clear
insheet using MERGED2018_19_PP.csv
keep unitid bbrr* dbrr*
gen year=2013
save repay2013.dta, replace
	}



**********(B) PERFORM FINAL MERGE**********	

qui {
use hd2012a, clear
gen year=2012
forvalues year=2013/2020 {
	append using hd`year'a
    replace year=`year' if year==.
		}
	
forvalues year=2012/2020 {
    merge 1:1 unitid year using ef`year'a_dist, nogen update
    merge 1:1 unitid year using first`year', nogen keepusing(f*) update
    merge 1:1 unitid year using under`year', nogen keepusing(u*) update
	merge 1:1 unitid year using trad`year', nogen keepusing(t*) update
	merge 1:1 unitid year using adm`year', nogen update
		}	
	
forvalues year=2012/2019 {
    merge 1:1 unitid year using efia`year',  nogen update
	merge 1:1 unitid year using sfa`year', nogen update
	merge 1:1 unitid year using ret`year', nogen update
		}

forvalues year=2012/2014 {
	merge 1:1 unitid year using gr`year', nogen update
		}	

merge 1:1 unitid year using repay2013, nogen update

	}



**********(C) CREATE / CLEAN VARIABLES AND SAVE ANALYTIC DATASET**********	

*Miscellaneous data-cleaning and variable construction
qui {
gen forprofit = (control==3)
gen nonprofit = (control!=3)
gen allcontrols = 1
foreach var in forprofit nonprofit {
	replace `var' = . if control==.
		}
label define forprofit_lab 0 "Nonprofit (public or private)" 1 "For-profit"
label values forprofit forprofit_lab
label define nonprofit_lab 0 "For-profit" 1 "Nonprofit (public or private)" 
label values nonprofit nonprofit_lab
gen blackpct = fefbkaat / feftotlt * 100
gen latinxpct = fefhispt / feftotlt * 100
gen aianpct = fefaiant / feftotlt * 100
gen asiapct = fefasiat / feftotlt * 100
gen blackpct_u = uefbkaat / ueftotlt * 100
gen latinxpct_u = uefhispt / ueftotlt * 100
gen aianpct_u = uefaiant / ueftotlt * 100
gen asiapct_u = uefasiat / ueftotlt * 100
gen malepct_u = ueftotlm / ueftotlt * 100
gen blackpct_t = tefbkaat / teftotlt * 100
gen latinxpct_t = tefhispt / teftotlt * 100
gen aianpct_t = tefaiant / teftotlt * 100
gen asiapct_t = tefasiat / teftotlt * 100
gen malepct_t = teftotlm / teftotlt * 100
replace hbcu = (hbcu==1)
replace locale = . if locale==-3
replace hdegofr1  = . if hdegofr1 ==-3
sort unitid year
gen pctonline = efdeexc / efdetot * 100
gen pctonline10 = pctonline/10
gen logenrl = ln(ueftotlt)
gen acceptrate = 100*admssn/applcn
replace acceptrate = 100 if acceptrate==.
gen totloan_a = floan_a+oloan_a
foreach var in bbrr2_fed_ug_dflt bbrr2_fed_ug_dlnq bbrr2_fed_ug_fbr bbrr2_fed_ug_dfr bbrr2_fed_ug_noprog bbrr2_fed_ug_makeprog bbrr2_fed_ug_paidinfull bbrr2_fed_ug_discharge {
	replace `var' = "" if `var'=="NULL"
	replace `var' = "" if `var'=="PrivacySuppressed"
	destring `var', replace
	replace `var' = 100*`var'
		}
	}

*Save final analytic dataset
save d_t3_t5_ipeds_scorecard, replace



. qui {

. qui {

. save d_t3_t5_ipeds_scorecard, replace
(file d_t3_t5_ipeds_scorecard.dta not found)
file d_t3_t5_ipeds_scorecard.dta saved
