## Table of Contents

### 1. Importing libraries
### 2. Importing data
##### 1. Create list of columns to import from data set
##### 2. Import data from specific columns
### 3. Data cleaning and consistency checks
##### 1. Dropping columns
##### 2. Renaming columns
##### 3. Mixed-type columns
##### 4. Missing values
##### 5. Duplicate values
### 4. Get info about data set
### 5. Export data

# 01. Importing libraries

In [1]:
# Import libraries
import pandas as pd
import numpy as np
import os

# 02. Importing data

## 01. Create list of columns to import from data set

In [2]:
# Create path shortcut
path = r'/Users/taraperrigeold/Documents/Documents - Tara Perrige’s MacBook Pro/CareerFoundry/College Cost Analysis'

In [3]:
# Check output
path

'/Users/taraperrigeold/Documents/Documents - Tara Perrige’s MacBook Pro/CareerFoundry/College Cost Analysis'

In [4]:
# Create vars_list of columns to import from data dictionary file
vars_list = ['dev-category', 'VARIABLE NAME']

In [5]:
# Check output
vars_list

['dev-category', 'VARIABLE NAME']

In [6]:
# Import dev-category and VARIABLE NAME columns from collegescorecarddatadictionary excel file
df_guide = pd.read_excel(os.path.join(path, '02 Data', 'Original Data', 'collegescorecarddatadictionary_2021-04-01.xlsx'), sheet_name = 'institution_data_dictionary', usecols = vars_list)

In [7]:
# Check output
df_guide.head(15)

Unnamed: 0,dev-category,VARIABLE NAME
0,root,UNITID
1,root,OPEID
2,root,OPEID6
3,school,INSTNM
4,school,CITY
5,school,STABBR
6,school,ZIP
7,school,ACCREDAGENCY
8,school,INSTURL
9,school,NPCURL


In [8]:
# Find number of missing values in VARIABLE NAME
df_guide.isnull().sum()

dev-category     126
VARIABLE NAME    257
dtype: int64

In [9]:
# Look at null values
df_guide.isnull()

Unnamed: 0,dev-category,VARIABLE NAME
0,False,False
1,False,False
2,False,False
3,False,False
4,False,False
...,...,...
2635,False,False
2636,False,False
2637,False,False
2638,False,False


In [10]:
# Create subset where dev-category is null
df_dev_nan = df_guide[df_guide['dev-category'].isnull() == True]

In [11]:
# Check output
df_dev_nan.head(15)

Unnamed: 0,dev-category,VARIABLE NAME
154,,
155,,
156,,
157,,
158,,
159,,
160,,
161,,
162,,
163,,


In [12]:
# Check number of missing values in subset
df_dev_nan.isnull().sum()

dev-category     126
VARIABLE NAME    126
dtype: int64

In [13]:
# Update df_guide to remove rows with missing values in dev-category
df_guide = df_guide[df_guide['dev-category'].isnull() == False]

In [14]:
# Check that df_guide is 126 fewer rows
df_guide.shape

(2514, 2)

In [15]:
# Look at missing values in VARIABLE NAME
df_guide[df_guide['VARIABLE NAME'].isnull() == True]

Unnamed: 0,dev-category,VARIABLE NAME
13,school,
16,school,
17,school,
18,school,
19,school,
...,...,...
150,school,
151,school,
152,school,
1984,school,


In [16]:
# Update df_guide to remove rows with missing values
df_guide = df_guide[df_guide['VARIABLE NAME'].isnull() == False]

In [17]:
# Check that df_guide is 131 rows fewer
df_guide.shape

(2383, 2)

In [18]:
# Get variable counts for dev-category
df_guide['dev-category'].value_counts(dropna = False)

completion    1218
repayment      464
academics      247
student        117
aid            106
earnings        79
cost            77
school          44
admissions      25
root             6
Name: dev-category, dtype: int64

In [19]:
# Create new dataframe of only categories I want
df_small = df_guide[df_guide['dev-category'].isin(['root', 'school', 'admissions', 'student', 'cost', 'aid'])]

In [20]:
# Check output
df_small.head(15)

Unnamed: 0,dev-category,VARIABLE NAME
0,root,UNITID
1,root,OPEID
2,root,OPEID6
3,school,INSTNM
4,school,CITY
5,school,STABBR
6,school,ZIP
7,school,ACCREDAGENCY
8,school,INSTURL
9,school,NPCURL


In [21]:
# Check value counts
df_small['dev-category'].value_counts(dropna = False)

student       117
aid           106
cost           77
school         44
admissions     25
root            6
Name: dev-category, dtype: int64

In [22]:
# Check new shape
df_small.shape

(375, 2)

In [23]:
# Double-check no mixed-type columns
for col in df_small.columns.tolist():
    weird = (df_small[[col]].applymap(type) != df_small[[col]].iloc[0].apply(type)).any(axis = 1)
    if len (df_small[weird]) > 0:
        print(col)

In [24]:
# Check data type of VARIABLE NAME
df_small['VARIABLE NAME'].dtype

dtype('O')

In [25]:
# Create new variables list
new_vars = df_small['VARIABLE NAME'].to_list()

In [26]:
# Check output
new_vars

['UNITID',
 'OPEID',
 'OPEID6',
 'INSTNM',
 'CITY',
 'STABBR',
 'ZIP',
 'ACCREDAGENCY',
 'INSTURL',
 'NPCURL',
 'SCH_DEG',
 'HCM2',
 'MAIN',
 'NUMBRANCH',
 'PREDDEG',
 'HIGHDEG',
 'CONTROL',
 'ST_FIPS',
 'REGION',
 'LOCALE',
 'LOCALE2',
 'LATITUDE',
 'LONGITUDE',
 'CCBASIC',
 'CCUGPROF',
 'CCSIZSET',
 'HBCU',
 'PBI',
 'ANNHI',
 'TRIBAL',
 'AANAPII',
 'HSI',
 'NANTI',
 'MENONLY',
 'WOMENONLY',
 'RELAFFIL',
 'ADM_RATE',
 'ADM_RATE_ALL',
 'SATVR25',
 'SATVR75',
 'SATMT25',
 'SATMT75',
 'SATWR25',
 'SATWR75',
 'SATVRMID',
 'SATMTMID',
 'SATWRMID',
 'ACTCM25',
 'ACTCM75',
 'ACTEN25',
 'ACTEN75',
 'ACTMT25',
 'ACTMT75',
 'ACTWR25',
 'ACTWR75',
 'ACTCMMID',
 'ACTENMID',
 'ACTMTMID',
 'ACTWRMID',
 'SAT_AVG',
 'SAT_AVG_ALL',
 'DISTANCEONLY',
 'UGDS',
 'UG',
 'UGDS_WHITE',
 'UGDS_BLACK',
 'UGDS_HISP',
 'UGDS_ASIAN',
 'UGDS_AIAN',
 'UGDS_NHPI',
 'UGDS_2MOR',
 'UGDS_NRA',
 'UGDS_UNKN',
 'UGDS_WHITENH',
 'UGDS_BLACKNH',
 'UGDS_API',
 'UGDS_AIANOLD',
 'UGDS_HISPOLD',
 'UG_NRA',
 'UG_UNKN',
 'UG_WHIT

## 02. Import data from specific columns

In [27]:
# Import college scorecard data set, but only columns in list
df = pd.read_csv(os.path.join(path, '02 Data', 'Original Data', 'Most-Recent-Cohorts-All-Data-Elements.csv'), usecols = new_vars)

  has_raised = await self.run_ast_nodes(code_ast.body, cell_name,


In [28]:
# Check output
df.head(15)

Unnamed: 0,UNITID,OPEID,OPEID6,INSTNM,CITY,STABBR,ZIP,ACCREDAGENCY,INSTURL,NPCURL,...,PLUS_DEBT_INST_NOSTAFFANY_MD,PLUS_DEBT_ALL_NOSTAFFANY_N,PLUS_DEBT_ALL_NOSTAFFANY_MD,LPSTAFFORD_CNT,LPSTAFFORD_AMT,LPPPLUS_CNT,LPPPLUS_AMT,LPGPLUS_CNT,LPGPLUS_AMT,FEDSCHCD
0,100654,100200,1002,Alabama A & M University,Normal,AL,35762,Southern Association of Colleges and Schools C...,www.aamu.edu/,www.aamu.edu/admissions-aid/tuition-fees/net-p...,...,12688,46,11067,31374,922456254,5201,113949554,1004,15578483,1002
1,100663,105200,1052,University of Alabama at Birmingham,Birmingham,AL,35294-0110,Southern Association of Colleges and Schools C...,https://www.uab.edu,https://uab.studentaidcalculator.com/survey.aspx,...,PrivacySuppressed,22,18300,56997,1720042015,3727,87421879,3461,134126588,1052
2,100690,2503400,25034,Amridge University,Montgomery,AL,36117-3553,Southern Association of Colleges and Schools C...,www.amridgeuniversity.edu,www2.amridgeuniversity.edu:9091/,...,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,4463,174222020,16,309618,298,16290781,16885
3,100706,105500,1055,University of Alabama in Huntsville,Huntsville,AL,35899,Southern Association of Colleges and Schools C...,www.uah.edu,finaid.uah.edu/,...,PrivacySuppressed,15,PrivacySuppressed,19702,407184805,1397,29789762,144,2377759,1055
4,100724,100500,1005,Alabama State University,Montgomery,AL,36104-0271,Southern Association of Colleges and Schools C...,www.alasu.edu,www.alasu.edu/cost-aid/tuition-costs/net-price...,...,13000,30,12466,34246,947070736,4602,95359062,587,12174367,1005
5,100751,105100,1051,The University of Alabama,Tuscaloosa,AL,35487-0100,Southern Association of Colleges and Schools C...,www.ua.edu/,financialaid.ua.edu/net-price-calculator/,...,33072,80,31384,75084,1771875477,11535,619905869,2035,69504249,1051
6,100760,100700,1007,Central Alabama Community College,Alexander City,AL,35010,Southern Association of Colleges and Schools C...,www.cacc.edu,https://www.cacc.edu/net-price-calculator/,...,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,5297,68476891,14,96386,PrivacySuppressed,PrivacySuppressed,1007
7,100812,100800,1008,Athens State University,Athens,AL,35611,Southern Association of Colleges and Schools C...,www.athens.edu,www.athens.edu/financial-aid/net-price-calcula...,...,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,12034,234452111,171,1713456,PrivacySuppressed,PrivacySuppressed,1008
8,100830,831000,8310,Auburn University at Montgomery,Montgomery,AL,36117-3596,Southern Association of Colleges and Schools C...,www.aum.edu,www.aum.edu/current-students/financial-informa...,...,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,23340,493759303,1289,16701421,165,1883514,8310
9,100858,100900,1009,Auburn University,Auburn,AL,36849,Southern Association of Colleges and Schools C...,www.auburn.edu,https://www.auburn.edu/admissions/costcalc/fre...,...,36506,53,32255,48346,1258831243,6151,307762305,1968,82412571,1009


In [29]:
# Change options to display all columns
pd.options.display.max_columns = None

In [30]:
# Check output
df.head(15)

Unnamed: 0,UNITID,OPEID,OPEID6,INSTNM,CITY,STABBR,ZIP,ACCREDAGENCY,INSTURL,NPCURL,SCH_DEG,HCM2,MAIN,NUMBRANCH,PREDDEG,HIGHDEG,CONTROL,ST_FIPS,REGION,LOCALE,LOCALE2,LATITUDE,LONGITUDE,CCBASIC,CCUGPROF,CCSIZSET,HBCU,PBI,ANNHI,TRIBAL,AANAPII,HSI,NANTI,MENONLY,WOMENONLY,RELAFFIL,ADM_RATE,ADM_RATE_ALL,SATVR25,SATVR75,SATMT25,SATMT75,SATWR25,SATWR75,SATVRMID,SATMTMID,SATWRMID,ACTCM25,ACTCM75,ACTEN25,ACTEN75,ACTMT25,ACTMT75,ACTWR25,ACTWR75,ACTCMMID,ACTENMID,ACTMTMID,ACTWRMID,SAT_AVG,SAT_AVG_ALL,DISTANCEONLY,UGDS,UG,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN,UGDS_WHITENH,UGDS_BLACKNH,UGDS_API,UGDS_AIANOLD,UGDS_HISPOLD,UG_NRA,UG_UNKN,UG_WHITENH,UG_BLACKNH,UG_API,UG_AIANOLD,UG_HISPOLD,PPTUG_EF,PPTUG_EF2,CURROPER,NPT4_PUB,NPT4_PRIV,NPT4_PROG,NPT4_OTHER,NPT41_PUB,NPT42_PUB,NPT43_PUB,NPT44_PUB,NPT45_PUB,NPT41_PRIV,NPT42_PRIV,NPT43_PRIV,NPT44_PRIV,NPT45_PRIV,NPT41_PROG,NPT42_PROG,NPT43_PROG,NPT44_PROG,NPT45_PROG,NPT41_OTHER,NPT42_OTHER,NPT43_OTHER,NPT44_OTHER,NPT45_OTHER,NPT4_048_PUB,NPT4_048_PRIV,NPT4_048_PROG,NPT4_048_OTHER,NPT4_3075_PUB,NPT4_3075_PRIV,NPT4_75UP_PUB,NPT4_75UP_PRIV,NPT4_3075_PROG,NPT4_3075_OTHER,NPT4_75UP_PROG,NPT4_75UP_OTHER,NUM4_PUB,NUM4_PRIV,NUM4_PROG,NUM4_OTHER,NUM41_PUB,NUM42_PUB,NUM43_PUB,NUM44_PUB,NUM45_PUB,NUM41_PRIV,NUM42_PRIV,NUM43_PRIV,NUM44_PRIV,NUM45_PRIV,NUM41_PROG,NUM42_PROG,NUM43_PROG,NUM44_PROG,NUM45_PROG,NUM41_OTHER,NUM42_OTHER,NUM43_OTHER,NUM44_OTHER,NUM45_OTHER,COSTT4_A,COSTT4_P,TUITIONFEE_IN,TUITIONFEE_OUT,TUITIONFEE_PROG,TUITFTE,INEXPFTE,AVGFACSAL,PFTFAC,PCTPELL,PFTFTUG1_EF,RET_FT4,RET_FTL4,RET_PT4,RET_PTL4,PCTFLOAN,UG25ABV,INC_PCT_LO,DEP_STAT_PCT_IND,DEP_INC_PCT_LO,IND_INC_PCT_LO,PAR_ED_PCT_1STGEN,INC_PCT_M1,INC_PCT_M2,INC_PCT_H1,INC_PCT_H2,DEP_INC_PCT_M1,DEP_INC_PCT_M2,DEP_INC_PCT_H1,DEP_INC_PCT_H2,IND_INC_PCT_M1,IND_INC_PCT_M2,IND_INC_PCT_H1,IND_INC_PCT_H2,PAR_ED_PCT_MS,PAR_ED_PCT_HS,PAR_ED_PCT_PS,APPL_SCH_PCT_GE2,APPL_SCH_PCT_GE3,APPL_SCH_PCT_GE4,APPL_SCH_PCT_GE5,DEP_INC_AVG,IND_INC_AVG,DEBT_MDN,GRAD_DEBT_MDN,WDRAW_DEBT_MDN,LO_INC_DEBT_MDN,MD_INC_DEBT_MDN,HI_INC_DEBT_MDN,DEP_DEBT_MDN,IND_DEBT_MDN,PELL_DEBT_MDN,NOPELL_DEBT_MDN,FEMALE_DEBT_MDN,MALE_DEBT_MDN,FIRSTGEN_DEBT_MDN,NOTFIRSTGEN_DEBT_MDN,DEBT_N,GRAD_DEBT_N,WDRAW_DEBT_N,LO_INC_DEBT_N,MD_INC_DEBT_N,HI_INC_DEBT_N,DEP_DEBT_N,IND_DEBT_N,PELL_DEBT_N,NOPELL_DEBT_N,FEMALE_DEBT_N,MALE_DEBT_N,FIRSTGEN_DEBT_N,NOTFIRSTGEN_DEBT_N,GRAD_DEBT_MDN10YR,CUML_DEBT_N,CUML_DEBT_P90,CUML_DEBT_P75,CUML_DEBT_P25,CUML_DEBT_P10,INC_N,DEP_INC_N,IND_INC_N,DEP_STAT_N,PAR_ED_N,APPL_SCH_N,LOAN_EVER,PELL_EVER,AGE_ENTRY,AGE_ENTRY_SQ,AGEGE24,FEMALE,MARRIED,DEPENDENT,VETERAN,FIRST_GEN,FAMINC,MD_FAMINC,FAMINC_IND,LNFAMINC,LNFAMINC_IND,PCT_WHITE,PCT_BLACK,PCT_ASIAN,PCT_HISPANIC,PCT_BA,PCT_GRAD_PROF,PCT_BORN_US,MEDIAN_HH_INC,POVERTY_RATE,UNEMP_RATE,LN_MEDIAN_HH_INC,FSEND_COUNT,FSEND_1,FSEND_2,FSEND_3,FSEND_4,FSEND_5,DEBT_MDN_SUPP,GRAD_DEBT_MDN_SUPP,GRAD_DEBT_MDN10YR_SUPP,ALIAS,ICLEVEL,UGDS_MEN,UGDS_WOMEN,T4APPROVALDATE,D_PCTPELL_PCTFLOAN,OPENADMP,UGNONDS,GRADS,ACCREDCODE,RET_FT4_POOLED,RET_FTL4_POOLED,RET_PT4_POOLED,RET_PTL4_POOLED,RET_FT_DEN4_POOLED,RET_FT_DENL4_POOLED,RET_PT_DEN4_POOLED,RET_PT_DENL4_POOLED,POOLYRSRET_FT,POOLYRSRET_PT,RET_FT4_POOLED_SUPP,RET_FTL4_POOLED_SUPP,RET_PT4_POOLED_SUPP,RET_PTL4_POOLED_SUPP,SCHTYPE,OPEFLAG,CIPTFBS1,CIPTFBS2,CIPTFBS3,CIPTFBS4,CIPTFBS5,CIPTFBS6,CIPTFBSANNUAL1,CIPTFBSANNUAL2,CIPTFBSANNUAL3,CIPTFBSANNUAL4,CIPTFBSANNUAL5,CIPTFBSANNUAL6,FTFTPCTPELL,FTFTPCTFLOAN,UG12MN,G12MN,SCUGFFN,POOLYRS_FTFTAIDPCT,FTFTPCTPELL_POOLED_SUPP,FTFTPCTFLOAN_POOLED_SUPP,SCUGFFN_POOLED,PPLUS_PCT_LOW,PPLUS_PCT_HIGH,PPLUS_PCT_LOW_POOLED_SUPP,PPLUS_PCT_HIGH_POOLED_SUPP,POOLYRS_PLUSPCT,PLUS_DEBT_INST_N,PLUS_DEBT_INST_MD,PLUS_DEBT_ALL_N,PLUS_DEBT_ALL_MD,PLUS_DEBT_INST_COMP_N,PLUS_DEBT_INST_COMP_MD,PLUS_DEBT_INST_COMP_MDPAY10,PLUS_DEBT_INST_COMP_MD_SUPP,PLUS_DEBT_INST_COMP_MDPAY10_SUPP,PLUS_DEBT_ALL_COMP_N,PLUS_DEBT_ALL_COMP_MD,PLUS_DEBT_ALL_COMP_MDPAY10,PLUS_DEBT_ALL_COMP_MD_SUPP,PLUS_DEBT_ALL_COMP_MDPAY10_SUPP,PLUS_DEBT_INST_NOCOMP_N,PLUS_DEBT_INST_NOCOMP_MD,PLUS_DEBT_ALL_NOCOMP_N,PLUS_DEBT_ALL_NOCOMP_MD,PLUS_DEBT_INST_MALE_N,PLUS_DEBT_INST_MALE_MD,PLUS_DEBT_ALL_MALE_N,PLUS_DEBT_ALL_MALE_MD,PLUS_DEBT_INST_NOMALE_N,PLUS_DEBT_INST_NOMALE_MD,PLUS_DEBT_ALL_NOMALE_N,PLUS_DEBT_ALL_NOMALE_MD,PLUS_DEBT_INST_PELL_N,PLUS_DEBT_INST_PELL_MD,PLUS_DEBT_ALL_PELL_N,PLUS_DEBT_ALL_PELL_MD,PLUS_DEBT_INST_NOPELL_N,PLUS_DEBT_INST_NOPELL_MD,PLUS_DEBT_ALL_NOPELL_N,PLUS_DEBT_ALL_NOPELL_MD,PLUS_DEBT_INST_STAFFTHIS_N,PLUS_DEBT_INST_STAFFTHIS_MD,PLUS_DEBT_ALL_STAFFTHIS_N,PLUS_DEBT_ALL_STAFFTHIS_MD,PLUS_DEBT_INST_NOSTAFFTHIS_N,PLUS_DEBT_INST_NOSTAFFTHIS_MD,PLUS_DEBT_ALL_NOSTAFFTHIS_N,PLUS_DEBT_ALL_NOSTAFFTHIS_MD,PLUS_DEBT_INST_STAFFANY_N,PLUS_DEBT_INST_STAFFANY_MD,PLUS_DEBT_ALL_STAFFANY_N,PLUS_DEBT_ALL_STAFFANY_MD,PLUS_DEBT_INST_NOSTAFFANY_N,PLUS_DEBT_INST_NOSTAFFANY_MD,PLUS_DEBT_ALL_NOSTAFFANY_N,PLUS_DEBT_ALL_NOSTAFFANY_MD,LPSTAFFORD_CNT,LPSTAFFORD_AMT,LPPPLUS_CNT,LPPPLUS_AMT,LPGPLUS_CNT,LPGPLUS_AMT,FEDSCHCD
0,100654,100200,1002,Alabama A & M University,Normal,AL,35762,Southern Association of Colleges and Schools C...,www.aamu.edu/,www.aamu.edu/admissions-aid/tuition-fees/net-p...,3.0,0,1,1,3,4,1,1,5,12.0,,34.783368,-86.568502,18.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8986,0.8986,430.0,520.0,420.0,510.0,370.0,457.0,475.0,465.0,414.0,16.0,19.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,957.0,957.0,0.0,4990.0,,0.0186,0.912,0.0088,0.0018,0.0022,0.0016,0.0118,0.007,0.0361,,,,,,,,,,,,,0.0587,,1,14444.0,,,,13893.0,13976.0,15995.0,18957.0,17140.0,,,,,,,,,,,,,,,,13913.0,,,,14684.0,,18281.0,,,,,,592.0,,,,375.0,113.0,61.0,27.0,16.0,,,,,,,,,,,,,,,,22489.0,,9744.0,18354.0,,7413.0,5384.0,7101.0,0.7411,0.7067,0.8987,0.6087,,1.0,,0.7503,0.0758,0.6020087884,0.0988700565,0.5691396726,0.9015873016,0.3658280922,0.1898932831,0.1051475204,0.0621468927,0.0408035154,0.2034134448,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0666666667,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0164220825,0.3494060098,0.6341719078,0.7291274325,0.5668549906,0.4579409918,0.3631512869,34779.085684,10340.346032,15500,33375,10250,15500,16000,14518,15000,19000,17500,10250,17500,14250,15000,16421,3606,1076,2530,2185,1034,387,3191,415,3162,444,2074,1532,2895,711,346.376038474076,3085,47750,32208,5500,3381,3186,2871,315,3186,2862,3186,0.8860640301,0.8527934714,20.283741368,,0.07999999821186,0.5640301318,0.0091023227,0.9011299435,0.003138732,0.3658280922,32362.826114,23553.0,10340.346032,,,46.8400001525878,47.9799995422363,1.48000001907348,3.78999996185302,13.0,6.8600001335144,94.7399978637695,49720.22,14.8800001144409,4.84000015258789,10.75,,,,,,,15500,33375,346.376038474076,AAMU,1,0.4076,0.5924,12/12/1965,5039.0,2.0,153.0,963.0,SACSCC,0.5978,,0.25,,2698.0,,44.0,,2.0,2.0,0.5978,,0.25,,1.0,1,,,,,,,,,,,,,0.7057,0.7143,5343.0,1165.0,1288.0,2.0,0.7083,0.7287,2698.0,20.0,25.0,20.0,30.0,2.0,1318,14838,1573,13840,399,17396,187.073011318144,17396,187.073011318144,513,16106,173.200616250289,16106,173.200616250289,919,13628,1060,12978,569,15000,650,14275,749,14608,923,13489,1115,13563,1323,12859,203,17628,250,17175,1276,14985,1475,14288,42,12448,98,9451,1277,14970,1527,14000,41,12688,46,11067,31374,922456254,5201,113949554,1004,15578483,1002
1,100663,105200,1052,University of Alabama at Birmingham,Birmingham,AL,35294-0110,Southern Association of Colleges and Schools C...,https://www.uab.edu,https://uab.studentaidcalculator.com/survey.aspx,3.0,0,1,1,3,4,1,1,5,12.0,,33.505697,-86.799345,15.0,9.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9211,0.9211,490.0,620.0,490.0,620.0,,,555.0,555.0,,21.0,29.0,22.0,31.0,19.0,26.0,,,25.0,27.0,23.0,,1220.0,1220.0,0.0,13186.0,,0.5717,0.2553,0.0334,0.0633,0.0034,0.0002,0.0457,0.0213,0.0058,,,,,,,,,,,,,0.2425,,1,17005.0,,,,14550.0,15379.0,17892.0,19978.0,20110.0,,,,,,,,,,,,,,,,14830.0,,,,16587.0,,20050.0,,,,,,1229.0,,,,421.0,214.0,198.0,180.0,216.0,,,,,,,,,,,,,,,,24347.0,,8568.0,19704.0,,13177.0,16454.0,10717.0,0.7766,0.3632,0.6009,0.8186,,0.4648,,0.5127,0.2296,0.4276131917,0.3214086082,0.3487095003,0.5942028986,0.341223671,0.1798024967,0.1423514067,0.114589156,0.1356437488,0.1699615596,0.1537616694,0.142778693,0.1847885777,0.2005797101,0.1182608696,0.0550724638,0.031884058,0.0222668004,0.3189568706,0.658776329,0.5135084777,0.2634618968,0.1652692379,0.1076951742,61110.800384,30607.18029,15000,22500,9500,16226,15250,14000,15000,16000,17500,12500,15000,15000,15104,15000,7504,3730,3774,3168,2281,2055,5123,2381,4714,2790,4804,2700,5286,2218,233.511936049938,6302,37540,26082,6250,3500,5367,3642,1725,5367,4985,5367,0.8574622694,0.6249301286,23.60797466,,0.25999999046325,0.6390907397,0.1050866406,0.6785913918,0.0031675051,0.341223671,51306.674306,34489.0,30607.18029,,,69.0199966430664,27.7600002288818,1.10000002384185,2.02999997138977,15.9300003051757,8.55000019073486,96.5,55735.22,10.9099998474121,3.45000004768371,10.8599996566772,,,,,,,15000,22500,233.511936049938,,1,0.393,0.607,12/1/1965,13134.0,2.0,650.0,8087.0,SACSCC,0.8303,,0.4514,,4130.0,,144.0,,2.0,2.0,0.8303,,0.4514,,1.0,1,,,,,,,,,,,,,0.3788,0.535,14445.0,10498.0,2228.0,2.0,0.3891,0.5414,4176.0,5.0,10.0,5.0,10.0,2.0,1090,16145,2175,15235,578,19870,213.677899223472,19870,213.677899223472,1125,16954,182.319834093344,16954,182.319834093344,512,13978,1050,14458,362,15247,712,15000,728,16944,1463,15859,647,13892,1247,12373,443,20084,928,21617,1071,16307,1811,15076,19,12000,364,16617,1079,PrivacySuppressed,2153,15200,11,PrivacySuppressed,22,18300,56997,1720042015,3727,87421879,3461,134126588,1052
2,100690,2503400,25034,Amridge University,Montgomery,AL,36117-3553,Southern Association of Colleges and Schools C...,www.amridgeuniversity.edu,www2.amridgeuniversity.edu:9091/,3.0,0,1,1,3,4,2,1,5,12.0,,32.362609,-86.17401,20.0,5.0,6.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,74.0,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,351.0,,0.2393,0.7151,0.0171,0.0057,0.0057,0.0,0.0,0.0,0.0171,,,,,,,,,,,,,0.5014,,1,,15322.0,,,,,,,,15322.0,,,,,,,,,,,,,,,,15322.0,,,,,,,,,,,,5.0,,,,,,,,5.0,0.0,0.0,0.0,0.0,,,,,,,,,,,17680.0,,6900.0,6900.0,,14273.0,4206.0,4292.0,1.0,0.7673,0.0035,,,,,0.8962,0.8302,0.7736486486,0.8952702703,PrivacySuppressed,PrivacySuppressed,0.5125,0.1148648649,0.0641891892,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.05,0.4625,0.4875,0.5945945946,0.3378378378,0.2432432432,0.1587837838,25211.032258,20596.158491,10500,27334,9500,9500,19000,25000,7646,12038,9500,15509,9500,17025,11500,9500,514,92,422,397,91,26,60,454,464,50,327,187,458,56,283.680678221734,398,38455,24250,4750,3166,296,31,265,296,240,296,0.9560810811,0.8648648649,33.672297297,,0.82999998331069,0.6486486486,0.2364864865,0.1047297297,0.0405405405,0.5125,21079.472973,15033.5,20596.158491,,,70.8799972534179,22.5300006866455,1.28999996185302,6.94000005722046,13.2299995422363,7.01000022888183,94.0899963378906,53683.7,10.6499996185302,3.59999990463256,10.8400001525878,,,,,,,10500,27334,283.680678221734,Southern Christian University Regions University,1,0.3191,0.6809,3/26/1987,318.0,1.0,,404.0,SACSCC,0.2143,,0.1429,,14.0,,14.0,,4.0,4.0,PrivacySuppressed,,PrivacySuppressed,,2.0,1,,,,,,,,,,,,,1.0,1.0,440.0,527.0,5.0,4.0,PrivacySuppressed,PrivacySuppressed,24.0,0.0,5.0,0.0,5.0,2.0,PrivacySuppressed,PrivacySuppressed,88,5599,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,29,5730,61.6192432083794,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,59,5597,PrivacySuppressed,PrivacySuppressed,24,5798,PrivacySuppressed,PrivacySuppressed,64,5367,PrivacySuppressed,PrivacySuppressed,74,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,14,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,78,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,10,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,4463,174222020,16,309618,298,16290781,16885
3,100706,105500,1055,University of Alabama in Huntsville,Huntsville,AL,35899,Southern Association of Colleges and Schools C...,www.uah.edu,finaid.uah.edu/,3.0,0,1,1,3,4,1,1,5,12.0,,34.724557,-86.640449,16.0,15.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8087,0.8087,560.0,700.0,450.0,680.0,,,630.0,565.0,,25.0,31.0,25.0,34.0,24.0,30.0,,,28.0,30.0,27.0,,1314.0,1314.0,0.0,7458.0,,0.7167,0.0969,0.0528,0.0381,0.0095,0.0008,0.0296,0.0223,0.0333,,,,,,,,,,,,,0.1443,,1,20909.0,,,,17561.0,18991.0,21396.0,23204.0,23406.0,,,,,,,,,,,,,,,,18147.0,,,,20356.0,,23315.0,,,,,,585.0,,,,134.0,93.0,122.0,107.0,129.0,,,,,,,,,,,,,,,,23441.0,,10714.0,22362.0,,8677.0,9242.0,9442.0,0.6544,0.2698,0.6176,0.8288,,0.0909,,0.4192,0.1842,0.374633738,0.2515696944,0.26901566,0.6888519135,0.3101321586,0.1377145249,0.1469233989,0.1506906656,0.1900376727,0.1448545861,0.1605145414,0.1817673378,0.2438478747,0.1164725458,0.1064891847,0.0582362729,0.0299500832,0.0198237885,0.29030837,0.6898678414,0.5290916702,0.2737547091,0.1573880285,0.1025533696,72240.892617,27941.821963,14476,21607,9000,16250,14750,12500,12750,18569,17014,11899,15250,13333,14943,13102,3021,1374,1647,1168,827,1026,2067,954,1808,1213,1375,1646,1997,1024,224.244106765823,2626,36250,26750,5500,3472,2389,1788,601,2389,2270,2389,0.8652155714,0.5571368774,22.727919632,,0.28999999165534,0.4763499372,0.1004604437,0.7484303056,PrivacySuppressed,0.3101321586,61096.588949,44787.0,27941.821963,,,76.3799972534179,18.9799995422363,1.41999995708465,2.54999995231628,17.6700000762939,8.90999984741211,95.2699966430664,58688.62,9.36999988555908,3.64000010490417,10.9300003051757,,,,,,,14476,21607,224.244106765823,UAH University of Alabama Huntsville,1,0.5796,0.4204,12/1/1965,7090.0,2.0,213.0,2065.0,SACSCC,0.8269,,0.35,,2531.0,,40.0,,2.0,4.0,0.8269,,0.35,,1.0,1,,,,,,,,,,,,,0.2707,0.4556,8145.0,2443.0,1341.0,2.0,0.2378,0.4402,2544.0,0.0,10.0,0.0,10.0,2.0,386,13524,655,14577,151,17030,183.137122484939,17030,183.137122484939,233,16550,177.975301064341,16550,177.975301064341,235,12000,422,13538,206,11500,323,13441,180,15937,332,15227,225,12033,385,12139,161,16268,270,17311,369,PrivacySuppressed,533,14383,17,PrivacySuppressed,122,15178,373,PrivacySuppressed,640,PrivacySuppressed,13,PrivacySuppressed,15,PrivacySuppressed,19702,407184805,1397,29789762,144,2377759,1055
4,100724,100500,1005,Alabama State University,Montgomery,AL,36104-0271,Southern Association of Colleges and Schools C...,www.alasu.edu,www.alasu.edu/cost-aid/tuition-costs/net-price...,3.0,0,1,1,3,4,1,1,5,12.0,,32.364317,-86.295677,19.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9774,0.9774,440.0,520.0,420.0,510.0,,,480.0,465.0,,16.0,20.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,972.0,972.0,0.0,3903.0,,0.0167,0.9352,0.0095,0.0041,0.0013,0.0005,0.0102,0.0102,0.0123,,,,,,,,,,,,,0.0666,,1,13043.0,,,,11344.0,14855.0,18390.0,18863.0,14833.0,,,,,,,,,,,,,,,,12113.0,,,,16104.0,,17819.0,,,,,,523.0,,,,346.0,97.0,53.0,20.0,7.0,,,,,,,,,,,,,,,,21476.0,,11068.0,19396.0,,10160.0,8527.0,7754.0,0.5826,0.7448,0.865,0.5868,,0.125,,0.7845,0.0848,0.6146166134,0.107428115,0.5776286353,0.9219330855,0.3434343434,0.178514377,0.1126198083,0.052715655,0.0415335463,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0188246097,0.3246097337,0.6565656566,0.6625399361,0.4972044728,0.3841853035,0.2903354633,34468.571812,8551.802974,18679,32000,11161,18750,18500,18246,17500,23925,19056,12000,19500,15525,19000,17500,3609,1149,2460,2299,965,345,3162,447,3237,372,2276,1333,2899,710,332.105864604357,3486,45000,32263,5784,3500,2504,2235,269,2504,2178,2504,0.8889776358,0.874600639,20.130990415,,0.10999999940395,0.6134185304,0.0079872204,0.892571885,PrivacySuppressed,0.3434343434,31684.382188,22080.5,8551.802974,,,42.6899986267089,52.3199996948242,1.40999996662139,4.09000015258789,11.8100004196167,6.76000022888183,94.5299987792968,46065.2,16.9599990844726,4.80999994277954,10.6700000762939,,,,,,,18679,32000,332.105864604357,,1,0.371,0.629,12/1/1965,4208.0,2.0,,510.0,SACSCC,0.5898,,0.25,,2094.0,,36.0,,2.0,2.0,0.5898,,0.25,,1.0,1,,,,,,,,,,,,,0.7792,0.7539,4732.0,642.0,951.0,2.0,0.7684,0.7464,2094.0,20.0,25.0,20.0,25.0,2.0,1362,15351,1486,15351,463,18918,203.440286739288,18918,203.440286739288,499,18952,203.80591575658,18952,203.80591575658,899,14078,987,14136,500,15212,548,15351,862,15505,938,15360,1183,14851,1289,14787,179,21686,197,21686,1335,15408,1430,15424,27,13000,56,12698,1335,15408,1456,15403,27,13000,30,12466,34246,947070736,4602,95359062,587,12174367,1005
5,100751,105100,1051,The University of Alabama,Tuscaloosa,AL,35487-0100,Southern Association of Colleges and Schools C...,www.ua.edu/,financialaid.ua.edu/net-price-calculator/,3.0,0,1,1,3,4,1,1,5,12.0,,33.211875,-87.545978,15.0,14.0,16.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.5906,0.5906,540.0,640.0,520.0,640.0,480.0,600.0,590.0,580.0,540.0,23.0,31.0,23.0,34.0,21.0,29.0,7.0,8.0,27.0,29.0,25.0,8.0,1252.0,1252.0,0.0,32177.0,,0.7774,0.0999,0.0499,0.0116,0.0035,0.001,0.0338,0.0183,0.0045,,,,,,,,,,,,,0.0836,,1,22232.0,,,,18515.0,20541.0,22457.0,24789.0,25199.0,,,,,,,,,,,,,,,,19212.0,,,,21592.0,,25065.0,,,,,,1267.0,,,,339.0,178.0,216.0,175.0,359.0,,,,,,,,,,,,,,,,29424.0,,10780.0,29230.0,,14198.0,10770.0,10225.0,0.7454,0.1802,0.807,0.8788,,0.6364,,0.3863,0.0725,0.261546724,0.1429645542,0.2037849355,0.6078136739,0.2257126887,0.1279269603,0.1374865736,0.1316863588,0.3413533835,0.1245770147,0.1376112295,0.1414964281,0.3925303923,0.1480090158,0.1367392938,0.0728775357,0.0345604808,0.0081609838,0.2175517049,0.7742873113,0.5377013963,0.3714285714,0.2766917293,0.2022556391,101976.77516,31119.872276,17500,23250,9500,17750,17750,17250,17500,15845,19500,15000,18500,16000,18000,16750,11447,6542,4905,2961,2958,5528,9733,1714,5520,5927,6713,4734,6580,4867,241.295667251603,10443,34000,27000,7439,4500,9310,7979,1331,9310,8945,9310,0.9107411386,0.4526315789,21.137701396,,0.10000000149011,0.6152524168,0.0537056928,0.8570354458,0.0039742213,0.2257126887,91846.749624,66733.5,31119.872276,,,75.3499984741211,21.0599994659423,1.20000004768371,2.41000008583068,16.4799995422363,9.21000003814697,96.0800018310547,57928.41,10.0500001907348,3.25999999046325,10.8999996185302,,,,,,,17500,23250,241.295667251603,,1,0.4443,0.5557,12/1/1965,33196.0,2.0,851.0,5362.0,SACSCC,0.8748,,0.6,,14921.0,,40.0,,2.0,2.0,0.8748,,0.6,,1.0,1,,,,,,,,,,,,,0.1656,0.4145,36237.0,6331.0,7351.0,2.0,0.1678,0.4094,14863.0,5.0,15.0,5.0,15.0,2.0,3068,41756,3730,36147,1747,55028,591.759810692967,55028,591.759810692967,2107,43707,470.016101729256,43707,470.016101729256,1321,33915,1623,27904,1150,36606,1399,31291,1918,44134,2331,38700,1405,36528,1807,27226,1663,45333,1923,43134,2984,42055,3431,38264,84,30692,299,17000,2992,41843,3650,36409,76,33072,80,31384,75084,1771875477,11535,619905869,2035,69504249,1051
6,100760,100700,1007,Central Alabama Community College,Alexander City,AL,35010,Southern Association of Colleges and Schools C...,www.cacc.edu,https://www.cacc.edu/net-price-calculator/,2.0,0,1,1,1,2,1,1,5,32.0,,32.92478,-85.945266,2.0,2.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,1211.0,,0.725,0.2337,0.0239,0.0041,0.0041,0.0,0.0058,0.0017,0.0017,,,,,,,,,,,,,0.3922,,1,3254.0,,,,2228.0,2904.0,5456.0,8063.0,7501.0,,,,,,,,,,,,,,,,2421.0,,,,3732.0,,7849.0,,,,,,228.0,,,,130.0,52.0,25.0,13.0,8.0,,,,,,,,,,,,,,,,8824.0,,4740.0,8610.0,,1771.0,6801.0,6291.0,0.3966,0.4381,0.6969,,0.5473,,0.3409,0.2104,0.1777,0.6074766355,0.3056074766,0.5235531629,0.7981651376,0.5496760259,0.1757009346,0.114953271,0.0654205607,0.0364485981,0.199192463,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.122324159,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0496760259,0.5,0.4503239741,0.4439252336,0.2429906542,0.1682242991,0.1130841121,36871.779273,16898.397554,7678,12500,6027,8000,7544,6256,5699,12500,8000,5625,9000,5500,7750,6500,612,145,467,318,182,112,376,236,472,140,423,189,543,69,129.728853361077,851,27362,13500,3250,1750,1070,743,327,1070,926,1070,0.408411215,0.8691588785,23.071028037,,0.41999998688697,0.6037383178,0.0962616822,0.6943925234,PrivacySuppressed,0.5496760259,30767.764486,22217.0,16898.397554,,,71.5100021362304,26.8999996185302,0.2199999988079,1.00999999046325,7.96999979019165,4.55000019073486,98.8499984741211,43985.14,13.5500001907348,3.75999999046325,10.6800003051757,,,,,,,7678,12500,129.728853361077,,2,0.4154,0.5846,2/14/1969,1835.0,1.0,470.0,,SACSCC,,0.5893,,0.3695,,689.0,,92.0,2.0,2.0,,0.5893,,0.3695,1.0,1,,,,,,,,,,,,,0.5817,0.1748,2417.0,,349.0,2.0,0.5893,0.2076,689.0,0.0,5.0,0.0,5.0,2.0,PrivacySuppressed,PrivacySuppressed,38,6000,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,14,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,24,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,20,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,18,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,5297,68476891,14,96386,PrivacySuppressed,PrivacySuppressed,1007
7,100812,100800,1008,Athens State University,Athens,AL,35611,Southern Association of Colleges and Schools C...,www.athens.edu,www.athens.edu/financial-aid/net-price-calcula...,3.0,0,1,1,3,4,1,1,5,31.0,,34.806793,-86.964698,22.0,5.0,9.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,2732.0,,0.7657,0.127,0.0311,0.0073,0.0143,0.0011,0.0212,0.0,0.0322,,,,,,,,,,,,,0.5593,,1,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,6817.0,7988.0,8538.0,0.4601,0.4223,,,,,,0.5079,0.6377,0.4928385417,0.7213541667,0.3107476636,0.5631768953,0.4774964838,0.203125,0.1569010417,0.1009114583,0.0462239583,0.2079439252,0.1845794393,0.1565420561,0.1401869159,0.2012635379,0.1462093863,0.0794223827,0.0099277978,0.047116737,0.4303797468,0.5225035162,0.5826822917,0.1875,0.07421875,0.0403645833,56488.670561,31522.732852,13750,19500,10833,15250,13750,12500,11000,16666,15813,11750,14939,12500,14372,12501,1907,882,1025,909,667,331,532,1375,1359,548,1342,565,1540,367,202.37701124328,1786,34231,25000,6341,3500,1536,428,1108,1536,1422,1536,0.81640625,0.720703125,30.384765625,,0.61000001430511,0.705078125,0.361328125,0.2786458333,PrivacySuppressed,0.4774964838,38479.38737,29645.5,31522.732852,,,83.8899993896484,12.2600002288818,0.64999997615814,2.40000009536743,11.8900003433227,6.17000007629394,96.9599990844726,50752.1,10.4399995803833,3.38000011444091,10.8000001907348,,,,,,,13750,19500,202.37701124328,,1,0.3086,0.6914,12/1/1965,2967.0,,153.0,159.0,SACSCC,,,,,,,,,,,,,,,1.0,1,,,,,,,,,,,,,,,3947.0,165.0,0.0,4.0,,,0.0,0.0,5.0,0.0,5.0,2.0,56,8098,273,11625,38,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,109,10021,107.763775949593,10021,107.763775949593,18,PrivacySuppressed,164,12795,20,8070,93,13128,36,8098,180,11072,28,6897,170,10010,28,8673,103,13729,PrivacySuppressed,PrivacySuppressed,179,9325,PrivacySuppressed,PrivacySuppressed,94,15500,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,12034,234452111,171,1713456,PrivacySuppressed,PrivacySuppressed,1008
8,100830,831000,8310,Auburn University at Montgomery,Montgomery,AL,36117-3596,Southern Association of Colleges and Schools C...,www.aum.edu,www.aum.edu/current-students/financial-informa...,3.0,0,1,1,3,4,1,1,5,12.0,,32.36736,-86.177544,18.0,9.0,13.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9281,0.9281,510.0,570.0,480.0,570.0,,,540.0,525.0,,19.0,23.0,18.0,24.0,16.0,22.0,,,21.0,21.0,19.0,,1084.0,1084.0,0.0,4529.0,,0.452,0.4131,0.0117,0.0221,0.004,0.0007,0.0393,0.0488,0.0084,,,,,,,,,,,,,0.2168,,1,12680.0,,,,10877.0,12321.0,14734.0,15871.0,15341.0,,,,,,,,,,,,,,,,11257.0,,,,13318.0,,15642.0,,,,,,415.0,,,,199.0,71.0,50.0,54.0,41.0,,,,,,,,,,,,,,,,18291.0,,8404.0,17812.0,,7582.0,6289.0,7678.0,0.9655,0.4584,0.5739,0.6699,,0.6,,0.5539,0.2244,0.4892262488,0.2272282076,0.4283903676,0.6961206897,0.38189609,0.1885406464,0.1307541626,0.110675808,0.0808031342,0.2015209125,0.1432192649,0.1292775665,0.0975918885,0.1443965517,0.088362069,0.0474137931,0.0237068966,0.0230316015,0.3588644885,0.61810391,0.5710088149,0.3506366308,0.2277179236,0.152301665,46985.570342,24991.892241,12250,24826,7514,11802,12500,12235,11189,13838,13000,11000,12982,10440,12375,12000,2776,996,1780,1485,813,478,2042,734,2098,678,1951,825,2183,593,257.651881083368,2522,37250,23500,5500,2750,2042,1578,464,2042,1867,2042,0.8932419197,0.7257590597,22.199804114,,0.31999999284744,0.6929480901,0.0729676787,0.7727717924,0.0048971596,0.38189609,41987.986288,29671.5,24991.892241,,,59.9700012207031,37.2099990844726,0.91000002622604,1.62000000476837,14.7200002670288,9.09000015258789,96.8499984741211,50723.81,13.0,3.78999996185302,10.7799997329711,,,,,,,12250,24826,257.651881083368,AUM||Auburn University at Montgomery|Auburn Mo...,1,0.348,0.652,1/1/1968,4313.0,2.0,103.0,579.0,SACSCC,0.676,,0.5166,,1185.0,,60.0,,2.0,2.0,0.676,,0.5166,,1.0,1,,,,,,,,,,,,,0.5183,0.5518,5246.0,787.0,627.0,2.0,0.524,0.5966,1185.0,0.0,10.0,5.0,10.0,2.0,379,7998,643,9765,140,8567,92.1277585630342,8567,92.1277585630342,253,11000,118.291740888686,11000,118.291740888686,239,7500,390,9000,117,8000,175,9424,262,7605,468,9963,307,7500,500,8233,72,10000,143,14900,PrivacySuppressed,PrivacySuppressed,568,9475,PrivacySuppressed,PrivacySuppressed,75,10966,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,23340,493759303,1289,16701421,165,1883514,8310
9,100858,100900,1009,Auburn University,Auburn,AL,36849,Southern Association of Colleges and Schools C...,www.auburn.edu,https://www.auburn.edu/admissions/costcalc/fre...,3.0,0,1,1,3,4,1,1,5,13.0,,32.599378,-85.488258,15.0,14.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.7543,0.7543,580.0,650.0,570.0,660.0,520.0,620.0,615.0,615.0,570.0,25.0,30.0,25.0,33.0,23.0,28.0,7.0,8.0,28.0,29.0,26.0,8.0,1289.0,1289.0,0.0,24147.0,,0.8078,0.055,0.0342,0.0236,0.0038,0.0005,0.0225,0.049,0.0036,,,,,,,,,,,,,0.0791,,1,23696.0,,,,18617.0,20546.0,23110.0,26329.0,27395.0,,,,,,,,,,,,,,,,19348.0,,,,21872.0,,27016.0,,,,,,1140.0,,,,254.0,155.0,166.0,201.0,364.0,,,,,,,,,,,,,,,,31282.0,,11276.0,30524.0,,15908.0,11058.0,10428.0,0.8553,0.1537,0.7973,0.8999,,0.7458,,0.3169,0.0377,0.2520373683,0.0858676208,0.2028701892,0.775462963,0.1726471191,0.1208507255,0.129397734,0.1530510833,0.3446630888,0.1213307241,0.1358991085,PrivacySuppressed,PrivacySuppressed,0.1157407407,0.0601851852,PrivacySuppressed,PrivacySuppressed,0.0065614107,0.1660857084,0.8273528809,0.4514013119,0.2790697674,0.1868415822,0.1297952693,98805.666232,21278.891204,17014,21281,8250,17750,17750,16250,16849,18581,19000,15000,17750,16250,16750,17500,6671,4322,2349,1467,1661,3543,6037,634,3007,3664,3392,3279,3248,3423,220.860778270166,5807,33474,26000,7500,4500,5031,4599,432,5031,4877,5031,0.887696283,0.4362949712,20.516795866,,0.07000000029802,0.531504671,0.0222619758,0.9141323792,0.0023852117,0.1726471191,92148.626516,72031.0,21278.891204,,,75.9000015258789,19.7999992370605,1.64999997615814,2.89000010490417,17.9300003051757,10.8199996948242,94.9199981689453,59005.4,9.59000015258789,3.14000010490417,10.8999996185302,,,,,,,17014,21281,220.860778270166,,1,0.5115,0.4885,9/8/1987,23964.0,2.0,481.0,5812.0,SACSCC,0.9073,,0.7959,,9245.0,,98.0,,2.0,2.0,0.9073,,0.7959,,1.0,1,,,,,,,,,,,,,0.1409,0.3039,25195.0,6650.0,4771.0,2.0,0.1343,0.3134,9258.0,5.0,10.0,5.0,10.0,2.0,1571,38301,1985,32236,1052,46902,504.374475560106,46902,504.374475560106,1308,38924,418.58070203193,38924,418.58070203193,519,26842,677,24642,734,35973,925,29933,837,41754,1060,33884,691,32100,890,26286,880,43764,1095,37994,1517,38642,1783,34082,54,34035,202,21459,1522,38580,1932,32168,49,36506,53,32255,48346,1258831243,6151,307762305,1968,82412571,1009


In [31]:
# Get info
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 6806 entries, 0 to 6805
Columns: 375 entries, UNITID to FEDSCHCD
dtypes: float64(196), int64(14), object(165)
memory usage: 19.5+ MB


# 03. Data cleaning and consistency checks

## 01. Dropping columns

In [32]:
# In order to remove columns having to do with PLUS loans, create list of just columns with PLUS
plus_col = [col for col in df if 'PLUS' in col]

In [33]:
# Check output
plus_col

['PPLUS_PCT_LOW',
 'PPLUS_PCT_HIGH',
 'PPLUS_PCT_LOW_POOLED_SUPP',
 'PPLUS_PCT_HIGH_POOLED_SUPP',
 'POOLYRS_PLUSPCT',
 'PLUS_DEBT_INST_N',
 'PLUS_DEBT_INST_MD',
 'PLUS_DEBT_ALL_N',
 'PLUS_DEBT_ALL_MD',
 'PLUS_DEBT_INST_COMP_N',
 'PLUS_DEBT_INST_COMP_MD',
 'PLUS_DEBT_INST_COMP_MDPAY10',
 'PLUS_DEBT_INST_COMP_MD_SUPP',
 'PLUS_DEBT_INST_COMP_MDPAY10_SUPP',
 'PLUS_DEBT_ALL_COMP_N',
 'PLUS_DEBT_ALL_COMP_MD',
 'PLUS_DEBT_ALL_COMP_MDPAY10',
 'PLUS_DEBT_ALL_COMP_MD_SUPP',
 'PLUS_DEBT_ALL_COMP_MDPAY10_SUPP',
 'PLUS_DEBT_INST_NOCOMP_N',
 'PLUS_DEBT_INST_NOCOMP_MD',
 'PLUS_DEBT_ALL_NOCOMP_N',
 'PLUS_DEBT_ALL_NOCOMP_MD',
 'PLUS_DEBT_INST_MALE_N',
 'PLUS_DEBT_INST_MALE_MD',
 'PLUS_DEBT_ALL_MALE_N',
 'PLUS_DEBT_ALL_MALE_MD',
 'PLUS_DEBT_INST_NOMALE_N',
 'PLUS_DEBT_INST_NOMALE_MD',
 'PLUS_DEBT_ALL_NOMALE_N',
 'PLUS_DEBT_ALL_NOMALE_MD',
 'PLUS_DEBT_INST_PELL_N',
 'PLUS_DEBT_INST_PELL_MD',
 'PLUS_DEBT_ALL_PELL_N',
 'PLUS_DEBT_ALL_PELL_MD',
 'PLUS_DEBT_INST_NOPELL_N',
 'PLUS_DEBT_INST_NOPELL_MD',
 'PLUS

In [34]:
# Drop columns from dataframe that are in list
df.drop(columns = plus_col, inplace = True)

In [35]:
# Check new dataframe
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 6806 entries, 0 to 6805
Columns: 316 entries, UNITID to FEDSCHCD
dtypes: float64(191), int64(14), object(111)
memory usage: 16.4+ MB


In [36]:
# Drop URL columns - INSTURL and NPCURL
df = df.drop(columns = ['INSTURL', 'NPCURL'])

In [37]:
# Check output
df.head()

Unnamed: 0,UNITID,OPEID,OPEID6,INSTNM,CITY,STABBR,ZIP,ACCREDAGENCY,SCH_DEG,HCM2,MAIN,NUMBRANCH,PREDDEG,HIGHDEG,CONTROL,ST_FIPS,REGION,LOCALE,LOCALE2,LATITUDE,LONGITUDE,CCBASIC,CCUGPROF,CCSIZSET,HBCU,PBI,ANNHI,TRIBAL,AANAPII,HSI,NANTI,MENONLY,WOMENONLY,RELAFFIL,ADM_RATE,ADM_RATE_ALL,SATVR25,SATVR75,SATMT25,SATMT75,SATWR25,SATWR75,SATVRMID,SATMTMID,SATWRMID,ACTCM25,ACTCM75,ACTEN25,ACTEN75,ACTMT25,ACTMT75,ACTWR25,ACTWR75,ACTCMMID,ACTENMID,ACTMTMID,ACTWRMID,SAT_AVG,SAT_AVG_ALL,DISTANCEONLY,UGDS,UG,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN,UGDS_WHITENH,UGDS_BLACKNH,UGDS_API,UGDS_AIANOLD,UGDS_HISPOLD,UG_NRA,UG_UNKN,UG_WHITENH,UG_BLACKNH,UG_API,UG_AIANOLD,UG_HISPOLD,PPTUG_EF,PPTUG_EF2,CURROPER,NPT4_PUB,NPT4_PRIV,NPT4_PROG,NPT4_OTHER,NPT41_PUB,NPT42_PUB,NPT43_PUB,NPT44_PUB,NPT45_PUB,NPT41_PRIV,NPT42_PRIV,NPT43_PRIV,NPT44_PRIV,NPT45_PRIV,NPT41_PROG,NPT42_PROG,NPT43_PROG,NPT44_PROG,NPT45_PROG,NPT41_OTHER,NPT42_OTHER,NPT43_OTHER,NPT44_OTHER,NPT45_OTHER,NPT4_048_PUB,NPT4_048_PRIV,NPT4_048_PROG,NPT4_048_OTHER,NPT4_3075_PUB,NPT4_3075_PRIV,NPT4_75UP_PUB,NPT4_75UP_PRIV,NPT4_3075_PROG,NPT4_3075_OTHER,NPT4_75UP_PROG,NPT4_75UP_OTHER,NUM4_PUB,NUM4_PRIV,NUM4_PROG,NUM4_OTHER,NUM41_PUB,NUM42_PUB,NUM43_PUB,NUM44_PUB,NUM45_PUB,NUM41_PRIV,NUM42_PRIV,NUM43_PRIV,NUM44_PRIV,NUM45_PRIV,NUM41_PROG,NUM42_PROG,NUM43_PROG,NUM44_PROG,NUM45_PROG,NUM41_OTHER,NUM42_OTHER,NUM43_OTHER,NUM44_OTHER,NUM45_OTHER,COSTT4_A,COSTT4_P,TUITIONFEE_IN,TUITIONFEE_OUT,TUITIONFEE_PROG,TUITFTE,INEXPFTE,AVGFACSAL,PFTFAC,PCTPELL,PFTFTUG1_EF,RET_FT4,RET_FTL4,RET_PT4,RET_PTL4,PCTFLOAN,UG25ABV,INC_PCT_LO,DEP_STAT_PCT_IND,DEP_INC_PCT_LO,IND_INC_PCT_LO,PAR_ED_PCT_1STGEN,INC_PCT_M1,INC_PCT_M2,INC_PCT_H1,INC_PCT_H2,DEP_INC_PCT_M1,DEP_INC_PCT_M2,DEP_INC_PCT_H1,DEP_INC_PCT_H2,IND_INC_PCT_M1,IND_INC_PCT_M2,IND_INC_PCT_H1,IND_INC_PCT_H2,PAR_ED_PCT_MS,PAR_ED_PCT_HS,PAR_ED_PCT_PS,APPL_SCH_PCT_GE2,APPL_SCH_PCT_GE3,APPL_SCH_PCT_GE4,APPL_SCH_PCT_GE5,DEP_INC_AVG,IND_INC_AVG,DEBT_MDN,GRAD_DEBT_MDN,WDRAW_DEBT_MDN,LO_INC_DEBT_MDN,MD_INC_DEBT_MDN,HI_INC_DEBT_MDN,DEP_DEBT_MDN,IND_DEBT_MDN,PELL_DEBT_MDN,NOPELL_DEBT_MDN,FEMALE_DEBT_MDN,MALE_DEBT_MDN,FIRSTGEN_DEBT_MDN,NOTFIRSTGEN_DEBT_MDN,DEBT_N,GRAD_DEBT_N,WDRAW_DEBT_N,LO_INC_DEBT_N,MD_INC_DEBT_N,HI_INC_DEBT_N,DEP_DEBT_N,IND_DEBT_N,PELL_DEBT_N,NOPELL_DEBT_N,FEMALE_DEBT_N,MALE_DEBT_N,FIRSTGEN_DEBT_N,NOTFIRSTGEN_DEBT_N,GRAD_DEBT_MDN10YR,CUML_DEBT_N,CUML_DEBT_P90,CUML_DEBT_P75,CUML_DEBT_P25,CUML_DEBT_P10,INC_N,DEP_INC_N,IND_INC_N,DEP_STAT_N,PAR_ED_N,APPL_SCH_N,LOAN_EVER,PELL_EVER,AGE_ENTRY,AGE_ENTRY_SQ,AGEGE24,FEMALE,MARRIED,DEPENDENT,VETERAN,FIRST_GEN,FAMINC,MD_FAMINC,FAMINC_IND,LNFAMINC,LNFAMINC_IND,PCT_WHITE,PCT_BLACK,PCT_ASIAN,PCT_HISPANIC,PCT_BA,PCT_GRAD_PROF,PCT_BORN_US,MEDIAN_HH_INC,POVERTY_RATE,UNEMP_RATE,LN_MEDIAN_HH_INC,FSEND_COUNT,FSEND_1,FSEND_2,FSEND_3,FSEND_4,FSEND_5,DEBT_MDN_SUPP,GRAD_DEBT_MDN_SUPP,GRAD_DEBT_MDN10YR_SUPP,ALIAS,ICLEVEL,UGDS_MEN,UGDS_WOMEN,T4APPROVALDATE,D_PCTPELL_PCTFLOAN,OPENADMP,UGNONDS,GRADS,ACCREDCODE,RET_FT4_POOLED,RET_FTL4_POOLED,RET_PT4_POOLED,RET_PTL4_POOLED,RET_FT_DEN4_POOLED,RET_FT_DENL4_POOLED,RET_PT_DEN4_POOLED,RET_PT_DENL4_POOLED,POOLYRSRET_FT,POOLYRSRET_PT,RET_FT4_POOLED_SUPP,RET_FTL4_POOLED_SUPP,RET_PT4_POOLED_SUPP,RET_PTL4_POOLED_SUPP,SCHTYPE,OPEFLAG,CIPTFBS1,CIPTFBS2,CIPTFBS3,CIPTFBS4,CIPTFBS5,CIPTFBS6,CIPTFBSANNUAL1,CIPTFBSANNUAL2,CIPTFBSANNUAL3,CIPTFBSANNUAL4,CIPTFBSANNUAL5,CIPTFBSANNUAL6,FTFTPCTPELL,FTFTPCTFLOAN,UG12MN,G12MN,SCUGFFN,POOLYRS_FTFTAIDPCT,FTFTPCTPELL_POOLED_SUPP,FTFTPCTFLOAN_POOLED_SUPP,SCUGFFN_POOLED,LPSTAFFORD_CNT,LPSTAFFORD_AMT,FEDSCHCD
0,100654,100200,1002,Alabama A & M University,Normal,AL,35762,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,34.783368,-86.568502,18.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8986,0.8986,430.0,520.0,420.0,510.0,370.0,457.0,475.0,465.0,414.0,16.0,19.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,957.0,957.0,0.0,4990.0,,0.0186,0.912,0.0088,0.0018,0.0022,0.0016,0.0118,0.007,0.0361,,,,,,,,,,,,,0.0587,,1,14444.0,,,,13893.0,13976.0,15995.0,18957.0,17140.0,,,,,,,,,,,,,,,,13913.0,,,,14684.0,,18281.0,,,,,,592.0,,,,375.0,113.0,61.0,27.0,16.0,,,,,,,,,,,,,,,,22489.0,,9744.0,18354.0,,7413.0,5384.0,7101.0,0.7411,0.7067,0.8987,0.6087,,1.0,,0.7503,0.0758,0.6020087884,0.0988700565,0.5691396726,0.9015873016,0.3658280922,0.1898932831,0.1051475204,0.0621468927,0.0408035154,0.2034134448,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0666666667,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0164220825,0.3494060098,0.6341719078,0.7291274325,0.5668549906,0.4579409918,0.3631512869,34779.085684,10340.346032,15500,33375,10250,15500,16000,14518,15000,19000,17500,10250,17500,14250,15000,16421,3606,1076,2530,2185,1034,387,3191,415,3162,444,2074,1532,2895,711,346.376038474076,3085,47750,32208,5500,3381,3186,2871,315,3186,2862,3186,0.8860640301,0.8527934714,20.283741368,,0.07999999821186,0.5640301318,0.0091023227,0.9011299435,0.003138732,0.3658280922,32362.826114,23553.0,10340.346032,,,46.8400001525878,47.9799995422363,1.48000001907348,3.78999996185302,13.0,6.8600001335144,94.7399978637695,49720.22,14.8800001144409,4.84000015258789,10.75,,,,,,,15500,33375,346.376038474076,AAMU,1,0.4076,0.5924,12/12/1965,5039.0,2.0,153.0,963.0,SACSCC,0.5978,,0.25,,2698.0,,44.0,,2.0,2.0,0.5978,,0.25,,1.0,1,,,,,,,,,,,,,0.7057,0.7143,5343.0,1165.0,1288.0,2.0,0.7083,0.7287,2698.0,31374,922456254,1002
1,100663,105200,1052,University of Alabama at Birmingham,Birmingham,AL,35294-0110,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,33.505697,-86.799345,15.0,9.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9211,0.9211,490.0,620.0,490.0,620.0,,,555.0,555.0,,21.0,29.0,22.0,31.0,19.0,26.0,,,25.0,27.0,23.0,,1220.0,1220.0,0.0,13186.0,,0.5717,0.2553,0.0334,0.0633,0.0034,0.0002,0.0457,0.0213,0.0058,,,,,,,,,,,,,0.2425,,1,17005.0,,,,14550.0,15379.0,17892.0,19978.0,20110.0,,,,,,,,,,,,,,,,14830.0,,,,16587.0,,20050.0,,,,,,1229.0,,,,421.0,214.0,198.0,180.0,216.0,,,,,,,,,,,,,,,,24347.0,,8568.0,19704.0,,13177.0,16454.0,10717.0,0.7766,0.3632,0.6009,0.8186,,0.4648,,0.5127,0.2296,0.4276131917,0.3214086082,0.3487095003,0.5942028986,0.341223671,0.1798024967,0.1423514067,0.114589156,0.1356437488,0.1699615596,0.1537616694,0.142778693,0.1847885777,0.2005797101,0.1182608696,0.0550724638,0.031884058,0.0222668004,0.3189568706,0.658776329,0.5135084777,0.2634618968,0.1652692379,0.1076951742,61110.800384,30607.18029,15000,22500,9500,16226,15250,14000,15000,16000,17500,12500,15000,15000,15104,15000,7504,3730,3774,3168,2281,2055,5123,2381,4714,2790,4804,2700,5286,2218,233.511936049938,6302,37540,26082,6250,3500,5367,3642,1725,5367,4985,5367,0.8574622694,0.6249301286,23.60797466,,0.25999999046325,0.6390907397,0.1050866406,0.6785913918,0.0031675051,0.341223671,51306.674306,34489.0,30607.18029,,,69.0199966430664,27.7600002288818,1.10000002384185,2.02999997138977,15.9300003051757,8.55000019073486,96.5,55735.22,10.9099998474121,3.45000004768371,10.8599996566772,,,,,,,15000,22500,233.511936049938,,1,0.393,0.607,12/1/1965,13134.0,2.0,650.0,8087.0,SACSCC,0.8303,,0.4514,,4130.0,,144.0,,2.0,2.0,0.8303,,0.4514,,1.0,1,,,,,,,,,,,,,0.3788,0.535,14445.0,10498.0,2228.0,2.0,0.3891,0.5414,4176.0,56997,1720042015,1052
2,100690,2503400,25034,Amridge University,Montgomery,AL,36117-3553,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,2,1,5,12.0,,32.362609,-86.17401,20.0,5.0,6.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,74.0,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,351.0,,0.2393,0.7151,0.0171,0.0057,0.0057,0.0,0.0,0.0,0.0171,,,,,,,,,,,,,0.5014,,1,,15322.0,,,,,,,,15322.0,,,,,,,,,,,,,,,,15322.0,,,,,,,,,,,,5.0,,,,,,,,5.0,0.0,0.0,0.0,0.0,,,,,,,,,,,17680.0,,6900.0,6900.0,,14273.0,4206.0,4292.0,1.0,0.7673,0.0035,,,,,0.8962,0.8302,0.7736486486,0.8952702703,PrivacySuppressed,PrivacySuppressed,0.5125,0.1148648649,0.0641891892,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.05,0.4625,0.4875,0.5945945946,0.3378378378,0.2432432432,0.1587837838,25211.032258,20596.158491,10500,27334,9500,9500,19000,25000,7646,12038,9500,15509,9500,17025,11500,9500,514,92,422,397,91,26,60,454,464,50,327,187,458,56,283.680678221734,398,38455,24250,4750,3166,296,31,265,296,240,296,0.9560810811,0.8648648649,33.672297297,,0.82999998331069,0.6486486486,0.2364864865,0.1047297297,0.0405405405,0.5125,21079.472973,15033.5,20596.158491,,,70.8799972534179,22.5300006866455,1.28999996185302,6.94000005722046,13.2299995422363,7.01000022888183,94.0899963378906,53683.7,10.6499996185302,3.59999990463256,10.8400001525878,,,,,,,10500,27334,283.680678221734,Southern Christian University Regions University,1,0.3191,0.6809,3/26/1987,318.0,1.0,,404.0,SACSCC,0.2143,,0.1429,,14.0,,14.0,,4.0,4.0,PrivacySuppressed,,PrivacySuppressed,,2.0,1,,,,,,,,,,,,,1.0,1.0,440.0,527.0,5.0,4.0,PrivacySuppressed,PrivacySuppressed,24.0,4463,174222020,16885
3,100706,105500,1055,University of Alabama in Huntsville,Huntsville,AL,35899,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,34.724557,-86.640449,16.0,15.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8087,0.8087,560.0,700.0,450.0,680.0,,,630.0,565.0,,25.0,31.0,25.0,34.0,24.0,30.0,,,28.0,30.0,27.0,,1314.0,1314.0,0.0,7458.0,,0.7167,0.0969,0.0528,0.0381,0.0095,0.0008,0.0296,0.0223,0.0333,,,,,,,,,,,,,0.1443,,1,20909.0,,,,17561.0,18991.0,21396.0,23204.0,23406.0,,,,,,,,,,,,,,,,18147.0,,,,20356.0,,23315.0,,,,,,585.0,,,,134.0,93.0,122.0,107.0,129.0,,,,,,,,,,,,,,,,23441.0,,10714.0,22362.0,,8677.0,9242.0,9442.0,0.6544,0.2698,0.6176,0.8288,,0.0909,,0.4192,0.1842,0.374633738,0.2515696944,0.26901566,0.6888519135,0.3101321586,0.1377145249,0.1469233989,0.1506906656,0.1900376727,0.1448545861,0.1605145414,0.1817673378,0.2438478747,0.1164725458,0.1064891847,0.0582362729,0.0299500832,0.0198237885,0.29030837,0.6898678414,0.5290916702,0.2737547091,0.1573880285,0.1025533696,72240.892617,27941.821963,14476,21607,9000,16250,14750,12500,12750,18569,17014,11899,15250,13333,14943,13102,3021,1374,1647,1168,827,1026,2067,954,1808,1213,1375,1646,1997,1024,224.244106765823,2626,36250,26750,5500,3472,2389,1788,601,2389,2270,2389,0.8652155714,0.5571368774,22.727919632,,0.28999999165534,0.4763499372,0.1004604437,0.7484303056,PrivacySuppressed,0.3101321586,61096.588949,44787.0,27941.821963,,,76.3799972534179,18.9799995422363,1.41999995708465,2.54999995231628,17.6700000762939,8.90999984741211,95.2699966430664,58688.62,9.36999988555908,3.64000010490417,10.9300003051757,,,,,,,14476,21607,224.244106765823,UAH University of Alabama Huntsville,1,0.5796,0.4204,12/1/1965,7090.0,2.0,213.0,2065.0,SACSCC,0.8269,,0.35,,2531.0,,40.0,,2.0,4.0,0.8269,,0.35,,1.0,1,,,,,,,,,,,,,0.2707,0.4556,8145.0,2443.0,1341.0,2.0,0.2378,0.4402,2544.0,19702,407184805,1055
4,100724,100500,1005,Alabama State University,Montgomery,AL,36104-0271,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,32.364317,-86.295677,19.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9774,0.9774,440.0,520.0,420.0,510.0,,,480.0,465.0,,16.0,20.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,972.0,972.0,0.0,3903.0,,0.0167,0.9352,0.0095,0.0041,0.0013,0.0005,0.0102,0.0102,0.0123,,,,,,,,,,,,,0.0666,,1,13043.0,,,,11344.0,14855.0,18390.0,18863.0,14833.0,,,,,,,,,,,,,,,,12113.0,,,,16104.0,,17819.0,,,,,,523.0,,,,346.0,97.0,53.0,20.0,7.0,,,,,,,,,,,,,,,,21476.0,,11068.0,19396.0,,10160.0,8527.0,7754.0,0.5826,0.7448,0.865,0.5868,,0.125,,0.7845,0.0848,0.6146166134,0.107428115,0.5776286353,0.9219330855,0.3434343434,0.178514377,0.1126198083,0.052715655,0.0415335463,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0188246097,0.3246097337,0.6565656566,0.6625399361,0.4972044728,0.3841853035,0.2903354633,34468.571812,8551.802974,18679,32000,11161,18750,18500,18246,17500,23925,19056,12000,19500,15525,19000,17500,3609,1149,2460,2299,965,345,3162,447,3237,372,2276,1333,2899,710,332.105864604357,3486,45000,32263,5784,3500,2504,2235,269,2504,2178,2504,0.8889776358,0.874600639,20.130990415,,0.10999999940395,0.6134185304,0.0079872204,0.892571885,PrivacySuppressed,0.3434343434,31684.382188,22080.5,8551.802974,,,42.6899986267089,52.3199996948242,1.40999996662139,4.09000015258789,11.8100004196167,6.76000022888183,94.5299987792968,46065.2,16.9599990844726,4.80999994277954,10.6700000762939,,,,,,,18679,32000,332.105864604357,,1,0.371,0.629,12/1/1965,4208.0,2.0,,510.0,SACSCC,0.5898,,0.25,,2094.0,,36.0,,2.0,2.0,0.5898,,0.25,,1.0,1,,,,,,,,,,,,,0.7792,0.7539,4732.0,642.0,951.0,2.0,0.7684,0.7464,2094.0,34246,947070736,1005


In [38]:
# Check new size
df.shape

(6806, 314)

In [39]:
# Get descriptive stats
df.describe()

Unnamed: 0,UNITID,OPEID,OPEID6,SCH_DEG,HCM2,MAIN,NUMBRANCH,PREDDEG,HIGHDEG,CONTROL,ST_FIPS,REGION,LOCALE,LOCALE2,LATITUDE,LONGITUDE,CCBASIC,CCUGPROF,CCSIZSET,HBCU,PBI,ANNHI,TRIBAL,AANAPII,HSI,NANTI,MENONLY,WOMENONLY,RELAFFIL,ADM_RATE,ADM_RATE_ALL,SATVR25,SATVR75,SATMT25,SATMT75,SATWR25,SATWR75,SATVRMID,SATMTMID,SATWRMID,ACTCM25,ACTCM75,ACTEN25,ACTEN75,ACTMT25,ACTMT75,ACTWR25,ACTWR75,ACTCMMID,ACTENMID,ACTMTMID,ACTWRMID,SAT_AVG,SAT_AVG_ALL,DISTANCEONLY,UGDS,UG,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN,UGDS_WHITENH,UGDS_BLACKNH,UGDS_API,UGDS_AIANOLD,UGDS_HISPOLD,UG_NRA,UG_UNKN,UG_WHITENH,UG_BLACKNH,UG_API,UG_AIANOLD,UG_HISPOLD,PPTUG_EF,PPTUG_EF2,CURROPER,NPT4_PUB,NPT4_PRIV,NPT4_PROG,NPT4_OTHER,NPT41_PUB,NPT42_PUB,NPT43_PUB,NPT44_PUB,NPT45_PUB,NPT41_PRIV,NPT42_PRIV,NPT43_PRIV,NPT44_PRIV,NPT45_PRIV,NPT41_PROG,NPT42_PROG,NPT43_PROG,NPT44_PROG,NPT45_PROG,NPT41_OTHER,NPT42_OTHER,NPT43_OTHER,NPT44_OTHER,NPT45_OTHER,NPT4_048_PUB,NPT4_048_PRIV,NPT4_048_PROG,NPT4_048_OTHER,NPT4_3075_PUB,NPT4_3075_PRIV,NPT4_75UP_PUB,NPT4_75UP_PRIV,NPT4_3075_PROG,NPT4_3075_OTHER,NPT4_75UP_PROG,NPT4_75UP_OTHER,NUM4_PUB,NUM4_PRIV,NUM4_PROG,NUM4_OTHER,NUM41_PUB,NUM42_PUB,NUM43_PUB,NUM44_PUB,NUM45_PUB,NUM41_PRIV,NUM42_PRIV,NUM43_PRIV,NUM44_PRIV,NUM45_PRIV,NUM41_PROG,NUM42_PROG,NUM43_PROG,NUM44_PROG,NUM45_PROG,NUM41_OTHER,NUM42_OTHER,NUM43_OTHER,NUM44_OTHER,NUM45_OTHER,COSTT4_A,COSTT4_P,TUITIONFEE_IN,TUITIONFEE_OUT,TUITIONFEE_PROG,TUITFTE,INEXPFTE,AVGFACSAL,PFTFAC,PCTPELL,PFTFTUG1_EF,RET_FT4,RET_FTL4,RET_PT4,RET_PTL4,PCTFLOAN,UG25ABV,AGE_ENTRY_SQ,LNFAMINC,LNFAMINC_IND,FSEND_COUNT,FSEND_1,FSEND_2,FSEND_3,FSEND_4,FSEND_5,ICLEVEL,UGDS_MEN,UGDS_WOMEN,D_PCTPELL_PCTFLOAN,OPENADMP,UGNONDS,GRADS,RET_FT4_POOLED,RET_FTL4_POOLED,RET_PT4_POOLED,RET_PTL4_POOLED,RET_FT_DEN4_POOLED,RET_FT_DENL4_POOLED,RET_PT_DEN4_POOLED,RET_PT_DENL4_POOLED,POOLYRSRET_FT,POOLYRSRET_PT,SCHTYPE,OPEFLAG,CIPTFBS1,CIPTFBS2,CIPTFBS3,CIPTFBS4,CIPTFBS5,CIPTFBS6,CIPTFBSANNUAL1,CIPTFBSANNUAL2,CIPTFBSANNUAL3,CIPTFBSANNUAL4,CIPTFBSANNUAL5,CIPTFBSANNUAL6,FTFTPCTPELL,FTFTPCTFLOAN,UG12MN,G12MN,SCUGFFN,POOLYRS_FTFTAIDPCT,SCUGFFN_POOLED
count,6806.0,6806.0,6806.0,6524.0,6806.0,6806.0,6806.0,6806.0,6806.0,6806.0,6806.0,6806.0,6331.0,0.0,6331.0,6331.0,6331.0,6331.0,6331.0,6323.0,6323.0,6323.0,6323.0,6323.0,6323.0,6323.0,6331.0,6331.0,911.0,2006.0,2242.0,1239.0,1239.0,1242.0,1242.0,732.0,732.0,1239.0,1242.0,732.0,1273.0,1273.0,1199.0,1199.0,1199.0,1199.0,325.0,325.0,1273.0,1199.0,1199.0,325.0,1298.0,1426.0,6331.0,6041.0,0.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6013.0,0.0,6806.0,1878.0,3727.0,0.0,0.0,1869.0,1795.0,1745.0,1559.0,1338.0,3661.0,2944.0,2669.0,2172.0,1814.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1875.0,3698.0,0.0,0.0,1818.0,3082.0,1587.0,2326.0,0.0,0.0,0.0,0.0,1878.0,3728.0,0.0,0.0,1878.0,1878.0,1878.0,1878.0,1878.0,3727.0,3727.0,3727.0,3727.0,3727.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3431.0,2175.0,3865.0,3621.0,2361.0,6304.0,6304.0,4012.0,3623.0,6014.0,5705.0,2098.0,3194.0,1309.0,1798.0,6014.0,5872.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6806.0,6041.0,6041.0,6014.0,5880.0,2867.0,2073.0,2201.0,3253.0,1615.0,1936.0,2418.0,3293.0,2001.0,2019.0,5711.0,4020.0,6425.0,6806.0,2403.0,1908.0,1513.0,1158.0,839.0,638.0,2403.0,1908.0,1513.0,1158.0,839.0,638.0,5740.0,5740.0,6030.0,2072.0,6024.0,6032.0,6032.0
mean,2126810.0,1784672.0,16671.262269,1.938228,0.007934,0.785336,3.523509,1.833823,2.222892,2.08757,29.032912,4.613135,19.884378,,37.374743,-90.314421,9.922287,3.684568,4.520771,0.015815,0.015973,0.005693,0.005535,0.025621,0.072908,0.004428,0.009635,0.005528,55.613611,0.678958,0.681198,516.617433,613.322034,510.353462,609.377617,463.353825,569.61612,565.009685,559.904992,516.523224,20.609584,25.958366,19.718098,26.309425,19.367807,25.386155,6.581538,8.390769,23.535742,23.264387,22.643036,7.698462,1141.174114,1147.656381,0.008214,2522.160735,,0.49179,0.179735,0.181379,0.037811,0.013504,0.004573,0.03077,0.021385,0.035911,,,,,,,,,,,,,0.228367,,0.950485,10010.15229,19153.949826,,,8192.315677,8887.431198,11253.812607,13787.00449,15273.18012,17300.208959,18373.194293,20440.384039,23315.191068,26398.55237,,,,,,,,,,,8435.453867,17485.478908,,,9982.357536,19155.016223,14193.072464,24612.271281,,,,,525.988818,141.060622,,,228.787007,92.435037,77.924388,57.394569,69.447817,60.220016,18.163671,17.48323,16.382345,28.848135,,,,,,,,,,,26956.896823,20229.456092,15476.787322,18906.769125,15733.626853,11099.011104,8477.335343,6858.799103,0.593839,0.471843,0.694014,0.727493,0.691617,0.453604,0.550197,0.462107,0.381475,,,,,,,,,,1.815898,0.352605,0.64425,2925.16445,1.354252,680.179281,1486.300531,0.718455,0.693193,0.463474,0.555272,1298.507031,447.711206,54.583208,380.435859,2.466468,3.178607,2.055409,1.035557,17189.837703,13769.241614,12338.627231,12947.160622,13358.454112,13505.871473,11579.242613,10311.824423,9341.637806,9267.105354,9177.20143,9241.785266,0.570178,0.526082,3788.561526,1886.294884,452.09595,2.306034,901.83687
std,7640544.0,2739965.0,14847.499904,0.900211,0.088726,0.410619,8.75141,1.070275,1.362394,0.835281,16.769898,2.179201,9.614376,,5.851418,17.979595,11.066478,5.808817,6.424307,0.12477,0.125382,0.075246,0.0742,0.158014,0.260007,0.066403,0.097692,0.074153,21.578581,0.217596,0.213015,65.9955,59.956409,70.706483,72.226097,82.233472,81.296986,61.946404,70.163575,80.596669,3.971297,3.725738,4.494545,4.438807,3.681928,3.615055,1.195528,0.921908,3.801546,4.376404,3.577571,1.034064,125.516704,125.000305,0.090263,5657.459316,,0.283737,0.217884,0.227826,0.079448,0.071663,0.031879,0.038606,0.06313,0.072023,,,,,,,,,,,,,0.255692,,0.216957,5289.529286,8034.427512,,,4445.243251,4441.244657,4638.79014,4953.010675,5513.770411,7335.639646,7468.678637,7452.874567,7266.69814,9000.447445,,,,,,,,,,,4483.830171,7361.061127,,,4627.898333,7501.934667,5407.004051,8284.018676,,,,,655.80164,264.21544,,,298.260338,117.326822,102.589175,95.948682,152.780283,153.150652,33.249969,34.010776,35.9908,81.71666,,,,,,,,,,,15831.620491,6873.577043,13333.765877,12621.628174,8127.867242,12995.482144,14025.056252,2534.714614,0.290545,0.217235,0.272367,0.169951,0.18127,0.305215,0.25166,0.279112,0.236839,,,,,,,,,,0.834446,0.242507,0.244392,6115.386037,0.478327,1260.876649,3102.072006,0.163226,0.159387,0.253207,0.221719,2285.935515,924.771122,206.174696,846.201554,0.845854,0.984043,0.836425,0.339294,8662.22446,9743.432766,9639.341214,11254.483046,11487.770831,11630.885604,4954.846521,5202.005336,5050.927486,5394.351573,5285.5678,5494.356963,0.239364,0.320575,8322.875304,4045.939627,925.426065,0.720068,1829.955708
min,100654.0,100200.0,1002.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,-3.0,,-14.322636,-170.742774,-2.0,-2.0,-2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,22.0,0.0,0.0,244.0,330.0,283.0,400.0,200.0,360.0,300.0,370.0,280.0,6.0,11.0,6.0,11.0,6.0,11.0,2.0,6.0,9.0,9.0,9.0,4.0,785.0,785.0,0.0,0.0,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,0.0,,0.0,-1973.0,-1338.0,,,-3088.0,-2563.0,805.0,-2558.0,650.0,-3260.0,-3395.0,451.0,3800.0,5923.0,,,,,,,,,,,-3001.0,-3335.0,,,-1765.0,-610.0,-2558.0,3800.0,,,,,1.0,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,3990.0,1480.0,480.0,480.0,299.0,0.0,0.0,0.0,0.0,0.0,0.0009,0.0,0.0,0.0,0.0,0.0,0.0004,,,,,,,,,,1.0,0.0,0.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,2.0,1.0,1.0,404.0,525.0,395.0,50.0,263.0,530.0,404.0,525.0,395.0,50.0,263.0,530.0,0.0,0.0,1.0,1.0,0.0,2.0,0.0
25%,174031.5,311950.0,3109.25,1.0,0.0,1.0,1.0,1.0,1.0,1.0,13.0,3.0,12.0,,33.971442,-97.408884,-2.0,-2.0,-2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,30.0,0.552575,0.5627,470.0,570.0,470.0,560.0,410.0,520.0,525.0,515.0,464.75,18.0,23.0,17.0,23.0,17.0,23.0,6.0,8.0,21.0,20.0,20.0,7.0,1058.0,1062.0,0.0,105.0,,0.2524,0.0356,0.0363,0.0024,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,,,0.0,,1.0,6127.5,13797.0,,,5148.0,5722.0,7761.0,10110.5,11239.5,12607.0,13844.25,15902.0,18862.25,20328.0,,,,,,,,,,,5317.5,12777.75,,,6615.75,14599.5,10301.0,19263.0,,,,,101.25,17.0,,,49.0,16.0,11.0,2.0,0.0,11.0,1.0,0.0,0.0,0.0,,,,,,,,,,,14055.5,15578.5,5252.0,8869.0,12166.0,4836.75,3807.25,5200.75,0.3427,0.3098,0.5,0.64725,0.5779,0.25,0.389525,0.2277,0.194875,,,,,,,,,,1.0,0.1398,0.5276,163.0,1.0,29.0,106.0,0.6358,0.5909,0.3121,0.404575,49.0,44.0,1.0,24.0,2.0,2.0,1.0,1.0,13182.0,7722.75,5650.0,5444.75,5271.5,5153.0,9210.0,6995.0,5100.0,4801.0,4627.0,4439.25,0.4,0.25,176.0,143.0,30.0,2.0,66.0
50%,228209.5,1019812.0,10198.0,2.0,0.0,1.0,1.0,2.0,2.0,2.0,29.0,5.0,21.0,,38.832183,-86.267098,9.0,2.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,54.0,0.7027,0.7003,510.0,610.0,500.0,598.0,441.5,557.5,556.0,549.5,500.0,20.0,26.0,19.0,25.0,18.0,25.0,6.0,8.0,23.0,23.0,22.0,7.0,1123.0,1130.0,0.0,438.0,,0.5321,0.0959,0.091,0.0144,0.0023,0.0003,0.025,0.0,0.0133,,,,,,,,,,,,,0.1256,,1.0,8937.5,18669.0,,,7503.0,8046.0,10533.0,12969.0,14122.5,16672.0,17813.5,19953.0,22656.0,24898.5,,,,,,,,,,,7754.0,16871.0,,,9142.5,18669.5,13173.0,23542.0,,,,,270.0,46.0,,,130.5,49.0,37.0,17.0,9.0,28.0,5.0,3.0,1.0,0.0,,,,,,,,,,,22581.0,19589.0,11207.0,15275.0,15300.0,9231.5,6056.0,6574.0,0.5696,0.45295,0.7319,0.74825,0.69315,0.4545,0.5,0.5149,0.3581,,,,,,,,,,2.0,0.3706,0.6276,602.0,1.0,187.0,424.0,0.7436,0.6982,0.4587,0.50605,481.0,95.0,11.0,61.0,2.0,4.0,2.0,1.0,16500.0,12150.0,10177.0,9987.5,10470.0,10635.0,11304.0,10112.0,9100.0,8735.0,8716.0,9014.0,0.5678,0.5949,716.5,573.5,137.0,2.0,272.0
75%,452758.5,3034350.0,30273.75,3.0,0.0,1.0,2.0,3.0,4.0,3.0,42.0,6.0,22.0,,41.33294,-78.788784,20.0,10.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,71.0,0.844125,0.8442,550.0,650.0,540.0,640.0,500.0,610.0,600.0,590.0,555.0,22.0,28.0,22.0,29.0,21.0,27.0,7.0,9.0,25.0,26.0,24.0,9.0,1199.0,1211.0,0.0,2117.0,,0.7231,0.239,0.2353,0.0373,0.0067,0.0026,0.0418,0.0173,0.0392,,,,,,,,,,,,,0.4027,,1.0,13483.75,23755.5,,,10747.0,11584.5,14125.0,17333.5,18627.5,21434.0,22443.0,24469.0,26948.75,30657.0,,,,,,,,,,,11052.0,21632.0,,,12875.75,23261.75,17759.5,28892.25,,,,,690.0,169.0,,,301.0,124.0,103.0,65.0,52.0,64.0,24.0,20.0,13.0,12.0,,,,,,,,,,,35765.5,24066.5,20550.0,26079.0,17700.0,14052.0,9449.25,8198.5,0.88215,0.628675,0.9787,0.833525,0.8182,0.6636,0.75,0.68025,0.5455,,,,,,,,,,3.0,0.4706,0.8571,2635.75,2.0,830.0,1416.0,0.8235,0.807,0.6213,0.731425,1313.75,405.0,40.0,347.0,2.0,4.0,3.0,1.0,19812.0,16774.75,15740.0,16315.0,16414.0,16987.5,13793.0,12954.0,12458.0,12861.25,13000.0,13242.75,0.75,0.793025,3319.0,1940.25,472.0,2.0,937.25
max,49146400.0,82098880.0,42788.0,3.0,1.0,1.0,74.0,4.0,4.0,3.0,78.0,9.0,43.0,,71.324702,171.378129,33.0,15.0,18.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,108.0,1.0,1.0,740.0,780.0,790.0,800.0,730.0,800.0,760.0,795.0,765.0,35.0,36.0,35.0,36.0,35.0,36.0,11.0,12.0,36.0,36.0,36.0,12.0,1566.0,1566.0,1.0,88921.0,,1.0,1.0,1.0,1.0,1.0,0.9973,0.6316,1.0,1.0,,,,,,,,,,,,,1.0,,1.0,44661.0,111408.0,,,41496.0,32114.0,31339.0,32589.0,47826.0,109313.0,109704.0,113261.0,114298.0,113314.0,,,,,,,,,,,41496.0,109425.0,,,31883.0,111737.0,47826.0,113642.0,,,,,6383.0,6610.0,,,4749.0,1172.0,650.0,838.0,1279.0,6259.0,637.0,391.0,400.0,981.0,,,,,,,,,,,96375.0,116377.0,74514.0,74514.0,117450.0,455440.0,542922.0,20484.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,,,,,,,,,,3.0,1.0,1.0,80898.0,2.0,14425.0,42336.0,1.0,1.0,1.0,1.0,19054.0,12877.0,4987.0,12615.0,4.0,4.0,3.0,7.0,118250.0,118250.0,119200.0,99995.0,74995.0,86339.0,91125.0,77805.0,46968.0,60000.0,29179.0,37358.0,1.0,1.0,162762.0,68457.0,25695.0,4.0,49860.0


In [40]:
# Remove demographic classification columns that are outdated and no longer used
df = df.drop(columns = ['UG', 'UGDS_WHITENH', 'UGDS_BLACKNH', 'UGDS_API', 'UGDS_AIANOLD', 'UGDS_HISPOLD', 'UG_NRA', 'UG_UNKN', 'UG_WHITENH', 'UG_BLACKNH', 'UG_API', 'UG_AIANOLD', 'UG_HISPOLD'])

In [41]:
# Check new size
df.shape

(6806, 301)

In [42]:
# Check new output
df.head()

Unnamed: 0,UNITID,OPEID,OPEID6,INSTNM,CITY,STABBR,ZIP,ACCREDAGENCY,SCH_DEG,HCM2,MAIN,NUMBRANCH,PREDDEG,HIGHDEG,CONTROL,ST_FIPS,REGION,LOCALE,LOCALE2,LATITUDE,LONGITUDE,CCBASIC,CCUGPROF,CCSIZSET,HBCU,PBI,ANNHI,TRIBAL,AANAPII,HSI,NANTI,MENONLY,WOMENONLY,RELAFFIL,ADM_RATE,ADM_RATE_ALL,SATVR25,SATVR75,SATMT25,SATMT75,SATWR25,SATWR75,SATVRMID,SATMTMID,SATWRMID,ACTCM25,ACTCM75,ACTEN25,ACTEN75,ACTMT25,ACTMT75,ACTWR25,ACTWR75,ACTCMMID,ACTENMID,ACTMTMID,ACTWRMID,SAT_AVG,SAT_AVG_ALL,DISTANCEONLY,UGDS,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN,PPTUG_EF,PPTUG_EF2,CURROPER,NPT4_PUB,NPT4_PRIV,NPT4_PROG,NPT4_OTHER,NPT41_PUB,NPT42_PUB,NPT43_PUB,NPT44_PUB,NPT45_PUB,NPT41_PRIV,NPT42_PRIV,NPT43_PRIV,NPT44_PRIV,NPT45_PRIV,NPT41_PROG,NPT42_PROG,NPT43_PROG,NPT44_PROG,NPT45_PROG,NPT41_OTHER,NPT42_OTHER,NPT43_OTHER,NPT44_OTHER,NPT45_OTHER,NPT4_048_PUB,NPT4_048_PRIV,NPT4_048_PROG,NPT4_048_OTHER,NPT4_3075_PUB,NPT4_3075_PRIV,NPT4_75UP_PUB,NPT4_75UP_PRIV,NPT4_3075_PROG,NPT4_3075_OTHER,NPT4_75UP_PROG,NPT4_75UP_OTHER,NUM4_PUB,NUM4_PRIV,NUM4_PROG,NUM4_OTHER,NUM41_PUB,NUM42_PUB,NUM43_PUB,NUM44_PUB,NUM45_PUB,NUM41_PRIV,NUM42_PRIV,NUM43_PRIV,NUM44_PRIV,NUM45_PRIV,NUM41_PROG,NUM42_PROG,NUM43_PROG,NUM44_PROG,NUM45_PROG,NUM41_OTHER,NUM42_OTHER,NUM43_OTHER,NUM44_OTHER,NUM45_OTHER,COSTT4_A,COSTT4_P,TUITIONFEE_IN,TUITIONFEE_OUT,TUITIONFEE_PROG,TUITFTE,INEXPFTE,AVGFACSAL,PFTFAC,PCTPELL,PFTFTUG1_EF,RET_FT4,RET_FTL4,RET_PT4,RET_PTL4,PCTFLOAN,UG25ABV,INC_PCT_LO,DEP_STAT_PCT_IND,DEP_INC_PCT_LO,IND_INC_PCT_LO,PAR_ED_PCT_1STGEN,INC_PCT_M1,INC_PCT_M2,INC_PCT_H1,INC_PCT_H2,DEP_INC_PCT_M1,DEP_INC_PCT_M2,DEP_INC_PCT_H1,DEP_INC_PCT_H2,IND_INC_PCT_M1,IND_INC_PCT_M2,IND_INC_PCT_H1,IND_INC_PCT_H2,PAR_ED_PCT_MS,PAR_ED_PCT_HS,PAR_ED_PCT_PS,APPL_SCH_PCT_GE2,APPL_SCH_PCT_GE3,APPL_SCH_PCT_GE4,APPL_SCH_PCT_GE5,DEP_INC_AVG,IND_INC_AVG,DEBT_MDN,GRAD_DEBT_MDN,WDRAW_DEBT_MDN,LO_INC_DEBT_MDN,MD_INC_DEBT_MDN,HI_INC_DEBT_MDN,DEP_DEBT_MDN,IND_DEBT_MDN,PELL_DEBT_MDN,NOPELL_DEBT_MDN,FEMALE_DEBT_MDN,MALE_DEBT_MDN,FIRSTGEN_DEBT_MDN,NOTFIRSTGEN_DEBT_MDN,DEBT_N,GRAD_DEBT_N,WDRAW_DEBT_N,LO_INC_DEBT_N,MD_INC_DEBT_N,HI_INC_DEBT_N,DEP_DEBT_N,IND_DEBT_N,PELL_DEBT_N,NOPELL_DEBT_N,FEMALE_DEBT_N,MALE_DEBT_N,FIRSTGEN_DEBT_N,NOTFIRSTGEN_DEBT_N,GRAD_DEBT_MDN10YR,CUML_DEBT_N,CUML_DEBT_P90,CUML_DEBT_P75,CUML_DEBT_P25,CUML_DEBT_P10,INC_N,DEP_INC_N,IND_INC_N,DEP_STAT_N,PAR_ED_N,APPL_SCH_N,LOAN_EVER,PELL_EVER,AGE_ENTRY,AGE_ENTRY_SQ,AGEGE24,FEMALE,MARRIED,DEPENDENT,VETERAN,FIRST_GEN,FAMINC,MD_FAMINC,FAMINC_IND,LNFAMINC,LNFAMINC_IND,PCT_WHITE,PCT_BLACK,PCT_ASIAN,PCT_HISPANIC,PCT_BA,PCT_GRAD_PROF,PCT_BORN_US,MEDIAN_HH_INC,POVERTY_RATE,UNEMP_RATE,LN_MEDIAN_HH_INC,FSEND_COUNT,FSEND_1,FSEND_2,FSEND_3,FSEND_4,FSEND_5,DEBT_MDN_SUPP,GRAD_DEBT_MDN_SUPP,GRAD_DEBT_MDN10YR_SUPP,ALIAS,ICLEVEL,UGDS_MEN,UGDS_WOMEN,T4APPROVALDATE,D_PCTPELL_PCTFLOAN,OPENADMP,UGNONDS,GRADS,ACCREDCODE,RET_FT4_POOLED,RET_FTL4_POOLED,RET_PT4_POOLED,RET_PTL4_POOLED,RET_FT_DEN4_POOLED,RET_FT_DENL4_POOLED,RET_PT_DEN4_POOLED,RET_PT_DENL4_POOLED,POOLYRSRET_FT,POOLYRSRET_PT,RET_FT4_POOLED_SUPP,RET_FTL4_POOLED_SUPP,RET_PT4_POOLED_SUPP,RET_PTL4_POOLED_SUPP,SCHTYPE,OPEFLAG,CIPTFBS1,CIPTFBS2,CIPTFBS3,CIPTFBS4,CIPTFBS5,CIPTFBS6,CIPTFBSANNUAL1,CIPTFBSANNUAL2,CIPTFBSANNUAL3,CIPTFBSANNUAL4,CIPTFBSANNUAL5,CIPTFBSANNUAL6,FTFTPCTPELL,FTFTPCTFLOAN,UG12MN,G12MN,SCUGFFN,POOLYRS_FTFTAIDPCT,FTFTPCTPELL_POOLED_SUPP,FTFTPCTFLOAN_POOLED_SUPP,SCUGFFN_POOLED,LPSTAFFORD_CNT,LPSTAFFORD_AMT,FEDSCHCD
0,100654,100200,1002,Alabama A & M University,Normal,AL,35762,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,34.783368,-86.568502,18.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8986,0.8986,430.0,520.0,420.0,510.0,370.0,457.0,475.0,465.0,414.0,16.0,19.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,957.0,957.0,0.0,4990.0,0.0186,0.912,0.0088,0.0018,0.0022,0.0016,0.0118,0.007,0.0361,0.0587,,1,14444.0,,,,13893.0,13976.0,15995.0,18957.0,17140.0,,,,,,,,,,,,,,,,13913.0,,,,14684.0,,18281.0,,,,,,592.0,,,,375.0,113.0,61.0,27.0,16.0,,,,,,,,,,,,,,,,22489.0,,9744.0,18354.0,,7413.0,5384.0,7101.0,0.7411,0.7067,0.8987,0.6087,,1.0,,0.7503,0.0758,0.6020087884,0.0988700565,0.5691396726,0.9015873016,0.3658280922,0.1898932831,0.1051475204,0.0621468927,0.0408035154,0.2034134448,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0666666667,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0164220825,0.3494060098,0.6341719078,0.7291274325,0.5668549906,0.4579409918,0.3631512869,34779.085684,10340.346032,15500,33375,10250,15500,16000,14518,15000,19000,17500,10250,17500,14250,15000,16421,3606,1076,2530,2185,1034,387,3191,415,3162,444,2074,1532,2895,711,346.376038474076,3085,47750,32208,5500,3381,3186,2871,315,3186,2862,3186,0.8860640301,0.8527934714,20.283741368,,0.07999999821186,0.5640301318,0.0091023227,0.9011299435,0.003138732,0.3658280922,32362.826114,23553.0,10340.346032,,,46.8400001525878,47.9799995422363,1.48000001907348,3.78999996185302,13.0,6.8600001335144,94.7399978637695,49720.22,14.8800001144409,4.84000015258789,10.75,,,,,,,15500,33375,346.376038474076,AAMU,1,0.4076,0.5924,12/12/1965,5039.0,2.0,153.0,963.0,SACSCC,0.5978,,0.25,,2698.0,,44.0,,2.0,2.0,0.5978,,0.25,,1.0,1,,,,,,,,,,,,,0.7057,0.7143,5343.0,1165.0,1288.0,2.0,0.7083,0.7287,2698.0,31374,922456254,1002
1,100663,105200,1052,University of Alabama at Birmingham,Birmingham,AL,35294-0110,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,33.505697,-86.799345,15.0,9.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9211,0.9211,490.0,620.0,490.0,620.0,,,555.0,555.0,,21.0,29.0,22.0,31.0,19.0,26.0,,,25.0,27.0,23.0,,1220.0,1220.0,0.0,13186.0,0.5717,0.2553,0.0334,0.0633,0.0034,0.0002,0.0457,0.0213,0.0058,0.2425,,1,17005.0,,,,14550.0,15379.0,17892.0,19978.0,20110.0,,,,,,,,,,,,,,,,14830.0,,,,16587.0,,20050.0,,,,,,1229.0,,,,421.0,214.0,198.0,180.0,216.0,,,,,,,,,,,,,,,,24347.0,,8568.0,19704.0,,13177.0,16454.0,10717.0,0.7766,0.3632,0.6009,0.8186,,0.4648,,0.5127,0.2296,0.4276131917,0.3214086082,0.3487095003,0.5942028986,0.341223671,0.1798024967,0.1423514067,0.114589156,0.1356437488,0.1699615596,0.1537616694,0.142778693,0.1847885777,0.2005797101,0.1182608696,0.0550724638,0.031884058,0.0222668004,0.3189568706,0.658776329,0.5135084777,0.2634618968,0.1652692379,0.1076951742,61110.800384,30607.18029,15000,22500,9500,16226,15250,14000,15000,16000,17500,12500,15000,15000,15104,15000,7504,3730,3774,3168,2281,2055,5123,2381,4714,2790,4804,2700,5286,2218,233.511936049938,6302,37540,26082,6250,3500,5367,3642,1725,5367,4985,5367,0.8574622694,0.6249301286,23.60797466,,0.25999999046325,0.6390907397,0.1050866406,0.6785913918,0.0031675051,0.341223671,51306.674306,34489.0,30607.18029,,,69.0199966430664,27.7600002288818,1.10000002384185,2.02999997138977,15.9300003051757,8.55000019073486,96.5,55735.22,10.9099998474121,3.45000004768371,10.8599996566772,,,,,,,15000,22500,233.511936049938,,1,0.393,0.607,12/1/1965,13134.0,2.0,650.0,8087.0,SACSCC,0.8303,,0.4514,,4130.0,,144.0,,2.0,2.0,0.8303,,0.4514,,1.0,1,,,,,,,,,,,,,0.3788,0.535,14445.0,10498.0,2228.0,2.0,0.3891,0.5414,4176.0,56997,1720042015,1052
2,100690,2503400,25034,Amridge University,Montgomery,AL,36117-3553,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,2,1,5,12.0,,32.362609,-86.17401,20.0,5.0,6.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,74.0,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,351.0,0.2393,0.7151,0.0171,0.0057,0.0057,0.0,0.0,0.0,0.0171,0.5014,,1,,15322.0,,,,,,,,15322.0,,,,,,,,,,,,,,,,15322.0,,,,,,,,,,,,5.0,,,,,,,,5.0,0.0,0.0,0.0,0.0,,,,,,,,,,,17680.0,,6900.0,6900.0,,14273.0,4206.0,4292.0,1.0,0.7673,0.0035,,,,,0.8962,0.8302,0.7736486486,0.8952702703,PrivacySuppressed,PrivacySuppressed,0.5125,0.1148648649,0.0641891892,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.05,0.4625,0.4875,0.5945945946,0.3378378378,0.2432432432,0.1587837838,25211.032258,20596.158491,10500,27334,9500,9500,19000,25000,7646,12038,9500,15509,9500,17025,11500,9500,514,92,422,397,91,26,60,454,464,50,327,187,458,56,283.680678221734,398,38455,24250,4750,3166,296,31,265,296,240,296,0.9560810811,0.8648648649,33.672297297,,0.82999998331069,0.6486486486,0.2364864865,0.1047297297,0.0405405405,0.5125,21079.472973,15033.5,20596.158491,,,70.8799972534179,22.5300006866455,1.28999996185302,6.94000005722046,13.2299995422363,7.01000022888183,94.0899963378906,53683.7,10.6499996185302,3.59999990463256,10.8400001525878,,,,,,,10500,27334,283.680678221734,Southern Christian University Regions University,1,0.3191,0.6809,3/26/1987,318.0,1.0,,404.0,SACSCC,0.2143,,0.1429,,14.0,,14.0,,4.0,4.0,PrivacySuppressed,,PrivacySuppressed,,2.0,1,,,,,,,,,,,,,1.0,1.0,440.0,527.0,5.0,4.0,PrivacySuppressed,PrivacySuppressed,24.0,4463,174222020,16885
3,100706,105500,1055,University of Alabama in Huntsville,Huntsville,AL,35899,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,34.724557,-86.640449,16.0,15.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8087,0.8087,560.0,700.0,450.0,680.0,,,630.0,565.0,,25.0,31.0,25.0,34.0,24.0,30.0,,,28.0,30.0,27.0,,1314.0,1314.0,0.0,7458.0,0.7167,0.0969,0.0528,0.0381,0.0095,0.0008,0.0296,0.0223,0.0333,0.1443,,1,20909.0,,,,17561.0,18991.0,21396.0,23204.0,23406.0,,,,,,,,,,,,,,,,18147.0,,,,20356.0,,23315.0,,,,,,585.0,,,,134.0,93.0,122.0,107.0,129.0,,,,,,,,,,,,,,,,23441.0,,10714.0,22362.0,,8677.0,9242.0,9442.0,0.6544,0.2698,0.6176,0.8288,,0.0909,,0.4192,0.1842,0.374633738,0.2515696944,0.26901566,0.6888519135,0.3101321586,0.1377145249,0.1469233989,0.1506906656,0.1900376727,0.1448545861,0.1605145414,0.1817673378,0.2438478747,0.1164725458,0.1064891847,0.0582362729,0.0299500832,0.0198237885,0.29030837,0.6898678414,0.5290916702,0.2737547091,0.1573880285,0.1025533696,72240.892617,27941.821963,14476,21607,9000,16250,14750,12500,12750,18569,17014,11899,15250,13333,14943,13102,3021,1374,1647,1168,827,1026,2067,954,1808,1213,1375,1646,1997,1024,224.244106765823,2626,36250,26750,5500,3472,2389,1788,601,2389,2270,2389,0.8652155714,0.5571368774,22.727919632,,0.28999999165534,0.4763499372,0.1004604437,0.7484303056,PrivacySuppressed,0.3101321586,61096.588949,44787.0,27941.821963,,,76.3799972534179,18.9799995422363,1.41999995708465,2.54999995231628,17.6700000762939,8.90999984741211,95.2699966430664,58688.62,9.36999988555908,3.64000010490417,10.9300003051757,,,,,,,14476,21607,224.244106765823,UAH University of Alabama Huntsville,1,0.5796,0.4204,12/1/1965,7090.0,2.0,213.0,2065.0,SACSCC,0.8269,,0.35,,2531.0,,40.0,,2.0,4.0,0.8269,,0.35,,1.0,1,,,,,,,,,,,,,0.2707,0.4556,8145.0,2443.0,1341.0,2.0,0.2378,0.4402,2544.0,19702,407184805,1055
4,100724,100500,1005,Alabama State University,Montgomery,AL,36104-0271,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,32.364317,-86.295677,19.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9774,0.9774,440.0,520.0,420.0,510.0,,,480.0,465.0,,16.0,20.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,972.0,972.0,0.0,3903.0,0.0167,0.9352,0.0095,0.0041,0.0013,0.0005,0.0102,0.0102,0.0123,0.0666,,1,13043.0,,,,11344.0,14855.0,18390.0,18863.0,14833.0,,,,,,,,,,,,,,,,12113.0,,,,16104.0,,17819.0,,,,,,523.0,,,,346.0,97.0,53.0,20.0,7.0,,,,,,,,,,,,,,,,21476.0,,11068.0,19396.0,,10160.0,8527.0,7754.0,0.5826,0.7448,0.865,0.5868,,0.125,,0.7845,0.0848,0.6146166134,0.107428115,0.5776286353,0.9219330855,0.3434343434,0.178514377,0.1126198083,0.052715655,0.0415335463,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0188246097,0.3246097337,0.6565656566,0.6625399361,0.4972044728,0.3841853035,0.2903354633,34468.571812,8551.802974,18679,32000,11161,18750,18500,18246,17500,23925,19056,12000,19500,15525,19000,17500,3609,1149,2460,2299,965,345,3162,447,3237,372,2276,1333,2899,710,332.105864604357,3486,45000,32263,5784,3500,2504,2235,269,2504,2178,2504,0.8889776358,0.874600639,20.130990415,,0.10999999940395,0.6134185304,0.0079872204,0.892571885,PrivacySuppressed,0.3434343434,31684.382188,22080.5,8551.802974,,,42.6899986267089,52.3199996948242,1.40999996662139,4.09000015258789,11.8100004196167,6.76000022888183,94.5299987792968,46065.2,16.9599990844726,4.80999994277954,10.6700000762939,,,,,,,18679,32000,332.105864604357,,1,0.371,0.629,12/1/1965,4208.0,2.0,,510.0,SACSCC,0.5898,,0.25,,2094.0,,36.0,,2.0,2.0,0.5898,,0.25,,1.0,1,,,,,,,,,,,,,0.7792,0.7539,4732.0,642.0,951.0,2.0,0.7684,0.7464,2094.0,34246,947070736,1005


In [43]:
# Check new descriptive stats
df.describe()

Unnamed: 0,UNITID,OPEID,OPEID6,SCH_DEG,HCM2,MAIN,NUMBRANCH,PREDDEG,HIGHDEG,CONTROL,ST_FIPS,REGION,LOCALE,LOCALE2,LATITUDE,LONGITUDE,CCBASIC,CCUGPROF,CCSIZSET,HBCU,PBI,ANNHI,TRIBAL,AANAPII,HSI,NANTI,MENONLY,WOMENONLY,RELAFFIL,ADM_RATE,ADM_RATE_ALL,SATVR25,SATVR75,SATMT25,SATMT75,SATWR25,SATWR75,SATVRMID,SATMTMID,SATWRMID,ACTCM25,ACTCM75,ACTEN25,ACTEN75,ACTMT25,ACTMT75,ACTWR25,ACTWR75,ACTCMMID,ACTENMID,ACTMTMID,ACTWRMID,SAT_AVG,SAT_AVG_ALL,DISTANCEONLY,UGDS,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN,PPTUG_EF,PPTUG_EF2,CURROPER,NPT4_PUB,NPT4_PRIV,NPT4_PROG,NPT4_OTHER,NPT41_PUB,NPT42_PUB,NPT43_PUB,NPT44_PUB,NPT45_PUB,NPT41_PRIV,NPT42_PRIV,NPT43_PRIV,NPT44_PRIV,NPT45_PRIV,NPT41_PROG,NPT42_PROG,NPT43_PROG,NPT44_PROG,NPT45_PROG,NPT41_OTHER,NPT42_OTHER,NPT43_OTHER,NPT44_OTHER,NPT45_OTHER,NPT4_048_PUB,NPT4_048_PRIV,NPT4_048_PROG,NPT4_048_OTHER,NPT4_3075_PUB,NPT4_3075_PRIV,NPT4_75UP_PUB,NPT4_75UP_PRIV,NPT4_3075_PROG,NPT4_3075_OTHER,NPT4_75UP_PROG,NPT4_75UP_OTHER,NUM4_PUB,NUM4_PRIV,NUM4_PROG,NUM4_OTHER,NUM41_PUB,NUM42_PUB,NUM43_PUB,NUM44_PUB,NUM45_PUB,NUM41_PRIV,NUM42_PRIV,NUM43_PRIV,NUM44_PRIV,NUM45_PRIV,NUM41_PROG,NUM42_PROG,NUM43_PROG,NUM44_PROG,NUM45_PROG,NUM41_OTHER,NUM42_OTHER,NUM43_OTHER,NUM44_OTHER,NUM45_OTHER,COSTT4_A,COSTT4_P,TUITIONFEE_IN,TUITIONFEE_OUT,TUITIONFEE_PROG,TUITFTE,INEXPFTE,AVGFACSAL,PFTFAC,PCTPELL,PFTFTUG1_EF,RET_FT4,RET_FTL4,RET_PT4,RET_PTL4,PCTFLOAN,UG25ABV,AGE_ENTRY_SQ,LNFAMINC,LNFAMINC_IND,FSEND_COUNT,FSEND_1,FSEND_2,FSEND_3,FSEND_4,FSEND_5,ICLEVEL,UGDS_MEN,UGDS_WOMEN,D_PCTPELL_PCTFLOAN,OPENADMP,UGNONDS,GRADS,RET_FT4_POOLED,RET_FTL4_POOLED,RET_PT4_POOLED,RET_PTL4_POOLED,RET_FT_DEN4_POOLED,RET_FT_DENL4_POOLED,RET_PT_DEN4_POOLED,RET_PT_DENL4_POOLED,POOLYRSRET_FT,POOLYRSRET_PT,SCHTYPE,OPEFLAG,CIPTFBS1,CIPTFBS2,CIPTFBS3,CIPTFBS4,CIPTFBS5,CIPTFBS6,CIPTFBSANNUAL1,CIPTFBSANNUAL2,CIPTFBSANNUAL3,CIPTFBSANNUAL4,CIPTFBSANNUAL5,CIPTFBSANNUAL6,FTFTPCTPELL,FTFTPCTFLOAN,UG12MN,G12MN,SCUGFFN,POOLYRS_FTFTAIDPCT,SCUGFFN_POOLED
count,6806.0,6806.0,6806.0,6524.0,6806.0,6806.0,6806.0,6806.0,6806.0,6806.0,6806.0,6806.0,6331.0,0.0,6331.0,6331.0,6331.0,6331.0,6331.0,6323.0,6323.0,6323.0,6323.0,6323.0,6323.0,6323.0,6331.0,6331.0,911.0,2006.0,2242.0,1239.0,1239.0,1242.0,1242.0,732.0,732.0,1239.0,1242.0,732.0,1273.0,1273.0,1199.0,1199.0,1199.0,1199.0,325.0,325.0,1273.0,1199.0,1199.0,325.0,1298.0,1426.0,6331.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,6013.0,0.0,6806.0,1878.0,3727.0,0.0,0.0,1869.0,1795.0,1745.0,1559.0,1338.0,3661.0,2944.0,2669.0,2172.0,1814.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1875.0,3698.0,0.0,0.0,1818.0,3082.0,1587.0,2326.0,0.0,0.0,0.0,0.0,1878.0,3728.0,0.0,0.0,1878.0,1878.0,1878.0,1878.0,1878.0,3727.0,3727.0,3727.0,3727.0,3727.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3431.0,2175.0,3865.0,3621.0,2361.0,6304.0,6304.0,4012.0,3623.0,6014.0,5705.0,2098.0,3194.0,1309.0,1798.0,6014.0,5872.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6806.0,6041.0,6041.0,6014.0,5880.0,2867.0,2073.0,2201.0,3253.0,1615.0,1936.0,2418.0,3293.0,2001.0,2019.0,5711.0,4020.0,6425.0,6806.0,2403.0,1908.0,1513.0,1158.0,839.0,638.0,2403.0,1908.0,1513.0,1158.0,839.0,638.0,5740.0,5740.0,6030.0,2072.0,6024.0,6032.0,6032.0
mean,2126810.0,1784672.0,16671.262269,1.938228,0.007934,0.785336,3.523509,1.833823,2.222892,2.08757,29.032912,4.613135,19.884378,,37.374743,-90.314421,9.922287,3.684568,4.520771,0.015815,0.015973,0.005693,0.005535,0.025621,0.072908,0.004428,0.009635,0.005528,55.613611,0.678958,0.681198,516.617433,613.322034,510.353462,609.377617,463.353825,569.61612,565.009685,559.904992,516.523224,20.609584,25.958366,19.718098,26.309425,19.367807,25.386155,6.581538,8.390769,23.535742,23.264387,22.643036,7.698462,1141.174114,1147.656381,0.008214,2522.160735,0.49179,0.179735,0.181379,0.037811,0.013504,0.004573,0.03077,0.021385,0.035911,0.228367,,0.950485,10010.15229,19153.949826,,,8192.315677,8887.431198,11253.812607,13787.00449,15273.18012,17300.208959,18373.194293,20440.384039,23315.191068,26398.55237,,,,,,,,,,,8435.453867,17485.478908,,,9982.357536,19155.016223,14193.072464,24612.271281,,,,,525.988818,141.060622,,,228.787007,92.435037,77.924388,57.394569,69.447817,60.220016,18.163671,17.48323,16.382345,28.848135,,,,,,,,,,,26956.896823,20229.456092,15476.787322,18906.769125,15733.626853,11099.011104,8477.335343,6858.799103,0.593839,0.471843,0.694014,0.727493,0.691617,0.453604,0.550197,0.462107,0.381475,,,,,,,,,,1.815898,0.352605,0.64425,2925.16445,1.354252,680.179281,1486.300531,0.718455,0.693193,0.463474,0.555272,1298.507031,447.711206,54.583208,380.435859,2.466468,3.178607,2.055409,1.035557,17189.837703,13769.241614,12338.627231,12947.160622,13358.454112,13505.871473,11579.242613,10311.824423,9341.637806,9267.105354,9177.20143,9241.785266,0.570178,0.526082,3788.561526,1886.294884,452.09595,2.306034,901.83687
std,7640544.0,2739965.0,14847.499904,0.900211,0.088726,0.410619,8.75141,1.070275,1.362394,0.835281,16.769898,2.179201,9.614376,,5.851418,17.979595,11.066478,5.808817,6.424307,0.12477,0.125382,0.075246,0.0742,0.158014,0.260007,0.066403,0.097692,0.074153,21.578581,0.217596,0.213015,65.9955,59.956409,70.706483,72.226097,82.233472,81.296986,61.946404,70.163575,80.596669,3.971297,3.725738,4.494545,4.438807,3.681928,3.615055,1.195528,0.921908,3.801546,4.376404,3.577571,1.034064,125.516704,125.000305,0.090263,5657.459316,0.283737,0.217884,0.227826,0.079448,0.071663,0.031879,0.038606,0.06313,0.072023,0.255692,,0.216957,5289.529286,8034.427512,,,4445.243251,4441.244657,4638.79014,4953.010675,5513.770411,7335.639646,7468.678637,7452.874567,7266.69814,9000.447445,,,,,,,,,,,4483.830171,7361.061127,,,4627.898333,7501.934667,5407.004051,8284.018676,,,,,655.80164,264.21544,,,298.260338,117.326822,102.589175,95.948682,152.780283,153.150652,33.249969,34.010776,35.9908,81.71666,,,,,,,,,,,15831.620491,6873.577043,13333.765877,12621.628174,8127.867242,12995.482144,14025.056252,2534.714614,0.290545,0.217235,0.272367,0.169951,0.18127,0.305215,0.25166,0.279112,0.236839,,,,,,,,,,0.834446,0.242507,0.244392,6115.386037,0.478327,1260.876649,3102.072006,0.163226,0.159387,0.253207,0.221719,2285.935515,924.771122,206.174696,846.201554,0.845854,0.984043,0.836425,0.339294,8662.22446,9743.432766,9639.341214,11254.483046,11487.770831,11630.885604,4954.846521,5202.005336,5050.927486,5394.351573,5285.5678,5494.356963,0.239364,0.320575,8322.875304,4045.939627,925.426065,0.720068,1829.955708
min,100654.0,100200.0,1002.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,-3.0,,-14.322636,-170.742774,-2.0,-2.0,-2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,22.0,0.0,0.0,244.0,330.0,283.0,400.0,200.0,360.0,300.0,370.0,280.0,6.0,11.0,6.0,11.0,6.0,11.0,2.0,6.0,9.0,9.0,9.0,4.0,785.0,785.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,-1973.0,-1338.0,,,-3088.0,-2563.0,805.0,-2558.0,650.0,-3260.0,-3395.0,451.0,3800.0,5923.0,,,,,,,,,,,-3001.0,-3335.0,,,-1765.0,-610.0,-2558.0,3800.0,,,,,1.0,1.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,,,,,,,,,3990.0,1480.0,480.0,480.0,299.0,0.0,0.0,0.0,0.0,0.0,0.0009,0.0,0.0,0.0,0.0,0.0,0.0004,,,,,,,,,,1.0,0.0,0.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,2.0,1.0,1.0,404.0,525.0,395.0,50.0,263.0,530.0,404.0,525.0,395.0,50.0,263.0,530.0,0.0,0.0,1.0,1.0,0.0,2.0,0.0
25%,174031.5,311950.0,3109.25,1.0,0.0,1.0,1.0,1.0,1.0,1.0,13.0,3.0,12.0,,33.971442,-97.408884,-2.0,-2.0,-2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,30.0,0.552575,0.5627,470.0,570.0,470.0,560.0,410.0,520.0,525.0,515.0,464.75,18.0,23.0,17.0,23.0,17.0,23.0,6.0,8.0,21.0,20.0,20.0,7.0,1058.0,1062.0,0.0,105.0,0.2524,0.0356,0.0363,0.0024,0.0,0.0,0.0,0.0,0.0,0.0,,1.0,6127.5,13797.0,,,5148.0,5722.0,7761.0,10110.5,11239.5,12607.0,13844.25,15902.0,18862.25,20328.0,,,,,,,,,,,5317.5,12777.75,,,6615.75,14599.5,10301.0,19263.0,,,,,101.25,17.0,,,49.0,16.0,11.0,2.0,0.0,11.0,1.0,0.0,0.0,0.0,,,,,,,,,,,14055.5,15578.5,5252.0,8869.0,12166.0,4836.75,3807.25,5200.75,0.3427,0.3098,0.5,0.64725,0.5779,0.25,0.389525,0.2277,0.194875,,,,,,,,,,1.0,0.1398,0.5276,163.0,1.0,29.0,106.0,0.6358,0.5909,0.3121,0.404575,49.0,44.0,1.0,24.0,2.0,2.0,1.0,1.0,13182.0,7722.75,5650.0,5444.75,5271.5,5153.0,9210.0,6995.0,5100.0,4801.0,4627.0,4439.25,0.4,0.25,176.0,143.0,30.0,2.0,66.0
50%,228209.5,1019812.0,10198.0,2.0,0.0,1.0,1.0,2.0,2.0,2.0,29.0,5.0,21.0,,38.832183,-86.267098,9.0,2.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,54.0,0.7027,0.7003,510.0,610.0,500.0,598.0,441.5,557.5,556.0,549.5,500.0,20.0,26.0,19.0,25.0,18.0,25.0,6.0,8.0,23.0,23.0,22.0,7.0,1123.0,1130.0,0.0,438.0,0.5321,0.0959,0.091,0.0144,0.0023,0.0003,0.025,0.0,0.0133,0.1256,,1.0,8937.5,18669.0,,,7503.0,8046.0,10533.0,12969.0,14122.5,16672.0,17813.5,19953.0,22656.0,24898.5,,,,,,,,,,,7754.0,16871.0,,,9142.5,18669.5,13173.0,23542.0,,,,,270.0,46.0,,,130.5,49.0,37.0,17.0,9.0,28.0,5.0,3.0,1.0,0.0,,,,,,,,,,,22581.0,19589.0,11207.0,15275.0,15300.0,9231.5,6056.0,6574.0,0.5696,0.45295,0.7319,0.74825,0.69315,0.4545,0.5,0.5149,0.3581,,,,,,,,,,2.0,0.3706,0.6276,602.0,1.0,187.0,424.0,0.7436,0.6982,0.4587,0.50605,481.0,95.0,11.0,61.0,2.0,4.0,2.0,1.0,16500.0,12150.0,10177.0,9987.5,10470.0,10635.0,11304.0,10112.0,9100.0,8735.0,8716.0,9014.0,0.5678,0.5949,716.5,573.5,137.0,2.0,272.0
75%,452758.5,3034350.0,30273.75,3.0,0.0,1.0,2.0,3.0,4.0,3.0,42.0,6.0,22.0,,41.33294,-78.788784,20.0,10.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,71.0,0.844125,0.8442,550.0,650.0,540.0,640.0,500.0,610.0,600.0,590.0,555.0,22.0,28.0,22.0,29.0,21.0,27.0,7.0,9.0,25.0,26.0,24.0,9.0,1199.0,1211.0,0.0,2117.0,0.7231,0.239,0.2353,0.0373,0.0067,0.0026,0.0418,0.0173,0.0392,0.4027,,1.0,13483.75,23755.5,,,10747.0,11584.5,14125.0,17333.5,18627.5,21434.0,22443.0,24469.0,26948.75,30657.0,,,,,,,,,,,11052.0,21632.0,,,12875.75,23261.75,17759.5,28892.25,,,,,690.0,169.0,,,301.0,124.0,103.0,65.0,52.0,64.0,24.0,20.0,13.0,12.0,,,,,,,,,,,35765.5,24066.5,20550.0,26079.0,17700.0,14052.0,9449.25,8198.5,0.88215,0.628675,0.9787,0.833525,0.8182,0.6636,0.75,0.68025,0.5455,,,,,,,,,,3.0,0.4706,0.8571,2635.75,2.0,830.0,1416.0,0.8235,0.807,0.6213,0.731425,1313.75,405.0,40.0,347.0,2.0,4.0,3.0,1.0,19812.0,16774.75,15740.0,16315.0,16414.0,16987.5,13793.0,12954.0,12458.0,12861.25,13000.0,13242.75,0.75,0.793025,3319.0,1940.25,472.0,2.0,937.25
max,49146400.0,82098880.0,42788.0,3.0,1.0,1.0,74.0,4.0,4.0,3.0,78.0,9.0,43.0,,71.324702,171.378129,33.0,15.0,18.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,108.0,1.0,1.0,740.0,780.0,790.0,800.0,730.0,800.0,760.0,795.0,765.0,35.0,36.0,35.0,36.0,35.0,36.0,11.0,12.0,36.0,36.0,36.0,12.0,1566.0,1566.0,1.0,88921.0,1.0,1.0,1.0,1.0,1.0,0.9973,0.6316,1.0,1.0,1.0,,1.0,44661.0,111408.0,,,41496.0,32114.0,31339.0,32589.0,47826.0,109313.0,109704.0,113261.0,114298.0,113314.0,,,,,,,,,,,41496.0,109425.0,,,31883.0,111737.0,47826.0,113642.0,,,,,6383.0,6610.0,,,4749.0,1172.0,650.0,838.0,1279.0,6259.0,637.0,391.0,400.0,981.0,,,,,,,,,,,96375.0,116377.0,74514.0,74514.0,117450.0,455440.0,542922.0,20484.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,,,,,,,,,,3.0,1.0,1.0,80898.0,2.0,14425.0,42336.0,1.0,1.0,1.0,1.0,19054.0,12877.0,4987.0,12615.0,4.0,4.0,3.0,7.0,118250.0,118250.0,119200.0,99995.0,74995.0,86339.0,91125.0,77805.0,46968.0,60000.0,29179.0,37358.0,1.0,1.0,162762.0,68457.0,25695.0,4.0,49860.0


In [44]:
# Remove column only relevant to 2000-01 academic year
df = df.drop(columns = ['PPTUG_EF2'])

In [45]:
# In order to remove columns involving missing cost elements for 'program-year institutions', create list of just columns with PROG
prog_col = [col for col in df if 'PROG' in col]

In [46]:
# Check output
prog_col

['NPT4_PROG',
 'NPT41_PROG',
 'NPT42_PROG',
 'NPT43_PROG',
 'NPT44_PROG',
 'NPT45_PROG',
 'NPT4_048_PROG',
 'NPT4_3075_PROG',
 'NPT4_75UP_PROG',
 'NUM4_PROG',
 'NUM41_PROG',
 'NUM42_PROG',
 'NUM43_PROG',
 'NUM44_PROG',
 'NUM45_PROG',
 'TUITIONFEE_PROG']

In [47]:
# Remove TUITIONFEE_PROG from list
prog_col.remove('TUITIONFEE_PROG')

In [48]:
# Check output
prog_col

['NPT4_PROG',
 'NPT41_PROG',
 'NPT42_PROG',
 'NPT43_PROG',
 'NPT44_PROG',
 'NPT45_PROG',
 'NPT4_048_PROG',
 'NPT4_3075_PROG',
 'NPT4_75UP_PROG',
 'NUM4_PROG',
 'NUM41_PROG',
 'NUM42_PROG',
 'NUM43_PROG',
 'NUM44_PROG',
 'NUM45_PROG']

In [49]:
# Drop columns from dataframe that are in list
df.drop(columns = prog_col, inplace = True)

In [50]:
# Check new size
df.shape

(6806, 285)

In [51]:
# Check new output
df.head()

Unnamed: 0,UNITID,OPEID,OPEID6,INSTNM,CITY,STABBR,ZIP,ACCREDAGENCY,SCH_DEG,HCM2,MAIN,NUMBRANCH,PREDDEG,HIGHDEG,CONTROL,ST_FIPS,REGION,LOCALE,LOCALE2,LATITUDE,LONGITUDE,CCBASIC,CCUGPROF,CCSIZSET,HBCU,PBI,ANNHI,TRIBAL,AANAPII,HSI,NANTI,MENONLY,WOMENONLY,RELAFFIL,ADM_RATE,ADM_RATE_ALL,SATVR25,SATVR75,SATMT25,SATMT75,SATWR25,SATWR75,SATVRMID,SATMTMID,SATWRMID,ACTCM25,ACTCM75,ACTEN25,ACTEN75,ACTMT25,ACTMT75,ACTWR25,ACTWR75,ACTCMMID,ACTENMID,ACTMTMID,ACTWRMID,SAT_AVG,SAT_AVG_ALL,DISTANCEONLY,UGDS,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN,PPTUG_EF,CURROPER,NPT4_PUB,NPT4_PRIV,NPT4_OTHER,NPT41_PUB,NPT42_PUB,NPT43_PUB,NPT44_PUB,NPT45_PUB,NPT41_PRIV,NPT42_PRIV,NPT43_PRIV,NPT44_PRIV,NPT45_PRIV,NPT41_OTHER,NPT42_OTHER,NPT43_OTHER,NPT44_OTHER,NPT45_OTHER,NPT4_048_PUB,NPT4_048_PRIV,NPT4_048_OTHER,NPT4_3075_PUB,NPT4_3075_PRIV,NPT4_75UP_PUB,NPT4_75UP_PRIV,NPT4_3075_OTHER,NPT4_75UP_OTHER,NUM4_PUB,NUM4_PRIV,NUM4_OTHER,NUM41_PUB,NUM42_PUB,NUM43_PUB,NUM44_PUB,NUM45_PUB,NUM41_PRIV,NUM42_PRIV,NUM43_PRIV,NUM44_PRIV,NUM45_PRIV,NUM41_OTHER,NUM42_OTHER,NUM43_OTHER,NUM44_OTHER,NUM45_OTHER,COSTT4_A,COSTT4_P,TUITIONFEE_IN,TUITIONFEE_OUT,TUITIONFEE_PROG,TUITFTE,INEXPFTE,AVGFACSAL,PFTFAC,PCTPELL,PFTFTUG1_EF,RET_FT4,RET_FTL4,RET_PT4,RET_PTL4,PCTFLOAN,UG25ABV,INC_PCT_LO,DEP_STAT_PCT_IND,DEP_INC_PCT_LO,IND_INC_PCT_LO,PAR_ED_PCT_1STGEN,INC_PCT_M1,INC_PCT_M2,INC_PCT_H1,INC_PCT_H2,DEP_INC_PCT_M1,DEP_INC_PCT_M2,DEP_INC_PCT_H1,DEP_INC_PCT_H2,IND_INC_PCT_M1,IND_INC_PCT_M2,IND_INC_PCT_H1,IND_INC_PCT_H2,PAR_ED_PCT_MS,PAR_ED_PCT_HS,PAR_ED_PCT_PS,APPL_SCH_PCT_GE2,APPL_SCH_PCT_GE3,APPL_SCH_PCT_GE4,APPL_SCH_PCT_GE5,DEP_INC_AVG,IND_INC_AVG,DEBT_MDN,GRAD_DEBT_MDN,WDRAW_DEBT_MDN,LO_INC_DEBT_MDN,MD_INC_DEBT_MDN,HI_INC_DEBT_MDN,DEP_DEBT_MDN,IND_DEBT_MDN,PELL_DEBT_MDN,NOPELL_DEBT_MDN,FEMALE_DEBT_MDN,MALE_DEBT_MDN,FIRSTGEN_DEBT_MDN,NOTFIRSTGEN_DEBT_MDN,DEBT_N,GRAD_DEBT_N,WDRAW_DEBT_N,LO_INC_DEBT_N,MD_INC_DEBT_N,HI_INC_DEBT_N,DEP_DEBT_N,IND_DEBT_N,PELL_DEBT_N,NOPELL_DEBT_N,FEMALE_DEBT_N,MALE_DEBT_N,FIRSTGEN_DEBT_N,NOTFIRSTGEN_DEBT_N,GRAD_DEBT_MDN10YR,CUML_DEBT_N,CUML_DEBT_P90,CUML_DEBT_P75,CUML_DEBT_P25,CUML_DEBT_P10,INC_N,DEP_INC_N,IND_INC_N,DEP_STAT_N,PAR_ED_N,APPL_SCH_N,LOAN_EVER,PELL_EVER,AGE_ENTRY,AGE_ENTRY_SQ,AGEGE24,FEMALE,MARRIED,DEPENDENT,VETERAN,FIRST_GEN,FAMINC,MD_FAMINC,FAMINC_IND,LNFAMINC,LNFAMINC_IND,PCT_WHITE,PCT_BLACK,PCT_ASIAN,PCT_HISPANIC,PCT_BA,PCT_GRAD_PROF,PCT_BORN_US,MEDIAN_HH_INC,POVERTY_RATE,UNEMP_RATE,LN_MEDIAN_HH_INC,FSEND_COUNT,FSEND_1,FSEND_2,FSEND_3,FSEND_4,FSEND_5,DEBT_MDN_SUPP,GRAD_DEBT_MDN_SUPP,GRAD_DEBT_MDN10YR_SUPP,ALIAS,ICLEVEL,UGDS_MEN,UGDS_WOMEN,T4APPROVALDATE,D_PCTPELL_PCTFLOAN,OPENADMP,UGNONDS,GRADS,ACCREDCODE,RET_FT4_POOLED,RET_FTL4_POOLED,RET_PT4_POOLED,RET_PTL4_POOLED,RET_FT_DEN4_POOLED,RET_FT_DENL4_POOLED,RET_PT_DEN4_POOLED,RET_PT_DENL4_POOLED,POOLYRSRET_FT,POOLYRSRET_PT,RET_FT4_POOLED_SUPP,RET_FTL4_POOLED_SUPP,RET_PT4_POOLED_SUPP,RET_PTL4_POOLED_SUPP,SCHTYPE,OPEFLAG,CIPTFBS1,CIPTFBS2,CIPTFBS3,CIPTFBS4,CIPTFBS5,CIPTFBS6,CIPTFBSANNUAL1,CIPTFBSANNUAL2,CIPTFBSANNUAL3,CIPTFBSANNUAL4,CIPTFBSANNUAL5,CIPTFBSANNUAL6,FTFTPCTPELL,FTFTPCTFLOAN,UG12MN,G12MN,SCUGFFN,POOLYRS_FTFTAIDPCT,FTFTPCTPELL_POOLED_SUPP,FTFTPCTFLOAN_POOLED_SUPP,SCUGFFN_POOLED,LPSTAFFORD_CNT,LPSTAFFORD_AMT,FEDSCHCD
0,100654,100200,1002,Alabama A & M University,Normal,AL,35762,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,34.783368,-86.568502,18.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8986,0.8986,430.0,520.0,420.0,510.0,370.0,457.0,475.0,465.0,414.0,16.0,19.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,957.0,957.0,0.0,4990.0,0.0186,0.912,0.0088,0.0018,0.0022,0.0016,0.0118,0.007,0.0361,0.0587,1,14444.0,,,13893.0,13976.0,15995.0,18957.0,17140.0,,,,,,,,,,,13913.0,,,14684.0,,18281.0,,,,592.0,,,375.0,113.0,61.0,27.0,16.0,,,,,,,,,,,22489.0,,9744.0,18354.0,,7413.0,5384.0,7101.0,0.7411,0.7067,0.8987,0.6087,,1.0,,0.7503,0.0758,0.6020087884,0.0988700565,0.5691396726,0.9015873016,0.3658280922,0.1898932831,0.1051475204,0.0621468927,0.0408035154,0.2034134448,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0666666667,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0164220825,0.3494060098,0.6341719078,0.7291274325,0.5668549906,0.4579409918,0.3631512869,34779.085684,10340.346032,15500,33375,10250,15500,16000,14518,15000,19000,17500,10250,17500,14250,15000,16421,3606,1076,2530,2185,1034,387,3191,415,3162,444,2074,1532,2895,711,346.376038474076,3085,47750,32208,5500,3381,3186,2871,315,3186,2862,3186,0.8860640301,0.8527934714,20.283741368,,0.07999999821186,0.5640301318,0.0091023227,0.9011299435,0.003138732,0.3658280922,32362.826114,23553.0,10340.346032,,,46.8400001525878,47.9799995422363,1.48000001907348,3.78999996185302,13.0,6.8600001335144,94.7399978637695,49720.22,14.8800001144409,4.84000015258789,10.75,,,,,,,15500,33375,346.376038474076,AAMU,1,0.4076,0.5924,12/12/1965,5039.0,2.0,153.0,963.0,SACSCC,0.5978,,0.25,,2698.0,,44.0,,2.0,2.0,0.5978,,0.25,,1.0,1,,,,,,,,,,,,,0.7057,0.7143,5343.0,1165.0,1288.0,2.0,0.7083,0.7287,2698.0,31374,922456254,1002
1,100663,105200,1052,University of Alabama at Birmingham,Birmingham,AL,35294-0110,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,33.505697,-86.799345,15.0,9.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9211,0.9211,490.0,620.0,490.0,620.0,,,555.0,555.0,,21.0,29.0,22.0,31.0,19.0,26.0,,,25.0,27.0,23.0,,1220.0,1220.0,0.0,13186.0,0.5717,0.2553,0.0334,0.0633,0.0034,0.0002,0.0457,0.0213,0.0058,0.2425,1,17005.0,,,14550.0,15379.0,17892.0,19978.0,20110.0,,,,,,,,,,,14830.0,,,16587.0,,20050.0,,,,1229.0,,,421.0,214.0,198.0,180.0,216.0,,,,,,,,,,,24347.0,,8568.0,19704.0,,13177.0,16454.0,10717.0,0.7766,0.3632,0.6009,0.8186,,0.4648,,0.5127,0.2296,0.4276131917,0.3214086082,0.3487095003,0.5942028986,0.341223671,0.1798024967,0.1423514067,0.114589156,0.1356437488,0.1699615596,0.1537616694,0.142778693,0.1847885777,0.2005797101,0.1182608696,0.0550724638,0.031884058,0.0222668004,0.3189568706,0.658776329,0.5135084777,0.2634618968,0.1652692379,0.1076951742,61110.800384,30607.18029,15000,22500,9500,16226,15250,14000,15000,16000,17500,12500,15000,15000,15104,15000,7504,3730,3774,3168,2281,2055,5123,2381,4714,2790,4804,2700,5286,2218,233.511936049938,6302,37540,26082,6250,3500,5367,3642,1725,5367,4985,5367,0.8574622694,0.6249301286,23.60797466,,0.25999999046325,0.6390907397,0.1050866406,0.6785913918,0.0031675051,0.341223671,51306.674306,34489.0,30607.18029,,,69.0199966430664,27.7600002288818,1.10000002384185,2.02999997138977,15.9300003051757,8.55000019073486,96.5,55735.22,10.9099998474121,3.45000004768371,10.8599996566772,,,,,,,15000,22500,233.511936049938,,1,0.393,0.607,12/1/1965,13134.0,2.0,650.0,8087.0,SACSCC,0.8303,,0.4514,,4130.0,,144.0,,2.0,2.0,0.8303,,0.4514,,1.0,1,,,,,,,,,,,,,0.3788,0.535,14445.0,10498.0,2228.0,2.0,0.3891,0.5414,4176.0,56997,1720042015,1052
2,100690,2503400,25034,Amridge University,Montgomery,AL,36117-3553,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,2,1,5,12.0,,32.362609,-86.17401,20.0,5.0,6.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,74.0,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,351.0,0.2393,0.7151,0.0171,0.0057,0.0057,0.0,0.0,0.0,0.0171,0.5014,1,,15322.0,,,,,,,15322.0,,,,,,,,,,,15322.0,,,,,,,,,5.0,,,,,,,5.0,0.0,0.0,0.0,0.0,,,,,,17680.0,,6900.0,6900.0,,14273.0,4206.0,4292.0,1.0,0.7673,0.0035,,,,,0.8962,0.8302,0.7736486486,0.8952702703,PrivacySuppressed,PrivacySuppressed,0.5125,0.1148648649,0.0641891892,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.05,0.4625,0.4875,0.5945945946,0.3378378378,0.2432432432,0.1587837838,25211.032258,20596.158491,10500,27334,9500,9500,19000,25000,7646,12038,9500,15509,9500,17025,11500,9500,514,92,422,397,91,26,60,454,464,50,327,187,458,56,283.680678221734,398,38455,24250,4750,3166,296,31,265,296,240,296,0.9560810811,0.8648648649,33.672297297,,0.82999998331069,0.6486486486,0.2364864865,0.1047297297,0.0405405405,0.5125,21079.472973,15033.5,20596.158491,,,70.8799972534179,22.5300006866455,1.28999996185302,6.94000005722046,13.2299995422363,7.01000022888183,94.0899963378906,53683.7,10.6499996185302,3.59999990463256,10.8400001525878,,,,,,,10500,27334,283.680678221734,Southern Christian University Regions University,1,0.3191,0.6809,3/26/1987,318.0,1.0,,404.0,SACSCC,0.2143,,0.1429,,14.0,,14.0,,4.0,4.0,PrivacySuppressed,,PrivacySuppressed,,2.0,1,,,,,,,,,,,,,1.0,1.0,440.0,527.0,5.0,4.0,PrivacySuppressed,PrivacySuppressed,24.0,4463,174222020,16885
3,100706,105500,1055,University of Alabama in Huntsville,Huntsville,AL,35899,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,34.724557,-86.640449,16.0,15.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8087,0.8087,560.0,700.0,450.0,680.0,,,630.0,565.0,,25.0,31.0,25.0,34.0,24.0,30.0,,,28.0,30.0,27.0,,1314.0,1314.0,0.0,7458.0,0.7167,0.0969,0.0528,0.0381,0.0095,0.0008,0.0296,0.0223,0.0333,0.1443,1,20909.0,,,17561.0,18991.0,21396.0,23204.0,23406.0,,,,,,,,,,,18147.0,,,20356.0,,23315.0,,,,585.0,,,134.0,93.0,122.0,107.0,129.0,,,,,,,,,,,23441.0,,10714.0,22362.0,,8677.0,9242.0,9442.0,0.6544,0.2698,0.6176,0.8288,,0.0909,,0.4192,0.1842,0.374633738,0.2515696944,0.26901566,0.6888519135,0.3101321586,0.1377145249,0.1469233989,0.1506906656,0.1900376727,0.1448545861,0.1605145414,0.1817673378,0.2438478747,0.1164725458,0.1064891847,0.0582362729,0.0299500832,0.0198237885,0.29030837,0.6898678414,0.5290916702,0.2737547091,0.1573880285,0.1025533696,72240.892617,27941.821963,14476,21607,9000,16250,14750,12500,12750,18569,17014,11899,15250,13333,14943,13102,3021,1374,1647,1168,827,1026,2067,954,1808,1213,1375,1646,1997,1024,224.244106765823,2626,36250,26750,5500,3472,2389,1788,601,2389,2270,2389,0.8652155714,0.5571368774,22.727919632,,0.28999999165534,0.4763499372,0.1004604437,0.7484303056,PrivacySuppressed,0.3101321586,61096.588949,44787.0,27941.821963,,,76.3799972534179,18.9799995422363,1.41999995708465,2.54999995231628,17.6700000762939,8.90999984741211,95.2699966430664,58688.62,9.36999988555908,3.64000010490417,10.9300003051757,,,,,,,14476,21607,224.244106765823,UAH University of Alabama Huntsville,1,0.5796,0.4204,12/1/1965,7090.0,2.0,213.0,2065.0,SACSCC,0.8269,,0.35,,2531.0,,40.0,,2.0,4.0,0.8269,,0.35,,1.0,1,,,,,,,,,,,,,0.2707,0.4556,8145.0,2443.0,1341.0,2.0,0.2378,0.4402,2544.0,19702,407184805,1055
4,100724,100500,1005,Alabama State University,Montgomery,AL,36104-0271,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,32.364317,-86.295677,19.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9774,0.9774,440.0,520.0,420.0,510.0,,,480.0,465.0,,16.0,20.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,972.0,972.0,0.0,3903.0,0.0167,0.9352,0.0095,0.0041,0.0013,0.0005,0.0102,0.0102,0.0123,0.0666,1,13043.0,,,11344.0,14855.0,18390.0,18863.0,14833.0,,,,,,,,,,,12113.0,,,16104.0,,17819.0,,,,523.0,,,346.0,97.0,53.0,20.0,7.0,,,,,,,,,,,21476.0,,11068.0,19396.0,,10160.0,8527.0,7754.0,0.5826,0.7448,0.865,0.5868,,0.125,,0.7845,0.0848,0.6146166134,0.107428115,0.5776286353,0.9219330855,0.3434343434,0.178514377,0.1126198083,0.052715655,0.0415335463,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0188246097,0.3246097337,0.6565656566,0.6625399361,0.4972044728,0.3841853035,0.2903354633,34468.571812,8551.802974,18679,32000,11161,18750,18500,18246,17500,23925,19056,12000,19500,15525,19000,17500,3609,1149,2460,2299,965,345,3162,447,3237,372,2276,1333,2899,710,332.105864604357,3486,45000,32263,5784,3500,2504,2235,269,2504,2178,2504,0.8889776358,0.874600639,20.130990415,,0.10999999940395,0.6134185304,0.0079872204,0.892571885,PrivacySuppressed,0.3434343434,31684.382188,22080.5,8551.802974,,,42.6899986267089,52.3199996948242,1.40999996662139,4.09000015258789,11.8100004196167,6.76000022888183,94.5299987792968,46065.2,16.9599990844726,4.80999994277954,10.6700000762939,,,,,,,18679,32000,332.105864604357,,1,0.371,0.629,12/1/1965,4208.0,2.0,,510.0,SACSCC,0.5898,,0.25,,2094.0,,36.0,,2.0,2.0,0.5898,,0.25,,1.0,1,,,,,,,,,,,,,0.7792,0.7539,4732.0,642.0,951.0,2.0,0.7684,0.7464,2094.0,34246,947070736,1005


In [52]:
# In order to remove columns involving missing cost elements for 'other academic year institutions', create list of just columns with OTHER
other_col = [col for col in df if 'OTHER' in col]


In [53]:
# Check output
other_col

['NPT4_OTHER',
 'NPT41_OTHER',
 'NPT42_OTHER',
 'NPT43_OTHER',
 'NPT44_OTHER',
 'NPT45_OTHER',
 'NPT4_048_OTHER',
 'NPT4_3075_OTHER',
 'NPT4_75UP_OTHER',
 'NUM4_OTHER',
 'NUM41_OTHER',
 'NUM42_OTHER',
 'NUM43_OTHER',
 'NUM44_OTHER',
 'NUM45_OTHER']

In [54]:
# Drop columns from dataframe that are in list
df.drop(columns = other_col, inplace = True)

In [55]:
# Check new size
df.shape

(6806, 270)

In [56]:
# Check new output
df.head()

Unnamed: 0,UNITID,OPEID,OPEID6,INSTNM,CITY,STABBR,ZIP,ACCREDAGENCY,SCH_DEG,HCM2,MAIN,NUMBRANCH,PREDDEG,HIGHDEG,CONTROL,ST_FIPS,REGION,LOCALE,LOCALE2,LATITUDE,LONGITUDE,CCBASIC,CCUGPROF,CCSIZSET,HBCU,PBI,ANNHI,TRIBAL,AANAPII,HSI,NANTI,MENONLY,WOMENONLY,RELAFFIL,ADM_RATE,ADM_RATE_ALL,SATVR25,SATVR75,SATMT25,SATMT75,SATWR25,SATWR75,SATVRMID,SATMTMID,SATWRMID,ACTCM25,ACTCM75,ACTEN25,ACTEN75,ACTMT25,ACTMT75,ACTWR25,ACTWR75,ACTCMMID,ACTENMID,ACTMTMID,ACTWRMID,SAT_AVG,SAT_AVG_ALL,DISTANCEONLY,UGDS,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN,PPTUG_EF,CURROPER,NPT4_PUB,NPT4_PRIV,NPT41_PUB,NPT42_PUB,NPT43_PUB,NPT44_PUB,NPT45_PUB,NPT41_PRIV,NPT42_PRIV,NPT43_PRIV,NPT44_PRIV,NPT45_PRIV,NPT4_048_PUB,NPT4_048_PRIV,NPT4_3075_PUB,NPT4_3075_PRIV,NPT4_75UP_PUB,NPT4_75UP_PRIV,NUM4_PUB,NUM4_PRIV,NUM41_PUB,NUM42_PUB,NUM43_PUB,NUM44_PUB,NUM45_PUB,NUM41_PRIV,NUM42_PRIV,NUM43_PRIV,NUM44_PRIV,NUM45_PRIV,COSTT4_A,COSTT4_P,TUITIONFEE_IN,TUITIONFEE_OUT,TUITIONFEE_PROG,TUITFTE,INEXPFTE,AVGFACSAL,PFTFAC,PCTPELL,PFTFTUG1_EF,RET_FT4,RET_FTL4,RET_PT4,RET_PTL4,PCTFLOAN,UG25ABV,INC_PCT_LO,DEP_STAT_PCT_IND,DEP_INC_PCT_LO,IND_INC_PCT_LO,PAR_ED_PCT_1STGEN,INC_PCT_M1,INC_PCT_M2,INC_PCT_H1,INC_PCT_H2,DEP_INC_PCT_M1,DEP_INC_PCT_M2,DEP_INC_PCT_H1,DEP_INC_PCT_H2,IND_INC_PCT_M1,IND_INC_PCT_M2,IND_INC_PCT_H1,IND_INC_PCT_H2,PAR_ED_PCT_MS,PAR_ED_PCT_HS,PAR_ED_PCT_PS,APPL_SCH_PCT_GE2,APPL_SCH_PCT_GE3,APPL_SCH_PCT_GE4,APPL_SCH_PCT_GE5,DEP_INC_AVG,IND_INC_AVG,DEBT_MDN,GRAD_DEBT_MDN,WDRAW_DEBT_MDN,LO_INC_DEBT_MDN,MD_INC_DEBT_MDN,HI_INC_DEBT_MDN,DEP_DEBT_MDN,IND_DEBT_MDN,PELL_DEBT_MDN,NOPELL_DEBT_MDN,FEMALE_DEBT_MDN,MALE_DEBT_MDN,FIRSTGEN_DEBT_MDN,NOTFIRSTGEN_DEBT_MDN,DEBT_N,GRAD_DEBT_N,WDRAW_DEBT_N,LO_INC_DEBT_N,MD_INC_DEBT_N,HI_INC_DEBT_N,DEP_DEBT_N,IND_DEBT_N,PELL_DEBT_N,NOPELL_DEBT_N,FEMALE_DEBT_N,MALE_DEBT_N,FIRSTGEN_DEBT_N,NOTFIRSTGEN_DEBT_N,GRAD_DEBT_MDN10YR,CUML_DEBT_N,CUML_DEBT_P90,CUML_DEBT_P75,CUML_DEBT_P25,CUML_DEBT_P10,INC_N,DEP_INC_N,IND_INC_N,DEP_STAT_N,PAR_ED_N,APPL_SCH_N,LOAN_EVER,PELL_EVER,AGE_ENTRY,AGE_ENTRY_SQ,AGEGE24,FEMALE,MARRIED,DEPENDENT,VETERAN,FIRST_GEN,FAMINC,MD_FAMINC,FAMINC_IND,LNFAMINC,LNFAMINC_IND,PCT_WHITE,PCT_BLACK,PCT_ASIAN,PCT_HISPANIC,PCT_BA,PCT_GRAD_PROF,PCT_BORN_US,MEDIAN_HH_INC,POVERTY_RATE,UNEMP_RATE,LN_MEDIAN_HH_INC,FSEND_COUNT,FSEND_1,FSEND_2,FSEND_3,FSEND_4,FSEND_5,DEBT_MDN_SUPP,GRAD_DEBT_MDN_SUPP,GRAD_DEBT_MDN10YR_SUPP,ALIAS,ICLEVEL,UGDS_MEN,UGDS_WOMEN,T4APPROVALDATE,D_PCTPELL_PCTFLOAN,OPENADMP,UGNONDS,GRADS,ACCREDCODE,RET_FT4_POOLED,RET_FTL4_POOLED,RET_PT4_POOLED,RET_PTL4_POOLED,RET_FT_DEN4_POOLED,RET_FT_DENL4_POOLED,RET_PT_DEN4_POOLED,RET_PT_DENL4_POOLED,POOLYRSRET_FT,POOLYRSRET_PT,RET_FT4_POOLED_SUPP,RET_FTL4_POOLED_SUPP,RET_PT4_POOLED_SUPP,RET_PTL4_POOLED_SUPP,SCHTYPE,OPEFLAG,CIPTFBS1,CIPTFBS2,CIPTFBS3,CIPTFBS4,CIPTFBS5,CIPTFBS6,CIPTFBSANNUAL1,CIPTFBSANNUAL2,CIPTFBSANNUAL3,CIPTFBSANNUAL4,CIPTFBSANNUAL5,CIPTFBSANNUAL6,FTFTPCTPELL,FTFTPCTFLOAN,UG12MN,G12MN,SCUGFFN,POOLYRS_FTFTAIDPCT,FTFTPCTPELL_POOLED_SUPP,FTFTPCTFLOAN_POOLED_SUPP,SCUGFFN_POOLED,LPSTAFFORD_CNT,LPSTAFFORD_AMT,FEDSCHCD
0,100654,100200,1002,Alabama A & M University,Normal,AL,35762,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,34.783368,-86.568502,18.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8986,0.8986,430.0,520.0,420.0,510.0,370.0,457.0,475.0,465.0,414.0,16.0,19.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,957.0,957.0,0.0,4990.0,0.0186,0.912,0.0088,0.0018,0.0022,0.0016,0.0118,0.007,0.0361,0.0587,1,14444.0,,13893.0,13976.0,15995.0,18957.0,17140.0,,,,,,13913.0,,14684.0,,18281.0,,592.0,,375.0,113.0,61.0,27.0,16.0,,,,,,22489.0,,9744.0,18354.0,,7413.0,5384.0,7101.0,0.7411,0.7067,0.8987,0.6087,,1.0,,0.7503,0.0758,0.6020087884,0.0988700565,0.5691396726,0.9015873016,0.3658280922,0.1898932831,0.1051475204,0.0621468927,0.0408035154,0.2034134448,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0666666667,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0164220825,0.3494060098,0.6341719078,0.7291274325,0.5668549906,0.4579409918,0.3631512869,34779.085684,10340.346032,15500,33375,10250,15500,16000,14518,15000,19000,17500,10250,17500,14250,15000,16421,3606,1076,2530,2185,1034,387,3191,415,3162,444,2074,1532,2895,711,346.376038474076,3085,47750,32208,5500,3381,3186,2871,315,3186,2862,3186,0.8860640301,0.8527934714,20.283741368,,0.07999999821186,0.5640301318,0.0091023227,0.9011299435,0.003138732,0.3658280922,32362.826114,23553.0,10340.346032,,,46.8400001525878,47.9799995422363,1.48000001907348,3.78999996185302,13.0,6.8600001335144,94.7399978637695,49720.22,14.8800001144409,4.84000015258789,10.75,,,,,,,15500,33375,346.376038474076,AAMU,1,0.4076,0.5924,12/12/1965,5039.0,2.0,153.0,963.0,SACSCC,0.5978,,0.25,,2698.0,,44.0,,2.0,2.0,0.5978,,0.25,,1.0,1,,,,,,,,,,,,,0.7057,0.7143,5343.0,1165.0,1288.0,2.0,0.7083,0.7287,2698.0,31374,922456254,1002
1,100663,105200,1052,University of Alabama at Birmingham,Birmingham,AL,35294-0110,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,33.505697,-86.799345,15.0,9.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9211,0.9211,490.0,620.0,490.0,620.0,,,555.0,555.0,,21.0,29.0,22.0,31.0,19.0,26.0,,,25.0,27.0,23.0,,1220.0,1220.0,0.0,13186.0,0.5717,0.2553,0.0334,0.0633,0.0034,0.0002,0.0457,0.0213,0.0058,0.2425,1,17005.0,,14550.0,15379.0,17892.0,19978.0,20110.0,,,,,,14830.0,,16587.0,,20050.0,,1229.0,,421.0,214.0,198.0,180.0,216.0,,,,,,24347.0,,8568.0,19704.0,,13177.0,16454.0,10717.0,0.7766,0.3632,0.6009,0.8186,,0.4648,,0.5127,0.2296,0.4276131917,0.3214086082,0.3487095003,0.5942028986,0.341223671,0.1798024967,0.1423514067,0.114589156,0.1356437488,0.1699615596,0.1537616694,0.142778693,0.1847885777,0.2005797101,0.1182608696,0.0550724638,0.031884058,0.0222668004,0.3189568706,0.658776329,0.5135084777,0.2634618968,0.1652692379,0.1076951742,61110.800384,30607.18029,15000,22500,9500,16226,15250,14000,15000,16000,17500,12500,15000,15000,15104,15000,7504,3730,3774,3168,2281,2055,5123,2381,4714,2790,4804,2700,5286,2218,233.511936049938,6302,37540,26082,6250,3500,5367,3642,1725,5367,4985,5367,0.8574622694,0.6249301286,23.60797466,,0.25999999046325,0.6390907397,0.1050866406,0.6785913918,0.0031675051,0.341223671,51306.674306,34489.0,30607.18029,,,69.0199966430664,27.7600002288818,1.10000002384185,2.02999997138977,15.9300003051757,8.55000019073486,96.5,55735.22,10.9099998474121,3.45000004768371,10.8599996566772,,,,,,,15000,22500,233.511936049938,,1,0.393,0.607,12/1/1965,13134.0,2.0,650.0,8087.0,SACSCC,0.8303,,0.4514,,4130.0,,144.0,,2.0,2.0,0.8303,,0.4514,,1.0,1,,,,,,,,,,,,,0.3788,0.535,14445.0,10498.0,2228.0,2.0,0.3891,0.5414,4176.0,56997,1720042015,1052
2,100690,2503400,25034,Amridge University,Montgomery,AL,36117-3553,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,2,1,5,12.0,,32.362609,-86.17401,20.0,5.0,6.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,74.0,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,351.0,0.2393,0.7151,0.0171,0.0057,0.0057,0.0,0.0,0.0,0.0171,0.5014,1,,15322.0,,,,,,15322.0,,,,,,15322.0,,,,,,5.0,,,,,,5.0,0.0,0.0,0.0,0.0,17680.0,,6900.0,6900.0,,14273.0,4206.0,4292.0,1.0,0.7673,0.0035,,,,,0.8962,0.8302,0.7736486486,0.8952702703,PrivacySuppressed,PrivacySuppressed,0.5125,0.1148648649,0.0641891892,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.05,0.4625,0.4875,0.5945945946,0.3378378378,0.2432432432,0.1587837838,25211.032258,20596.158491,10500,27334,9500,9500,19000,25000,7646,12038,9500,15509,9500,17025,11500,9500,514,92,422,397,91,26,60,454,464,50,327,187,458,56,283.680678221734,398,38455,24250,4750,3166,296,31,265,296,240,296,0.9560810811,0.8648648649,33.672297297,,0.82999998331069,0.6486486486,0.2364864865,0.1047297297,0.0405405405,0.5125,21079.472973,15033.5,20596.158491,,,70.8799972534179,22.5300006866455,1.28999996185302,6.94000005722046,13.2299995422363,7.01000022888183,94.0899963378906,53683.7,10.6499996185302,3.59999990463256,10.8400001525878,,,,,,,10500,27334,283.680678221734,Southern Christian University Regions University,1,0.3191,0.6809,3/26/1987,318.0,1.0,,404.0,SACSCC,0.2143,,0.1429,,14.0,,14.0,,4.0,4.0,PrivacySuppressed,,PrivacySuppressed,,2.0,1,,,,,,,,,,,,,1.0,1.0,440.0,527.0,5.0,4.0,PrivacySuppressed,PrivacySuppressed,24.0,4463,174222020,16885
3,100706,105500,1055,University of Alabama in Huntsville,Huntsville,AL,35899,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,34.724557,-86.640449,16.0,15.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8087,0.8087,560.0,700.0,450.0,680.0,,,630.0,565.0,,25.0,31.0,25.0,34.0,24.0,30.0,,,28.0,30.0,27.0,,1314.0,1314.0,0.0,7458.0,0.7167,0.0969,0.0528,0.0381,0.0095,0.0008,0.0296,0.0223,0.0333,0.1443,1,20909.0,,17561.0,18991.0,21396.0,23204.0,23406.0,,,,,,18147.0,,20356.0,,23315.0,,585.0,,134.0,93.0,122.0,107.0,129.0,,,,,,23441.0,,10714.0,22362.0,,8677.0,9242.0,9442.0,0.6544,0.2698,0.6176,0.8288,,0.0909,,0.4192,0.1842,0.374633738,0.2515696944,0.26901566,0.6888519135,0.3101321586,0.1377145249,0.1469233989,0.1506906656,0.1900376727,0.1448545861,0.1605145414,0.1817673378,0.2438478747,0.1164725458,0.1064891847,0.0582362729,0.0299500832,0.0198237885,0.29030837,0.6898678414,0.5290916702,0.2737547091,0.1573880285,0.1025533696,72240.892617,27941.821963,14476,21607,9000,16250,14750,12500,12750,18569,17014,11899,15250,13333,14943,13102,3021,1374,1647,1168,827,1026,2067,954,1808,1213,1375,1646,1997,1024,224.244106765823,2626,36250,26750,5500,3472,2389,1788,601,2389,2270,2389,0.8652155714,0.5571368774,22.727919632,,0.28999999165534,0.4763499372,0.1004604437,0.7484303056,PrivacySuppressed,0.3101321586,61096.588949,44787.0,27941.821963,,,76.3799972534179,18.9799995422363,1.41999995708465,2.54999995231628,17.6700000762939,8.90999984741211,95.2699966430664,58688.62,9.36999988555908,3.64000010490417,10.9300003051757,,,,,,,14476,21607,224.244106765823,UAH University of Alabama Huntsville,1,0.5796,0.4204,12/1/1965,7090.0,2.0,213.0,2065.0,SACSCC,0.8269,,0.35,,2531.0,,40.0,,2.0,4.0,0.8269,,0.35,,1.0,1,,,,,,,,,,,,,0.2707,0.4556,8145.0,2443.0,1341.0,2.0,0.2378,0.4402,2544.0,19702,407184805,1055
4,100724,100500,1005,Alabama State University,Montgomery,AL,36104-0271,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,32.364317,-86.295677,19.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9774,0.9774,440.0,520.0,420.0,510.0,,,480.0,465.0,,16.0,20.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,972.0,972.0,0.0,3903.0,0.0167,0.9352,0.0095,0.0041,0.0013,0.0005,0.0102,0.0102,0.0123,0.0666,1,13043.0,,11344.0,14855.0,18390.0,18863.0,14833.0,,,,,,12113.0,,16104.0,,17819.0,,523.0,,346.0,97.0,53.0,20.0,7.0,,,,,,21476.0,,11068.0,19396.0,,10160.0,8527.0,7754.0,0.5826,0.7448,0.865,0.5868,,0.125,,0.7845,0.0848,0.6146166134,0.107428115,0.5776286353,0.9219330855,0.3434343434,0.178514377,0.1126198083,0.052715655,0.0415335463,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0188246097,0.3246097337,0.6565656566,0.6625399361,0.4972044728,0.3841853035,0.2903354633,34468.571812,8551.802974,18679,32000,11161,18750,18500,18246,17500,23925,19056,12000,19500,15525,19000,17500,3609,1149,2460,2299,965,345,3162,447,3237,372,2276,1333,2899,710,332.105864604357,3486,45000,32263,5784,3500,2504,2235,269,2504,2178,2504,0.8889776358,0.874600639,20.130990415,,0.10999999940395,0.6134185304,0.0079872204,0.892571885,PrivacySuppressed,0.3434343434,31684.382188,22080.5,8551.802974,,,42.6899986267089,52.3199996948242,1.40999996662139,4.09000015258789,11.8100004196167,6.76000022888183,94.5299987792968,46065.2,16.9599990844726,4.80999994277954,10.6700000762939,,,,,,,18679,32000,332.105864604357,,1,0.371,0.629,12/1/1965,4208.0,2.0,,510.0,SACSCC,0.5898,,0.25,,2094.0,,36.0,,2.0,2.0,0.5898,,0.25,,1.0,1,,,,,,,,,,,,,0.7792,0.7539,4732.0,642.0,951.0,2.0,0.7684,0.7464,2094.0,34246,947070736,1005


In [57]:
# Remove weird missing squares and average of logarithm columns, as well as missing number of FAFSAs sent and no longer provided
df = df.drop(columns = ['AGE_ENTRY_SQ', 'LNFAMINC', 'LNFAMINC_IND', 'FSEND_COUNT', 'FSEND_1', 'FSEND_2', 'FSEND_3', 'FSEND_4', 'FSEND_5'])

In [58]:
# Check new size
df.shape

(6806, 261)

In [59]:
# Check new output
df.head()

Unnamed: 0,UNITID,OPEID,OPEID6,INSTNM,CITY,STABBR,ZIP,ACCREDAGENCY,SCH_DEG,HCM2,MAIN,NUMBRANCH,PREDDEG,HIGHDEG,CONTROL,ST_FIPS,REGION,LOCALE,LOCALE2,LATITUDE,LONGITUDE,CCBASIC,CCUGPROF,CCSIZSET,HBCU,PBI,ANNHI,TRIBAL,AANAPII,HSI,NANTI,MENONLY,WOMENONLY,RELAFFIL,ADM_RATE,ADM_RATE_ALL,SATVR25,SATVR75,SATMT25,SATMT75,SATWR25,SATWR75,SATVRMID,SATMTMID,SATWRMID,ACTCM25,ACTCM75,ACTEN25,ACTEN75,ACTMT25,ACTMT75,ACTWR25,ACTWR75,ACTCMMID,ACTENMID,ACTMTMID,ACTWRMID,SAT_AVG,SAT_AVG_ALL,DISTANCEONLY,UGDS,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN,PPTUG_EF,CURROPER,NPT4_PUB,NPT4_PRIV,NPT41_PUB,NPT42_PUB,NPT43_PUB,NPT44_PUB,NPT45_PUB,NPT41_PRIV,NPT42_PRIV,NPT43_PRIV,NPT44_PRIV,NPT45_PRIV,NPT4_048_PUB,NPT4_048_PRIV,NPT4_3075_PUB,NPT4_3075_PRIV,NPT4_75UP_PUB,NPT4_75UP_PRIV,NUM4_PUB,NUM4_PRIV,NUM41_PUB,NUM42_PUB,NUM43_PUB,NUM44_PUB,NUM45_PUB,NUM41_PRIV,NUM42_PRIV,NUM43_PRIV,NUM44_PRIV,NUM45_PRIV,COSTT4_A,COSTT4_P,TUITIONFEE_IN,TUITIONFEE_OUT,TUITIONFEE_PROG,TUITFTE,INEXPFTE,AVGFACSAL,PFTFAC,PCTPELL,PFTFTUG1_EF,RET_FT4,RET_FTL4,RET_PT4,RET_PTL4,PCTFLOAN,UG25ABV,INC_PCT_LO,DEP_STAT_PCT_IND,DEP_INC_PCT_LO,IND_INC_PCT_LO,PAR_ED_PCT_1STGEN,INC_PCT_M1,INC_PCT_M2,INC_PCT_H1,INC_PCT_H2,DEP_INC_PCT_M1,DEP_INC_PCT_M2,DEP_INC_PCT_H1,DEP_INC_PCT_H2,IND_INC_PCT_M1,IND_INC_PCT_M2,IND_INC_PCT_H1,IND_INC_PCT_H2,PAR_ED_PCT_MS,PAR_ED_PCT_HS,PAR_ED_PCT_PS,APPL_SCH_PCT_GE2,APPL_SCH_PCT_GE3,APPL_SCH_PCT_GE4,APPL_SCH_PCT_GE5,DEP_INC_AVG,IND_INC_AVG,DEBT_MDN,GRAD_DEBT_MDN,WDRAW_DEBT_MDN,LO_INC_DEBT_MDN,MD_INC_DEBT_MDN,HI_INC_DEBT_MDN,DEP_DEBT_MDN,IND_DEBT_MDN,PELL_DEBT_MDN,NOPELL_DEBT_MDN,FEMALE_DEBT_MDN,MALE_DEBT_MDN,FIRSTGEN_DEBT_MDN,NOTFIRSTGEN_DEBT_MDN,DEBT_N,GRAD_DEBT_N,WDRAW_DEBT_N,LO_INC_DEBT_N,MD_INC_DEBT_N,HI_INC_DEBT_N,DEP_DEBT_N,IND_DEBT_N,PELL_DEBT_N,NOPELL_DEBT_N,FEMALE_DEBT_N,MALE_DEBT_N,FIRSTGEN_DEBT_N,NOTFIRSTGEN_DEBT_N,GRAD_DEBT_MDN10YR,CUML_DEBT_N,CUML_DEBT_P90,CUML_DEBT_P75,CUML_DEBT_P25,CUML_DEBT_P10,INC_N,DEP_INC_N,IND_INC_N,DEP_STAT_N,PAR_ED_N,APPL_SCH_N,LOAN_EVER,PELL_EVER,AGE_ENTRY,AGEGE24,FEMALE,MARRIED,DEPENDENT,VETERAN,FIRST_GEN,FAMINC,MD_FAMINC,FAMINC_IND,PCT_WHITE,PCT_BLACK,PCT_ASIAN,PCT_HISPANIC,PCT_BA,PCT_GRAD_PROF,PCT_BORN_US,MEDIAN_HH_INC,POVERTY_RATE,UNEMP_RATE,LN_MEDIAN_HH_INC,DEBT_MDN_SUPP,GRAD_DEBT_MDN_SUPP,GRAD_DEBT_MDN10YR_SUPP,ALIAS,ICLEVEL,UGDS_MEN,UGDS_WOMEN,T4APPROVALDATE,D_PCTPELL_PCTFLOAN,OPENADMP,UGNONDS,GRADS,ACCREDCODE,RET_FT4_POOLED,RET_FTL4_POOLED,RET_PT4_POOLED,RET_PTL4_POOLED,RET_FT_DEN4_POOLED,RET_FT_DENL4_POOLED,RET_PT_DEN4_POOLED,RET_PT_DENL4_POOLED,POOLYRSRET_FT,POOLYRSRET_PT,RET_FT4_POOLED_SUPP,RET_FTL4_POOLED_SUPP,RET_PT4_POOLED_SUPP,RET_PTL4_POOLED_SUPP,SCHTYPE,OPEFLAG,CIPTFBS1,CIPTFBS2,CIPTFBS3,CIPTFBS4,CIPTFBS5,CIPTFBS6,CIPTFBSANNUAL1,CIPTFBSANNUAL2,CIPTFBSANNUAL3,CIPTFBSANNUAL4,CIPTFBSANNUAL5,CIPTFBSANNUAL6,FTFTPCTPELL,FTFTPCTFLOAN,UG12MN,G12MN,SCUGFFN,POOLYRS_FTFTAIDPCT,FTFTPCTPELL_POOLED_SUPP,FTFTPCTFLOAN_POOLED_SUPP,SCUGFFN_POOLED,LPSTAFFORD_CNT,LPSTAFFORD_AMT,FEDSCHCD
0,100654,100200,1002,Alabama A & M University,Normal,AL,35762,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,34.783368,-86.568502,18.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8986,0.8986,430.0,520.0,420.0,510.0,370.0,457.0,475.0,465.0,414.0,16.0,19.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,957.0,957.0,0.0,4990.0,0.0186,0.912,0.0088,0.0018,0.0022,0.0016,0.0118,0.007,0.0361,0.0587,1,14444.0,,13893.0,13976.0,15995.0,18957.0,17140.0,,,,,,13913.0,,14684.0,,18281.0,,592.0,,375.0,113.0,61.0,27.0,16.0,,,,,,22489.0,,9744.0,18354.0,,7413.0,5384.0,7101.0,0.7411,0.7067,0.8987,0.6087,,1.0,,0.7503,0.0758,0.6020087884,0.0988700565,0.5691396726,0.9015873016,0.3658280922,0.1898932831,0.1051475204,0.0621468927,0.0408035154,0.2034134448,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0666666667,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0164220825,0.3494060098,0.6341719078,0.7291274325,0.5668549906,0.4579409918,0.3631512869,34779.085684,10340.346032,15500,33375,10250,15500,16000,14518,15000,19000,17500,10250,17500,14250,15000,16421,3606,1076,2530,2185,1034,387,3191,415,3162,444,2074,1532,2895,711,346.376038474076,3085,47750,32208,5500,3381,3186,2871,315,3186,2862,3186,0.8860640301,0.8527934714,20.283741368,0.07999999821186,0.5640301318,0.0091023227,0.9011299435,0.003138732,0.3658280922,32362.826114,23553.0,10340.346032,46.8400001525878,47.9799995422363,1.48000001907348,3.78999996185302,13.0,6.8600001335144,94.7399978637695,49720.22,14.8800001144409,4.84000015258789,10.75,15500,33375,346.376038474076,AAMU,1,0.4076,0.5924,12/12/1965,5039.0,2.0,153.0,963.0,SACSCC,0.5978,,0.25,,2698.0,,44.0,,2.0,2.0,0.5978,,0.25,,1.0,1,,,,,,,,,,,,,0.7057,0.7143,5343.0,1165.0,1288.0,2.0,0.7083,0.7287,2698.0,31374,922456254,1002
1,100663,105200,1052,University of Alabama at Birmingham,Birmingham,AL,35294-0110,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,33.505697,-86.799345,15.0,9.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9211,0.9211,490.0,620.0,490.0,620.0,,,555.0,555.0,,21.0,29.0,22.0,31.0,19.0,26.0,,,25.0,27.0,23.0,,1220.0,1220.0,0.0,13186.0,0.5717,0.2553,0.0334,0.0633,0.0034,0.0002,0.0457,0.0213,0.0058,0.2425,1,17005.0,,14550.0,15379.0,17892.0,19978.0,20110.0,,,,,,14830.0,,16587.0,,20050.0,,1229.0,,421.0,214.0,198.0,180.0,216.0,,,,,,24347.0,,8568.0,19704.0,,13177.0,16454.0,10717.0,0.7766,0.3632,0.6009,0.8186,,0.4648,,0.5127,0.2296,0.4276131917,0.3214086082,0.3487095003,0.5942028986,0.341223671,0.1798024967,0.1423514067,0.114589156,0.1356437488,0.1699615596,0.1537616694,0.142778693,0.1847885777,0.2005797101,0.1182608696,0.0550724638,0.031884058,0.0222668004,0.3189568706,0.658776329,0.5135084777,0.2634618968,0.1652692379,0.1076951742,61110.800384,30607.18029,15000,22500,9500,16226,15250,14000,15000,16000,17500,12500,15000,15000,15104,15000,7504,3730,3774,3168,2281,2055,5123,2381,4714,2790,4804,2700,5286,2218,233.511936049938,6302,37540,26082,6250,3500,5367,3642,1725,5367,4985,5367,0.8574622694,0.6249301286,23.60797466,0.25999999046325,0.6390907397,0.1050866406,0.6785913918,0.0031675051,0.341223671,51306.674306,34489.0,30607.18029,69.0199966430664,27.7600002288818,1.10000002384185,2.02999997138977,15.9300003051757,8.55000019073486,96.5,55735.22,10.9099998474121,3.45000004768371,10.8599996566772,15000,22500,233.511936049938,,1,0.393,0.607,12/1/1965,13134.0,2.0,650.0,8087.0,SACSCC,0.8303,,0.4514,,4130.0,,144.0,,2.0,2.0,0.8303,,0.4514,,1.0,1,,,,,,,,,,,,,0.3788,0.535,14445.0,10498.0,2228.0,2.0,0.3891,0.5414,4176.0,56997,1720042015,1052
2,100690,2503400,25034,Amridge University,Montgomery,AL,36117-3553,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,2,1,5,12.0,,32.362609,-86.17401,20.0,5.0,6.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,74.0,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,351.0,0.2393,0.7151,0.0171,0.0057,0.0057,0.0,0.0,0.0,0.0171,0.5014,1,,15322.0,,,,,,15322.0,,,,,,15322.0,,,,,,5.0,,,,,,5.0,0.0,0.0,0.0,0.0,17680.0,,6900.0,6900.0,,14273.0,4206.0,4292.0,1.0,0.7673,0.0035,,,,,0.8962,0.8302,0.7736486486,0.8952702703,PrivacySuppressed,PrivacySuppressed,0.5125,0.1148648649,0.0641891892,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.05,0.4625,0.4875,0.5945945946,0.3378378378,0.2432432432,0.1587837838,25211.032258,20596.158491,10500,27334,9500,9500,19000,25000,7646,12038,9500,15509,9500,17025,11500,9500,514,92,422,397,91,26,60,454,464,50,327,187,458,56,283.680678221734,398,38455,24250,4750,3166,296,31,265,296,240,296,0.9560810811,0.8648648649,33.672297297,0.82999998331069,0.6486486486,0.2364864865,0.1047297297,0.0405405405,0.5125,21079.472973,15033.5,20596.158491,70.8799972534179,22.5300006866455,1.28999996185302,6.94000005722046,13.2299995422363,7.01000022888183,94.0899963378906,53683.7,10.6499996185302,3.59999990463256,10.8400001525878,10500,27334,283.680678221734,Southern Christian University Regions University,1,0.3191,0.6809,3/26/1987,318.0,1.0,,404.0,SACSCC,0.2143,,0.1429,,14.0,,14.0,,4.0,4.0,PrivacySuppressed,,PrivacySuppressed,,2.0,1,,,,,,,,,,,,,1.0,1.0,440.0,527.0,5.0,4.0,PrivacySuppressed,PrivacySuppressed,24.0,4463,174222020,16885
3,100706,105500,1055,University of Alabama in Huntsville,Huntsville,AL,35899,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,34.724557,-86.640449,16.0,15.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8087,0.8087,560.0,700.0,450.0,680.0,,,630.0,565.0,,25.0,31.0,25.0,34.0,24.0,30.0,,,28.0,30.0,27.0,,1314.0,1314.0,0.0,7458.0,0.7167,0.0969,0.0528,0.0381,0.0095,0.0008,0.0296,0.0223,0.0333,0.1443,1,20909.0,,17561.0,18991.0,21396.0,23204.0,23406.0,,,,,,18147.0,,20356.0,,23315.0,,585.0,,134.0,93.0,122.0,107.0,129.0,,,,,,23441.0,,10714.0,22362.0,,8677.0,9242.0,9442.0,0.6544,0.2698,0.6176,0.8288,,0.0909,,0.4192,0.1842,0.374633738,0.2515696944,0.26901566,0.6888519135,0.3101321586,0.1377145249,0.1469233989,0.1506906656,0.1900376727,0.1448545861,0.1605145414,0.1817673378,0.2438478747,0.1164725458,0.1064891847,0.0582362729,0.0299500832,0.0198237885,0.29030837,0.6898678414,0.5290916702,0.2737547091,0.1573880285,0.1025533696,72240.892617,27941.821963,14476,21607,9000,16250,14750,12500,12750,18569,17014,11899,15250,13333,14943,13102,3021,1374,1647,1168,827,1026,2067,954,1808,1213,1375,1646,1997,1024,224.244106765823,2626,36250,26750,5500,3472,2389,1788,601,2389,2270,2389,0.8652155714,0.5571368774,22.727919632,0.28999999165534,0.4763499372,0.1004604437,0.7484303056,PrivacySuppressed,0.3101321586,61096.588949,44787.0,27941.821963,76.3799972534179,18.9799995422363,1.41999995708465,2.54999995231628,17.6700000762939,8.90999984741211,95.2699966430664,58688.62,9.36999988555908,3.64000010490417,10.9300003051757,14476,21607,224.244106765823,UAH University of Alabama Huntsville,1,0.5796,0.4204,12/1/1965,7090.0,2.0,213.0,2065.0,SACSCC,0.8269,,0.35,,2531.0,,40.0,,2.0,4.0,0.8269,,0.35,,1.0,1,,,,,,,,,,,,,0.2707,0.4556,8145.0,2443.0,1341.0,2.0,0.2378,0.4402,2544.0,19702,407184805,1055
4,100724,100500,1005,Alabama State University,Montgomery,AL,36104-0271,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,32.364317,-86.295677,19.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9774,0.9774,440.0,520.0,420.0,510.0,,,480.0,465.0,,16.0,20.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,972.0,972.0,0.0,3903.0,0.0167,0.9352,0.0095,0.0041,0.0013,0.0005,0.0102,0.0102,0.0123,0.0666,1,13043.0,,11344.0,14855.0,18390.0,18863.0,14833.0,,,,,,12113.0,,16104.0,,17819.0,,523.0,,346.0,97.0,53.0,20.0,7.0,,,,,,21476.0,,11068.0,19396.0,,10160.0,8527.0,7754.0,0.5826,0.7448,0.865,0.5868,,0.125,,0.7845,0.0848,0.6146166134,0.107428115,0.5776286353,0.9219330855,0.3434343434,0.178514377,0.1126198083,0.052715655,0.0415335463,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0188246097,0.3246097337,0.6565656566,0.6625399361,0.4972044728,0.3841853035,0.2903354633,34468.571812,8551.802974,18679,32000,11161,18750,18500,18246,17500,23925,19056,12000,19500,15525,19000,17500,3609,1149,2460,2299,965,345,3162,447,3237,372,2276,1333,2899,710,332.105864604357,3486,45000,32263,5784,3500,2504,2235,269,2504,2178,2504,0.8889776358,0.874600639,20.130990415,0.10999999940395,0.6134185304,0.0079872204,0.892571885,PrivacySuppressed,0.3434343434,31684.382188,22080.5,8551.802974,42.6899986267089,52.3199996948242,1.40999996662139,4.09000015258789,11.8100004196167,6.76000022888183,94.5299987792968,46065.2,16.9599990844726,4.80999994277954,10.6700000762939,18679,32000,332.105864604357,,1,0.371,0.629,12/1/1965,4208.0,2.0,,510.0,SACSCC,0.5898,,0.25,,2094.0,,36.0,,2.0,2.0,0.5898,,0.25,,1.0,1,,,,,,,,,,,,,0.7792,0.7539,4732.0,642.0,951.0,2.0,0.7684,0.7464,2094.0,34246,947070736,1005


## 02. Renaming columns

In [60]:
# Rename INSTNM column to NAME and STABBR column to STATE
df.rename(columns = {'INSTNM' : 'NAME', 'STABBR' : 'STATE'}, inplace = True)

In [61]:
# Check output
df.head()

Unnamed: 0,UNITID,OPEID,OPEID6,NAME,CITY,STATE,ZIP,ACCREDAGENCY,SCH_DEG,HCM2,MAIN,NUMBRANCH,PREDDEG,HIGHDEG,CONTROL,ST_FIPS,REGION,LOCALE,LOCALE2,LATITUDE,LONGITUDE,CCBASIC,CCUGPROF,CCSIZSET,HBCU,PBI,ANNHI,TRIBAL,AANAPII,HSI,NANTI,MENONLY,WOMENONLY,RELAFFIL,ADM_RATE,ADM_RATE_ALL,SATVR25,SATVR75,SATMT25,SATMT75,SATWR25,SATWR75,SATVRMID,SATMTMID,SATWRMID,ACTCM25,ACTCM75,ACTEN25,ACTEN75,ACTMT25,ACTMT75,ACTWR25,ACTWR75,ACTCMMID,ACTENMID,ACTMTMID,ACTWRMID,SAT_AVG,SAT_AVG_ALL,DISTANCEONLY,UGDS,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN,PPTUG_EF,CURROPER,NPT4_PUB,NPT4_PRIV,NPT41_PUB,NPT42_PUB,NPT43_PUB,NPT44_PUB,NPT45_PUB,NPT41_PRIV,NPT42_PRIV,NPT43_PRIV,NPT44_PRIV,NPT45_PRIV,NPT4_048_PUB,NPT4_048_PRIV,NPT4_3075_PUB,NPT4_3075_PRIV,NPT4_75UP_PUB,NPT4_75UP_PRIV,NUM4_PUB,NUM4_PRIV,NUM41_PUB,NUM42_PUB,NUM43_PUB,NUM44_PUB,NUM45_PUB,NUM41_PRIV,NUM42_PRIV,NUM43_PRIV,NUM44_PRIV,NUM45_PRIV,COSTT4_A,COSTT4_P,TUITIONFEE_IN,TUITIONFEE_OUT,TUITIONFEE_PROG,TUITFTE,INEXPFTE,AVGFACSAL,PFTFAC,PCTPELL,PFTFTUG1_EF,RET_FT4,RET_FTL4,RET_PT4,RET_PTL4,PCTFLOAN,UG25ABV,INC_PCT_LO,DEP_STAT_PCT_IND,DEP_INC_PCT_LO,IND_INC_PCT_LO,PAR_ED_PCT_1STGEN,INC_PCT_M1,INC_PCT_M2,INC_PCT_H1,INC_PCT_H2,DEP_INC_PCT_M1,DEP_INC_PCT_M2,DEP_INC_PCT_H1,DEP_INC_PCT_H2,IND_INC_PCT_M1,IND_INC_PCT_M2,IND_INC_PCT_H1,IND_INC_PCT_H2,PAR_ED_PCT_MS,PAR_ED_PCT_HS,PAR_ED_PCT_PS,APPL_SCH_PCT_GE2,APPL_SCH_PCT_GE3,APPL_SCH_PCT_GE4,APPL_SCH_PCT_GE5,DEP_INC_AVG,IND_INC_AVG,DEBT_MDN,GRAD_DEBT_MDN,WDRAW_DEBT_MDN,LO_INC_DEBT_MDN,MD_INC_DEBT_MDN,HI_INC_DEBT_MDN,DEP_DEBT_MDN,IND_DEBT_MDN,PELL_DEBT_MDN,NOPELL_DEBT_MDN,FEMALE_DEBT_MDN,MALE_DEBT_MDN,FIRSTGEN_DEBT_MDN,NOTFIRSTGEN_DEBT_MDN,DEBT_N,GRAD_DEBT_N,WDRAW_DEBT_N,LO_INC_DEBT_N,MD_INC_DEBT_N,HI_INC_DEBT_N,DEP_DEBT_N,IND_DEBT_N,PELL_DEBT_N,NOPELL_DEBT_N,FEMALE_DEBT_N,MALE_DEBT_N,FIRSTGEN_DEBT_N,NOTFIRSTGEN_DEBT_N,GRAD_DEBT_MDN10YR,CUML_DEBT_N,CUML_DEBT_P90,CUML_DEBT_P75,CUML_DEBT_P25,CUML_DEBT_P10,INC_N,DEP_INC_N,IND_INC_N,DEP_STAT_N,PAR_ED_N,APPL_SCH_N,LOAN_EVER,PELL_EVER,AGE_ENTRY,AGEGE24,FEMALE,MARRIED,DEPENDENT,VETERAN,FIRST_GEN,FAMINC,MD_FAMINC,FAMINC_IND,PCT_WHITE,PCT_BLACK,PCT_ASIAN,PCT_HISPANIC,PCT_BA,PCT_GRAD_PROF,PCT_BORN_US,MEDIAN_HH_INC,POVERTY_RATE,UNEMP_RATE,LN_MEDIAN_HH_INC,DEBT_MDN_SUPP,GRAD_DEBT_MDN_SUPP,GRAD_DEBT_MDN10YR_SUPP,ALIAS,ICLEVEL,UGDS_MEN,UGDS_WOMEN,T4APPROVALDATE,D_PCTPELL_PCTFLOAN,OPENADMP,UGNONDS,GRADS,ACCREDCODE,RET_FT4_POOLED,RET_FTL4_POOLED,RET_PT4_POOLED,RET_PTL4_POOLED,RET_FT_DEN4_POOLED,RET_FT_DENL4_POOLED,RET_PT_DEN4_POOLED,RET_PT_DENL4_POOLED,POOLYRSRET_FT,POOLYRSRET_PT,RET_FT4_POOLED_SUPP,RET_FTL4_POOLED_SUPP,RET_PT4_POOLED_SUPP,RET_PTL4_POOLED_SUPP,SCHTYPE,OPEFLAG,CIPTFBS1,CIPTFBS2,CIPTFBS3,CIPTFBS4,CIPTFBS5,CIPTFBS6,CIPTFBSANNUAL1,CIPTFBSANNUAL2,CIPTFBSANNUAL3,CIPTFBSANNUAL4,CIPTFBSANNUAL5,CIPTFBSANNUAL6,FTFTPCTPELL,FTFTPCTFLOAN,UG12MN,G12MN,SCUGFFN,POOLYRS_FTFTAIDPCT,FTFTPCTPELL_POOLED_SUPP,FTFTPCTFLOAN_POOLED_SUPP,SCUGFFN_POOLED,LPSTAFFORD_CNT,LPSTAFFORD_AMT,FEDSCHCD
0,100654,100200,1002,Alabama A & M University,Normal,AL,35762,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,34.783368,-86.568502,18.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8986,0.8986,430.0,520.0,420.0,510.0,370.0,457.0,475.0,465.0,414.0,16.0,19.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,957.0,957.0,0.0,4990.0,0.0186,0.912,0.0088,0.0018,0.0022,0.0016,0.0118,0.007,0.0361,0.0587,1,14444.0,,13893.0,13976.0,15995.0,18957.0,17140.0,,,,,,13913.0,,14684.0,,18281.0,,592.0,,375.0,113.0,61.0,27.0,16.0,,,,,,22489.0,,9744.0,18354.0,,7413.0,5384.0,7101.0,0.7411,0.7067,0.8987,0.6087,,1.0,,0.7503,0.0758,0.6020087884,0.0988700565,0.5691396726,0.9015873016,0.3658280922,0.1898932831,0.1051475204,0.0621468927,0.0408035154,0.2034134448,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0666666667,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0164220825,0.3494060098,0.6341719078,0.7291274325,0.5668549906,0.4579409918,0.3631512869,34779.085684,10340.346032,15500,33375,10250,15500,16000,14518,15000,19000,17500,10250,17500,14250,15000,16421,3606,1076,2530,2185,1034,387,3191,415,3162,444,2074,1532,2895,711,346.376038474076,3085,47750,32208,5500,3381,3186,2871,315,3186,2862,3186,0.8860640301,0.8527934714,20.283741368,0.07999999821186,0.5640301318,0.0091023227,0.9011299435,0.003138732,0.3658280922,32362.826114,23553.0,10340.346032,46.8400001525878,47.9799995422363,1.48000001907348,3.78999996185302,13.0,6.8600001335144,94.7399978637695,49720.22,14.8800001144409,4.84000015258789,10.75,15500,33375,346.376038474076,AAMU,1,0.4076,0.5924,12/12/1965,5039.0,2.0,153.0,963.0,SACSCC,0.5978,,0.25,,2698.0,,44.0,,2.0,2.0,0.5978,,0.25,,1.0,1,,,,,,,,,,,,,0.7057,0.7143,5343.0,1165.0,1288.0,2.0,0.7083,0.7287,2698.0,31374,922456254,1002
1,100663,105200,1052,University of Alabama at Birmingham,Birmingham,AL,35294-0110,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,33.505697,-86.799345,15.0,9.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9211,0.9211,490.0,620.0,490.0,620.0,,,555.0,555.0,,21.0,29.0,22.0,31.0,19.0,26.0,,,25.0,27.0,23.0,,1220.0,1220.0,0.0,13186.0,0.5717,0.2553,0.0334,0.0633,0.0034,0.0002,0.0457,0.0213,0.0058,0.2425,1,17005.0,,14550.0,15379.0,17892.0,19978.0,20110.0,,,,,,14830.0,,16587.0,,20050.0,,1229.0,,421.0,214.0,198.0,180.0,216.0,,,,,,24347.0,,8568.0,19704.0,,13177.0,16454.0,10717.0,0.7766,0.3632,0.6009,0.8186,,0.4648,,0.5127,0.2296,0.4276131917,0.3214086082,0.3487095003,0.5942028986,0.341223671,0.1798024967,0.1423514067,0.114589156,0.1356437488,0.1699615596,0.1537616694,0.142778693,0.1847885777,0.2005797101,0.1182608696,0.0550724638,0.031884058,0.0222668004,0.3189568706,0.658776329,0.5135084777,0.2634618968,0.1652692379,0.1076951742,61110.800384,30607.18029,15000,22500,9500,16226,15250,14000,15000,16000,17500,12500,15000,15000,15104,15000,7504,3730,3774,3168,2281,2055,5123,2381,4714,2790,4804,2700,5286,2218,233.511936049938,6302,37540,26082,6250,3500,5367,3642,1725,5367,4985,5367,0.8574622694,0.6249301286,23.60797466,0.25999999046325,0.6390907397,0.1050866406,0.6785913918,0.0031675051,0.341223671,51306.674306,34489.0,30607.18029,69.0199966430664,27.7600002288818,1.10000002384185,2.02999997138977,15.9300003051757,8.55000019073486,96.5,55735.22,10.9099998474121,3.45000004768371,10.8599996566772,15000,22500,233.511936049938,,1,0.393,0.607,12/1/1965,13134.0,2.0,650.0,8087.0,SACSCC,0.8303,,0.4514,,4130.0,,144.0,,2.0,2.0,0.8303,,0.4514,,1.0,1,,,,,,,,,,,,,0.3788,0.535,14445.0,10498.0,2228.0,2.0,0.3891,0.5414,4176.0,56997,1720042015,1052
2,100690,2503400,25034,Amridge University,Montgomery,AL,36117-3553,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,2,1,5,12.0,,32.362609,-86.17401,20.0,5.0,6.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,74.0,,,,,,,,,,,,,,,,,,,,,,,,,,1.0,351.0,0.2393,0.7151,0.0171,0.0057,0.0057,0.0,0.0,0.0,0.0171,0.5014,1,,15322.0,,,,,,15322.0,,,,,,15322.0,,,,,,5.0,,,,,,5.0,0.0,0.0,0.0,0.0,17680.0,,6900.0,6900.0,,14273.0,4206.0,4292.0,1.0,0.7673,0.0035,,,,,0.8962,0.8302,0.7736486486,0.8952702703,PrivacySuppressed,PrivacySuppressed,0.5125,0.1148648649,0.0641891892,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.05,0.4625,0.4875,0.5945945946,0.3378378378,0.2432432432,0.1587837838,25211.032258,20596.158491,10500,27334,9500,9500,19000,25000,7646,12038,9500,15509,9500,17025,11500,9500,514,92,422,397,91,26,60,454,464,50,327,187,458,56,283.680678221734,398,38455,24250,4750,3166,296,31,265,296,240,296,0.9560810811,0.8648648649,33.672297297,0.82999998331069,0.6486486486,0.2364864865,0.1047297297,0.0405405405,0.5125,21079.472973,15033.5,20596.158491,70.8799972534179,22.5300006866455,1.28999996185302,6.94000005722046,13.2299995422363,7.01000022888183,94.0899963378906,53683.7,10.6499996185302,3.59999990463256,10.8400001525878,10500,27334,283.680678221734,Southern Christian University Regions University,1,0.3191,0.6809,3/26/1987,318.0,1.0,,404.0,SACSCC,0.2143,,0.1429,,14.0,,14.0,,4.0,4.0,PrivacySuppressed,,PrivacySuppressed,,2.0,1,,,,,,,,,,,,,1.0,1.0,440.0,527.0,5.0,4.0,PrivacySuppressed,PrivacySuppressed,24.0,4463,174222020,16885
3,100706,105500,1055,University of Alabama in Huntsville,Huntsville,AL,35899,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,34.724557,-86.640449,16.0,15.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.8087,0.8087,560.0,700.0,450.0,680.0,,,630.0,565.0,,25.0,31.0,25.0,34.0,24.0,30.0,,,28.0,30.0,27.0,,1314.0,1314.0,0.0,7458.0,0.7167,0.0969,0.0528,0.0381,0.0095,0.0008,0.0296,0.0223,0.0333,0.1443,1,20909.0,,17561.0,18991.0,21396.0,23204.0,23406.0,,,,,,18147.0,,20356.0,,23315.0,,585.0,,134.0,93.0,122.0,107.0,129.0,,,,,,23441.0,,10714.0,22362.0,,8677.0,9242.0,9442.0,0.6544,0.2698,0.6176,0.8288,,0.0909,,0.4192,0.1842,0.374633738,0.2515696944,0.26901566,0.6888519135,0.3101321586,0.1377145249,0.1469233989,0.1506906656,0.1900376727,0.1448545861,0.1605145414,0.1817673378,0.2438478747,0.1164725458,0.1064891847,0.0582362729,0.0299500832,0.0198237885,0.29030837,0.6898678414,0.5290916702,0.2737547091,0.1573880285,0.1025533696,72240.892617,27941.821963,14476,21607,9000,16250,14750,12500,12750,18569,17014,11899,15250,13333,14943,13102,3021,1374,1647,1168,827,1026,2067,954,1808,1213,1375,1646,1997,1024,224.244106765823,2626,36250,26750,5500,3472,2389,1788,601,2389,2270,2389,0.8652155714,0.5571368774,22.727919632,0.28999999165534,0.4763499372,0.1004604437,0.7484303056,PrivacySuppressed,0.3101321586,61096.588949,44787.0,27941.821963,76.3799972534179,18.9799995422363,1.41999995708465,2.54999995231628,17.6700000762939,8.90999984741211,95.2699966430664,58688.62,9.36999988555908,3.64000010490417,10.9300003051757,14476,21607,224.244106765823,UAH University of Alabama Huntsville,1,0.5796,0.4204,12/1/1965,7090.0,2.0,213.0,2065.0,SACSCC,0.8269,,0.35,,2531.0,,40.0,,2.0,4.0,0.8269,,0.35,,1.0,1,,,,,,,,,,,,,0.2707,0.4556,8145.0,2443.0,1341.0,2.0,0.2378,0.4402,2544.0,19702,407184805,1055
4,100724,100500,1005,Alabama State University,Montgomery,AL,36104-0271,Southern Association of Colleges and Schools C...,3.0,0,1,1,3,4,1,1,5,12.0,,32.364317,-86.295677,19.0,10.0,14.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.9774,0.9774,440.0,520.0,420.0,510.0,,,480.0,465.0,,16.0,20.0,14.0,20.0,15.0,18.0,,,18.0,17.0,17.0,,972.0,972.0,0.0,3903.0,0.0167,0.9352,0.0095,0.0041,0.0013,0.0005,0.0102,0.0102,0.0123,0.0666,1,13043.0,,11344.0,14855.0,18390.0,18863.0,14833.0,,,,,,12113.0,,16104.0,,17819.0,,523.0,,346.0,97.0,53.0,20.0,7.0,,,,,,21476.0,,11068.0,19396.0,,10160.0,8527.0,7754.0,0.5826,0.7448,0.865,0.5868,,0.125,,0.7845,0.0848,0.6146166134,0.107428115,0.5776286353,0.9219330855,0.3434343434,0.178514377,0.1126198083,0.052715655,0.0415335463,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,PrivacySuppressed,0.0188246097,0.3246097337,0.6565656566,0.6625399361,0.4972044728,0.3841853035,0.2903354633,34468.571812,8551.802974,18679,32000,11161,18750,18500,18246,17500,23925,19056,12000,19500,15525,19000,17500,3609,1149,2460,2299,965,345,3162,447,3237,372,2276,1333,2899,710,332.105864604357,3486,45000,32263,5784,3500,2504,2235,269,2504,2178,2504,0.8889776358,0.874600639,20.130990415,0.10999999940395,0.6134185304,0.0079872204,0.892571885,PrivacySuppressed,0.3434343434,31684.382188,22080.5,8551.802974,42.6899986267089,52.3199996948242,1.40999996662139,4.09000015258789,11.8100004196167,6.76000022888183,94.5299987792968,46065.2,16.9599990844726,4.80999994277954,10.6700000762939,18679,32000,332.105864604357,,1,0.371,0.629,12/1/1965,4208.0,2.0,,510.0,SACSCC,0.5898,,0.25,,2094.0,,36.0,,2.0,2.0,0.5898,,0.25,,1.0,1,,,,,,,,,,,,,0.7792,0.7539,4732.0,642.0,951.0,2.0,0.7684,0.7464,2094.0,34246,947070736,1005


## 03. Mixed-type columns

In [62]:
# Check for mixed types
for col in df.columns.tolist():
    weird = (df[[col]].applymap(type) != df[[col]].iloc[0].apply(type)).any(axis = 1)
    if len (df[weird]) > 0:
        print(col)

ACCREDAGENCY
INC_PCT_LO
DEP_STAT_PCT_IND
DEP_INC_PCT_LO
IND_INC_PCT_LO
PAR_ED_PCT_1STGEN
INC_PCT_M1
INC_PCT_M2
INC_PCT_H1
INC_PCT_H2
DEP_INC_PCT_M1
DEP_INC_PCT_M2
DEP_INC_PCT_H1
DEP_INC_PCT_H2
IND_INC_PCT_M1
IND_INC_PCT_M2
IND_INC_PCT_H1
IND_INC_PCT_H2
PAR_ED_PCT_MS
PAR_ED_PCT_HS
PAR_ED_PCT_PS
APPL_SCH_PCT_GE2
APPL_SCH_PCT_GE3
APPL_SCH_PCT_GE4
APPL_SCH_PCT_GE5
DEP_INC_AVG
IND_INC_AVG
DEBT_MDN
GRAD_DEBT_MDN
WDRAW_DEBT_MDN
LO_INC_DEBT_MDN
MD_INC_DEBT_MDN
HI_INC_DEBT_MDN
DEP_DEBT_MDN
IND_DEBT_MDN
PELL_DEBT_MDN
NOPELL_DEBT_MDN
FEMALE_DEBT_MDN
MALE_DEBT_MDN
FIRSTGEN_DEBT_MDN
NOTFIRSTGEN_DEBT_MDN
DEBT_N
GRAD_DEBT_N
WDRAW_DEBT_N
LO_INC_DEBT_N
MD_INC_DEBT_N
HI_INC_DEBT_N
DEP_DEBT_N
IND_DEBT_N
PELL_DEBT_N
NOPELL_DEBT_N
FEMALE_DEBT_N
MALE_DEBT_N
FIRSTGEN_DEBT_N
NOTFIRSTGEN_DEBT_N
GRAD_DEBT_MDN10YR
CUML_DEBT_N
CUML_DEBT_P90
CUML_DEBT_P75
CUML_DEBT_P25
CUML_DEBT_P10
INC_N
DEP_INC_N
IND_INC_N
DEP_STAT_N
PAR_ED_N
APPL_SCH_N
LOAN_EVER
PELL_EVER
AGE_ENTRY
AGEGE24
FEMALE
MARRIED
DEPENDENT
VETERAN
FIRST

In [63]:
# Replace PrivacySuppressed with NaN
df = df.replace(to_replace = 'PrivacySuppressed', value = np.nan)

In [64]:
# Fix columns with string data types
df[['ACCREDAGENCY', 'ALIAS', 'T4APPROVALDATE', 'ACCREDCODE', 'FEDSCHCD']] = df[['ACCREDAGENCY', 'ALIAS', 'T4APPROVALDATE', 'ACCREDCODE', 'FEDSCHCD']].astype('str')

In [66]:
# Check data types were changed
df[['ACCREDAGENCY', 'ALIAS', 'T4APPROVALDATE', 'ACCREDCODE', 'FEDSCHCD']].dtypes

ACCREDAGENCY      object
ALIAS             object
T4APPROVALDATE    object
ACCREDCODE        object
FEDSCHCD          object
dtype: object

In [70]:
# Fix some columns with float data types
df[['INC_PCT_LO', 'DEP_STAT_PCT_IND', 'DEP_INC_PCT_LO', 'IND_INC_PCT_LO', 'PAR_ED_PCT_1STGEN']] = df[['INC_PCT_LO', 'DEP_STAT_PCT_IND', 'DEP_INC_PCT_LO', 'IND_INC_PCT_LO', 'PAR_ED_PCT_1STGEN']].astype(float)

In [71]:
# Check data types were changed
df[['INC_PCT_LO', 'DEP_STAT_PCT_IND', 'DEP_INC_PCT_LO', 'IND_INC_PCT_LO', 'PAR_ED_PCT_1STGEN']].dtypes

INC_PCT_LO           float64
DEP_STAT_PCT_IND     float64
DEP_INC_PCT_LO       float64
IND_INC_PCT_LO       float64
PAR_ED_PCT_1STGEN    float64
dtype: object

In [72]:
# Fix some columns with float data types
df[['INC_PCT_M1', 'INC_PCT_M2', 'INC_PCT_H1', 'INC_PCT_H2', 'DEP_INC_PCT_M1', 'DEP_INC_PCT_M2']] = df[['INC_PCT_M1', 'INC_PCT_M2', 'INC_PCT_H1', 'INC_PCT_H2', 'DEP_INC_PCT_M1', 'DEP_INC_PCT_M2']].astype(float)

In [73]:
# Check data types were changed
df[['INC_PCT_M1', 'INC_PCT_M2', 'INC_PCT_H1', 'INC_PCT_H2', 'DEP_INC_PCT_M1', 'DEP_INC_PCT_M2']].dtypes

INC_PCT_M1        float64
INC_PCT_M2        float64
INC_PCT_H1        float64
INC_PCT_H2        float64
DEP_INC_PCT_M1    float64
DEP_INC_PCT_M2    float64
dtype: object

In [74]:
# Fix some columns with float data types
df[['DEP_INC_PCT_H1', 'DEP_INC_PCT_H2', 'IND_INC_PCT_M1', 'IND_INC_PCT_M2', 'IND_INC_PCT_H1', 'IND_INC_PCT_H2']] = df[['DEP_INC_PCT_H1', 'DEP_INC_PCT_H2', 'IND_INC_PCT_M1', 'IND_INC_PCT_M2', 'IND_INC_PCT_H1', 'IND_INC_PCT_H2']].astype(float)

In [75]:
# Check data types were changed
df[['DEP_INC_PCT_H1', 'DEP_INC_PCT_H2', 'IND_INC_PCT_M1', 'IND_INC_PCT_M2', 'IND_INC_PCT_H1', 'IND_INC_PCT_H2']].dtypes

DEP_INC_PCT_H1    float64
DEP_INC_PCT_H2    float64
IND_INC_PCT_M1    float64
IND_INC_PCT_M2    float64
IND_INC_PCT_H1    float64
IND_INC_PCT_H2    float64
dtype: object

In [76]:
# Fix some columns with float data types
df[['PAR_ED_PCT_MS', 'PAR_ED_PCT_HS', 'PAR_ED_PCT_PS', 'APPL_SCH_PCT_GE2', 'APPL_SCH_PCT_GE3']] = df[['PAR_ED_PCT_MS', 'PAR_ED_PCT_HS', 'PAR_ED_PCT_PS', 'APPL_SCH_PCT_GE2', 'APPL_SCH_PCT_GE3']].astype(float)

In [77]:
# Check data types were changed
df[['PAR_ED_PCT_MS', 'PAR_ED_PCT_HS', 'PAR_ED_PCT_PS', 'APPL_SCH_PCT_GE2', 'APPL_SCH_PCT_GE3']].dtypes

PAR_ED_PCT_MS       float64
PAR_ED_PCT_HS       float64
PAR_ED_PCT_PS       float64
APPL_SCH_PCT_GE2    float64
APPL_SCH_PCT_GE3    float64
dtype: object

In [78]:
# Fix some columns with float data types
df[['APPL_SCH_PCT_GE4', 'APPL_SCH_PCT_GE5', 'DEP_INC_AVG', 'IND_INC_AVG']] = df[['APPL_SCH_PCT_GE4', 'APPL_SCH_PCT_GE5', 'DEP_INC_AVG', 'IND_INC_AVG']].astype(float)

In [79]:
# Check data types were changed
df[['APPL_SCH_PCT_GE4', 'APPL_SCH_PCT_GE5', 'DEP_INC_AVG', 'IND_INC_AVG']].dtypes

APPL_SCH_PCT_GE4    float64
APPL_SCH_PCT_GE5    float64
DEP_INC_AVG         float64
IND_INC_AVG         float64
dtype: object

In [81]:
# Fix some columns with float data types
df[['DEBT_MDN', 'GRAD_DEBT_MDN', 'WDRAW_DEBT_MDN', 'LO_INC_DEBT_MDN', 'MD_INC_DEBT_MDN', 'HI_INC_DEBT_MDN']] = df[['DEBT_MDN', 'GRAD_DEBT_MDN', 'WDRAW_DEBT_MDN', 'LO_INC_DEBT_MDN', 'MD_INC_DEBT_MDN', 'HI_INC_DEBT_MDN']].astype(float)

In [82]:
# Check data types were changed
df[['DEBT_MDN', 'GRAD_DEBT_MDN', 'WDRAW_DEBT_MDN', 'LO_INC_DEBT_MDN', 'MD_INC_DEBT_MDN', 'HI_INC_DEBT_MDN']].dtypes

DEBT_MDN           float64
GRAD_DEBT_MDN      float64
WDRAW_DEBT_MDN     float64
LO_INC_DEBT_MDN    float64
MD_INC_DEBT_MDN    float64
HI_INC_DEBT_MDN    float64
dtype: object

In [84]:
# Fix some columns with float data types
df[['DEP_DEBT_MDN', 'IND_DEBT_MDN', 'PELL_DEBT_MDN', 'NOPELL_DEBT_MDN', 'FEMALE_DEBT_MDN']] = df[['DEP_DEBT_MDN', 'IND_DEBT_MDN', 'PELL_DEBT_MDN', 'NOPELL_DEBT_MDN', 'FEMALE_DEBT_MDN']].astype(float)

In [85]:
# Check data types were changed
df[['DEP_DEBT_MDN', 'IND_DEBT_MDN', 'PELL_DEBT_MDN', 'NOPELL_DEBT_MDN', 'FEMALE_DEBT_MDN']].dtypes

DEP_DEBT_MDN       float64
IND_DEBT_MDN       float64
PELL_DEBT_MDN      float64
NOPELL_DEBT_MDN    float64
FEMALE_DEBT_MDN    float64
dtype: object

In [86]:
# Fix some columns with float data types
df[['MALE_DEBT_MDN', 'FIRSTGEN_DEBT_MDN', 'NOTFIRSTGEN_DEBT_MDN', 'DEBT_N', 'GRAD_DEBT_N', 'WDRAW_DEBT_N']] = df[['MALE_DEBT_MDN', 'FIRSTGEN_DEBT_MDN', 'NOTFIRSTGEN_DEBT_MDN', 'DEBT_N', 'GRAD_DEBT_N', 'WDRAW_DEBT_N']].astype(float)

In [87]:
# Check data types were changed
df[['MALE_DEBT_MDN', 'FIRSTGEN_DEBT_MDN', 'NOTFIRSTGEN_DEBT_MDN', 'DEBT_N', 'GRAD_DEBT_N', 'WDRAW_DEBT_N']].dtypes

MALE_DEBT_MDN           float64
FIRSTGEN_DEBT_MDN       float64
NOTFIRSTGEN_DEBT_MDN    float64
DEBT_N                  float64
GRAD_DEBT_N             float64
WDRAW_DEBT_N            float64
dtype: object

In [88]:
# Fix some columns with float data types
df[['LO_INC_DEBT_N','MD_INC_DEBT_N', 'HI_INC_DEBT_N', 'DEP_DEBT_N', 'IND_DEBT_N', 'PELL_DEBT_N', 'NOPELL_DEBT_N']] = df[['LO_INC_DEBT_N','MD_INC_DEBT_N', 'HI_INC_DEBT_N', 'DEP_DEBT_N', 'IND_DEBT_N', 'PELL_DEBT_N', 'NOPELL_DEBT_N']].astype(float)

In [89]:
# Check data types were changed
df[['LO_INC_DEBT_N','MD_INC_DEBT_N', 'HI_INC_DEBT_N', 'DEP_DEBT_N', 'IND_DEBT_N', 'PELL_DEBT_N', 'NOPELL_DEBT_N']].dtypes

LO_INC_DEBT_N    float64
MD_INC_DEBT_N    float64
HI_INC_DEBT_N    float64
DEP_DEBT_N       float64
IND_DEBT_N       float64
PELL_DEBT_N      float64
NOPELL_DEBT_N    float64
dtype: object

In [90]:
# Fix some columns with float data types
df[['FEMALE_DEBT_N', 'MALE_DEBT_N', 'FIRSTGEN_DEBT_N', 'NOTFIRSTGEN_DEBT_N', 'GRAD_DEBT_MDN10YR']] = df[['FEMALE_DEBT_N', 'MALE_DEBT_N', 'FIRSTGEN_DEBT_N', 'NOTFIRSTGEN_DEBT_N', 'GRAD_DEBT_MDN10YR']].astype(float)

In [91]:
# Check data types were changed
df[['FEMALE_DEBT_N', 'MALE_DEBT_N', 'FIRSTGEN_DEBT_N', 'NOTFIRSTGEN_DEBT_N', 'GRAD_DEBT_MDN10YR']].dtypes

FEMALE_DEBT_N         float64
MALE_DEBT_N           float64
FIRSTGEN_DEBT_N       float64
NOTFIRSTGEN_DEBT_N    float64
GRAD_DEBT_MDN10YR     float64
dtype: object

In [92]:
# Fix some columns with float data types
df[['CUML_DEBT_N', 'CUML_DEBT_P90', 'CUML_DEBT_P75', 'CUML_DEBT_P25', 'CUML_DEBT_P10', 'INC_N', 'DEP_INC_N', 'IND_INC_N', 'DEP_STAT_N']] = df[['CUML_DEBT_N', 'CUML_DEBT_P90', 'CUML_DEBT_P75', 'CUML_DEBT_P25', 'CUML_DEBT_P10', 'INC_N', 'DEP_INC_N', 'IND_INC_N', 'DEP_STAT_N']].astype(float)

In [93]:
# Check data types were changed
df[['CUML_DEBT_N', 'CUML_DEBT_P90', 'CUML_DEBT_P75', 'CUML_DEBT_P25', 'CUML_DEBT_P10', 'INC_N', 'DEP_INC_N', 'IND_INC_N', 'DEP_STAT_N']].dtypes

CUML_DEBT_N      float64
CUML_DEBT_P90    float64
CUML_DEBT_P75    float64
CUML_DEBT_P25    float64
CUML_DEBT_P10    float64
INC_N            float64
DEP_INC_N        float64
IND_INC_N        float64
DEP_STAT_N       float64
dtype: object

In [94]:
# Fix some columns with float data types
df[['PAR_ED_N', 'APPL_SCH_N', 'LOAN_EVER', 'PELL_EVER', 'AGE_ENTRY', 'AGEGE24', 'FEMALE', 'MARRIED', 'DEPENDENT', 'VETERAN', 'FIRST_GEN']] = df[['PAR_ED_N', 'APPL_SCH_N', 'LOAN_EVER', 'PELL_EVER', 'AGE_ENTRY', 'AGEGE24', 'FEMALE', 'MARRIED', 'DEPENDENT', 'VETERAN', 'FIRST_GEN']].astype(float)

In [95]:
# Check data types were changed
df[['PAR_ED_N', 'APPL_SCH_N', 'LOAN_EVER', 'PELL_EVER', 'AGE_ENTRY', 'AGEGE24', 'FEMALE', 'MARRIED', 'DEPENDENT', 'VETERAN', 'FIRST_GEN']].dtypes

PAR_ED_N      float64
APPL_SCH_N    float64
LOAN_EVER     float64
PELL_EVER     float64
AGE_ENTRY     float64
AGEGE24       float64
FEMALE        float64
MARRIED       float64
DEPENDENT     float64
VETERAN       float64
FIRST_GEN     float64
dtype: object

In [96]:
# Fix some columns with float data types
df[['FAMINC', 'MD_FAMINC', 'FAMINC_IND', 'PCT_WHITE', 'PCT_BLACK', 'PCT_ASIAN', 'PCT_HISPANIC', 'PCT_BA']] = df[['FAMINC', 'MD_FAMINC', 'FAMINC_IND', 'PCT_WHITE', 'PCT_BLACK', 'PCT_ASIAN', 'PCT_HISPANIC', 'PCT_BA']].astype(float)

In [97]:
# Check data types were changed
df[['FAMINC', 'MD_FAMINC', 'FAMINC_IND', 'PCT_WHITE', 'PCT_BLACK', 'PCT_ASIAN', 'PCT_HISPANIC', 'PCT_BA']].dtypes

FAMINC          float64
MD_FAMINC       float64
FAMINC_IND      float64
PCT_WHITE       float64
PCT_BLACK       float64
PCT_ASIAN       float64
PCT_HISPANIC    float64
PCT_BA          float64
dtype: object

In [98]:
# Fix some columns with float data types
df[['PCT_GRAD_PROF', 'PCT_BORN_US', 'MEDIAN_HH_INC', 'POVERTY_RATE', 'UNEMP_RATE', 'LN_MEDIAN_HH_INC', 'DEBT_MDN_SUPP', 'GRAD_DEBT_MDN_SUPP']] = df[['PCT_GRAD_PROF', 'PCT_BORN_US', 'MEDIAN_HH_INC', 'POVERTY_RATE', 'UNEMP_RATE', 'LN_MEDIAN_HH_INC', 'DEBT_MDN_SUPP', 'GRAD_DEBT_MDN_SUPP']].astype(float)

In [99]:
# Check data types were changed
df[['PCT_GRAD_PROF', 'PCT_BORN_US', 'MEDIAN_HH_INC', 'POVERTY_RATE', 'UNEMP_RATE', 'LN_MEDIAN_HH_INC', 'DEBT_MDN_SUPP', 'GRAD_DEBT_MDN_SUPP']].dtypes

PCT_GRAD_PROF         float64
PCT_BORN_US           float64
MEDIAN_HH_INC         float64
POVERTY_RATE          float64
UNEMP_RATE            float64
LN_MEDIAN_HH_INC      float64
DEBT_MDN_SUPP         float64
GRAD_DEBT_MDN_SUPP    float64
dtype: object

In [100]:
# Fix some columns with float data types
df[['GRAD_DEBT_MDN10YR_SUPP', 'RET_FT4_POOLED_SUPP', 'RET_FTL4_POOLED_SUPP', 'RET_PT4_POOLED_SUPP']] = df[['GRAD_DEBT_MDN10YR_SUPP', 'RET_FT4_POOLED_SUPP', 'RET_FTL4_POOLED_SUPP', 'RET_PT4_POOLED_SUPP']].astype(float)

In [101]:
# Check data types were changed
df[['GRAD_DEBT_MDN10YR_SUPP', 'RET_FT4_POOLED_SUPP', 'RET_FTL4_POOLED_SUPP', 'RET_PT4_POOLED_SUPP']].dtypes

GRAD_DEBT_MDN10YR_SUPP    float64
RET_FT4_POOLED_SUPP       float64
RET_FTL4_POOLED_SUPP      float64
RET_PT4_POOLED_SUPP       float64
dtype: object

In [102]:
# Fix some columns with float data types
df[['RET_PTL4_POOLED_SUPP', 'FTFTPCTPELL_POOLED_SUPP', 'FTFTPCTFLOAN_POOLED_SUPP', 'LPSTAFFORD_CNT', 'LPSTAFFORD_AMT']] = df[['RET_PTL4_POOLED_SUPP', 'FTFTPCTPELL_POOLED_SUPP', 'FTFTPCTFLOAN_POOLED_SUPP', 'LPSTAFFORD_CNT', 'LPSTAFFORD_AMT']].astype(float)

In [103]:
# Check data types were changed
df[['RET_PTL4_POOLED_SUPP', 'FTFTPCTPELL_POOLED_SUPP', 'FTFTPCTFLOAN_POOLED_SUPP', 'LPSTAFFORD_CNT', 'LPSTAFFORD_AMT']].dtypes

RET_PTL4_POOLED_SUPP        float64
FTFTPCTPELL_POOLED_SUPP     float64
FTFTPCTFLOAN_POOLED_SUPP    float64
LPSTAFFORD_CNT              float64
LPSTAFFORD_AMT              float64
dtype: object

In [104]:
# Run mixed type check again
for col in df.columns.tolist():
    weird = (df[[col]].applymap(type) != df[[col]].iloc[0].apply(type)).any(axis = 1)
    if len (df[weird]) > 0:
        print(col)

## 04. Missing values

In [105]:
# Check for missing values
df.isnull().sum()

UNITID                         0
OPEID                          0
OPEID6                         0
NAME                           0
CITY                           0
                            ... 
FTFTPCTFLOAN_POOLED_SUPP    1353
SCUGFFN_POOLED               774
LPSTAFFORD_CNT               399
LPSTAFFORD_AMT               399
FEDSCHCD                       0
Length: 261, dtype: int64

In [106]:
# Change options to display all rows
pd.options.display.max_rows = None

In [107]:
# Check for missing values
df.isnull().sum()

UNITID                         0
OPEID                          0
OPEID6                         0
NAME                           0
CITY                           0
STATE                          0
ZIP                            0
ACCREDAGENCY                   0
SCH_DEG                      282
HCM2                           0
MAIN                           0
NUMBRANCH                      0
PREDDEG                        0
HIGHDEG                        0
CONTROL                        0
ST_FIPS                        0
REGION                         0
LOCALE                       475
LOCALE2                     6806
LATITUDE                     475
LONGITUDE                    475
CCBASIC                      475
CCUGPROF                     475
CCSIZSET                     475
HBCU                         483
PBI                          483
ANNHI                        483
TRIBAL                       483
AANAPII                      483
HSI                          483
NANTI     

In [137]:
# Drop LOCALE2 column
df = df.drop(columns = 'LOCALE2')

In [138]:
# Get total count of missing values
df.isnull().sum().sum()

668356

## 05. Duplicate values

In [139]:
# Search for full duplicates
df_dups = df[df.duplicated()]

In [140]:
# Check output
df_dups

Unnamed: 0,UNITID,OPEID,OPEID6,NAME,CITY,STATE,ZIP,ACCREDAGENCY,SCH_DEG,HCM2,MAIN,NUMBRANCH,PREDDEG,HIGHDEG,CONTROL,ST_FIPS,REGION,LOCALE,LATITUDE,LONGITUDE,CCBASIC,CCUGPROF,CCSIZSET,HBCU,PBI,ANNHI,TRIBAL,AANAPII,HSI,NANTI,MENONLY,WOMENONLY,RELAFFIL,ADM_RATE,ADM_RATE_ALL,SATVR25,SATVR75,SATMT25,SATMT75,SATWR25,SATWR75,SATVRMID,SATMTMID,SATWRMID,ACTCM25,ACTCM75,ACTEN25,ACTEN75,ACTMT25,ACTMT75,ACTWR25,ACTWR75,ACTCMMID,ACTENMID,ACTMTMID,ACTWRMID,SAT_AVG,SAT_AVG_ALL,DISTANCEONLY,UGDS,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN,PPTUG_EF,CURROPER,NPT4_PUB,NPT4_PRIV,NPT41_PUB,NPT42_PUB,NPT43_PUB,NPT44_PUB,NPT45_PUB,NPT41_PRIV,NPT42_PRIV,NPT43_PRIV,NPT44_PRIV,NPT45_PRIV,NPT4_048_PUB,NPT4_048_PRIV,NPT4_3075_PUB,NPT4_3075_PRIV,NPT4_75UP_PUB,NPT4_75UP_PRIV,NUM4_PUB,NUM4_PRIV,NUM41_PUB,NUM42_PUB,NUM43_PUB,NUM44_PUB,NUM45_PUB,NUM41_PRIV,NUM42_PRIV,NUM43_PRIV,NUM44_PRIV,NUM45_PRIV,COSTT4_A,COSTT4_P,TUITIONFEE_IN,TUITIONFEE_OUT,TUITIONFEE_PROG,TUITFTE,INEXPFTE,AVGFACSAL,PFTFAC,PCTPELL,PFTFTUG1_EF,RET_FT4,RET_FTL4,RET_PT4,RET_PTL4,PCTFLOAN,UG25ABV,INC_PCT_LO,DEP_STAT_PCT_IND,DEP_INC_PCT_LO,IND_INC_PCT_LO,PAR_ED_PCT_1STGEN,INC_PCT_M1,INC_PCT_M2,INC_PCT_H1,INC_PCT_H2,DEP_INC_PCT_M1,DEP_INC_PCT_M2,DEP_INC_PCT_H1,DEP_INC_PCT_H2,IND_INC_PCT_M1,IND_INC_PCT_M2,IND_INC_PCT_H1,IND_INC_PCT_H2,PAR_ED_PCT_MS,PAR_ED_PCT_HS,PAR_ED_PCT_PS,APPL_SCH_PCT_GE2,APPL_SCH_PCT_GE3,APPL_SCH_PCT_GE4,APPL_SCH_PCT_GE5,DEP_INC_AVG,IND_INC_AVG,DEBT_MDN,GRAD_DEBT_MDN,WDRAW_DEBT_MDN,LO_INC_DEBT_MDN,MD_INC_DEBT_MDN,HI_INC_DEBT_MDN,DEP_DEBT_MDN,IND_DEBT_MDN,PELL_DEBT_MDN,NOPELL_DEBT_MDN,FEMALE_DEBT_MDN,MALE_DEBT_MDN,FIRSTGEN_DEBT_MDN,NOTFIRSTGEN_DEBT_MDN,DEBT_N,GRAD_DEBT_N,WDRAW_DEBT_N,LO_INC_DEBT_N,MD_INC_DEBT_N,HI_INC_DEBT_N,DEP_DEBT_N,IND_DEBT_N,PELL_DEBT_N,NOPELL_DEBT_N,FEMALE_DEBT_N,MALE_DEBT_N,FIRSTGEN_DEBT_N,NOTFIRSTGEN_DEBT_N,GRAD_DEBT_MDN10YR,CUML_DEBT_N,CUML_DEBT_P90,CUML_DEBT_P75,CUML_DEBT_P25,CUML_DEBT_P10,INC_N,DEP_INC_N,IND_INC_N,DEP_STAT_N,PAR_ED_N,APPL_SCH_N,LOAN_EVER,PELL_EVER,AGE_ENTRY,AGEGE24,FEMALE,MARRIED,DEPENDENT,VETERAN,FIRST_GEN,FAMINC,MD_FAMINC,FAMINC_IND,PCT_WHITE,PCT_BLACK,PCT_ASIAN,PCT_HISPANIC,PCT_BA,PCT_GRAD_PROF,PCT_BORN_US,MEDIAN_HH_INC,POVERTY_RATE,UNEMP_RATE,LN_MEDIAN_HH_INC,DEBT_MDN_SUPP,GRAD_DEBT_MDN_SUPP,GRAD_DEBT_MDN10YR_SUPP,ALIAS,ICLEVEL,UGDS_MEN,UGDS_WOMEN,T4APPROVALDATE,D_PCTPELL_PCTFLOAN,OPENADMP,UGNONDS,GRADS,ACCREDCODE,RET_FT4_POOLED,RET_FTL4_POOLED,RET_PT4_POOLED,RET_PTL4_POOLED,RET_FT_DEN4_POOLED,RET_FT_DENL4_POOLED,RET_PT_DEN4_POOLED,RET_PT_DENL4_POOLED,POOLYRSRET_FT,POOLYRSRET_PT,RET_FT4_POOLED_SUPP,RET_FTL4_POOLED_SUPP,RET_PT4_POOLED_SUPP,RET_PTL4_POOLED_SUPP,SCHTYPE,OPEFLAG,CIPTFBS1,CIPTFBS2,CIPTFBS3,CIPTFBS4,CIPTFBS5,CIPTFBS6,CIPTFBSANNUAL1,CIPTFBSANNUAL2,CIPTFBSANNUAL3,CIPTFBSANNUAL4,CIPTFBSANNUAL5,CIPTFBSANNUAL6,FTFTPCTPELL,FTFTPCTFLOAN,UG12MN,G12MN,SCUGFFN,POOLYRS_FTFTAIDPCT,FTFTPCTPELL_POOLED_SUPP,FTFTPCTFLOAN_POOLED_SUPP,SCUGFFN_POOLED,LPSTAFFORD_CNT,LPSTAFFORD_AMT,FEDSCHCD


# 04. Get info about data set

In [141]:
# Get info about data set
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 6806 entries, 0 to 6805
Columns: 260 entries, UNITID to FEDSCHCD
dtypes: float64(237), int64(14), object(9)
memory usage: 13.5+ MB


In [142]:
# Get descriptive stats
df.describe()

Unnamed: 0,UNITID,OPEID,OPEID6,SCH_DEG,HCM2,MAIN,NUMBRANCH,PREDDEG,HIGHDEG,CONTROL,ST_FIPS,REGION,LOCALE,LATITUDE,LONGITUDE,CCBASIC,CCUGPROF,CCSIZSET,HBCU,PBI,ANNHI,TRIBAL,AANAPII,HSI,NANTI,MENONLY,WOMENONLY,RELAFFIL,ADM_RATE,ADM_RATE_ALL,SATVR25,SATVR75,SATMT25,SATMT75,SATWR25,SATWR75,SATVRMID,SATMTMID,SATWRMID,ACTCM25,ACTCM75,ACTEN25,ACTEN75,ACTMT25,ACTMT75,ACTWR25,ACTWR75,ACTCMMID,ACTENMID,ACTMTMID,ACTWRMID,SAT_AVG,SAT_AVG_ALL,DISTANCEONLY,UGDS,UGDS_WHITE,UGDS_BLACK,UGDS_HISP,UGDS_ASIAN,UGDS_AIAN,UGDS_NHPI,UGDS_2MOR,UGDS_NRA,UGDS_UNKN,PPTUG_EF,CURROPER,NPT4_PUB,NPT4_PRIV,NPT41_PUB,NPT42_PUB,NPT43_PUB,NPT44_PUB,NPT45_PUB,NPT41_PRIV,NPT42_PRIV,NPT43_PRIV,NPT44_PRIV,NPT45_PRIV,NPT4_048_PUB,NPT4_048_PRIV,NPT4_3075_PUB,NPT4_3075_PRIV,NPT4_75UP_PUB,NPT4_75UP_PRIV,NUM4_PUB,NUM4_PRIV,NUM41_PUB,NUM42_PUB,NUM43_PUB,NUM44_PUB,NUM45_PUB,NUM41_PRIV,NUM42_PRIV,NUM43_PRIV,NUM44_PRIV,NUM45_PRIV,COSTT4_A,COSTT4_P,TUITIONFEE_IN,TUITIONFEE_OUT,TUITIONFEE_PROG,TUITFTE,INEXPFTE,AVGFACSAL,PFTFAC,PCTPELL,PFTFTUG1_EF,RET_FT4,RET_FTL4,RET_PT4,RET_PTL4,PCTFLOAN,UG25ABV,INC_PCT_LO,DEP_STAT_PCT_IND,DEP_INC_PCT_LO,IND_INC_PCT_LO,PAR_ED_PCT_1STGEN,INC_PCT_M1,INC_PCT_M2,INC_PCT_H1,INC_PCT_H2,DEP_INC_PCT_M1,DEP_INC_PCT_M2,DEP_INC_PCT_H1,DEP_INC_PCT_H2,IND_INC_PCT_M1,IND_INC_PCT_M2,IND_INC_PCT_H1,IND_INC_PCT_H2,PAR_ED_PCT_MS,PAR_ED_PCT_HS,PAR_ED_PCT_PS,APPL_SCH_PCT_GE2,APPL_SCH_PCT_GE3,APPL_SCH_PCT_GE4,APPL_SCH_PCT_GE5,DEP_INC_AVG,IND_INC_AVG,DEBT_MDN,GRAD_DEBT_MDN,WDRAW_DEBT_MDN,LO_INC_DEBT_MDN,MD_INC_DEBT_MDN,HI_INC_DEBT_MDN,DEP_DEBT_MDN,IND_DEBT_MDN,PELL_DEBT_MDN,NOPELL_DEBT_MDN,FEMALE_DEBT_MDN,MALE_DEBT_MDN,FIRSTGEN_DEBT_MDN,NOTFIRSTGEN_DEBT_MDN,DEBT_N,GRAD_DEBT_N,WDRAW_DEBT_N,LO_INC_DEBT_N,MD_INC_DEBT_N,HI_INC_DEBT_N,DEP_DEBT_N,IND_DEBT_N,PELL_DEBT_N,NOPELL_DEBT_N,FEMALE_DEBT_N,MALE_DEBT_N,FIRSTGEN_DEBT_N,NOTFIRSTGEN_DEBT_N,GRAD_DEBT_MDN10YR,CUML_DEBT_N,CUML_DEBT_P90,CUML_DEBT_P75,CUML_DEBT_P25,CUML_DEBT_P10,INC_N,DEP_INC_N,IND_INC_N,DEP_STAT_N,PAR_ED_N,APPL_SCH_N,LOAN_EVER,PELL_EVER,AGE_ENTRY,AGEGE24,FEMALE,MARRIED,DEPENDENT,VETERAN,FIRST_GEN,FAMINC,MD_FAMINC,FAMINC_IND,PCT_WHITE,PCT_BLACK,PCT_ASIAN,PCT_HISPANIC,PCT_BA,PCT_GRAD_PROF,PCT_BORN_US,MEDIAN_HH_INC,POVERTY_RATE,UNEMP_RATE,LN_MEDIAN_HH_INC,DEBT_MDN_SUPP,GRAD_DEBT_MDN_SUPP,GRAD_DEBT_MDN10YR_SUPP,ICLEVEL,UGDS_MEN,UGDS_WOMEN,D_PCTPELL_PCTFLOAN,OPENADMP,UGNONDS,GRADS,RET_FT4_POOLED,RET_FTL4_POOLED,RET_PT4_POOLED,RET_PTL4_POOLED,RET_FT_DEN4_POOLED,RET_FT_DENL4_POOLED,RET_PT_DEN4_POOLED,RET_PT_DENL4_POOLED,POOLYRSRET_FT,POOLYRSRET_PT,RET_FT4_POOLED_SUPP,RET_FTL4_POOLED_SUPP,RET_PT4_POOLED_SUPP,RET_PTL4_POOLED_SUPP,SCHTYPE,OPEFLAG,CIPTFBS1,CIPTFBS2,CIPTFBS3,CIPTFBS4,CIPTFBS5,CIPTFBS6,CIPTFBSANNUAL1,CIPTFBSANNUAL2,CIPTFBSANNUAL3,CIPTFBSANNUAL4,CIPTFBSANNUAL5,CIPTFBSANNUAL6,FTFTPCTPELL,FTFTPCTFLOAN,UG12MN,G12MN,SCUGFFN,POOLYRS_FTFTAIDPCT,FTFTPCTPELL_POOLED_SUPP,FTFTPCTFLOAN_POOLED_SUPP,SCUGFFN_POOLED,LPSTAFFORD_CNT,LPSTAFFORD_AMT
count,6806.0,6806.0,6806.0,6524.0,6806.0,6806.0,6806.0,6806.0,6806.0,6806.0,6806.0,6806.0,6331.0,6331.0,6331.0,6331.0,6331.0,6331.0,6323.0,6323.0,6323.0,6323.0,6323.0,6323.0,6323.0,6331.0,6331.0,911.0,2006.0,2242.0,1239.0,1239.0,1242.0,1242.0,732.0,732.0,1239.0,1242.0,732.0,1273.0,1273.0,1199.0,1199.0,1199.0,1199.0,325.0,325.0,1273.0,1199.0,1199.0,325.0,1298.0,1426.0,6331.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,6041.0,6013.0,6806.0,1878.0,3727.0,1869.0,1795.0,1745.0,1559.0,1338.0,3661.0,2944.0,2669.0,2172.0,1814.0,1875.0,3698.0,1818.0,3082.0,1587.0,2326.0,1878.0,3728.0,1878.0,1878.0,1878.0,1878.0,1878.0,3727.0,3727.0,3727.0,3727.0,3727.0,3431.0,2175.0,3865.0,3621.0,2361.0,6304.0,6304.0,4012.0,3623.0,6014.0,5705.0,2098.0,3194.0,1309.0,1798.0,6014.0,5872.0,5893.0,5781.0,4713.0,4713.0,5477.0,5304.0,4755.0,4154.0,4125.0,3792.0,3013.0,1718.0,1703.0,3794.0,3013.0,1718.0,1703.0,4176.0,4185.0,5477.0,5355.0,4638.0,4165.0,4305.0,5800.0,5800.0,5740.0,5307.0,5156.0,5220.0,4446.0,4440.0,5044.0,5044.0,4846.0,4846.0,4602.0,4602.0,4743.0,4743.0,5855.0,5405.0,5405.0,5496.0,4858.0,4855.0,5394.0,5394.0,5198.0,5198.0,4911.0,4911.0,5131.0,5131.0,5307.0,5656.0,4895.0,5388.0,5388.0,4895.0,6180.0,5800.0,5800.0,6180.0,5504.0,6180.0,4936.0,5149.0,6180.0,4673.0,5314.0,5324.0,5781.0,2336.0,5477.0,6180.0,6180.0,5800.0,4670.0,4670.0,4670.0,4670.0,4634.0,4634.0,4634.0,4670.0,4670.0,4670.0,4670.0,5615.0,5186.0,5186.0,6806.0,6041.0,6041.0,6014.0,5880.0,2867.0,2073.0,2201.0,3253.0,1615.0,1936.0,2418.0,3293.0,2001.0,2019.0,5711.0,4020.0,1962.0,2943.0,675.0,1442.0,6425.0,6806.0,2403.0,1908.0,1513.0,1158.0,839.0,638.0,2403.0,1908.0,1513.0,1158.0,839.0,638.0,5740.0,5740.0,6030.0,2072.0,6024.0,6032.0,5453.0,5453.0,6032.0,6407.0,6407.0
mean,2126810.0,1784672.0,16671.262269,1.938228,0.007934,0.785336,3.523509,1.833823,2.222892,2.08757,29.032912,4.613135,19.884378,37.374743,-90.314421,9.922287,3.684568,4.520771,0.015815,0.015973,0.005693,0.005535,0.025621,0.072908,0.004428,0.009635,0.005528,55.613611,0.678958,0.681198,516.617433,613.322034,510.353462,609.377617,463.353825,569.61612,565.009685,559.904992,516.523224,20.609584,25.958366,19.718098,26.309425,19.367807,25.386155,6.581538,8.390769,23.535742,23.264387,22.643036,7.698462,1141.174114,1147.656381,0.008214,2522.160735,0.49179,0.179735,0.181379,0.037811,0.013504,0.004573,0.03077,0.021385,0.035911,0.228367,0.950485,10010.15229,19153.949826,8192.315677,8887.431198,11253.812607,13787.00449,15273.18012,17300.208959,18373.194293,20440.384039,23315.191068,26398.55237,8435.453867,17485.478908,9982.357536,19155.016223,14193.072464,24612.271281,525.988818,141.060622,228.787007,92.435037,77.924388,57.394569,69.447817,60.220016,18.163671,17.48323,16.382345,28.848135,26956.896823,20229.456092,15476.787322,18906.769125,15733.626853,11099.011104,8477.335343,6858.799103,0.593839,0.471843,0.694014,0.727493,0.691617,0.453604,0.550197,0.462107,0.381475,0.565182,0.498729,0.438762,0.737699,0.449684,0.155762,0.124082,0.097187,0.115975,0.179304,0.154415,0.125437,0.142775,0.14067,0.087905,0.046462,0.024397,0.059043,0.400104,0.550316,0.457171,0.270337,0.19783,0.14713,50443.632947,21104.523972,11325.35331,16255.580366,6825.797905,11485.34636,12469.853351,12025.300225,9968.705194,12720.643933,12378.749071,11055.253405,12254.671664,11547.165363,11972.071052,11930.743411,3466.137148,1587.941166,2162.555967,2025.279658,1096.82359,783.286303,1540.181498,2213.390063,2867.485956,1028.674683,2782.56404,1330.736103,3176.124147,771.152017,168.705424,3664.573197,25213.216343,17925.435969,5781.862565,3263.280899,3019.21521,1362.447069,1847.285517,3019.21521,2833.81577,3019.21521,0.7688,0.722888,25.846444,0.414783,0.636853,0.161643,0.501271,0.014872,0.449684,39440.00824,28912.429126,21104.523972,75.971861,12.535807,3.02536,13.037589,14.388347,7.920423,88.896543,57992.621585,10.742944,3.835178,10.899752,11367.727872,16344.567875,169.628964,1.815898,0.352605,0.64425,2925.16445,1.354252,680.179281,1486.300531,0.718455,0.693193,0.463474,0.555272,1298.507031,447.711206,54.583208,380.435859,2.466468,3.178607,0.730958,0.685279,0.467003,0.517901,2.055409,1.035557,17189.837703,13769.241614,12338.627231,12947.160622,13358.454112,13505.871473,11579.242613,10311.824423,9341.637806,9267.105354,9177.20143,9241.785266,0.570178,0.526082,3788.561526,1886.294884,452.09595,2.306034,0.565577,0.529327,901.83687,26105.91,597540800.0
std,7640544.0,2739965.0,14847.499904,0.900211,0.088726,0.410619,8.75141,1.070275,1.362394,0.835281,16.769898,2.179201,9.614376,5.851418,17.979595,11.066478,5.808817,6.424307,0.12477,0.125382,0.075246,0.0742,0.158014,0.260007,0.066403,0.097692,0.074153,21.578581,0.217596,0.213015,65.9955,59.956409,70.706483,72.226097,82.233472,81.296986,61.946404,70.163575,80.596669,3.971297,3.725738,4.494545,4.438807,3.681928,3.615055,1.195528,0.921908,3.801546,4.376404,3.577571,1.034064,125.516704,125.000305,0.090263,5657.459316,0.283737,0.217884,0.227826,0.079448,0.071663,0.031879,0.038606,0.06313,0.072023,0.255692,0.216957,5289.529286,8034.427512,4445.243251,4441.244657,4638.79014,4953.010675,5513.770411,7335.639646,7468.678637,7452.874567,7266.69814,9000.447445,4483.830171,7361.061127,4627.898333,7501.934667,5407.004051,8284.018676,655.80164,264.21544,298.260338,117.326822,102.589175,95.948682,152.780283,153.150652,33.249969,34.010776,35.9908,81.71666,15831.620491,6873.577043,13333.765877,12621.628174,8127.867242,12995.482144,14025.056252,2534.714614,0.290545,0.217235,0.272367,0.169951,0.18127,0.305215,0.25166,0.279112,0.236839,0.190112,0.246947,0.169211,0.114108,0.127526,0.037808,0.041991,0.056561,0.113601,0.040513,0.037185,0.05717,0.103365,0.043435,0.041079,0.032528,0.022505,0.04504,0.095498,0.127526,0.161834,0.173939,0.166133,0.151109,23946.854637,8407.579719,5267.400384,8111.9544,2723.206374,5223.303729,5699.638575,5736.113804,5373.693526,5675.505407,5721.244558,5016.769062,5454.178943,5316.241077,5368.098275,5381.810006,8371.533331,3572.988937,5535.828189,5366.624669,2436.345845,1776.241622,3116.178437,7106.841599,7044.598975,2234.121372,6434.466135,2823.373772,7465.20147,1632.899529,84.188363,10801.986423,11207.609234,8355.168694,2587.657499,1259.016675,6549.330822,2589.826452,5393.326775,6549.330822,5720.32681,6549.330822,0.226925,0.172757,3.977495,0.235184,0.186048,0.100722,0.246947,0.022536,0.127526,23501.428097,19593.230647,8407.579719,16.001689,12.779219,4.101095,19.054551,4.165254,2.925431,10.449878,13096.119296,7.071622,1.2432,0.251125,5261.221354,8102.483101,84.090067,0.834446,0.242507,0.244392,6115.386037,0.478327,1260.876649,3102.072006,0.163226,0.159387,0.253207,0.221719,2285.935515,924.771122,206.174696,846.201554,0.845854,0.984043,0.139367,0.15213,0.169448,0.189837,0.836425,0.339294,8662.22446,9743.432766,9639.341214,11254.483046,11487.770831,11630.885604,4954.846521,5202.005336,5050.927486,5394.351573,5285.5678,5494.356963,0.239364,0.320575,8322.875304,4045.939627,925.426065,0.720068,0.2232,0.307368,1829.955708,91908.28,2458995000.0
min,100654.0,100200.0,1002.0,1.0,0.0,0.0,1.0,0.0,0.0,1.0,1.0,0.0,-3.0,-14.322636,-170.742774,-2.0,-2.0,-2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,22.0,0.0,0.0,244.0,330.0,283.0,400.0,200.0,360.0,300.0,370.0,280.0,6.0,11.0,6.0,11.0,6.0,11.0,2.0,6.0,9.0,9.0,9.0,4.0,785.0,785.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-1973.0,-1338.0,-3088.0,-2563.0,805.0,-2558.0,650.0,-3260.0,-3395.0,451.0,3800.0,5923.0,-3001.0,-3335.0,-1765.0,-610.0,-2558.0,3800.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3990.0,1480.0,480.0,480.0,299.0,0.0,0.0,0.0,0.0,0.0,0.0009,0.0,0.0,0.0,0.0,0.0,0.0004,0.086801,0.01088,0.078014,0.297619,0.08867,0.037422,0.010695,0.004942,0.001318,0.058333,0.033937,0.010915,0.005962,0.01728,0.013691,0.004608,0.002206,0.002952,0.085406,0.042735,0.026539,0.021449,0.005071,0.002056,2160.666667,0.0,1834.0,2020.0,1388.0,1700.0,2600.0,2750.0,1960.0,2013.0,2443.0,2996.0,1933.0,1981.0,2400.0,2312.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,10.0,12.0,10.0,20.964183,10.0,3381.0,2147.0,928.0,450.0,10.0,10.0,10.0,10.0,11.0,10.0,0.009852,0.114961,17.427711,0.0,0.016129,0.002738,0.028061,0.001021,0.08867,321.385321,0.0,0.0,5.34,0.02,0.06,0.41,3.0,0.6,28.92,15429.01,3.01,1.85,9.64,1834.0,2020.0,20.964183,1.0,0.0,0.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,2.0,0.0946,0.0363,0.0286,0.0124,1.0,1.0,404.0,525.0,395.0,50.0,263.0,530.0,404.0,525.0,395.0,50.0,263.0,530.0,0.0,0.0,1.0,1.0,0.0,2.0,0.0,0.0,0.0,10.0,28087.0
25%,174031.5,311950.0,3109.25,1.0,0.0,1.0,1.0,1.0,1.0,1.0,13.0,3.0,12.0,33.971442,-97.408884,-2.0,-2.0,-2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,30.0,0.552575,0.5627,470.0,570.0,470.0,560.0,410.0,520.0,525.0,515.0,464.75,18.0,23.0,17.0,23.0,17.0,23.0,6.0,8.0,21.0,20.0,20.0,7.0,1058.0,1062.0,0.0,105.0,0.2524,0.0356,0.0363,0.0024,0.0,0.0,0.0,0.0,0.0,0.0,1.0,6127.5,13797.0,5148.0,5722.0,7761.0,10110.5,11239.5,12607.0,13844.25,15902.0,18862.25,20328.0,5317.5,12777.75,6615.75,14599.5,10301.0,19263.0,101.25,17.0,49.0,16.0,11.0,2.0,0.0,11.0,1.0,0.0,0.0,0.0,14055.5,15578.5,5252.0,8869.0,12166.0,4836.75,3807.25,5200.75,0.3427,0.3098,0.5,0.64725,0.5779,0.25,0.389525,0.2277,0.194875,0.424324,0.30465,0.306452,0.675687,0.368254,0.129999,0.093008,0.049125,0.031532,0.151163,0.132075,0.083746,0.064598,0.109821,0.058363,0.025758,0.010313,0.030246,0.347926,0.462145,0.345374,0.147036,0.082687,0.048885,32317.854839,15661.141553,7234.0,9500.0,4750.0,7600.0,7667.0,6485.0,5500.0,8731.5,7917.0,6411.75,7917.0,7026.0,7735.0,7394.5,194.0,140.0,98.0,129.0,107.0,54.0,100.0,101.0,228.0,69.0,247.0,94.0,268.0,58.0,98.593929,212.0,15720.0,10139.25,4067.875,2400.0,212.0,97.0,104.0,212.0,287.0,212.0,0.721934,0.608696,22.982419,0.22,0.548387,0.092642,0.3,0.006358,0.368254,23187.831075,16563.75,15661.141553,67.592497,3.9825,0.87,2.6325,11.3725,5.84,85.232502,49478.5,6.89,3.07,10.78,7304.5,9500.0,98.593929,1.0,0.1398,0.5276,163.0,1.0,29.0,106.0,0.6358,0.5909,0.3121,0.404575,49.0,44.0,1.0,24.0,2.0,2.0,0.653125,0.5884,0.35,0.391975,1.0,1.0,13182.0,7722.75,5650.0,5444.75,5271.5,5153.0,9210.0,6995.0,5100.0,4801.0,4627.0,4439.25,0.4,0.25,176.0,143.0,30.0,2.0,0.4045,0.2817,66.0,945.5,9599686.0
50%,228209.5,1019812.0,10198.0,2.0,0.0,1.0,1.0,2.0,2.0,2.0,29.0,5.0,21.0,38.832183,-86.267098,9.0,2.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,54.0,0.7027,0.7003,510.0,610.0,500.0,598.0,441.5,557.5,556.0,549.5,500.0,20.0,26.0,19.0,25.0,18.0,25.0,6.0,8.0,23.0,23.0,22.0,7.0,1123.0,1130.0,0.0,438.0,0.5321,0.0959,0.091,0.0144,0.0023,0.0003,0.025,0.0,0.0133,0.1256,1.0,8937.5,18669.0,7503.0,8046.0,10533.0,12969.0,14122.5,16672.0,17813.5,19953.0,22656.0,24898.5,7754.0,16871.0,9142.5,18669.5,13173.0,23542.0,270.0,46.0,130.5,49.0,37.0,17.0,9.0,28.0,5.0,3.0,1.0,0.0,22581.0,19589.0,11207.0,15275.0,15300.0,9231.5,6056.0,6574.0,0.5696,0.45295,0.7319,0.74825,0.69315,0.4545,0.5,0.5149,0.3581,0.595004,0.520447,0.434783,0.749164,0.471415,0.156748,0.126214,0.088442,0.072868,0.179245,0.15774,0.124297,0.110858,0.139888,0.081325,0.037234,0.015834,0.049222,0.414674,0.528585,0.428058,0.207067,0.132666,0.086785,46257.574359,20183.45414,9500.0,13700.0,6069.5,9500.0,11996.0,11645.0,8388.5,10926.5,10500.0,10270.0,11000.0,10500.0,10506.0,11000.0,766.0,423.0,423.0,373.5,303.5,198.0,509.0,324.0,647.5,250.0,674.0,362.0,761.0,198.0,142.182823,807.5,25000.0,16007.5,5500.0,3167.0,799.0,507.0,327.5,799.0,881.5,799.0,0.863212,0.76189,25.593387,0.42,0.623674,0.147102,0.479553,0.00951,0.471415,32228.572691,22593.25,20183.45414,79.540001,7.905,1.74,5.68,14.09,7.38,92.739998,57722.875,8.85,3.53,10.92,9500.0,13894.0,144.196215,2.0,0.3706,0.6276,602.0,1.0,187.0,424.0,0.7436,0.6982,0.4587,0.50605,481.0,95.0,11.0,61.0,2.0,4.0,0.74855,0.6901,0.4514,0.47355,2.0,1.0,16500.0,12150.0,10177.0,9987.5,10470.0,10635.0,11304.0,10112.0,9100.0,8735.0,8716.0,9014.0,0.5678,0.5949,716.5,573.5,137.0,2.0,0.5635,0.6049,272.0,4779.0,65992650.0
75%,452758.5,3034350.0,30273.75,3.0,0.0,1.0,2.0,3.0,4.0,3.0,42.0,6.0,22.0,41.33294,-78.788784,20.0,10.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,71.0,0.844125,0.8442,550.0,650.0,540.0,640.0,500.0,610.0,600.0,590.0,555.0,22.0,28.0,22.0,29.0,21.0,27.0,7.0,9.0,25.0,26.0,24.0,9.0,1199.0,1211.0,0.0,2117.0,0.7231,0.239,0.2353,0.0373,0.0067,0.0026,0.0418,0.0173,0.0392,0.4027,1.0,13483.75,23755.5,10747.0,11584.5,14125.0,17333.5,18627.5,21434.0,22443.0,24469.0,26948.75,30657.0,11052.0,21632.0,12875.75,23261.75,17759.5,28892.25,690.0,169.0,301.0,124.0,103.0,65.0,52.0,64.0,24.0,20.0,13.0,12.0,35765.5,24066.5,20550.0,26079.0,17700.0,14052.0,9449.25,8198.5,0.88215,0.628675,0.9787,0.833525,0.8182,0.6636,0.75,0.68025,0.5455,0.714222,0.7,0.559322,0.81987,0.537855,0.179588,0.153348,0.142857,0.168589,0.203083,0.178571,0.168596,0.207681,0.171159,0.111801,0.059372,0.02999,0.071942,0.4635,0.631746,0.55665,0.35292,0.260316,0.18476,64652.046245,25363.174251,14800.0,23250.0,8750.0,14888.25,16687.0,16154.0,13473.25,16624.25,16651.0,14192.25,16248.0,15000.0,15579.0,15500.0,2448.0,1310.0,1513.0,1420.0,919.0,687.0,1532.25,1125.0,2082.5,849.0,2100.5,1218.0,2406.0,656.5,241.295667,2518.0,33863.0,26250.0,6744.0,4000.0,2596.5,1498.25,1172.5,2596.5,2509.25,2596.5,0.910887,0.861921,28.283893,0.59,0.758221,0.216281,0.69535,0.014947,0.537855,49591.912657,35266.0,25363.174251,88.400002,16.5475,3.45,14.9275,17.1,9.46,96.239998,66273.98,12.13,4.21,11.06,14941.0,23250.0,241.295667,3.0,0.4706,0.8571,2635.75,2.0,830.0,1416.0,0.8235,0.807,0.6213,0.731425,1313.75,405.0,40.0,347.0,2.0,4.0,0.824675,0.7955,0.57225,0.646825,3.0,1.0,19812.0,16774.75,15740.0,16315.0,16414.0,16987.5,13793.0,12954.0,12458.0,12861.25,13000.0,13242.75,0.75,0.793025,3319.0,1940.25,472.0,2.0,0.7353,0.784,937.25,17023.0,291954400.0
max,49146400.0,82098880.0,42788.0,3.0,1.0,1.0,74.0,4.0,4.0,3.0,78.0,9.0,43.0,71.324702,171.378129,33.0,15.0,18.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,108.0,1.0,1.0,740.0,780.0,790.0,800.0,730.0,800.0,760.0,795.0,765.0,35.0,36.0,35.0,36.0,35.0,36.0,11.0,12.0,36.0,36.0,36.0,12.0,1566.0,1566.0,1.0,88921.0,1.0,1.0,1.0,1.0,1.0,0.9973,0.6316,1.0,1.0,1.0,1.0,44661.0,111408.0,41496.0,32114.0,31339.0,32589.0,47826.0,109313.0,109704.0,113261.0,114298.0,113314.0,41496.0,109425.0,31883.0,111737.0,47826.0,113642.0,6383.0,6610.0,4749.0,1172.0,650.0,838.0,1279.0,6259.0,637.0,391.0,400.0,981.0,96375.0,116377.0,74514.0,74514.0,117450.0,455440.0,542922.0,20484.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.976879,0.971939,0.932238,0.977273,0.957265,0.434783,0.31891,0.37931,0.606421,0.40625,0.294737,0.5,0.559146,0.344,0.309735,0.315789,0.157534,0.434783,0.773364,0.91133,0.950134,0.921935,0.896705,0.853963,152068.92308,67438.15,39375.0,45881.0,24208.0,38625.0,35375.0,36000.0,31314.0,43737.0,35629.0,40000.0,35000.0,38750.0,32800.0,35882.0,93095.0,41062.0,52033.0,60282.0,25535.0,16039.0,28633.0,85050.0,80219.0,23270.0,67104.0,25991.0,81286.0,12621.0,476.167162,151086.0,57500.0,53250.0,22000.0,14617.0,61975.0,22902.0,56938.0,61975.0,50030.0,61975.0,0.985612,0.99674,51.6,1.0,0.979567,0.815385,0.98912,0.346939,0.957265,174263.25,179864.0,67438.15,98.980003,85.82,51.720001,99.349998,30.700001,24.360001,100.0,100870.75,55.279999,15.36,11.49,39375.0,45222.0,469.327857,3.0,1.0,1.0,80898.0,2.0,14425.0,42336.0,1.0,1.0,1.0,1.0,19054.0,12877.0,4987.0,12615.0,4.0,4.0,0.994,1.0,0.9565,1.0,3.0,7.0,118250.0,118250.0,119200.0,99995.0,74995.0,86339.0,91125.0,77805.0,46968.0,60000.0,29179.0,37358.0,1.0,1.0,162762.0,68457.0,25695.0,4.0,1.0,1.0,49860.0,1429109.0,37427770000.0


In [143]:
# Change options to display all rows
pd.options.display.max_rows = None

In [144]:
# Show all column names
df.dtypes

UNITID                        int64
OPEID                         int64
OPEID6                        int64
NAME                         object
CITY                         object
STATE                        object
ZIP                          object
ACCREDAGENCY                 object
SCH_DEG                     float64
HCM2                          int64
MAIN                          int64
NUMBRANCH                     int64
PREDDEG                       int64
HIGHDEG                       int64
CONTROL                       int64
ST_FIPS                       int64
REGION                        int64
LOCALE                      float64
LATITUDE                    float64
LONGITUDE                   float64
CCBASIC                     float64
CCUGPROF                    float64
CCSIZSET                    float64
HBCU                        float64
PBI                         float64
ANNHI                       float64
TRIBAL                      float64
AANAPII                     

In [145]:
# Reset display max rows option
pd.reset_option('display.max_rows')

In [146]:
# Get value counts of UNITID
df['UNITID'].value_counts(dropna = False)

149505      1
490258      1
21429002    1
240392      1
203526      1
           ..
423412      1
230898      1
431600      1
158787      1
42799102    1
Name: UNITID, Length: 6806, dtype: int64

In [147]:
# Get value counts of NAME
df['NAME'].value_counts(dropna = False)

Stevens-Henager College                                7
Columbia College                                       5
Brittany Beauty Academy                                4
Unitek College                                         4
Southwestern College                                   3
                                                      ..
Henderson Community College                            1
Tennessee College of Applied Technology-McMinnville    1
Troy University-Support Sites                          1
Washington County Community College                    1
Ave Maria University                                   1
Name: NAME, Length: 6678, dtype: int64

In [148]:
# Get value counts of CITY
df['CITY'].value_counts(dropna = False)

New York       83
Chicago        69
Houston        66
Los Angeles    52
Miami          48
               ..
Torrington      1
Center City     1
Westport        1
Paso Robles     1
Ellensburg      1
Name: CITY, Length: 2456, dtype: int64

In [149]:
# Get value counts of STATE
df['STATE'].value_counts(dropna = False)

CA    702
NY    450
TX    434
FL    387
PA    359
OH    298
IL    263
MI    191
NC    183
GA    177
NJ    167
VA    167
MO    164
MA    163
TN    159
PR    142
IN    137
LA    126
AZ    117
MN    117
OK    110
CO    109
WA    108
WI    100
SC     99
KY     94
AR     92
AL     87
MD     87
IA     86
KS     81
CT     80
OR     79
WV     74
UT     72
MS     60
NM     49
NE     46
ME     40
NV     39
ID     38
NH     38
MT     33
SD     29
ND     28
VT     25
RI     24
DC     23
HI     23
DE     21
WY     10
AK      9
GU      3
VI      2
MH      1
FM      1
AS      1
PW      1
MP      1
Name: STATE, dtype: int64

In [150]:
# Get value counts of ZIP
df['ZIP'].value_counts(dropna = False)

00961         8
33144         6
23462         6
92626         5
78229         5
             ..
46962         1
36756-3207    1
735013025     1
94551-7650    1
30582         1
Name: ZIP, Length: 6043, dtype: int64

In [151]:
# Get value counts of ACCREDAGENCY
df['ACCREDAGENCY'].value_counts(dropna = False)

Higher Learning Commission                                                                                                                            1186
National Accrediting Commission of Career Arts and Sciences                                                                                            964
Southern Association of Colleges and Schools Commission on Colleges                                                                                    875
Middle States Commission on Higher Education                                                                                                           679
Accrediting Commission of Career Schools and Colleges                                                                                                  548
Council on Occupational Education                                                                                                                      522
nan                                                                   

In [152]:
# Get value counts of SCH_DEG
df['SCH_DEG'].value_counts(dropna = False)

1.0    2857
3.0    2454
2.0    1213
NaN     282
Name: SCH_DEG, dtype: int64

In [153]:
# Get value counts of HCM2
df['HCM2'].value_counts(dropna = False)

0    6752
1      54
Name: HCM2, dtype: int64

In [154]:
# Get value counts of MAIN
df['MAIN'].value_counts(dropna = False)

1    5345
0    1461
Name: MAIN, dtype: int64

In [155]:
# Get value counts of NUMBRANCH
df['NUMBRANCH'].value_counts(dropna = False)

1     4846
2      616
3      243
4      163
7       91
6       90
5       81
74      76
14      57
10      50
12      48
8       48
15      46
11      44
13      40
19      38
9       36
17      34
33      33
24      24
23      24
22      22
21      21
18      19
16      16
Name: NUMBRANCH, dtype: int64

In [156]:
# Get value counts of PREDDEG
df['PREDDEG'].value_counts(dropna = False)

1    2829
3    2058
2    1145
0     477
4     297
Name: PREDDEG, dtype: int64

In [157]:
# Get value counts of HIGHDEG
df['HIGHDEG'].value_counts(dropna = False)

1    2192
4    2004
2    1379
3     721
0     510
Name: HIGHDEG, dtype: int64

In [158]:
# Get value counts of CONTROL
df['CONTROL'].value_counts(dropna = False)

3    2698
1    2102
2    2006
Name: CONTROL, dtype: int64

In [159]:
# Get value counts of REGION
df['REGION'].value_counts(dropna = False)

5    1705
2    1104
3     988
8     959
6     710
4     551
1     369
7     261
9     152
0       7
Name: REGION, dtype: int64

In [160]:
# Get value counts of LOCALE
df['LOCALE'].value_counts(dropna = False)

 21.0    1567
 11.0    1479
 13.0     835
 12.0     727
 NaN      475
 32.0     433
 41.0     346
 33.0     323
 22.0     188
 23.0     129
 31.0     124
 42.0     117
 43.0      60
-3.0        3
Name: LOCALE, dtype: int64

In [161]:
# Get value counts of CCBASIC
df['CCBASIC'].value_counts(dropna = False)

-2.0     2275
 NaN      475
 18.0     349
 22.0     310
 24.0     297
 26.0     251
 21.0     238
 10.0     223
 19.0     193
 17.0     146
 16.0     135
 23.0     135
 20.0     131
 15.0     131
 4.0      123
 1.0      122
 2.0      118
 7.0      118
 6.0      110
 14.0     106
 5.0      106
 30.0      93
 8.0       91
 9.0       85
 3.0       82
 29.0      66
 11.0      57
 25.0      56
 13.0      38
 32.0      35
 33.0      34
 31.0      32
 12.0      26
 28.0      12
 27.0       7
Name: CCBASIC, dtype: int64

In [162]:
# Get value counts of CCUGPROF
df['CCUGPROF'].value_counts(dropna = False)

-2.0     2275
 1.0      542
 NaN      475
 11.0     432
 5.0      400
 13.0     332
 2.0      329
 0.0      305
 14.0     294
 4.0      289
 7.0      248
 10.0     217
 12.0     211
 3.0      152
 9.0      136
 15.0     133
 6.0       32
 8.0        4
Name: CCUGPROF, dtype: int64

In [163]:
# Get value counts of CCSIZSET
df['CCSIZSET'].value_counts(dropna = False)

-2.0     2275
 6.0      541
 NaN      475
 2.0      424
 1.0      383
 11.0     376
 3.0      302
 18.0     278
 8.0      272
 12.0     197
 9.0      179
 13.0     174
 14.0     166
 10.0     159
 4.0      144
 15.0     133
 16.0     128
 7.0       93
 5.0       64
 17.0      43
Name: CCSIZSET, dtype: int64

In [164]:
# Get value counts of HBCU
df['HBCU'].value_counts(dropna = False)

0.0    6223
NaN     483
1.0     100
Name: HBCU, dtype: int64

In [165]:
# Get value counts of PBI
df['PBI'].value_counts(dropna = False)

0.0    6222
NaN     483
1.0     101
Name: PBI, dtype: int64

In [166]:
# Get value counts of MENONLY
df['MENONLY'].value_counts(dropna = False)

0.0    6270
NaN     475
1.0      61
Name: MENONLY, dtype: int64

In [167]:
# Get value counts of WOMENONLY
df['WOMENONLY'].value_counts(dropna = False)

0.0    6296
NaN     475
1.0      35
Name: WOMENONLY, dtype: int64

In [168]:
# Get value counts of RELAFFIL
df['RELAFFIL'].value_counts(dropna = False)

NaN      5895
30.0      246
71.0       92
54.0       64
66.0       55
         ... 
107.0       1
22.0        1
92.0        1
45.0        1
100.0       1
Name: RELAFFIL, Length: 63, dtype: int64

In [170]:
# Get value counts of DISTANCEONLY
df['DISTANCEONLY'].value_counts(dropna = False)

0.0    6279
NaN     475
1.0      52
Name: DISTANCEONLY, dtype: int64

In [171]:
# Get value counts of CURROPER
df['CURROPER'].value_counts(dropna = False)

1    6469
0     337
Name: CURROPER, dtype: int64

In [172]:
# Get value counts of TUITFTE
df['TUITFTE'].value_counts(dropna = False)

NaN         502
0.0          14
1606.0        4
3478.0        4
5195.0        4
           ... 
1052.0        1
170220.0      1
4253.0        1
18575.0       1
8077.0        1
Name: TUITFTE, Length: 5482, dtype: int64

In [173]:
# Get value counts of ADM_RATE
df['ADM_RATE'].value_counts(dropna = False)

NaN       4800
1.0000      87
0.5000      15
0.6667      10
0.3333      10
          ... 
0.9400       1
0.9163       1
0.3437       1
0.8807       1
0.7970       1
Name: ADM_RATE, Length: 1596, dtype: int64

In [174]:
# Get value counts of SAT_AVG
df['SAT_AVG'].value_counts(dropna = False)

NaN       5508
1120.0      20
1105.0      14
1133.0      12
1129.0      11
          ... 
1415.0       1
1407.0       1
993.0        1
1151.0       1
1456.0       1
Name: SAT_AVG, Length: 450, dtype: int64

In [175]:
# Get value counts of PCTPELL
df['PCTPELL'].value_counts(dropna = False)

NaN       792
0.0000     66
1.0000     35
0.5000     28
0.6667     19
         ... 
0.1878      1
0.4212      1
0.3459      1
0.1389      1
0.7565      1
Name: PCTPELL, Length: 3935, dtype: int64

In [176]:
# Get value counts of DEBT_MDN
df['DEBT_MDN'].value_counts(dropna = False)

NaN        1066
9500.0      559
5500.0      296
6333.0      164
12000.0     149
           ... 
6074.0        1
6925.0        1
5454.0        1
7497.0        1
12039.0       1
Name: DEBT_MDN, Length: 1849, dtype: int64

In [177]:
# Get value counts of NPT4_PUB
df['NPT4_PUB'].value_counts(dropna = False)

NaN        4928
5906.0        3
8262.0        2
12001.0       2
9593.0        2
           ... 
9880.0        1
15620.0       1
4883.0        1
2999.0        1
7692.0        1
Name: NPT4_PUB, Length: 1776, dtype: int64

In [178]:
# Get value counts of NPT4_PRIV
df['NPT4_PRIV'].value_counts(dropna = False)

NaN        3079
28568.0       3
10797.0       3
24345.0       3
9600.0        3
           ... 
18722.0       1
31109.0       1
10856.0       1
7977.0        1
16405.0       1
Name: NPT4_PRIV, Length: 3477, dtype: int64

In [180]:
# Get value counts of NUM4_PUB
df['NUM4_PUB'].value_counts(dropna = False)

NaN       4928
1.0         17
5.0         14
9.0         14
8.0         14
          ... 
338.0        1
1451.0       1
384.0        1
576.0        1
1202.0       1
Name: NUM4_PUB, Length: 943, dtype: int64

In [181]:
# Get value counts of NUM4_PRIV
df['NUM4_PRIV'].value_counts(dropna = False)

NaN       3078
1.0         90
5.0         80
3.0         80
8.0         62
          ... 
499.0        1
933.0        1
549.0        1
813.0        1
1014.0       1
Name: NUM4_PRIV, Length: 630, dtype: int64

In [182]:
# Get value counts of COSTT4_A
df['COSTT4_A'].value_counts(dropna = False)

NaN        3375
27879.0       9
29195.0       4
26535.0       4
19100.0       3
           ... 
17824.0       1
17099.0       1
12691.0       1
16030.0       1
20652.0       1
Name: COSTT4_A, Length: 3248, dtype: int64

In [184]:
# Get value counts of INEXPFTE
df['INEXPFTE'].value_counts(dropna = False)

NaN        502
0.0          7
2840.0       5
5401.0       5
4693.0       5
          ... 
3483.0       1
4803.0       1
4764.0       1
11495.0      1
6893.0       1
Name: INEXPFTE, Length: 5092, dtype: int64

# 05. Export data

In [183]:
# Export data set
df.to_pickle(os.path.join(path, '02 Data', 'Prepared Data', 'scorecard_data_cleaned.pkl'))