In [2]:
import numpy as np
import pandas as pd

In [3]:
# read in census api
import census

In [4]:
# Set display options
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.options.display.float_format = '{:.2f}'.format  # Avoid scientific notation

# Set API Key
api_key = "64cf38e923af4727b9aafdd762ffa44d37aed7f5"
c = census.Census(api_key)

In [5]:
# Chicago-specific settings
city_name = 'Chicago'
state = '17'
FIPS = ['031', '043', '089', '093', '097', '111', '197']
sql_query = 'state:{} county:*'.format(state)

# Function to filter FIPS codes
def filter_FIPS(df):
    return df[df['county'].isin(FIPS)]


In [6]:
# Variables to fetch from ACS 2023
variables_2023 = ['B01003_001E', # total population
                    'B02001_002E', # white population
                    'B11001_001E', # total households
                    'B19013_001E', # median household income in 2023 inflation adjusted dollars
                    'B25077_001E', # median home value in 2023
                    'B25064_001E', # median gross rent in 2023
                    'B25003_002E', # owner occupied housing units
                    'B25003_003E', # renter occupied housing units
                    'B15003_022E', # total number of people with bachelor's degree over age 25
                    'B15003_023E', # total number of people with master's degree over age 25
                    'B15003_024E', # total number of people with professional degree over age 25
                    'B15003_025E', # total number of people with doctorate degree over age 25
                    'B25034_001E', # total number of housing units
                    'B25034_010E', # units built 1940-1949
                    'B25034_011E', # units built 11939 or earlier
                    'B07010_025E', # total number of people who move within the same county with income
                    'B07010_026E', # Total number of people who moved within same county with income $1 to $9,999 or loss
                    'B07010_027E', # Total number of people who moved within same county with income $10,000 to $14,999
                    'B07010_028E', # Total number of people who moved within same county with income $15,000 to $24,999
                    'B07010_029E', # Total number of people who moved within same county with income $25,000 to $34,999
                    'B07010_030E', # Total number of people who moved within same county with income $35,000 to $49,999
                    'B07010_031E', # Total number of people who moved within same county with income $50,000 to $64,999
                    'B07010_032E', # Total number of people who moved within same county with income $65,000 to $74,999
                    'B07010_033E', # Total number of people who moved within same county with income $75,000 more 
                    'B07010_036E', # Total number of people who moved from different county with income
                    'B07010_037E', # Total number of people who moved from different county with income $1 to $9,999 or loss
                    'B07010_038E', # Total number of people who moved from different county with income $10,000 to $14,999
                    'B07010_039E', # Total number of people who moved from different county with income $15,000 to $24,999
                    'B07010_040E', # Total number of people who moved from different county with income $25,000 to $34,999
                    'B07010_041E', # Total number of people who moved from different county with income $35,000 to $49,999
                    'B07010_042E', # Total number of people who moved from different county with income $50,000 to $64,999
                    'B07010_043E', # Total number of people who moved from different county with income $65,000 to $74,999
                    'B07010_044E', # Total number of people who moved from different county with income $76,000 or more
                    'B07010_047E', # Total number of people who moved from different state with income
                    'B07010_048E', # Total number of people who moved from different state with income $1 to $9,999 or loss
                    'B07010_049E', # Total number of people who moved from different state with income $10,000 to $14,999
                    'B07010_050E', # Total number of people who moved from different state with income $15,000 to $24,999
                    'B07010_051E', # Total number of people who moved from different state with income $25,000 to $34,999
                    'B07010_052E', # Total number of people who moved from different state with income $35,000 to $49,999
                    'B07010_053E', # Total number of people who moved from different state with income $50,000 to $64,999
                    'B07010_054E', # Total number of people who moved from different state with income $65,000 to $74,999
                    'B07010_055E', # Total number of people who moved from different state with income $76,000 or more
                    'B07010_058E', # Total number of people who moved from abroad with income
                    'B07010_059E', # Total number of people who moved from abroad with income $1 to $9,999 or loss
                    'B07010_060E', # Total number of people who moved from abroad with income $10,000 to $14,999
                    'B07010_061E', # Total number of people who moved from abroad with income $15,000 to $24,999
                    'B07010_062E', # Total number of people who moved from abroad with income $25,000 to $34,999
                    'B07010_063E', # Total number of people who moved from abroad with income $35,000 to $49,999
                    'B07010_064E', # Total number of people who moved from abroad with income $50,000 to $64,999
                    'B07010_065E', # Total number of people who moved from abroad with income $65,000 to $74,999
                    'B07010_066E', # Total number of people who moved from abroad with income $76,000 or more
                    'B06011_001E', # Median income in the past 12 months (in 2023 inflation-adjusted dollars) for the population 15 years and over 
                    ]

In [7]:
# Income categories
income_vars = ['B19001_' + str(i).zfill(3) + 'E' for i in range(1, 18)]
variables_2023.extend(income_vars)

# Run API query
var_dict_acs5 = c.acs5.get(variables_2023, geo={'for': 'tract:*', 'in': sql_query}, year=2023)


In [8]:
# Convert to DataFrame and filter by FIPS
df_2023 = pd.DataFrame.from_dict(var_dict_acs5)
df_2023['FIPS'] = df_2023['state'] + df_2023['county'] + df_2023['tract']
df_2023 = filter_FIPS(df_2023)
df_2023.head(10)

Unnamed: 0,B01003_001E,B02001_002E,B11001_001E,B19013_001E,B25077_001E,B25064_001E,B25003_002E,B25003_003E,B15003_022E,B15003_023E,B15003_024E,B15003_025E,B25034_001E,B25034_010E,B25034_011E,B07010_025E,B07010_026E,B07010_027E,B07010_028E,B07010_029E,B07010_030E,B07010_031E,B07010_032E,B07010_033E,B07010_036E,B07010_037E,B07010_038E,B07010_039E,B07010_040E,B07010_041E,B07010_042E,B07010_043E,B07010_044E,B07010_047E,B07010_048E,B07010_049E,B07010_050E,B07010_051E,B07010_052E,B07010_053E,B07010_054E,B07010_055E,B07010_058E,B07010_059E,B07010_060E,B07010_061E,B07010_062E,B07010_063E,B07010_064E,GEO_ID,state,county,tract,B07010_065E,B07010_066E,B06011_001E,B19001_001E,B19001_002E,B19001_003E,B19001_004E,B19001_005E,B19001_006E,B19001_007E,B19001_008E,B19001_009E,B19001_010E,B19001_011E,B19001_012E,B19001_013E,B19001_014E,B19001_015E,B19001_016E,B19001_017E,FIPS
150,3726.0,1475.0,2190.0,69460.0,296600.0,1252.0,689.0,1501.0,775.0,385.0,54.0,132.0,2841.0,289.0,1760.0,196.0,80.0,24.0,53.0,0.0,23.0,0.0,0.0,16.0,15.0,5.0,5.0,5.0,0.0,0.0,0.0,0.0,0.0,41.0,0.0,0.0,0.0,0.0,0.0,21.0,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1400000US17031010100,17,31,10100,0.0,0.0,37386.0,2190.0,125.0,109.0,41.0,148.0,118.0,191.0,51.0,45.0,96.0,102.0,299.0,418.0,82.0,118.0,124.0,123.0,17031010100
151,7588.0,1883.0,3038.0,49639.0,239100.0,1333.0,823.0,2215.0,684.0,647.0,135.0,106.0,3276.0,196.0,1586.0,564.0,84.0,176.0,37.0,33.0,80.0,0.0,51.0,103.0,8.0,0.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,198.0,0.0,9.0,16.0,109.0,43.0,0.0,0.0,21.0,25.0,0.0,0.0,0.0,25.0,0.0,0.0,1400000US17031010201,17,31,10201,0.0,0.0,39311.0,3038.0,223.0,61.0,153.0,0.0,92.0,172.0,355.0,243.0,233.0,49.0,192.0,576.0,220.0,201.0,161.0,107.0,17031010201
152,2609.0,987.0,1130.0,55119.0,231900.0,1292.0,270.0,860.0,656.0,232.0,52.0,42.0,1303.0,76.0,512.0,209.0,41.0,1.0,33.0,24.0,25.0,26.0,25.0,34.0,56.0,35.0,0.0,0.0,10.0,11.0,0.0,0.0,0.0,129.0,28.0,0.0,7.0,0.0,32.0,0.0,24.0,38.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1400000US17031010202,17,31,10202,0.0,0.0,34938.0,1130.0,100.0,79.0,12.0,12.0,40.0,52.0,20.0,94.0,103.0,104.0,36.0,236.0,99.0,31.0,66.0,46.0,17031010202
153,6311.0,3558.0,3185.0,65871.0,305000.0,1257.0,859.0,2326.0,1585.0,644.0,121.0,149.0,3377.0,292.0,1655.0,1072.0,191.0,187.0,133.0,105.0,99.0,121.0,93.0,143.0,65.0,10.0,5.0,0.0,0.0,3.0,30.0,0.0,17.0,166.0,0.0,25.0,89.0,23.0,0.0,0.0,29.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1400000US17031010300,17,31,10300,0.0,0.0,38532.0,3185.0,44.0,231.0,98.0,259.0,225.0,45.0,69.0,100.0,81.0,293.0,422.0,436.0,242.0,245.0,166.0,229.0,17031010300
154,4282.0,3349.0,2058.0,49017.0,229400.0,1248.0,513.0,1545.0,999.0,400.0,128.0,70.0,2460.0,216.0,1216.0,616.0,121.0,19.0,0.0,51.0,201.0,50.0,18.0,156.0,140.0,72.0,0.0,41.0,0.0,0.0,0.0,0.0,27.0,310.0,245.0,0.0,33.0,22.0,0.0,10.0,0.0,0.0,21.0,12.0,9.0,0.0,0.0,0.0,0.0,1400000US17031010400,17,31,10400,0.0,0.0,33561.0,2058.0,141.0,131.0,298.0,81.0,59.0,41.0,56.0,33.0,268.0,101.0,180.0,218.0,99.0,129.0,85.0,138.0,17031010400
155,3519.0,2298.0,2379.0,48250.0,196600.0,1176.0,341.0,2038.0,1157.0,573.0,0.0,206.0,2705.0,262.0,1198.0,383.0,0.0,0.0,19.0,38.0,156.0,77.0,16.0,77.0,47.0,0.0,0.0,0.0,20.0,27.0,0.0,0.0,0.0,110.0,57.0,0.0,16.0,0.0,0.0,0.0,0.0,37.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1400000US17031010501,17,31,10501,0.0,0.0,36258.0,2379.0,171.0,127.0,223.0,152.0,76.0,100.0,57.0,137.0,171.0,231.0,235.0,234.0,191.0,122.0,85.0,67.0,17031010501
156,3329.0,2171.0,1637.0,61367.0,282200.0,1311.0,469.0,1168.0,770.0,550.0,38.0,156.0,1807.0,164.0,1004.0,454.0,156.0,38.0,36.0,54.0,53.0,24.0,27.0,66.0,26.0,13.0,0.0,13.0,0.0,0.0,0.0,0.0,0.0,222.0,88.0,42.0,29.0,11.0,23.0,9.0,0.0,20.0,12.0,0.0,12.0,0.0,0.0,0.0,0.0,1400000US17031010502,17,31,10502,0.0,0.0,36926.0,1637.0,99.0,118.0,152.0,82.0,61.0,32.0,58.0,37.0,60.0,102.0,153.0,290.0,147.0,57.0,32.0,157.0,17031010502
157,2844.0,1806.0,1477.0,21924.0,470500.0,1122.0,177.0,1300.0,350.0,256.0,38.0,111.0,1570.0,109.0,510.0,591.0,329.0,88.0,53.0,60.0,22.0,36.0,0.0,3.0,75.0,23.0,18.0,0.0,0.0,0.0,34.0,0.0,0.0,78.0,69.0,0.0,0.0,9.0,0.0,0.0,0.0,0.0,66.0,35.0,20.0,0.0,0.0,11.0,0.0,1400000US17031010503,17,31,10503,0.0,0.0,13289.0,1477.0,298.0,249.0,103.0,133.0,46.0,44.0,49.0,13.0,37.0,97.0,92.0,125.0,65.0,48.0,45.0,33.0,17031010503
158,6708.0,3804.0,3066.0,71920.0,254500.0,1276.0,1094.0,1972.0,1843.0,760.0,136.0,267.0,3176.0,69.0,1683.0,797.0,45.0,6.0,78.0,249.0,191.0,138.0,59.0,31.0,36.0,0.0,0.0,0.0,0.0,34.0,0.0,0.0,2.0,209.0,26.0,46.0,36.0,50.0,33.0,18.0,0.0,0.0,88.0,0.0,0.0,0.0,0.0,0.0,88.0,1400000US17031010600,17,31,10600,0.0,0.0,38090.0,3066.0,81.0,152.0,49.0,45.0,209.0,130.0,172.0,134.0,28.0,169.0,464.0,374.0,280.0,312.0,176.0,291.0,17031010600
159,3573.0,1431.0,1652.0,74208.0,345400.0,1338.0,820.0,832.0,1047.0,382.0,41.0,41.0,1753.0,123.0,847.0,296.0,72.0,0.0,52.0,37.0,34.0,31.0,8.0,62.0,35.0,0.0,0.0,0.0,35.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1400000US17031010701,17,31,10701,0.0,0.0,43372.0,1652.0,31.0,51.0,50.0,40.0,51.0,169.0,54.0,49.0,57.0,113.0,193.0,255.0,161.0,92.0,126.0,160.0,17031010701


In [9]:
# Rename variables
# Rename columns
df_2023 = df_2023.rename(columns={  'B01003_001E': 'pop',
                                    'B02001_002E': 'white',
                                    'B11001_001E': 'hh',
                                    'B19013_001E': 'medhinc', 
                                    'B25077_001E': 'mhval',
                                    'B25064_001E': 'mrent',
                                    'B25003_002E': 'ohu',
                                    'B25003_003E': 'rhu',
                                    'B25105_001E': 'mmhcosts',
                                    'B15003_001E': 'total_25',
                                    'B15003_022E': 'total_bd',
                                    'B15003_023E': 'total_md',
                                    'B15003_024E': 'total_pd',
                                    'B15003_025E': 'total_phd',
                                    'B25034_001E': 'tot_units_built',
                                    'B25034_010E': 'units_40_49',
                                    'B25034_011E': 'units_39_earlier',
                                    'B07010_025E':'mov_wc_w_income',
                                    'B07010_026E':'mov_wc_9000',
                                    'B07010_027E':'mov_wc_15000',
                                    'B07010_028E':'mov_wc_25000',
                                    'B07010_029E':'mov_wc_35000',
                                    'B07010_030E':'mov_wc_50000',
                                    'B07010_031E':'mov_wc_65000',
                                    'B07010_032E':'mov_wc_75000',
                                    'B07010_033E':'mov_wc_76000_more',
                                    'B07010_036E':'mov_oc_w_income',
                                    'B07010_037E':'mov_oc_9000',
                                    'B07010_038E':'mov_oc_15000',
                                    'B07010_039E':'mov_oc_25000',
                                    'B07010_040E':'mov_oc_35000',
                                    'B07010_041E':'mov_oc_50000',
                                    'B07010_042E':'mov_oc_65000',
                                    'B07010_043E':'mov_oc_75000',
                                    'B07010_044E':'mov_oc_76000_more',
                                    'B07010_047E':'mov_os_w_income',
                                    'B07010_048E':'mov_os_9000',
                                    'B07010_049E':'mov_os_15000',
                                    'B07010_050E':'mov_os_25000',
                                    'B07010_051E':'mov_os_35000',
                                    'B07010_052E':'mov_os_50000',
                                    'B07010_053E':'mov_os_65000',
                                    'B07010_054E':'mov_os_75000',
                                    'B07010_055E':'mov_os_76000_more',
                                    'B07010_058E':'mov_fa_w_income',
                                    'B07010_059E':'mov_fa_9000',
                                    'B07010_060E':'mov_fa_15000',
                                    'B07010_061E':'mov_fa_25000',
                                    'B07010_062E':'mov_fa_35000',
                                    'B07010_063E':'mov_fa_50000',
                                    'B07010_064E':'mov_fa_65000',
                                    'B07010_065E':'mov_fa_75000',
                                    'B07010_066E':'mov_fa_76000_more',
                                    'B06011_001E':'iinc',
                                    'B19001_001E':'hinc', # number of household who reported household income in the past 12 months
                                    'B19001_002E':'I_10000', # these variables are on the household level
                                    'B19001_003E':'I_15000',
                                    'B19001_004E':'I_20000',
                                    'B19001_005E':'I_25000',
                                    'B19001_006E':'I_30000',
                                    'B19001_007E':'I_35000',
                                    'B19001_008E':'I_40000',
                                    'B19001_009E':'I_45000',
                                    'B19001_010E':'I_50000',
                                    'B19001_011E':'I_60000',
                                    'B19001_012E':'I_75000',
                                    'B19001_013E':'I_100000',
                                    'B19001_014E':'I_125000',
                                    'B19001_015E':'I_150000',
                                    'B19001_016E':'I_200000',
                                    'B19001_017E':'I_201000'})

In [10]:
df_2023.head(10)

Unnamed: 0,pop,white,hh,medhinc,mhval,mrent,ohu,rhu,total_bd,total_md,total_pd,total_phd,tot_units_built,units_40_49,units_39_earlier,mov_wc_w_income,mov_wc_9000,mov_wc_15000,mov_wc_25000,mov_wc_35000,mov_wc_50000,mov_wc_65000,mov_wc_75000,mov_wc_76000_more,mov_oc_w_income,mov_oc_9000,mov_oc_15000,mov_oc_25000,mov_oc_35000,mov_oc_50000,mov_oc_65000,mov_oc_75000,mov_oc_76000_more,mov_os_w_income,mov_os_9000,mov_os_15000,mov_os_25000,mov_os_35000,mov_os_50000,mov_os_65000,mov_os_75000,mov_os_76000_more,mov_fa_w_income,mov_fa_9000,mov_fa_15000,mov_fa_25000,mov_fa_35000,mov_fa_50000,mov_fa_65000,GEO_ID,state,county,tract,mov_fa_75000,mov_fa_76000_more,iinc,hinc,I_10000,I_15000,I_20000,I_25000,I_30000,I_35000,I_40000,I_45000,I_50000,I_60000,I_75000,I_100000,I_125000,I_150000,I_200000,I_201000,FIPS
150,3726.0,1475.0,2190.0,69460.0,296600.0,1252.0,689.0,1501.0,775.0,385.0,54.0,132.0,2841.0,289.0,1760.0,196.0,80.0,24.0,53.0,0.0,23.0,0.0,0.0,16.0,15.0,5.0,5.0,5.0,0.0,0.0,0.0,0.0,0.0,41.0,0.0,0.0,0.0,0.0,0.0,21.0,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1400000US17031010100,17,31,10100,0.0,0.0,37386.0,2190.0,125.0,109.0,41.0,148.0,118.0,191.0,51.0,45.0,96.0,102.0,299.0,418.0,82.0,118.0,124.0,123.0,17031010100
151,7588.0,1883.0,3038.0,49639.0,239100.0,1333.0,823.0,2215.0,684.0,647.0,135.0,106.0,3276.0,196.0,1586.0,564.0,84.0,176.0,37.0,33.0,80.0,0.0,51.0,103.0,8.0,0.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,198.0,0.0,9.0,16.0,109.0,43.0,0.0,0.0,21.0,25.0,0.0,0.0,0.0,25.0,0.0,0.0,1400000US17031010201,17,31,10201,0.0,0.0,39311.0,3038.0,223.0,61.0,153.0,0.0,92.0,172.0,355.0,243.0,233.0,49.0,192.0,576.0,220.0,201.0,161.0,107.0,17031010201
152,2609.0,987.0,1130.0,55119.0,231900.0,1292.0,270.0,860.0,656.0,232.0,52.0,42.0,1303.0,76.0,512.0,209.0,41.0,1.0,33.0,24.0,25.0,26.0,25.0,34.0,56.0,35.0,0.0,0.0,10.0,11.0,0.0,0.0,0.0,129.0,28.0,0.0,7.0,0.0,32.0,0.0,24.0,38.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1400000US17031010202,17,31,10202,0.0,0.0,34938.0,1130.0,100.0,79.0,12.0,12.0,40.0,52.0,20.0,94.0,103.0,104.0,36.0,236.0,99.0,31.0,66.0,46.0,17031010202
153,6311.0,3558.0,3185.0,65871.0,305000.0,1257.0,859.0,2326.0,1585.0,644.0,121.0,149.0,3377.0,292.0,1655.0,1072.0,191.0,187.0,133.0,105.0,99.0,121.0,93.0,143.0,65.0,10.0,5.0,0.0,0.0,3.0,30.0,0.0,17.0,166.0,0.0,25.0,89.0,23.0,0.0,0.0,29.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1400000US17031010300,17,31,10300,0.0,0.0,38532.0,3185.0,44.0,231.0,98.0,259.0,225.0,45.0,69.0,100.0,81.0,293.0,422.0,436.0,242.0,245.0,166.0,229.0,17031010300
154,4282.0,3349.0,2058.0,49017.0,229400.0,1248.0,513.0,1545.0,999.0,400.0,128.0,70.0,2460.0,216.0,1216.0,616.0,121.0,19.0,0.0,51.0,201.0,50.0,18.0,156.0,140.0,72.0,0.0,41.0,0.0,0.0,0.0,0.0,27.0,310.0,245.0,0.0,33.0,22.0,0.0,10.0,0.0,0.0,21.0,12.0,9.0,0.0,0.0,0.0,0.0,1400000US17031010400,17,31,10400,0.0,0.0,33561.0,2058.0,141.0,131.0,298.0,81.0,59.0,41.0,56.0,33.0,268.0,101.0,180.0,218.0,99.0,129.0,85.0,138.0,17031010400
155,3519.0,2298.0,2379.0,48250.0,196600.0,1176.0,341.0,2038.0,1157.0,573.0,0.0,206.0,2705.0,262.0,1198.0,383.0,0.0,0.0,19.0,38.0,156.0,77.0,16.0,77.0,47.0,0.0,0.0,0.0,20.0,27.0,0.0,0.0,0.0,110.0,57.0,0.0,16.0,0.0,0.0,0.0,0.0,37.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1400000US17031010501,17,31,10501,0.0,0.0,36258.0,2379.0,171.0,127.0,223.0,152.0,76.0,100.0,57.0,137.0,171.0,231.0,235.0,234.0,191.0,122.0,85.0,67.0,17031010501
156,3329.0,2171.0,1637.0,61367.0,282200.0,1311.0,469.0,1168.0,770.0,550.0,38.0,156.0,1807.0,164.0,1004.0,454.0,156.0,38.0,36.0,54.0,53.0,24.0,27.0,66.0,26.0,13.0,0.0,13.0,0.0,0.0,0.0,0.0,0.0,222.0,88.0,42.0,29.0,11.0,23.0,9.0,0.0,20.0,12.0,0.0,12.0,0.0,0.0,0.0,0.0,1400000US17031010502,17,31,10502,0.0,0.0,36926.0,1637.0,99.0,118.0,152.0,82.0,61.0,32.0,58.0,37.0,60.0,102.0,153.0,290.0,147.0,57.0,32.0,157.0,17031010502
157,2844.0,1806.0,1477.0,21924.0,470500.0,1122.0,177.0,1300.0,350.0,256.0,38.0,111.0,1570.0,109.0,510.0,591.0,329.0,88.0,53.0,60.0,22.0,36.0,0.0,3.0,75.0,23.0,18.0,0.0,0.0,0.0,34.0,0.0,0.0,78.0,69.0,0.0,0.0,9.0,0.0,0.0,0.0,0.0,66.0,35.0,20.0,0.0,0.0,11.0,0.0,1400000US17031010503,17,31,10503,0.0,0.0,13289.0,1477.0,298.0,249.0,103.0,133.0,46.0,44.0,49.0,13.0,37.0,97.0,92.0,125.0,65.0,48.0,45.0,33.0,17031010503
158,6708.0,3804.0,3066.0,71920.0,254500.0,1276.0,1094.0,1972.0,1843.0,760.0,136.0,267.0,3176.0,69.0,1683.0,797.0,45.0,6.0,78.0,249.0,191.0,138.0,59.0,31.0,36.0,0.0,0.0,0.0,0.0,34.0,0.0,0.0,2.0,209.0,26.0,46.0,36.0,50.0,33.0,18.0,0.0,0.0,88.0,0.0,0.0,0.0,0.0,0.0,88.0,1400000US17031010600,17,31,10600,0.0,0.0,38090.0,3066.0,81.0,152.0,49.0,45.0,209.0,130.0,172.0,134.0,28.0,169.0,464.0,374.0,280.0,312.0,176.0,291.0,17031010600
159,3573.0,1431.0,1652.0,74208.0,345400.0,1338.0,820.0,832.0,1047.0,382.0,41.0,41.0,1753.0,123.0,847.0,296.0,72.0,0.0,52.0,37.0,34.0,31.0,8.0,62.0,35.0,0.0,0.0,0.0,35.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1400000US17031010701,17,31,10701,0.0,0.0,43372.0,1652.0,31.0,51.0,50.0,40.0,51.0,169.0,54.0,49.0,57.0,113.0,193.0,255.0,161.0,92.0,126.0,160.0,17031010701


In [11]:
# add features to match with the 2018 data
df_2023['typology'] = None
df_2023['year'] = 2023
df_2023['typ_cat'] = None
df_2023.drop(columns=['GEO_ID'], inplace=True)

In [12]:
df_2023.head(10)

Unnamed: 0,pop,white,hh,medhinc,mhval,mrent,ohu,rhu,total_bd,total_md,total_pd,total_phd,tot_units_built,units_40_49,units_39_earlier,mov_wc_w_income,mov_wc_9000,mov_wc_15000,mov_wc_25000,mov_wc_35000,mov_wc_50000,mov_wc_65000,mov_wc_75000,mov_wc_76000_more,mov_oc_w_income,mov_oc_9000,mov_oc_15000,mov_oc_25000,mov_oc_35000,mov_oc_50000,mov_oc_65000,mov_oc_75000,mov_oc_76000_more,mov_os_w_income,mov_os_9000,mov_os_15000,mov_os_25000,mov_os_35000,mov_os_50000,mov_os_65000,mov_os_75000,mov_os_76000_more,mov_fa_w_income,mov_fa_9000,mov_fa_15000,mov_fa_25000,mov_fa_35000,mov_fa_50000,mov_fa_65000,state,county,tract,mov_fa_75000,mov_fa_76000_more,iinc,hinc,I_10000,I_15000,I_20000,I_25000,I_30000,I_35000,I_40000,I_45000,I_50000,I_60000,I_75000,I_100000,I_125000,I_150000,I_200000,I_201000,FIPS,typology,year,typ_cat
150,3726.0,1475.0,2190.0,69460.0,296600.0,1252.0,689.0,1501.0,775.0,385.0,54.0,132.0,2841.0,289.0,1760.0,196.0,80.0,24.0,53.0,0.0,23.0,0.0,0.0,16.0,15.0,5.0,5.0,5.0,0.0,0.0,0.0,0.0,0.0,41.0,0.0,0.0,0.0,0.0,0.0,21.0,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10100,0.0,0.0,37386.0,2190.0,125.0,109.0,41.0,148.0,118.0,191.0,51.0,45.0,96.0,102.0,299.0,418.0,82.0,118.0,124.0,123.0,17031010100,,2023,
151,7588.0,1883.0,3038.0,49639.0,239100.0,1333.0,823.0,2215.0,684.0,647.0,135.0,106.0,3276.0,196.0,1586.0,564.0,84.0,176.0,37.0,33.0,80.0,0.0,51.0,103.0,8.0,0.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,198.0,0.0,9.0,16.0,109.0,43.0,0.0,0.0,21.0,25.0,0.0,0.0,0.0,25.0,0.0,0.0,17,31,10201,0.0,0.0,39311.0,3038.0,223.0,61.0,153.0,0.0,92.0,172.0,355.0,243.0,233.0,49.0,192.0,576.0,220.0,201.0,161.0,107.0,17031010201,,2023,
152,2609.0,987.0,1130.0,55119.0,231900.0,1292.0,270.0,860.0,656.0,232.0,52.0,42.0,1303.0,76.0,512.0,209.0,41.0,1.0,33.0,24.0,25.0,26.0,25.0,34.0,56.0,35.0,0.0,0.0,10.0,11.0,0.0,0.0,0.0,129.0,28.0,0.0,7.0,0.0,32.0,0.0,24.0,38.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10202,0.0,0.0,34938.0,1130.0,100.0,79.0,12.0,12.0,40.0,52.0,20.0,94.0,103.0,104.0,36.0,236.0,99.0,31.0,66.0,46.0,17031010202,,2023,
153,6311.0,3558.0,3185.0,65871.0,305000.0,1257.0,859.0,2326.0,1585.0,644.0,121.0,149.0,3377.0,292.0,1655.0,1072.0,191.0,187.0,133.0,105.0,99.0,121.0,93.0,143.0,65.0,10.0,5.0,0.0,0.0,3.0,30.0,0.0,17.0,166.0,0.0,25.0,89.0,23.0,0.0,0.0,29.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10300,0.0,0.0,38532.0,3185.0,44.0,231.0,98.0,259.0,225.0,45.0,69.0,100.0,81.0,293.0,422.0,436.0,242.0,245.0,166.0,229.0,17031010300,,2023,
154,4282.0,3349.0,2058.0,49017.0,229400.0,1248.0,513.0,1545.0,999.0,400.0,128.0,70.0,2460.0,216.0,1216.0,616.0,121.0,19.0,0.0,51.0,201.0,50.0,18.0,156.0,140.0,72.0,0.0,41.0,0.0,0.0,0.0,0.0,27.0,310.0,245.0,0.0,33.0,22.0,0.0,10.0,0.0,0.0,21.0,12.0,9.0,0.0,0.0,0.0,0.0,17,31,10400,0.0,0.0,33561.0,2058.0,141.0,131.0,298.0,81.0,59.0,41.0,56.0,33.0,268.0,101.0,180.0,218.0,99.0,129.0,85.0,138.0,17031010400,,2023,
155,3519.0,2298.0,2379.0,48250.0,196600.0,1176.0,341.0,2038.0,1157.0,573.0,0.0,206.0,2705.0,262.0,1198.0,383.0,0.0,0.0,19.0,38.0,156.0,77.0,16.0,77.0,47.0,0.0,0.0,0.0,20.0,27.0,0.0,0.0,0.0,110.0,57.0,0.0,16.0,0.0,0.0,0.0,0.0,37.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10501,0.0,0.0,36258.0,2379.0,171.0,127.0,223.0,152.0,76.0,100.0,57.0,137.0,171.0,231.0,235.0,234.0,191.0,122.0,85.0,67.0,17031010501,,2023,
156,3329.0,2171.0,1637.0,61367.0,282200.0,1311.0,469.0,1168.0,770.0,550.0,38.0,156.0,1807.0,164.0,1004.0,454.0,156.0,38.0,36.0,54.0,53.0,24.0,27.0,66.0,26.0,13.0,0.0,13.0,0.0,0.0,0.0,0.0,0.0,222.0,88.0,42.0,29.0,11.0,23.0,9.0,0.0,20.0,12.0,0.0,12.0,0.0,0.0,0.0,0.0,17,31,10502,0.0,0.0,36926.0,1637.0,99.0,118.0,152.0,82.0,61.0,32.0,58.0,37.0,60.0,102.0,153.0,290.0,147.0,57.0,32.0,157.0,17031010502,,2023,
157,2844.0,1806.0,1477.0,21924.0,470500.0,1122.0,177.0,1300.0,350.0,256.0,38.0,111.0,1570.0,109.0,510.0,591.0,329.0,88.0,53.0,60.0,22.0,36.0,0.0,3.0,75.0,23.0,18.0,0.0,0.0,0.0,34.0,0.0,0.0,78.0,69.0,0.0,0.0,9.0,0.0,0.0,0.0,0.0,66.0,35.0,20.0,0.0,0.0,11.0,0.0,17,31,10503,0.0,0.0,13289.0,1477.0,298.0,249.0,103.0,133.0,46.0,44.0,49.0,13.0,37.0,97.0,92.0,125.0,65.0,48.0,45.0,33.0,17031010503,,2023,
158,6708.0,3804.0,3066.0,71920.0,254500.0,1276.0,1094.0,1972.0,1843.0,760.0,136.0,267.0,3176.0,69.0,1683.0,797.0,45.0,6.0,78.0,249.0,191.0,138.0,59.0,31.0,36.0,0.0,0.0,0.0,0.0,34.0,0.0,0.0,2.0,209.0,26.0,46.0,36.0,50.0,33.0,18.0,0.0,0.0,88.0,0.0,0.0,0.0,0.0,0.0,88.0,17,31,10600,0.0,0.0,38090.0,3066.0,81.0,152.0,49.0,45.0,209.0,130.0,172.0,134.0,28.0,169.0,464.0,374.0,280.0,312.0,176.0,291.0,17031010600,,2023,
159,3573.0,1431.0,1652.0,74208.0,345400.0,1338.0,820.0,832.0,1047.0,382.0,41.0,41.0,1753.0,123.0,847.0,296.0,72.0,0.0,52.0,37.0,34.0,31.0,8.0,62.0,35.0,0.0,0.0,0.0,35.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10701,0.0,0.0,43372.0,1652.0,31.0,51.0,50.0,40.0,51.0,169.0,54.0,49.0,57.0,113.0,193.0,255.0,161.0,92.0,126.0,160.0,17031010701,,2023,


In [13]:
df_2023.shape

(2072, 76)

# 2018 Data

In this section, I processed data from 2018. 

In [14]:
df_2018 = pd.read_csv('Chicago_typology_output.csv')
df_2018.head(10)

Unnamed: 0.1,Unnamed: 0,pop_18,white_18,hh_18,hinc_18,mhval_18,mhval_18_se,mrent_18,mrent_18_se,total_25_18,total_25_col_bd_18,total_25_col_md_18,total_25_col_pd_18,total_25_col_phd_18,tot_units_built_18,units_40_49_built_18,units_39_early_built_18,ohu_18,rhu_18,mmhcosts_18,iinc_18,mov_wc_w_income_18,mov_wc_9000_18,mov_wc_15000_18,mov_wc_25000_18,mov_wc_35000_18,mov_wc_50000_18,mov_wc_65000_18,mov_wc_75000_18,mov_wc_76000_more_18,mov_oc_w_income_18,mov_oc_9000_18,mov_oc_15000_18,mov_oc_25000_18,state_x,county_x,tract_x,mov_oc_35000_18,mov_oc_50000_18,mov_oc_65000_18,mov_oc_75000_18,mov_oc_76000_more_18,mov_os_w_income_18,mov_os_9000_18,mov_os_15000_18,mov_os_25000_18,mov_os_35000_18,mov_os_50000_18,mov_os_65000_18,mov_os_75000_18,mov_os_76000_more_18,mov_fa_w_income_18,mov_fa_9000_18,mov_fa_15000_18,mov_fa_25000_18,mov_fa_35000_18,mov_fa_50000_18,mov_fa_65000_18,mov_fa_75000_18,mov_fa_76000_more_18,FIPS,mhval_12,mhval_12_se,mrent_12,mrent_12_se,mov_wc_w_income_12,mov_wc_9000_12,mov_wc_15000_12,mov_wc_25000_12,mov_wc_35000_12,mov_wc_50000_12,mov_wc_65000_12,mov_wc_75000_12,mov_wc_76000_more_12,mov_oc_w_income_12,mov_oc_9000_12,mov_oc_15000_12,mov_oc_25000_12,mov_oc_35000_12,mov_oc_50000_12,mov_oc_65000_12,mov_oc_75000_12,mov_oc_76000_more_12,mov_os_w_income_12,mov_os_9000_12,mov_os_15000_12,mov_os_25000_12,mov_os_35000_12,mov_os_50000_12,mov_os_65000_12,mov_os_75000_12,mov_os_76000_more_12,mov_fa_w_income_12,mov_fa_9000_12,mov_fa_15000_12,mov_fa_25000_12,mov_fa_35000_12,mov_fa_50000_12,mov_fa_65000_12,mov_fa_75000_12,mov_fa_76000_more_12,iinc_12,pop_00,white_00,hu_00,ohu_00,rhu_00,state_y,county_y,tract_y,trtid_base_x,total_25_00,male_25_col_bd_00,male_25_col_md_00,male_25_col_psd_00,male_25_col_phd_00,female_25_col_bd_00,female_25_col_md_00,female_25_col_psd_00,female_25_col_phd_00,mhval_00,mrent_00,hh_00,hinc_00,trtid00,pop_90,white_90,hh_90,total_25_col_9th_90,total_25_col_12th_90,total_25_col_hs_90,total_25_col_sc_90,total_25_col_ad_90,total_25_col_bd_90,total_25_col_gd_90,mhval_90,mrent_90,hinc_90,ohu_90,rhu_90,state,county,tract,trtid_base_y,trtid90,inc80_18,inc120_18,inc80_00,inc120_00,inc80_90,low_80120_18,mod_80120_18,high_80120_18,low_pdmt_medhhinc_18,high_pdmt_medhhinc_18,mod_pdmt_medhhinc_18,mix_low_medhhinc_18,mix_mod_medhhinc_18,mix_high_medhhinc_18,inc_cat_medhhinc_18,inc_cat_medhhinc_encoded18,low_80120_00,mod_80120_00,high_80120_00,low_pdmt_medhhinc_00,high_pdmt_medhhinc_00,mod_pdmt_medhhinc_00,mix_low_medhhinc_00,mix_mod_medhhinc_00,mix_high_medhhinc_00,inc_cat_medhhinc_00,inc_cat_medhhinc_encoded00,per_all_li_90,per_all_li_00,per_all_li_18,all_li_count_90,all_li_count_00,all_li_count_18,real_mhval_90,real_mrent_90,real_hinc_90,real_mhval_00,real_mrent_00,real_hinc_00,real_mhval_12,real_mrent_12,real_mhval_18,real_mrent_18,real_hinc_18,per_nonwhite_18,per_nonwhite_90,per_nonwhite_00,hu_90,per_rent_90,per_rent_00,hu_18,per_rent_18,total_25_90,per_col_90,male_25_col_00,female_25_col_00,total_25_col_00,per_col_00,per_col_18,per_units_pre50_18,per_limove_18,mov_tot_w_income_18,per_limove_12,mov_tot_w_income_12,lmh_flag_encoded,lmh_flag_category,pctch_real_mhval_00_18,pctch_real_mrent_12_18,rent_decrease,rent_marginal,rent_increase,rent_rapid_increase,house_decrease,house_marginal,house_increase,house_rapid_increase,tot_decrease,tot_marginal,tot_increase,tot_rapid_increase,change_flag_encoded,change_flag_category,per_ch_zillow_12_18,ab_50pct_ch,ab_90percentile_ch,rent_50pct_ch,rent_90percentile_ch,hv_abrm_ch,rent_abrm_ch,pctch_real_mhval_90_00,pctch_real_mrent_90_00,pctch_real_hinc_90_00,pctch_real_mrent_00_18,pctch_real_hinc_00_18,ch_all_li_count_90_00,ch_all_li_count_00_18,ch_per_col_90_00,ch_per_col_00_18,ch_per_limove_12_18,pop00flag,aboverm_per_all_li_90,aboverm_per_all_li_00,aboverm_per_all_li_18,aboverm_per_nonwhite_18,aboverm_per_nonwhite_90,aboverm_per_nonwhite_00,aboverm_per_rent_90,aboverm_per_rent_00,aboverm_per_rent_18,aboverm_per_col_90,aboverm_per_col_00,aboverm_per_col_18,aboverm_real_mrent_90,aboverm_real_mrent_00,aboverm_real_mrent_12,aboverm_real_mrent_18,aboverm_real_mhval_90,aboverm_real_mhval_00,aboverm_real_mhval_18,aboverm_pctch_real_mhval_00_18,aboverm_pctch_real_mrent_00_18,aboverm_pctch_real_mrent_12_18,aboverm_pctch_real_mhval_90_00,aboverm_pctch_real_mrent_90_00,lostli_00,lostli_18,aboverm_pctch_real_hinc_90_00,aboverm_pctch_real_hinc_00_18,aboverm_ch_per_col_90_00,aboverm_ch_per_col_00_18,aboverm_per_units_pre50_18,GEOID,rail,presence_ph_LIHTC,vul_gent_90,vul_gent_00,vul_gent_18,hotmarket_00,hotmarket_18,gent_90_00,gent_90_00_urban,gent_00_18,gent_00_18_urban,dp_PChRent,dp_RentGap,tr_rent_gap,rm_rent_gap,dense,SAE,AdvG,ARE,BE,SMMI,ARG,EOG,OD,OD_loss,SLI,double_counted,typology,typ_cat
0,0,2344.0,1199.0,866.0,49565.0,124400.0,6926.0,969.0,38.0,1532.0,98.0,58.0,8.0,4.0,950.0,127.0,295.0,427.0,439.0,965.0,26602.0,164.0,54.0,6.0,25.0,46.0,12.0,9.0,3.0,9.0,24.0,4.0,4.0,7.0,17,197,882900,0.0,4.0,5.0,0.0,0.0,26.0,0.0,10.0,5.0,11.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197882900,143800.0,17014.0,864.0,60.0,279.0,60.0,21.0,50.0,49.0,39.0,42.0,3.0,15.0,51.0,9.0,0.0,3.0,0.0,0.0,31.0,0.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,8.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,29330.0,2296.07,1774.18,932.47,577.41,355.06,17.0,197.0,882900.0,51593648707.0,1490.4,36.28,3.08,11.04,3.0,52.35,15.1,0.02,0.02,93093.6,597.4,935.46,40208.99,51593648707.0,2156.15,1859.8,882.78,160.54,319.18,590.94,227.59,60.39,67.74,21.46,53826.48,419.96,31982.8,597.51,289.11,17.0,197.0,882900.0,68791532008.0,68791532008.0,0.52,0.7,0.4,0.63,0.36,0.52,0.18,0.3,0.0,0.0,0.0,1.0,0.0,0.0,2.0,mix_low,0.4,0.23,0.37,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.36,0.4,0.52,313.56,373.35,450.78,111959.07,873.53,66524.21,142433.21,914.02,61519.76,159618.0,959.04,124400.0,969.0,49565.0,0.49,0.14,0.23,886.63,0.33,0.38,866.0,0.51,1447.85,0.06,42.36,67.47,109.83,0.07,0.11,0.44,0.56,214.0,0.43,338.0,1,aff_predominantly_LI,-0.13,0.01,0,1,0,0,1,0,0,0,1,1,0,0,1,ch_decrease_marginal,0.3,0,0,0,0,1,1,0.27,0.05,-0.08,0.06,-0.19,59.79,77.43,0.01,0.04,0.13,1,1,1,1,1,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,17197882900,0,False,0,1,1,0.0,0.0,0,0,0,0,0,1,81.78,20.09,0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0,0.0,0,1.0,3.0,['ARG']
1,1,3759.0,1276.0,1183.0,46175.0,123400.0,10896.0,1019.0,273.0,2665.0,168.0,47.0,39.0,11.0,1266.0,206.0,153.0,542.0,641.0,1010.0,21376.0,127.0,21.0,7.0,39.0,34.0,22.0,0.0,0.0,4.0,69.0,15.0,7.0,0.0,17,197,883000,37.0,0.0,10.0,0.0,0.0,26.0,0.0,8.0,0.0,7.0,11.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197883000,142800.0,30771.0,814.0,310.0,572.0,155.0,90.0,185.0,132.0,6.0,4.0,0.0,0.0,105.0,77.0,19.0,9.0,0.0,0.0,0.0,0.0,0.0,111.0,42.0,60.0,9.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,16370.0,4106.0,1900.0,1254.0,839.0,415.0,17.0,197.0,883000.0,17197883000.0,2622.0,46.0,17.0,2.0,0.0,51.0,9.0,22.0,1.0,89800.0,380.0,1258.0,33900.0,17197883000.0,4199.0,2399.0,1220.0,258.0,556.0,903.0,561.0,135.0,104.0,90.0,56300.0,366.0,32029.0,831.0,458.0,17.0,197.0,883000.0,17197883000.0,17197883000.0,0.58,0.78,0.5,0.64,0.34,0.58,0.2,0.22,1.0,0.0,0.0,0.0,0.0,0.0,1.0,low_pdmt,0.5,0.13,0.36,0.0,0.0,0.0,1.0,0.0,0.0,2.0,mix_low,0.34,0.5,0.58,414.1,632.54,690.35,117104.0,761.28,66620.32,137394.0,581.4,51867.0,158508.0,903.54,123400.0,1019.0,46175.0,0.66,0.43,0.54,1289.0,0.36,0.33,1183.0,0.54,2607.0,0.07,63.0,61.0,124.0,0.05,0.1,0.28,0.47,222.0,0.79,788.0,5,aff_mix_mod,-0.1,0.13,0,0,1,0,1,0,0,0,1,0,1,0,2,ch_increase,,0,0,0,0,0,1,0.17,-0.24,-0.22,0.75,-0.11,218.44,57.82,-0.03,0.05,-0.32,1,1,1,1,1,1,1,1,1,1,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,1,17197883000,0,False,1,1,1,0.0,1.0,0,0,0,0,1,0,-6.29,20.09,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,1,1.0,1.0,['SLI']
2,2,3726.0,1295.0,1099.0,80230.0,159400.0,6619.0,1764.0,87.0,2278.0,439.0,93.0,30.0,10.0,1186.0,9.0,14.0,893.0,206.0,1471.0,28768.0,10.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,0.0,27.0,0.0,0.0,10.0,17,197,880111,0.0,17.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197880111,183200.0,7572.0,1457.0,158.0,88.0,0.0,0.0,41.0,0.0,14.0,33.0,0.0,0.0,71.0,22.0,0.0,0.0,29.0,13.0,0.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,0.0,3.0,0.0,0.0,0.0,3.0,0.0,27360.0,3288.0,2024.0,929.0,869.0,60.0,17.0,197.0,880111.0,17197880111.0,1899.0,89.0,12.0,0.0,0.0,95.0,36.0,11.0,0.0,115300.0,1106.0,939.0,59958.0,17197880111.0,3326.0,2637.0,917.0,69.0,284.0,578.0,538.0,106.0,147.0,56.0,84500.0,867.0,47934.0,864.0,79.0,17.0,197.0,880111.0,17197880111.0,17197880111.0,0.31,0.51,0.11,0.37,0.09,0.31,0.2,0.49,0.0,0.0,0.0,0.0,0.0,1.0,5.0,mix_high,0.11,0.25,0.63,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.09,0.11,0.31,83.62,107.27,342.21,175760.0,1803.36,99702.72,176409.0,1692.18,91735.74,203352.0,1617.27,159400.0,1764.0,80230.0,0.65,0.21,0.38,943.0,0.08,0.06,1099.0,0.19,1778.0,0.11,101.0,131.0,232.0,0.12,0.25,0.02,0.23,47.0,0.37,165.0,2,aff_predominantly_MI,-0.1,0.09,0,0,1,0,1,0,0,0,1,0,1,0,2,ch_increase,0.23,0,0,0,0,0,1,0.0,-0.06,-0.08,0.04,-0.13,23.65,234.94,0.01,0.13,-0.14,1,0,0,0,1,1,1,0,0,0,0,0,0,1,1,1,1,1,0,0,0,0,1,0,0,0,0,0,0,0,1,0,17197880111,0,False,0,0,0,0.0,1.0,0,0,0,0,1,0,-179.07,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE']
3,3,5692.0,4076.0,2429.0,71444.0,168400.0,16402.0,854.0,56.0,4421.0,703.0,364.0,21.0,0.0,2617.0,28.0,254.0,2233.0,196.0,1329.0,41679.0,77.0,0.0,0.0,31.0,25.0,0.0,0.0,8.0,13.0,456.0,136.0,13.0,31.0,17,197,883602,76.0,72.0,45.0,0.0,83.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197883602,188900.0,16717.0,931.0,334.0,62.0,0.0,0.0,19.0,14.0,29.0,0.0,0.0,0.0,133.0,34.0,1.0,43.0,43.0,0.0,0.0,0.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,37740.0,4097.97,3736.98,1605.99,1407.99,198.0,17.0,197.0,883602.0,17197883602.0,2897.98,159.0,41.0,11.0,4.0,236.0,87.0,8.0,4.0,150598.99,640.0,1606.99,62265.58,17197883602.0,6073.76,2337.39,1960.68,170.75,316.79,1032.76,936.15,232.17,375.96,323.53,49653.58,406.67,28005.97,1285.15,715.22,17.0,197.0,883602.0,17197883602.0,17197883602.0,0.26,0.58,0.26,0.4,0.29,0.26,0.32,0.42,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.26,0.14,0.6,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.29,0.26,0.26,571.46,418.4,622.73,103279.45,845.86,58252.41,230416.46,979.19,95266.34,209679.0,1033.41,168400.0,854.0,71444.0,0.28,0.62,0.09,2000.37,0.36,0.12,2429.0,0.08,3388.13,0.21,204.0,327.0,531.0,0.18,0.25,0.11,0.41,533.0,0.46,195.0,5,aff_mix_mod,-0.27,-0.17,1,0,0,0,1,0,0,0,1,0,0,0,1,ch_decrease_marginal,0.09,0,0,0,0,0,0,1.23,0.16,0.64,-0.13,-0.25,-153.05,204.33,-0.02,0.06,-0.05,1,1,0,0,0,1,0,1,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,1,1,1,0,1,0,0,0,0,17197883602,0,False,1,0,0,1.0,0.0,0,0,0,0,0,1,386.87,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE']
4,4,2756.0,368.0,1439.0,41193.0,119200.0,19150.0,947.0,64.0,1847.0,273.0,133.0,0.0,0.0,1570.0,52.0,35.0,248.0,1191.0,960.0,30259.0,52.0,0.0,0.0,8.0,0.0,11.0,0.0,33.0,0.0,254.0,25.0,19.0,33.0,17,197,883803,83.0,54.0,40.0,0.0,0.0,33.0,33.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19.0,17197883803,138500.0,10735.0,858.0,30.0,195.0,13.0,9.0,27.0,93.0,17.0,36.0,0.0,0.0,374.0,74.0,86.0,48.0,38.0,82.0,0.0,0.0,46.0,21.0,0.0,0.0,0.0,0.0,21.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,26544.0,2526.0,1599.3,1064.81,444.22,620.59,17.0,197.0,883803.0,17197883803.0,1577.18,90.28,22.12,0.0,0.0,96.85,51.42,0.0,0.0,65108.02,403.56,1064.21,24623.87,17197883803.0,2483.55,1914.38,1058.23,71.15,286.38,507.59,460.96,69.35,143.49,48.43,35752.62,290.56,17876.31,382.64,704.89,17.0,197.0,883803.0,17197883803.0,17197883803.0,0.64,0.84,0.39,0.61,0.33,0.64,0.19,0.16,1.0,0.0,0.0,0.0,0.0,0.0,1.0,low_pdmt,0.39,0.21,0.39,0.0,0.0,0.0,1.0,0.0,0.0,2.0,mix_low,0.33,0.39,0.64,350.89,419.07,925.01,74365.44,604.37,37182.72,99615.28,617.45,37674.52,153735.0,952.38,119200.0,947.0,41193.0,0.87,0.23,0.37,1087.53,0.65,0.58,1439.0,0.83,1587.34,0.12,112.4,148.27,260.67,0.17,0.22,0.06,0.35,358.0,0.42,590.0,1,aff_predominantly_LI,0.2,-0.01,0,1,0,0,0,0,1,0,0,1,1,0,2,ch_increase,-0.05,0,0,0,0,0,0,0.34,0.02,0.01,0.53,0.09,68.18,505.94,0.04,0.05,-0.07,1,1,1,1,1,1,1,1,1,1,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,1,1,0,0,17197883803,0,False,1,1,1,0.0,1.0,0,0,0,0,0,1,85.8,20.09,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,1,1.0,1.0,['SLI']
5,5,3375.0,2384.0,1320.0,69250.0,161300.0,10246.0,1199.0,228.0,2373.0,537.0,324.0,16.0,20.0,1485.0,255.0,502.0,1066.0,254.0,1201.0,34135.0,145.0,35.0,26.0,15.0,10.0,31.0,22.0,0.0,6.0,97.0,12.0,33.0,9.0,17,197,881700,0.0,0.0,0.0,34.0,9.0,21.0,0.0,0.0,0.0,0.0,21.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,17197881700,181200.0,10238.0,1063.0,428.0,211.0,0.0,87.0,17.0,16.0,71.0,20.0,0.0,0.0,46.0,27.0,0.0,0.0,0.0,13.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,40685.0,3358.0,3061.89,1420.12,1205.48,214.64,17.0,197.0,881700.0,17197881700.0,2387.31,334.66,72.71,37.67,8.76,261.95,73.59,31.54,0.0,109159.09,576.46,1417.49,45708.4,17197881700.0,3442.1,3296.67,1425.38,130.54,253.19,622.89,540.54,217.27,456.44,275.09,73152.36,459.06,33754.34,1213.37,192.74,17.0,197.0,881700.0,17197881700.0,17197881700.0,0.35,0.56,0.3,0.5,0.27,0.35,0.2,0.44,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.3,0.2,0.5,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.27,0.3,0.35,381.7,425.84,464.44,152156.91,954.85,70209.03,167013.41,881.98,69933.85,201132.0,1179.93,161300.0,1199.0,69250.0,0.29,0.04,0.09,1406.1,0.14,0.15,1320.0,0.19,2495.94,0.29,416.14,335.54,751.67,0.31,0.38,0.51,0.46,282.0,0.5,257.0,5,aff_mix_mod,-0.03,0.02,0,1,0,0,0,1,0,0,0,1,0,0,1,ch_decrease_marginal,0.23,0,0,0,0,0,1,0.1,-0.08,-0.0,0.36,-0.01,44.14,38.61,0.02,0.06,-0.04,1,1,0,0,0,0,0,0,0,0,1,1,1,1,0,1,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,17197881700,0,False,0,0,0,0.0,0.0,0,0,0,0,0,0,-101.65,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE']
6,6,5358.0,4574.0,2158.0,92984.0,306400.0,23669.0,2073.0,833.0,4089.0,955.0,572.0,123.0,133.0,2261.0,16.0,110.0,1981.0,177.0,1442.0,47201.0,70.0,32.0,0.0,0.0,7.0,24.0,0.0,0.0,7.0,83.0,7.0,0.0,0.0,17,197,883504,0.0,0.0,22.0,0.0,54.0,26.0,0.0,6.0,0.0,0.0,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197883504,278700.0,15238.0,1652.0,568.0,56.0,8.0,15.0,24.0,5.0,0.0,0.0,4.0,0.0,127.0,40.0,0.0,9.0,0.0,41.0,0.0,9.0,28.0,85.0,29.0,0.0,11.0,0.0,30.0,0.0,0.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,40232.0,3774.0,3527.0,1359.0,1230.0,129.0,17.0,197.0,883504.0,17197883504.0,2690.0,256.0,114.0,34.0,7.0,296.0,109.0,21.0,6.0,200300.0,695.0,1366.0,67708.0,17197883504.0,2784.0,2730.0,824.0,171.0,195.0,540.0,331.0,108.0,283.0,190.0,123600.0,539.0,46742.0,663.0,158.0,17.0,197.0,883504.0,17197883504.0,17197883504.0,0.3,0.45,0.24,0.38,0.09,0.3,0.16,0.55,0.0,0.0,0.0,0.0,0.0,1.0,5.0,mix_high,0.24,0.13,0.62,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.09,0.24,0.3,73.8,334.27,643.31,257088.0,1121.12,97223.36,306459.0,1063.35,103593.24,309357.0,1833.72,306400.0,2073.0,92984.0,0.15,0.02,0.07,821.0,0.19,0.09,2158.0,0.08,1818.0,0.26,377.0,411.0,788.0,0.29,0.44,0.06,0.26,179.0,0.49,268.0,5,aff_mix_mod,-0.0,0.13,0,0,1,0,0,1,0,0,0,1,1,0,2,ch_increase,0.08,0,0,0,0,0,1,0.19,-0.05,0.07,0.95,-0.1,260.47,309.04,0.03,0.14,-0.23,1,0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,0,1,1,0,0,0,0,0,0,0,1,0,17197883504,0,False,0,0,0,0.0,1.0,0,0,0,0,1,0,-583.76,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE']
7,7,3204.0,2267.0,1460.0,49732.0,95700.0,20588.0,767.0,147.0,2219.0,204.0,140.0,0.0,18.0,1639.0,152.0,274.0,1033.0,427.0,874.0,27875.0,85.0,12.0,11.0,0.0,43.0,0.0,0.0,19.0,0.0,26.0,0.0,5.0,21.0,17,197,883700,0.0,0.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197883700,123700.0,15719.0,722.0,97.0,93.0,9.0,0.0,17.0,42.0,0.0,0.0,25.0,0.0,116.0,21.0,35.0,31.0,0.0,29.0,0.0,0.0,0.0,23.0,13.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,23560.0,3293.0,2794.0,1354.0,909.0,445.0,17.0,197.0,883700.0,17197883700.0,2245.0,148.0,18.0,6.0,0.0,64.0,34.0,6.0,10.0,98400.0,497.0,1348.0,40500.0,17197883700.0,2940.76,2708.47,1139.56,333.2,333.2,692.11,315.12,100.91,104.72,34.27,49123.76,393.18,25749.04,815.87,329.4,17.0,197.0,883700.0,17197883700.0,17197883700.0,0.52,0.74,0.47,0.58,0.36,0.52,0.22,0.26,0.0,0.0,0.0,1.0,0.0,0.0,2.0,mix_low,0.47,0.12,0.42,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.36,0.47,0.52,414.52,628.54,766.19,102177.42,817.82,53558.0,150552.0,760.41,61965.0,137307.0,801.42,95700.0,767.0,49732.0,0.29,0.08,0.15,1145.27,0.29,0.33,1460.0,0.29,1913.54,0.07,166.0,108.0,274.0,0.12,0.16,0.26,0.47,114.0,0.56,232.0,1,aff_predominantly_LI,-0.36,-0.04,0,1,0,0,1,0,0,0,1,1,0,0,1,ch_decrease_marginal,-0.05,0,0,0,0,0,0,0.47,-0.07,0.16,0.01,-0.2,214.02,137.65,0.05,0.04,-0.09,1,1,1,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,1,0,1,17197883700,0,True,0,1,0,1.0,0.0,0,0,0,0,0,1,160.21,20.09,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,1,1.0,1.0,['SLI']
8,8,5139.0,4759.0,1746.0,78750.0,215000.0,20691.0,1424.0,294.0,3487.0,482.0,167.0,16.0,27.0,1924.0,58.0,55.0,1424.0,322.0,1425.0,32700.0,163.0,39.0,0.0,43.0,30.0,21.0,21.0,0.0,9.0,138.0,14.0,0.0,26.0,17,197,880502,13.0,10.0,15.0,11.0,49.0,20.0,12.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197880502,199000.0,19822.0,973.0,48.0,217.0,78.0,31.0,19.0,0.0,45.0,44.0,0.0,0.0,241.0,123.0,0.0,42.0,8.0,20.0,48.0,0.0,0.0,24.0,9.0,0.0,7.0,0.0,0.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,32531.0,5259.0,4922.0,1749.0,1516.0,233.0,17.0,197.0,880502.0,17197880502.0,3275.0,131.0,42.0,6.0,18.0,162.0,38.0,6.0,0.0,146200.0,692.0,1760.0,59636.0,17197880502.0,3968.0,3819.0,1348.0,228.0,456.0,1058.0,375.0,115.0,169.0,68.0,76900.0,510.0,38920.0,1093.0,260.0,17.0,197.0,880502.0,17197880502.0,17197880502.0,0.32,0.51,0.19,0.42,0.18,0.32,0.19,0.49,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.19,0.22,0.58,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.18,0.19,0.32,247.8,335.94,557.54,159952.0,1060.8,80953.6,223686.0,1058.76,91243.08,220890.0,1080.03,215000.0,1424.0,78750.0,0.07,0.04,0.06,1353.0,0.19,0.13,1746.0,0.18,2469.0,0.1,191.0,200.0,391.0,0.12,0.2,0.06,0.43,321.0,0.63,482.0,5,aff_mix_mod,-0.04,0.32,0,0,0,1,0,1,0,0,0,1,0,1,3,ch_rapid_increase,0.14,0,0,0,0,0,1,0.4,-0.0,0.13,0.34,-0.14,88.14,221.6,0.02,0.08,-0.19,1,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,1,1,1,0,0,1,1,1,0,0,0,1,0,0,0,0,17197880502,0,False,0,0,0,1.0,1.0,0,0,0,0,1,0,-157.36,20.09,0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0,0.0,0,1.0,6.0,['SMMI']
9,9,5370.0,5048.0,1820.0,102889.0,286700.0,8272.0,2039.0,323.0,3669.0,993.0,454.0,17.0,16.0,1869.0,25.0,13.0,1582.0,238.0,1907.0,40410.0,36.0,0.0,0.0,0.0,9.0,0.0,19.0,0.0,8.0,189.0,22.0,0.0,31.0,17,197,881002,24.0,70.0,0.0,15.0,27.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197881002,285700.0,21281.0,1698.0,151.0,76.0,0.0,0.0,0.0,9.0,9.0,30.0,19.0,9.0,146.0,80.0,17.0,0.0,8.0,0.0,41.0,0.0,0.0,12.0,0.0,0.0,0.0,12.0,0.0,0.0,0.0,0.0,16.0,9.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,35250.0,4847.39,4599.52,1458.38,1420.03,38.35,17.0,197.0,881002.0,34395762003.0,2906.57,288.43,81.97,26.86,6.95,240.57,66.03,15.9,9.93,194338.75,1063.27,1468.3,77838.46,34395762003.0,3785.43,3709.8,1135.68,51.82,147.94,666.03,614.76,205.65,411.26,171.52,133824.44,474.46,50706.91,1077.34,38.39,17.0,197.0,881002.0,34395762003.0,34395762003.0,0.25,0.37,0.13,0.24,0.09,0.25,0.13,0.63,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.13,0.11,0.76,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.09,0.13,0.25,97.29,189.95,451.14,278354.84,986.88,105470.38,297338.29,1626.8,119092.84,317127.0,1884.78,286700.0,2039.0,102889.0,0.06,0.02,0.05,1115.73,0.03,0.03,1820.0,0.13,2268.98,0.26,377.36,316.54,693.9,0.24,0.4,0.02,0.25,225.0,0.45,250.0,5,aff_mix_mod,-0.04,0.08,0,0,1,0,0,1,0,0,0,1,1,0,2,ch_increase,0.1,0,0,0,0,0,1,0.07,0.65,0.13,0.25,-0.14,92.66,261.2,-0.02,0.16,-0.2,1,0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,0,1,1,0,1,0,0,1,0,0,1,0,17197881002,0,False,0,0,0,1.0,1.0,0,0,0,0,1,0,-788.29,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE']


In [15]:
df_2018['FIPS'] = df_2018['FIPS'].astype(str)

In [16]:
df_2018.drop(columns=['Unnamed: 0'], inplace=True)

Add in household income data.

In [17]:
var_hinc_18 = []
for i in range(1, 18):
    var_hinc_18.append('B19001_' + str(i).zfill(3) + 'E')
var_hinc_18
    

['B19001_001E',
 'B19001_002E',
 'B19001_003E',
 'B19001_004E',
 'B19001_005E',
 'B19001_006E',
 'B19001_007E',
 'B19001_008E',
 'B19001_009E',
 'B19001_010E',
 'B19001_011E',
 'B19001_012E',
 'B19001_013E',
 'B19001_014E',
 'B19001_015E',
 'B19001_016E',
 'B19001_017E']

In [18]:
var_dict_18 = c.acs5.get(var_hinc_18, geo = {'for': 'tract:*',
                                 'in': sql_query}, year=2018)

In [19]:
df_hinc_18 = pd.DataFrame.from_dict(var_dict_18)
df_hinc_18['FIPS']= df_hinc_18['state'] + df_hinc_18['county'] + df_hinc_18['tract']
df_hinc_18 = filter_FIPS(df_hinc_18)
df_hinc_18.head(10)

Unnamed: 0,B19001_001E,B19001_002E,B19001_003E,B19001_004E,B19001_005E,B19001_006E,B19001_007E,B19001_008E,B19001_009E,B19001_010E,B19001_011E,B19001_012E,B19001_013E,B19001_014E,B19001_015E,B19001_016E,B19001_017E,state,county,tract,FIPS
0,2379.0,749.0,175.0,198.0,116.0,93.0,94.0,224.0,52.0,38.0,133.0,159.0,49.0,84.0,57.0,39.0,119.0,17,31,430200,17031430200
1,1585.0,413.0,231.0,252.0,139.0,45.0,94.0,22.0,13.0,68.0,105.0,71.0,53.0,9.0,25.0,45.0,0.0,17,31,430500,17031430500
2,3336.0,521.0,175.0,472.0,398.0,115.0,175.0,189.0,260.0,56.0,295.0,275.0,186.0,120.0,38.0,34.0,27.0,17,31,431400,17031431400
3,607.0,68.0,31.0,27.0,44.0,97.0,16.0,28.0,6.0,40.0,42.0,74.0,55.0,48.0,6.0,20.0,5.0,17,31,440700,17031440700
4,1046.0,150.0,198.0,102.0,66.0,76.0,18.0,71.0,77.0,27.0,4.0,59.0,74.0,117.0,7.0,0.0,0.0,17,31,470100,17031470100
5,1632.0,342.0,171.0,109.0,202.0,143.0,117.0,54.0,70.0,46.0,56.0,128.0,137.0,38.0,19.0,0.0,0.0,17,97,862605,17097862605
6,899.0,81.0,97.0,58.0,59.0,104.0,75.0,30.0,64.0,31.0,108.0,22.0,79.0,51.0,22.0,13.0,5.0,17,97,863100,17097863100
7,1659.0,30.0,11.0,3.0,20.0,17.0,66.0,71.0,70.0,113.0,179.0,180.0,215.0,104.0,101.0,94.0,385.0,17,97,863702,17097863702
8,2051.0,27.0,0.0,63.0,190.0,36.0,64.0,121.0,64.0,27.0,94.0,184.0,392.0,94.0,203.0,272.0,220.0,17,97,864001,17097864001
9,2435.0,0.0,13.0,53.0,92.0,66.0,0.0,42.0,155.0,34.0,123.0,209.0,299.0,376.0,269.0,331.0,373.0,17,97,864105,17097864105


In [20]:
df_hinc_18.drop(columns=['state', 'county', 'tract'], inplace=True)


In [21]:
df_hinc_18['FIPS'] = df_hinc_18['FIPS'].astype(str)
merged_18 = pd.merge(df_2018, df_hinc_18, on='FIPS', how='inner')
merged_18.head(10)

Unnamed: 0,pop_18,white_18,hh_18,hinc_18,mhval_18,mhval_18_se,mrent_18,mrent_18_se,total_25_18,total_25_col_bd_18,total_25_col_md_18,total_25_col_pd_18,total_25_col_phd_18,tot_units_built_18,units_40_49_built_18,units_39_early_built_18,ohu_18,rhu_18,mmhcosts_18,iinc_18,mov_wc_w_income_18,mov_wc_9000_18,mov_wc_15000_18,mov_wc_25000_18,mov_wc_35000_18,mov_wc_50000_18,mov_wc_65000_18,mov_wc_75000_18,mov_wc_76000_more_18,mov_oc_w_income_18,mov_oc_9000_18,mov_oc_15000_18,mov_oc_25000_18,state_x,county_x,tract_x,mov_oc_35000_18,mov_oc_50000_18,mov_oc_65000_18,mov_oc_75000_18,mov_oc_76000_more_18,mov_os_w_income_18,mov_os_9000_18,mov_os_15000_18,mov_os_25000_18,mov_os_35000_18,mov_os_50000_18,mov_os_65000_18,mov_os_75000_18,mov_os_76000_more_18,mov_fa_w_income_18,mov_fa_9000_18,mov_fa_15000_18,mov_fa_25000_18,mov_fa_35000_18,mov_fa_50000_18,mov_fa_65000_18,mov_fa_75000_18,mov_fa_76000_more_18,FIPS,mhval_12,mhval_12_se,mrent_12,mrent_12_se,mov_wc_w_income_12,mov_wc_9000_12,mov_wc_15000_12,mov_wc_25000_12,mov_wc_35000_12,mov_wc_50000_12,mov_wc_65000_12,mov_wc_75000_12,mov_wc_76000_more_12,mov_oc_w_income_12,mov_oc_9000_12,mov_oc_15000_12,mov_oc_25000_12,mov_oc_35000_12,mov_oc_50000_12,mov_oc_65000_12,mov_oc_75000_12,mov_oc_76000_more_12,mov_os_w_income_12,mov_os_9000_12,mov_os_15000_12,mov_os_25000_12,mov_os_35000_12,mov_os_50000_12,mov_os_65000_12,mov_os_75000_12,mov_os_76000_more_12,mov_fa_w_income_12,mov_fa_9000_12,mov_fa_15000_12,mov_fa_25000_12,mov_fa_35000_12,mov_fa_50000_12,mov_fa_65000_12,mov_fa_75000_12,mov_fa_76000_more_12,iinc_12,pop_00,white_00,hu_00,ohu_00,rhu_00,state_y,county_y,tract_y,trtid_base_x,total_25_00,male_25_col_bd_00,male_25_col_md_00,male_25_col_psd_00,male_25_col_phd_00,female_25_col_bd_00,female_25_col_md_00,female_25_col_psd_00,female_25_col_phd_00,mhval_00,mrent_00,hh_00,hinc_00,trtid00,pop_90,white_90,hh_90,total_25_col_9th_90,total_25_col_12th_90,total_25_col_hs_90,total_25_col_sc_90,total_25_col_ad_90,total_25_col_bd_90,total_25_col_gd_90,mhval_90,mrent_90,hinc_90,ohu_90,rhu_90,state,county,tract,trtid_base_y,trtid90,inc80_18,inc120_18,inc80_00,inc120_00,inc80_90,low_80120_18,mod_80120_18,high_80120_18,low_pdmt_medhhinc_18,high_pdmt_medhhinc_18,mod_pdmt_medhhinc_18,mix_low_medhhinc_18,mix_mod_medhhinc_18,mix_high_medhhinc_18,inc_cat_medhhinc_18,inc_cat_medhhinc_encoded18,low_80120_00,mod_80120_00,high_80120_00,low_pdmt_medhhinc_00,high_pdmt_medhhinc_00,mod_pdmt_medhhinc_00,mix_low_medhhinc_00,mix_mod_medhhinc_00,mix_high_medhhinc_00,inc_cat_medhhinc_00,inc_cat_medhhinc_encoded00,per_all_li_90,per_all_li_00,per_all_li_18,all_li_count_90,all_li_count_00,all_li_count_18,real_mhval_90,real_mrent_90,real_hinc_90,real_mhval_00,real_mrent_00,real_hinc_00,real_mhval_12,real_mrent_12,real_mhval_18,real_mrent_18,real_hinc_18,per_nonwhite_18,per_nonwhite_90,per_nonwhite_00,hu_90,per_rent_90,per_rent_00,hu_18,per_rent_18,total_25_90,per_col_90,male_25_col_00,female_25_col_00,total_25_col_00,per_col_00,per_col_18,per_units_pre50_18,per_limove_18,mov_tot_w_income_18,per_limove_12,mov_tot_w_income_12,lmh_flag_encoded,lmh_flag_category,pctch_real_mhval_00_18,pctch_real_mrent_12_18,rent_decrease,rent_marginal,rent_increase,rent_rapid_increase,house_decrease,house_marginal,house_increase,house_rapid_increase,tot_decrease,tot_marginal,tot_increase,tot_rapid_increase,change_flag_encoded,change_flag_category,per_ch_zillow_12_18,ab_50pct_ch,ab_90percentile_ch,rent_50pct_ch,rent_90percentile_ch,hv_abrm_ch,rent_abrm_ch,pctch_real_mhval_90_00,pctch_real_mrent_90_00,pctch_real_hinc_90_00,pctch_real_mrent_00_18,pctch_real_hinc_00_18,ch_all_li_count_90_00,ch_all_li_count_00_18,ch_per_col_90_00,ch_per_col_00_18,ch_per_limove_12_18,pop00flag,aboverm_per_all_li_90,aboverm_per_all_li_00,aboverm_per_all_li_18,aboverm_per_nonwhite_18,aboverm_per_nonwhite_90,aboverm_per_nonwhite_00,aboverm_per_rent_90,aboverm_per_rent_00,aboverm_per_rent_18,aboverm_per_col_90,aboverm_per_col_00,aboverm_per_col_18,aboverm_real_mrent_90,aboverm_real_mrent_00,aboverm_real_mrent_12,aboverm_real_mrent_18,aboverm_real_mhval_90,aboverm_real_mhval_00,aboverm_real_mhval_18,aboverm_pctch_real_mhval_00_18,aboverm_pctch_real_mrent_00_18,aboverm_pctch_real_mrent_12_18,aboverm_pctch_real_mhval_90_00,aboverm_pctch_real_mrent_90_00,lostli_00,lostli_18,aboverm_pctch_real_hinc_90_00,aboverm_pctch_real_hinc_00_18,aboverm_ch_per_col_90_00,aboverm_ch_per_col_00_18,aboverm_per_units_pre50_18,GEOID,rail,presence_ph_LIHTC,vul_gent_90,vul_gent_00,vul_gent_18,hotmarket_00,hotmarket_18,gent_90_00,gent_90_00_urban,gent_00_18,gent_00_18_urban,dp_PChRent,dp_RentGap,tr_rent_gap,rm_rent_gap,dense,SAE,AdvG,ARE,BE,SMMI,ARG,EOG,OD,OD_loss,SLI,double_counted,typology,typ_cat,B19001_001E,B19001_002E,B19001_003E,B19001_004E,B19001_005E,B19001_006E,B19001_007E,B19001_008E,B19001_009E,B19001_010E,B19001_011E,B19001_012E,B19001_013E,B19001_014E,B19001_015E,B19001_016E,B19001_017E
0,2344.0,1199.0,866.0,49565.0,124400.0,6926.0,969.0,38.0,1532.0,98.0,58.0,8.0,4.0,950.0,127.0,295.0,427.0,439.0,965.0,26602.0,164.0,54.0,6.0,25.0,46.0,12.0,9.0,3.0,9.0,24.0,4.0,4.0,7.0,17,197,882900,0.0,4.0,5.0,0.0,0.0,26.0,0.0,10.0,5.0,11.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197882900,143800.0,17014.0,864.0,60.0,279.0,60.0,21.0,50.0,49.0,39.0,42.0,3.0,15.0,51.0,9.0,0.0,3.0,0.0,0.0,31.0,0.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,8.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,29330.0,2296.07,1774.18,932.47,577.41,355.06,17.0,197.0,882900.0,51593648707.0,1490.4,36.28,3.08,11.04,3.0,52.35,15.1,0.02,0.02,93093.6,597.4,935.46,40208.99,51593648707.0,2156.15,1859.8,882.78,160.54,319.18,590.94,227.59,60.39,67.74,21.46,53826.48,419.96,31982.8,597.51,289.11,17.0,197.0,882900.0,68791532008.0,68791532008.0,0.52,0.7,0.4,0.63,0.36,0.52,0.18,0.3,0.0,0.0,0.0,1.0,0.0,0.0,2.0,mix_low,0.4,0.23,0.37,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.36,0.4,0.52,313.56,373.35,450.78,111959.07,873.53,66524.21,142433.21,914.02,61519.76,159618.0,959.04,124400.0,969.0,49565.0,0.49,0.14,0.23,886.63,0.33,0.38,866.0,0.51,1447.85,0.06,42.36,67.47,109.83,0.07,0.11,0.44,0.56,214.0,0.43,338.0,1,aff_predominantly_LI,-0.13,0.01,0,1,0,0,1,0,0,0,1,1,0,0,1,ch_decrease_marginal,0.3,0,0,0,0,1,1,0.27,0.05,-0.08,0.06,-0.19,59.79,77.43,0.01,0.04,0.13,1,1,1,1,1,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,17197882900,0,False,0,1,1,0.0,0.0,0,0,0,0,0,1,81.78,20.09,0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0,0.0,0,1.0,3.0,['ARG'],866.0,45.0,30.0,31.0,74.0,22.0,57.0,76.0,53.0,49.0,44.0,102.0,115.0,80.0,43.0,23.0,22.0
1,3759.0,1276.0,1183.0,46175.0,123400.0,10896.0,1019.0,273.0,2665.0,168.0,47.0,39.0,11.0,1266.0,206.0,153.0,542.0,641.0,1010.0,21376.0,127.0,21.0,7.0,39.0,34.0,22.0,0.0,0.0,4.0,69.0,15.0,7.0,0.0,17,197,883000,37.0,0.0,10.0,0.0,0.0,26.0,0.0,8.0,0.0,7.0,11.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197883000,142800.0,30771.0,814.0,310.0,572.0,155.0,90.0,185.0,132.0,6.0,4.0,0.0,0.0,105.0,77.0,19.0,9.0,0.0,0.0,0.0,0.0,0.0,111.0,42.0,60.0,9.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,16370.0,4106.0,1900.0,1254.0,839.0,415.0,17.0,197.0,883000.0,17197883000.0,2622.0,46.0,17.0,2.0,0.0,51.0,9.0,22.0,1.0,89800.0,380.0,1258.0,33900.0,17197883000.0,4199.0,2399.0,1220.0,258.0,556.0,903.0,561.0,135.0,104.0,90.0,56300.0,366.0,32029.0,831.0,458.0,17.0,197.0,883000.0,17197883000.0,17197883000.0,0.58,0.78,0.5,0.64,0.34,0.58,0.2,0.22,1.0,0.0,0.0,0.0,0.0,0.0,1.0,low_pdmt,0.5,0.13,0.36,0.0,0.0,0.0,1.0,0.0,0.0,2.0,mix_low,0.34,0.5,0.58,414.1,632.54,690.35,117104.0,761.28,66620.32,137394.0,581.4,51867.0,158508.0,903.54,123400.0,1019.0,46175.0,0.66,0.43,0.54,1289.0,0.36,0.33,1183.0,0.54,2607.0,0.07,63.0,61.0,124.0,0.05,0.1,0.28,0.47,222.0,0.79,788.0,5,aff_mix_mod,-0.1,0.13,0,0,1,0,1,0,0,0,1,0,1,0,2,ch_increase,,0,0,0,0,0,1,0.17,-0.24,-0.22,0.75,-0.11,218.44,57.82,-0.03,0.05,-0.32,1,1,1,1,1,1,1,1,1,1,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,1,17197883000,0,False,1,1,1,0.0,1.0,0,0,0,0,1,0,-6.29,20.09,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,1,1.0,1.0,['SLI'],1183.0,121.0,124.0,54.0,36.0,52.0,51.0,51.0,79.0,71.0,164.0,107.0,78.0,69.0,59.0,61.0,6.0
2,3726.0,1295.0,1099.0,80230.0,159400.0,6619.0,1764.0,87.0,2278.0,439.0,93.0,30.0,10.0,1186.0,9.0,14.0,893.0,206.0,1471.0,28768.0,10.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,0.0,27.0,0.0,0.0,10.0,17,197,880111,0.0,17.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197880111,183200.0,7572.0,1457.0,158.0,88.0,0.0,0.0,41.0,0.0,14.0,33.0,0.0,0.0,71.0,22.0,0.0,0.0,29.0,13.0,0.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,0.0,3.0,0.0,0.0,0.0,3.0,0.0,27360.0,3288.0,2024.0,929.0,869.0,60.0,17.0,197.0,880111.0,17197880111.0,1899.0,89.0,12.0,0.0,0.0,95.0,36.0,11.0,0.0,115300.0,1106.0,939.0,59958.0,17197880111.0,3326.0,2637.0,917.0,69.0,284.0,578.0,538.0,106.0,147.0,56.0,84500.0,867.0,47934.0,864.0,79.0,17.0,197.0,880111.0,17197880111.0,17197880111.0,0.31,0.51,0.11,0.37,0.09,0.31,0.2,0.49,0.0,0.0,0.0,0.0,0.0,1.0,5.0,mix_high,0.11,0.25,0.63,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.09,0.11,0.31,83.62,107.27,342.21,175760.0,1803.36,99702.72,176409.0,1692.18,91735.74,203352.0,1617.27,159400.0,1764.0,80230.0,0.65,0.21,0.38,943.0,0.08,0.06,1099.0,0.19,1778.0,0.11,101.0,131.0,232.0,0.12,0.25,0.02,0.23,47.0,0.37,165.0,2,aff_predominantly_MI,-0.1,0.09,0,0,1,0,1,0,0,0,1,0,1,0,2,ch_increase,0.23,0,0,0,0,0,1,0.0,-0.06,-0.08,0.04,-0.13,23.65,234.94,0.01,0.13,-0.14,1,0,0,0,1,1,1,0,0,0,0,0,0,1,1,1,1,1,0,0,0,0,1,0,0,0,0,0,0,0,1,0,17197880111,0,False,0,0,0,0.0,1.0,0,0,0,0,1,0,-179.07,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE'],1099.0,7.0,20.0,23.0,0.0,14.0,40.0,106.0,56.0,64.0,39.0,136.0,299.0,154.0,76.0,48.0,17.0
3,5692.0,4076.0,2429.0,71444.0,168400.0,16402.0,854.0,56.0,4421.0,703.0,364.0,21.0,0.0,2617.0,28.0,254.0,2233.0,196.0,1329.0,41679.0,77.0,0.0,0.0,31.0,25.0,0.0,0.0,8.0,13.0,456.0,136.0,13.0,31.0,17,197,883602,76.0,72.0,45.0,0.0,83.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197883602,188900.0,16717.0,931.0,334.0,62.0,0.0,0.0,19.0,14.0,29.0,0.0,0.0,0.0,133.0,34.0,1.0,43.0,43.0,0.0,0.0,0.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,37740.0,4097.97,3736.98,1605.99,1407.99,198.0,17.0,197.0,883602.0,17197883602.0,2897.98,159.0,41.0,11.0,4.0,236.0,87.0,8.0,4.0,150598.99,640.0,1606.99,62265.58,17197883602.0,6073.76,2337.39,1960.68,170.75,316.79,1032.76,936.15,232.17,375.96,323.53,49653.58,406.67,28005.97,1285.15,715.22,17.0,197.0,883602.0,17197883602.0,17197883602.0,0.26,0.58,0.26,0.4,0.29,0.26,0.32,0.42,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.26,0.14,0.6,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.29,0.26,0.26,571.46,418.4,622.73,103279.45,845.86,58252.41,230416.46,979.19,95266.34,209679.0,1033.41,168400.0,854.0,71444.0,0.28,0.62,0.09,2000.37,0.36,0.12,2429.0,0.08,3388.13,0.21,204.0,327.0,531.0,0.18,0.25,0.11,0.41,533.0,0.46,195.0,5,aff_mix_mod,-0.27,-0.17,1,0,0,0,1,0,0,0,1,0,0,0,1,ch_decrease_marginal,0.09,0,0,0,0,0,0,1.23,0.16,0.64,-0.13,-0.25,-153.05,204.33,-0.02,0.06,-0.05,1,1,0,0,0,1,0,1,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,1,1,1,0,1,0,0,0,0,17197883602,0,False,1,0,0,1.0,0.0,0,0,0,0,0,1,386.87,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE'],2429.0,30.0,13.0,85.0,67.0,23.0,92.0,73.0,64.0,89.0,277.0,546.0,225.0,225.0,261.0,264.0,95.0
4,2756.0,368.0,1439.0,41193.0,119200.0,19150.0,947.0,64.0,1847.0,273.0,133.0,0.0,0.0,1570.0,52.0,35.0,248.0,1191.0,960.0,30259.0,52.0,0.0,0.0,8.0,0.0,11.0,0.0,33.0,0.0,254.0,25.0,19.0,33.0,17,197,883803,83.0,54.0,40.0,0.0,0.0,33.0,33.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19.0,17197883803,138500.0,10735.0,858.0,30.0,195.0,13.0,9.0,27.0,93.0,17.0,36.0,0.0,0.0,374.0,74.0,86.0,48.0,38.0,82.0,0.0,0.0,46.0,21.0,0.0,0.0,0.0,0.0,21.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,26544.0,2526.0,1599.3,1064.81,444.22,620.59,17.0,197.0,883803.0,17197883803.0,1577.18,90.28,22.12,0.0,0.0,96.85,51.42,0.0,0.0,65108.02,403.56,1064.21,24623.87,17197883803.0,2483.55,1914.38,1058.23,71.15,286.38,507.59,460.96,69.35,143.49,48.43,35752.62,290.56,17876.31,382.64,704.89,17.0,197.0,883803.0,17197883803.0,17197883803.0,0.64,0.84,0.39,0.61,0.33,0.64,0.19,0.16,1.0,0.0,0.0,0.0,0.0,0.0,1.0,low_pdmt,0.39,0.21,0.39,0.0,0.0,0.0,1.0,0.0,0.0,2.0,mix_low,0.33,0.39,0.64,350.89,419.07,925.01,74365.44,604.37,37182.72,99615.28,617.45,37674.52,153735.0,952.38,119200.0,947.0,41193.0,0.87,0.23,0.37,1087.53,0.65,0.58,1439.0,0.83,1587.34,0.12,112.4,148.27,260.67,0.17,0.22,0.06,0.35,358.0,0.42,590.0,1,aff_predominantly_LI,0.2,-0.01,0,1,0,0,0,0,1,0,0,1,1,0,2,ch_increase,-0.05,0,0,0,0,0,0,0.34,0.02,0.01,0.53,0.09,68.18,505.94,0.04,0.05,-0.07,1,1,1,1,1,1,1,1,1,1,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,1,1,0,0,17197883803,0,False,1,1,1,0.0,1.0,0,0,0,0,0,1,85.8,20.09,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,1,1.0,1.0,['SLI'],1439.0,117.0,0.0,61.0,157.0,125.0,192.0,57.0,92.0,88.0,115.0,178.0,120.0,17.0,94.0,19.0,7.0
5,3375.0,2384.0,1320.0,69250.0,161300.0,10246.0,1199.0,228.0,2373.0,537.0,324.0,16.0,20.0,1485.0,255.0,502.0,1066.0,254.0,1201.0,34135.0,145.0,35.0,26.0,15.0,10.0,31.0,22.0,0.0,6.0,97.0,12.0,33.0,9.0,17,197,881700,0.0,0.0,0.0,34.0,9.0,21.0,0.0,0.0,0.0,0.0,21.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,17197881700,181200.0,10238.0,1063.0,428.0,211.0,0.0,87.0,17.0,16.0,71.0,20.0,0.0,0.0,46.0,27.0,0.0,0.0,0.0,13.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,40685.0,3358.0,3061.89,1420.12,1205.48,214.64,17.0,197.0,881700.0,17197881700.0,2387.31,334.66,72.71,37.67,8.76,261.95,73.59,31.54,0.0,109159.09,576.46,1417.49,45708.4,17197881700.0,3442.1,3296.67,1425.38,130.54,253.19,622.89,540.54,217.27,456.44,275.09,73152.36,459.06,33754.34,1213.37,192.74,17.0,197.0,881700.0,17197881700.0,17197881700.0,0.35,0.56,0.3,0.5,0.27,0.35,0.2,0.44,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.3,0.2,0.5,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.27,0.3,0.35,381.7,425.84,464.44,152156.91,954.85,70209.03,167013.41,881.98,69933.85,201132.0,1179.93,161300.0,1199.0,69250.0,0.29,0.04,0.09,1406.1,0.14,0.15,1320.0,0.19,2495.94,0.29,416.14,335.54,751.67,0.31,0.38,0.51,0.46,282.0,0.5,257.0,5,aff_mix_mod,-0.03,0.02,0,1,0,0,0,1,0,0,0,1,0,0,1,ch_decrease_marginal,0.23,0,0,0,0,0,1,0.1,-0.08,-0.0,0.36,-0.01,44.14,38.61,0.02,0.06,-0.04,1,1,0,0,0,0,0,0,0,0,1,1,1,1,0,1,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,17197881700,0,False,0,0,0,0.0,0.0,0,0,0,0,0,0,-101.65,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE'],1320.0,58.0,37.0,38.0,28.0,42.0,41.0,52.0,81.0,53.0,110.0,158.0,191.0,154.0,80.0,138.0,59.0
6,5358.0,4574.0,2158.0,92984.0,306400.0,23669.0,2073.0,833.0,4089.0,955.0,572.0,123.0,133.0,2261.0,16.0,110.0,1981.0,177.0,1442.0,47201.0,70.0,32.0,0.0,0.0,7.0,24.0,0.0,0.0,7.0,83.0,7.0,0.0,0.0,17,197,883504,0.0,0.0,22.0,0.0,54.0,26.0,0.0,6.0,0.0,0.0,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197883504,278700.0,15238.0,1652.0,568.0,56.0,8.0,15.0,24.0,5.0,0.0,0.0,4.0,0.0,127.0,40.0,0.0,9.0,0.0,41.0,0.0,9.0,28.0,85.0,29.0,0.0,11.0,0.0,30.0,0.0,0.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,40232.0,3774.0,3527.0,1359.0,1230.0,129.0,17.0,197.0,883504.0,17197883504.0,2690.0,256.0,114.0,34.0,7.0,296.0,109.0,21.0,6.0,200300.0,695.0,1366.0,67708.0,17197883504.0,2784.0,2730.0,824.0,171.0,195.0,540.0,331.0,108.0,283.0,190.0,123600.0,539.0,46742.0,663.0,158.0,17.0,197.0,883504.0,17197883504.0,17197883504.0,0.3,0.45,0.24,0.38,0.09,0.3,0.16,0.55,0.0,0.0,0.0,0.0,0.0,1.0,5.0,mix_high,0.24,0.13,0.62,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.09,0.24,0.3,73.8,334.27,643.31,257088.0,1121.12,97223.36,306459.0,1063.35,103593.24,309357.0,1833.72,306400.0,2073.0,92984.0,0.15,0.02,0.07,821.0,0.19,0.09,2158.0,0.08,1818.0,0.26,377.0,411.0,788.0,0.29,0.44,0.06,0.26,179.0,0.49,268.0,5,aff_mix_mod,-0.0,0.13,0,0,1,0,0,1,0,0,0,1,1,0,2,ch_increase,0.08,0,0,0,0,0,1,0.19,-0.05,0.07,0.95,-0.1,260.47,309.04,0.03,0.14,-0.23,1,0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,0,1,1,0,0,0,0,0,0,0,1,0,17197883504,0,False,0,0,0,0.0,1.0,0,0,0,0,1,0,-583.76,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE'],2158.0,28.0,35.0,31.0,49.0,117.0,63.0,45.0,154.0,59.0,199.0,162.0,209.0,197.0,71.0,360.0,379.0
7,3204.0,2267.0,1460.0,49732.0,95700.0,20588.0,767.0,147.0,2219.0,204.0,140.0,0.0,18.0,1639.0,152.0,274.0,1033.0,427.0,874.0,27875.0,85.0,12.0,11.0,0.0,43.0,0.0,0.0,19.0,0.0,26.0,0.0,5.0,21.0,17,197,883700,0.0,0.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197883700,123700.0,15719.0,722.0,97.0,93.0,9.0,0.0,17.0,42.0,0.0,0.0,25.0,0.0,116.0,21.0,35.0,31.0,0.0,29.0,0.0,0.0,0.0,23.0,13.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,23560.0,3293.0,2794.0,1354.0,909.0,445.0,17.0,197.0,883700.0,17197883700.0,2245.0,148.0,18.0,6.0,0.0,64.0,34.0,6.0,10.0,98400.0,497.0,1348.0,40500.0,17197883700.0,2940.76,2708.47,1139.56,333.2,333.2,692.11,315.12,100.91,104.72,34.27,49123.76,393.18,25749.04,815.87,329.4,17.0,197.0,883700.0,17197883700.0,17197883700.0,0.52,0.74,0.47,0.58,0.36,0.52,0.22,0.26,0.0,0.0,0.0,1.0,0.0,0.0,2.0,mix_low,0.47,0.12,0.42,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.36,0.47,0.52,414.52,628.54,766.19,102177.42,817.82,53558.0,150552.0,760.41,61965.0,137307.0,801.42,95700.0,767.0,49732.0,0.29,0.08,0.15,1145.27,0.29,0.33,1460.0,0.29,1913.54,0.07,166.0,108.0,274.0,0.12,0.16,0.26,0.47,114.0,0.56,232.0,1,aff_predominantly_LI,-0.36,-0.04,0,1,0,0,1,0,0,0,1,1,0,0,1,ch_decrease_marginal,-0.05,0,0,0,0,0,0,0.47,-0.07,0.16,0.01,-0.2,214.02,137.65,0.05,0.04,-0.09,1,1,1,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,1,0,1,17197883700,0,True,0,1,0,1.0,0.0,0,0,0,0,0,1,160.21,20.09,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,1,1.0,1.0,['SLI'],1460.0,110.0,123.0,143.0,61.0,98.0,62.0,64.0,32.0,40.0,106.0,205.0,231.0,95.0,51.0,34.0,5.0
8,5139.0,4759.0,1746.0,78750.0,215000.0,20691.0,1424.0,294.0,3487.0,482.0,167.0,16.0,27.0,1924.0,58.0,55.0,1424.0,322.0,1425.0,32700.0,163.0,39.0,0.0,43.0,30.0,21.0,21.0,0.0,9.0,138.0,14.0,0.0,26.0,17,197,880502,13.0,10.0,15.0,11.0,49.0,20.0,12.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197880502,199000.0,19822.0,973.0,48.0,217.0,78.0,31.0,19.0,0.0,45.0,44.0,0.0,0.0,241.0,123.0,0.0,42.0,8.0,20.0,48.0,0.0,0.0,24.0,9.0,0.0,7.0,0.0,0.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,32531.0,5259.0,4922.0,1749.0,1516.0,233.0,17.0,197.0,880502.0,17197880502.0,3275.0,131.0,42.0,6.0,18.0,162.0,38.0,6.0,0.0,146200.0,692.0,1760.0,59636.0,17197880502.0,3968.0,3819.0,1348.0,228.0,456.0,1058.0,375.0,115.0,169.0,68.0,76900.0,510.0,38920.0,1093.0,260.0,17.0,197.0,880502.0,17197880502.0,17197880502.0,0.32,0.51,0.19,0.42,0.18,0.32,0.19,0.49,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.19,0.22,0.58,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.18,0.19,0.32,247.8,335.94,557.54,159952.0,1060.8,80953.6,223686.0,1058.76,91243.08,220890.0,1080.03,215000.0,1424.0,78750.0,0.07,0.04,0.06,1353.0,0.19,0.13,1746.0,0.18,2469.0,0.1,191.0,200.0,391.0,0.12,0.2,0.06,0.43,321.0,0.63,482.0,5,aff_mix_mod,-0.04,0.32,0,0,0,1,0,1,0,0,0,1,0,1,3,ch_rapid_increase,0.14,0,0,0,0,0,1,0.4,-0.0,0.13,0.34,-0.14,88.14,221.6,0.02,0.08,-0.19,1,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,1,1,1,0,0,1,1,1,0,0,0,1,0,0,0,0,17197880502,0,False,0,0,0,1.0,1.0,0,0,0,0,1,0,-157.36,20.09,0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0,0.0,0,1.0,6.0,['SMMI'],1746.0,35.0,18.0,115.0,39.0,34.0,29.0,66.0,114.0,54.0,171.0,163.0,233.0,302.0,120.0,219.0,34.0
9,5370.0,5048.0,1820.0,102889.0,286700.0,8272.0,2039.0,323.0,3669.0,993.0,454.0,17.0,16.0,1869.0,25.0,13.0,1582.0,238.0,1907.0,40410.0,36.0,0.0,0.0,0.0,9.0,0.0,19.0,0.0,8.0,189.0,22.0,0.0,31.0,17,197,881002,24.0,70.0,0.0,15.0,27.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197881002,285700.0,21281.0,1698.0,151.0,76.0,0.0,0.0,0.0,9.0,9.0,30.0,19.0,9.0,146.0,80.0,17.0,0.0,8.0,0.0,41.0,0.0,0.0,12.0,0.0,0.0,0.0,12.0,0.0,0.0,0.0,0.0,16.0,9.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,35250.0,4847.39,4599.52,1458.38,1420.03,38.35,17.0,197.0,881002.0,34395762003.0,2906.57,288.43,81.97,26.86,6.95,240.57,66.03,15.9,9.93,194338.75,1063.27,1468.3,77838.46,34395762003.0,3785.43,3709.8,1135.68,51.82,147.94,666.03,614.76,205.65,411.26,171.52,133824.44,474.46,50706.91,1077.34,38.39,17.0,197.0,881002.0,34395762003.0,34395762003.0,0.25,0.37,0.13,0.24,0.09,0.25,0.13,0.63,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.13,0.11,0.76,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.09,0.13,0.25,97.29,189.95,451.14,278354.84,986.88,105470.38,297338.29,1626.8,119092.84,317127.0,1884.78,286700.0,2039.0,102889.0,0.06,0.02,0.05,1115.73,0.03,0.03,1820.0,0.13,2268.98,0.26,377.36,316.54,693.9,0.24,0.4,0.02,0.25,225.0,0.45,250.0,5,aff_mix_mod,-0.04,0.08,0,0,1,0,0,1,0,0,0,1,1,0,2,ch_increase,0.1,0,0,0,0,0,1,0.07,0.65,0.13,0.25,-0.14,92.66,261.2,-0.02,0.16,-0.2,1,0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,0,1,1,0,1,0,0,1,0,0,1,0,17197881002,0,False,0,0,0,1.0,1.0,0,0,0,0,1,0,-788.29,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE'],1820.0,59.0,43.0,68.0,48.0,32.0,81.0,48.0,56.0,8.0,26.0,160.0,274.0,156.0,244.0,259.0,258.0


In [22]:
merged_18 = merged_18.rename(
    columns={
        'hinc_18': 'medhinc_18',
        'total_25_col_bd_18': 'total_bd_18',
        'total_25_col_md_18': 'total_md_18',
        'total_25_col_pd_18': 'total_pd_18',
        'total_25_col_phd_18': 'total_phd_18',
        'units_40_49_built_18': 'units_40_49_18',
        'units_39_early_built_18': 'units_39_earlier_18',
        'B19001_001E':'hinc_18',
        'B19001_002E':'I_10000_18',
        'B19001_003E':'I_15000_18',
        'B19001_004E':'I_20000_18',
        'B19001_005E':'I_25000_18',
        'B19001_006E':'I_30000_18',
        'B19001_007E':'I_35000_18',
        'B19001_008E':'I_40000_18',
        'B19001_009E':'I_45000_18',
        'B19001_010E':'I_50000_18',
        'B19001_011E':'I_60000_18',
        'B19001_012E':'I_75000_18',
        'B19001_013E':'I_100000_18',
        'B19001_014E':'I_125000_18',
        'B19001_015E':'I_150000_18',
        'B19001_016E':'I_200000_18',
        'B19001_017E':'I_201000_18'})
merged_18.head(10)

Unnamed: 0,pop_18,white_18,hh_18,medhinc_18,mhval_18,mhval_18_se,mrent_18,mrent_18_se,total_25_18,total_bd_18,total_md_18,total_pd_18,total_phd_18,tot_units_built_18,units_40_49_18,units_39_earlier_18,ohu_18,rhu_18,mmhcosts_18,iinc_18,mov_wc_w_income_18,mov_wc_9000_18,mov_wc_15000_18,mov_wc_25000_18,mov_wc_35000_18,mov_wc_50000_18,mov_wc_65000_18,mov_wc_75000_18,mov_wc_76000_more_18,mov_oc_w_income_18,mov_oc_9000_18,mov_oc_15000_18,mov_oc_25000_18,state_x,county_x,tract_x,mov_oc_35000_18,mov_oc_50000_18,mov_oc_65000_18,mov_oc_75000_18,mov_oc_76000_more_18,mov_os_w_income_18,mov_os_9000_18,mov_os_15000_18,mov_os_25000_18,mov_os_35000_18,mov_os_50000_18,mov_os_65000_18,mov_os_75000_18,mov_os_76000_more_18,mov_fa_w_income_18,mov_fa_9000_18,mov_fa_15000_18,mov_fa_25000_18,mov_fa_35000_18,mov_fa_50000_18,mov_fa_65000_18,mov_fa_75000_18,mov_fa_76000_more_18,FIPS,mhval_12,mhval_12_se,mrent_12,mrent_12_se,mov_wc_w_income_12,mov_wc_9000_12,mov_wc_15000_12,mov_wc_25000_12,mov_wc_35000_12,mov_wc_50000_12,mov_wc_65000_12,mov_wc_75000_12,mov_wc_76000_more_12,mov_oc_w_income_12,mov_oc_9000_12,mov_oc_15000_12,mov_oc_25000_12,mov_oc_35000_12,mov_oc_50000_12,mov_oc_65000_12,mov_oc_75000_12,mov_oc_76000_more_12,mov_os_w_income_12,mov_os_9000_12,mov_os_15000_12,mov_os_25000_12,mov_os_35000_12,mov_os_50000_12,mov_os_65000_12,mov_os_75000_12,mov_os_76000_more_12,mov_fa_w_income_12,mov_fa_9000_12,mov_fa_15000_12,mov_fa_25000_12,mov_fa_35000_12,mov_fa_50000_12,mov_fa_65000_12,mov_fa_75000_12,mov_fa_76000_more_12,iinc_12,pop_00,white_00,hu_00,ohu_00,rhu_00,state_y,county_y,tract_y,trtid_base_x,total_25_00,male_25_col_bd_00,male_25_col_md_00,male_25_col_psd_00,male_25_col_phd_00,female_25_col_bd_00,female_25_col_md_00,female_25_col_psd_00,female_25_col_phd_00,mhval_00,mrent_00,hh_00,hinc_00,trtid00,pop_90,white_90,hh_90,total_25_col_9th_90,total_25_col_12th_90,total_25_col_hs_90,total_25_col_sc_90,total_25_col_ad_90,total_25_col_bd_90,total_25_col_gd_90,mhval_90,mrent_90,hinc_90,ohu_90,rhu_90,state,county,tract,trtid_base_y,trtid90,inc80_18,inc120_18,inc80_00,inc120_00,inc80_90,low_80120_18,mod_80120_18,high_80120_18,low_pdmt_medhhinc_18,high_pdmt_medhhinc_18,mod_pdmt_medhhinc_18,mix_low_medhhinc_18,mix_mod_medhhinc_18,mix_high_medhhinc_18,inc_cat_medhhinc_18,inc_cat_medhhinc_encoded18,low_80120_00,mod_80120_00,high_80120_00,low_pdmt_medhhinc_00,high_pdmt_medhhinc_00,mod_pdmt_medhhinc_00,mix_low_medhhinc_00,mix_mod_medhhinc_00,mix_high_medhhinc_00,inc_cat_medhhinc_00,inc_cat_medhhinc_encoded00,per_all_li_90,per_all_li_00,per_all_li_18,all_li_count_90,all_li_count_00,all_li_count_18,real_mhval_90,real_mrent_90,real_hinc_90,real_mhval_00,real_mrent_00,real_hinc_00,real_mhval_12,real_mrent_12,real_mhval_18,real_mrent_18,real_hinc_18,per_nonwhite_18,per_nonwhite_90,per_nonwhite_00,hu_90,per_rent_90,per_rent_00,hu_18,per_rent_18,total_25_90,per_col_90,male_25_col_00,female_25_col_00,total_25_col_00,per_col_00,per_col_18,per_units_pre50_18,per_limove_18,mov_tot_w_income_18,per_limove_12,mov_tot_w_income_12,lmh_flag_encoded,lmh_flag_category,pctch_real_mhval_00_18,pctch_real_mrent_12_18,rent_decrease,rent_marginal,rent_increase,rent_rapid_increase,house_decrease,house_marginal,house_increase,house_rapid_increase,tot_decrease,tot_marginal,tot_increase,tot_rapid_increase,change_flag_encoded,change_flag_category,per_ch_zillow_12_18,ab_50pct_ch,ab_90percentile_ch,rent_50pct_ch,rent_90percentile_ch,hv_abrm_ch,rent_abrm_ch,pctch_real_mhval_90_00,pctch_real_mrent_90_00,pctch_real_hinc_90_00,pctch_real_mrent_00_18,pctch_real_hinc_00_18,ch_all_li_count_90_00,ch_all_li_count_00_18,ch_per_col_90_00,ch_per_col_00_18,ch_per_limove_12_18,pop00flag,aboverm_per_all_li_90,aboverm_per_all_li_00,aboverm_per_all_li_18,aboverm_per_nonwhite_18,aboverm_per_nonwhite_90,aboverm_per_nonwhite_00,aboverm_per_rent_90,aboverm_per_rent_00,aboverm_per_rent_18,aboverm_per_col_90,aboverm_per_col_00,aboverm_per_col_18,aboverm_real_mrent_90,aboverm_real_mrent_00,aboverm_real_mrent_12,aboverm_real_mrent_18,aboverm_real_mhval_90,aboverm_real_mhval_00,aboverm_real_mhval_18,aboverm_pctch_real_mhval_00_18,aboverm_pctch_real_mrent_00_18,aboverm_pctch_real_mrent_12_18,aboverm_pctch_real_mhval_90_00,aboverm_pctch_real_mrent_90_00,lostli_00,lostli_18,aboverm_pctch_real_hinc_90_00,aboverm_pctch_real_hinc_00_18,aboverm_ch_per_col_90_00,aboverm_ch_per_col_00_18,aboverm_per_units_pre50_18,GEOID,rail,presence_ph_LIHTC,vul_gent_90,vul_gent_00,vul_gent_18,hotmarket_00,hotmarket_18,gent_90_00,gent_90_00_urban,gent_00_18,gent_00_18_urban,dp_PChRent,dp_RentGap,tr_rent_gap,rm_rent_gap,dense,SAE,AdvG,ARE,BE,SMMI,ARG,EOG,OD,OD_loss,SLI,double_counted,typology,typ_cat,hinc_18,I_10000_18,I_15000_18,I_20000_18,I_25000_18,I_30000_18,I_35000_18,I_40000_18,I_45000_18,I_50000_18,I_60000_18,I_75000_18,I_100000_18,I_125000_18,I_150000_18,I_200000_18,I_201000_18
0,2344.0,1199.0,866.0,49565.0,124400.0,6926.0,969.0,38.0,1532.0,98.0,58.0,8.0,4.0,950.0,127.0,295.0,427.0,439.0,965.0,26602.0,164.0,54.0,6.0,25.0,46.0,12.0,9.0,3.0,9.0,24.0,4.0,4.0,7.0,17,197,882900,0.0,4.0,5.0,0.0,0.0,26.0,0.0,10.0,5.0,11.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197882900,143800.0,17014.0,864.0,60.0,279.0,60.0,21.0,50.0,49.0,39.0,42.0,3.0,15.0,51.0,9.0,0.0,3.0,0.0,0.0,31.0,0.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,8.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,29330.0,2296.07,1774.18,932.47,577.41,355.06,17.0,197.0,882900.0,51593648707.0,1490.4,36.28,3.08,11.04,3.0,52.35,15.1,0.02,0.02,93093.6,597.4,935.46,40208.99,51593648707.0,2156.15,1859.8,882.78,160.54,319.18,590.94,227.59,60.39,67.74,21.46,53826.48,419.96,31982.8,597.51,289.11,17.0,197.0,882900.0,68791532008.0,68791532008.0,0.52,0.7,0.4,0.63,0.36,0.52,0.18,0.3,0.0,0.0,0.0,1.0,0.0,0.0,2.0,mix_low,0.4,0.23,0.37,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.36,0.4,0.52,313.56,373.35,450.78,111959.07,873.53,66524.21,142433.21,914.02,61519.76,159618.0,959.04,124400.0,969.0,49565.0,0.49,0.14,0.23,886.63,0.33,0.38,866.0,0.51,1447.85,0.06,42.36,67.47,109.83,0.07,0.11,0.44,0.56,214.0,0.43,338.0,1,aff_predominantly_LI,-0.13,0.01,0,1,0,0,1,0,0,0,1,1,0,0,1,ch_decrease_marginal,0.3,0,0,0,0,1,1,0.27,0.05,-0.08,0.06,-0.19,59.79,77.43,0.01,0.04,0.13,1,1,1,1,1,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,17197882900,0,False,0,1,1,0.0,0.0,0,0,0,0,0,1,81.78,20.09,0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0,0.0,0,1.0,3.0,['ARG'],866.0,45.0,30.0,31.0,74.0,22.0,57.0,76.0,53.0,49.0,44.0,102.0,115.0,80.0,43.0,23.0,22.0
1,3759.0,1276.0,1183.0,46175.0,123400.0,10896.0,1019.0,273.0,2665.0,168.0,47.0,39.0,11.0,1266.0,206.0,153.0,542.0,641.0,1010.0,21376.0,127.0,21.0,7.0,39.0,34.0,22.0,0.0,0.0,4.0,69.0,15.0,7.0,0.0,17,197,883000,37.0,0.0,10.0,0.0,0.0,26.0,0.0,8.0,0.0,7.0,11.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197883000,142800.0,30771.0,814.0,310.0,572.0,155.0,90.0,185.0,132.0,6.0,4.0,0.0,0.0,105.0,77.0,19.0,9.0,0.0,0.0,0.0,0.0,0.0,111.0,42.0,60.0,9.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,16370.0,4106.0,1900.0,1254.0,839.0,415.0,17.0,197.0,883000.0,17197883000.0,2622.0,46.0,17.0,2.0,0.0,51.0,9.0,22.0,1.0,89800.0,380.0,1258.0,33900.0,17197883000.0,4199.0,2399.0,1220.0,258.0,556.0,903.0,561.0,135.0,104.0,90.0,56300.0,366.0,32029.0,831.0,458.0,17.0,197.0,883000.0,17197883000.0,17197883000.0,0.58,0.78,0.5,0.64,0.34,0.58,0.2,0.22,1.0,0.0,0.0,0.0,0.0,0.0,1.0,low_pdmt,0.5,0.13,0.36,0.0,0.0,0.0,1.0,0.0,0.0,2.0,mix_low,0.34,0.5,0.58,414.1,632.54,690.35,117104.0,761.28,66620.32,137394.0,581.4,51867.0,158508.0,903.54,123400.0,1019.0,46175.0,0.66,0.43,0.54,1289.0,0.36,0.33,1183.0,0.54,2607.0,0.07,63.0,61.0,124.0,0.05,0.1,0.28,0.47,222.0,0.79,788.0,5,aff_mix_mod,-0.1,0.13,0,0,1,0,1,0,0,0,1,0,1,0,2,ch_increase,,0,0,0,0,0,1,0.17,-0.24,-0.22,0.75,-0.11,218.44,57.82,-0.03,0.05,-0.32,1,1,1,1,1,1,1,1,1,1,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,1,17197883000,0,False,1,1,1,0.0,1.0,0,0,0,0,1,0,-6.29,20.09,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,1,1.0,1.0,['SLI'],1183.0,121.0,124.0,54.0,36.0,52.0,51.0,51.0,79.0,71.0,164.0,107.0,78.0,69.0,59.0,61.0,6.0
2,3726.0,1295.0,1099.0,80230.0,159400.0,6619.0,1764.0,87.0,2278.0,439.0,93.0,30.0,10.0,1186.0,9.0,14.0,893.0,206.0,1471.0,28768.0,10.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,0.0,27.0,0.0,0.0,10.0,17,197,880111,0.0,17.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197880111,183200.0,7572.0,1457.0,158.0,88.0,0.0,0.0,41.0,0.0,14.0,33.0,0.0,0.0,71.0,22.0,0.0,0.0,29.0,13.0,0.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,0.0,3.0,0.0,0.0,0.0,3.0,0.0,27360.0,3288.0,2024.0,929.0,869.0,60.0,17.0,197.0,880111.0,17197880111.0,1899.0,89.0,12.0,0.0,0.0,95.0,36.0,11.0,0.0,115300.0,1106.0,939.0,59958.0,17197880111.0,3326.0,2637.0,917.0,69.0,284.0,578.0,538.0,106.0,147.0,56.0,84500.0,867.0,47934.0,864.0,79.0,17.0,197.0,880111.0,17197880111.0,17197880111.0,0.31,0.51,0.11,0.37,0.09,0.31,0.2,0.49,0.0,0.0,0.0,0.0,0.0,1.0,5.0,mix_high,0.11,0.25,0.63,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.09,0.11,0.31,83.62,107.27,342.21,175760.0,1803.36,99702.72,176409.0,1692.18,91735.74,203352.0,1617.27,159400.0,1764.0,80230.0,0.65,0.21,0.38,943.0,0.08,0.06,1099.0,0.19,1778.0,0.11,101.0,131.0,232.0,0.12,0.25,0.02,0.23,47.0,0.37,165.0,2,aff_predominantly_MI,-0.1,0.09,0,0,1,0,1,0,0,0,1,0,1,0,2,ch_increase,0.23,0,0,0,0,0,1,0.0,-0.06,-0.08,0.04,-0.13,23.65,234.94,0.01,0.13,-0.14,1,0,0,0,1,1,1,0,0,0,0,0,0,1,1,1,1,1,0,0,0,0,1,0,0,0,0,0,0,0,1,0,17197880111,0,False,0,0,0,0.0,1.0,0,0,0,0,1,0,-179.07,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE'],1099.0,7.0,20.0,23.0,0.0,14.0,40.0,106.0,56.0,64.0,39.0,136.0,299.0,154.0,76.0,48.0,17.0
3,5692.0,4076.0,2429.0,71444.0,168400.0,16402.0,854.0,56.0,4421.0,703.0,364.0,21.0,0.0,2617.0,28.0,254.0,2233.0,196.0,1329.0,41679.0,77.0,0.0,0.0,31.0,25.0,0.0,0.0,8.0,13.0,456.0,136.0,13.0,31.0,17,197,883602,76.0,72.0,45.0,0.0,83.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197883602,188900.0,16717.0,931.0,334.0,62.0,0.0,0.0,19.0,14.0,29.0,0.0,0.0,0.0,133.0,34.0,1.0,43.0,43.0,0.0,0.0,0.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,37740.0,4097.97,3736.98,1605.99,1407.99,198.0,17.0,197.0,883602.0,17197883602.0,2897.98,159.0,41.0,11.0,4.0,236.0,87.0,8.0,4.0,150598.99,640.0,1606.99,62265.58,17197883602.0,6073.76,2337.39,1960.68,170.75,316.79,1032.76,936.15,232.17,375.96,323.53,49653.58,406.67,28005.97,1285.15,715.22,17.0,197.0,883602.0,17197883602.0,17197883602.0,0.26,0.58,0.26,0.4,0.29,0.26,0.32,0.42,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.26,0.14,0.6,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.29,0.26,0.26,571.46,418.4,622.73,103279.45,845.86,58252.41,230416.46,979.19,95266.34,209679.0,1033.41,168400.0,854.0,71444.0,0.28,0.62,0.09,2000.37,0.36,0.12,2429.0,0.08,3388.13,0.21,204.0,327.0,531.0,0.18,0.25,0.11,0.41,533.0,0.46,195.0,5,aff_mix_mod,-0.27,-0.17,1,0,0,0,1,0,0,0,1,0,0,0,1,ch_decrease_marginal,0.09,0,0,0,0,0,0,1.23,0.16,0.64,-0.13,-0.25,-153.05,204.33,-0.02,0.06,-0.05,1,1,0,0,0,1,0,1,0,0,1,0,0,0,1,0,0,0,1,0,0,0,0,1,1,1,0,1,0,0,0,0,17197883602,0,False,1,0,0,1.0,0.0,0,0,0,0,0,1,386.87,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE'],2429.0,30.0,13.0,85.0,67.0,23.0,92.0,73.0,64.0,89.0,277.0,546.0,225.0,225.0,261.0,264.0,95.0
4,2756.0,368.0,1439.0,41193.0,119200.0,19150.0,947.0,64.0,1847.0,273.0,133.0,0.0,0.0,1570.0,52.0,35.0,248.0,1191.0,960.0,30259.0,52.0,0.0,0.0,8.0,0.0,11.0,0.0,33.0,0.0,254.0,25.0,19.0,33.0,17,197,883803,83.0,54.0,40.0,0.0,0.0,33.0,33.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19.0,17197883803,138500.0,10735.0,858.0,30.0,195.0,13.0,9.0,27.0,93.0,17.0,36.0,0.0,0.0,374.0,74.0,86.0,48.0,38.0,82.0,0.0,0.0,46.0,21.0,0.0,0.0,0.0,0.0,21.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,26544.0,2526.0,1599.3,1064.81,444.22,620.59,17.0,197.0,883803.0,17197883803.0,1577.18,90.28,22.12,0.0,0.0,96.85,51.42,0.0,0.0,65108.02,403.56,1064.21,24623.87,17197883803.0,2483.55,1914.38,1058.23,71.15,286.38,507.59,460.96,69.35,143.49,48.43,35752.62,290.56,17876.31,382.64,704.89,17.0,197.0,883803.0,17197883803.0,17197883803.0,0.64,0.84,0.39,0.61,0.33,0.64,0.19,0.16,1.0,0.0,0.0,0.0,0.0,0.0,1.0,low_pdmt,0.39,0.21,0.39,0.0,0.0,0.0,1.0,0.0,0.0,2.0,mix_low,0.33,0.39,0.64,350.89,419.07,925.01,74365.44,604.37,37182.72,99615.28,617.45,37674.52,153735.0,952.38,119200.0,947.0,41193.0,0.87,0.23,0.37,1087.53,0.65,0.58,1439.0,0.83,1587.34,0.12,112.4,148.27,260.67,0.17,0.22,0.06,0.35,358.0,0.42,590.0,1,aff_predominantly_LI,0.2,-0.01,0,1,0,0,0,0,1,0,0,1,1,0,2,ch_increase,-0.05,0,0,0,0,0,0,0.34,0.02,0.01,0.53,0.09,68.18,505.94,0.04,0.05,-0.07,1,1,1,1,1,1,1,1,1,1,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,1,1,0,0,17197883803,0,False,1,1,1,0.0,1.0,0,0,0,0,0,1,85.8,20.09,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,1,1.0,1.0,['SLI'],1439.0,117.0,0.0,61.0,157.0,125.0,192.0,57.0,92.0,88.0,115.0,178.0,120.0,17.0,94.0,19.0,7.0
5,3375.0,2384.0,1320.0,69250.0,161300.0,10246.0,1199.0,228.0,2373.0,537.0,324.0,16.0,20.0,1485.0,255.0,502.0,1066.0,254.0,1201.0,34135.0,145.0,35.0,26.0,15.0,10.0,31.0,22.0,0.0,6.0,97.0,12.0,33.0,9.0,17,197,881700,0.0,0.0,0.0,34.0,9.0,21.0,0.0,0.0,0.0,0.0,21.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,17197881700,181200.0,10238.0,1063.0,428.0,211.0,0.0,87.0,17.0,16.0,71.0,20.0,0.0,0.0,46.0,27.0,0.0,0.0,0.0,13.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,40685.0,3358.0,3061.89,1420.12,1205.48,214.64,17.0,197.0,881700.0,17197881700.0,2387.31,334.66,72.71,37.67,8.76,261.95,73.59,31.54,0.0,109159.09,576.46,1417.49,45708.4,17197881700.0,3442.1,3296.67,1425.38,130.54,253.19,622.89,540.54,217.27,456.44,275.09,73152.36,459.06,33754.34,1213.37,192.74,17.0,197.0,881700.0,17197881700.0,17197881700.0,0.35,0.56,0.3,0.5,0.27,0.35,0.2,0.44,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.3,0.2,0.5,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.27,0.3,0.35,381.7,425.84,464.44,152156.91,954.85,70209.03,167013.41,881.98,69933.85,201132.0,1179.93,161300.0,1199.0,69250.0,0.29,0.04,0.09,1406.1,0.14,0.15,1320.0,0.19,2495.94,0.29,416.14,335.54,751.67,0.31,0.38,0.51,0.46,282.0,0.5,257.0,5,aff_mix_mod,-0.03,0.02,0,1,0,0,0,1,0,0,0,1,0,0,1,ch_decrease_marginal,0.23,0,0,0,0,0,1,0.1,-0.08,-0.0,0.36,-0.01,44.14,38.61,0.02,0.06,-0.04,1,1,0,0,0,0,0,0,0,0,1,1,1,1,0,1,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,17197881700,0,False,0,0,0,0.0,0.0,0,0,0,0,0,0,-101.65,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE'],1320.0,58.0,37.0,38.0,28.0,42.0,41.0,52.0,81.0,53.0,110.0,158.0,191.0,154.0,80.0,138.0,59.0
6,5358.0,4574.0,2158.0,92984.0,306400.0,23669.0,2073.0,833.0,4089.0,955.0,572.0,123.0,133.0,2261.0,16.0,110.0,1981.0,177.0,1442.0,47201.0,70.0,32.0,0.0,0.0,7.0,24.0,0.0,0.0,7.0,83.0,7.0,0.0,0.0,17,197,883504,0.0,0.0,22.0,0.0,54.0,26.0,0.0,6.0,0.0,0.0,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197883504,278700.0,15238.0,1652.0,568.0,56.0,8.0,15.0,24.0,5.0,0.0,0.0,4.0,0.0,127.0,40.0,0.0,9.0,0.0,41.0,0.0,9.0,28.0,85.0,29.0,0.0,11.0,0.0,30.0,0.0,0.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,40232.0,3774.0,3527.0,1359.0,1230.0,129.0,17.0,197.0,883504.0,17197883504.0,2690.0,256.0,114.0,34.0,7.0,296.0,109.0,21.0,6.0,200300.0,695.0,1366.0,67708.0,17197883504.0,2784.0,2730.0,824.0,171.0,195.0,540.0,331.0,108.0,283.0,190.0,123600.0,539.0,46742.0,663.0,158.0,17.0,197.0,883504.0,17197883504.0,17197883504.0,0.3,0.45,0.24,0.38,0.09,0.3,0.16,0.55,0.0,0.0,0.0,0.0,0.0,1.0,5.0,mix_high,0.24,0.13,0.62,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.09,0.24,0.3,73.8,334.27,643.31,257088.0,1121.12,97223.36,306459.0,1063.35,103593.24,309357.0,1833.72,306400.0,2073.0,92984.0,0.15,0.02,0.07,821.0,0.19,0.09,2158.0,0.08,1818.0,0.26,377.0,411.0,788.0,0.29,0.44,0.06,0.26,179.0,0.49,268.0,5,aff_mix_mod,-0.0,0.13,0,0,1,0,0,1,0,0,0,1,1,0,2,ch_increase,0.08,0,0,0,0,0,1,0.19,-0.05,0.07,0.95,-0.1,260.47,309.04,0.03,0.14,-0.23,1,0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,0,1,1,0,0,0,0,0,0,0,1,0,17197883504,0,False,0,0,0,0.0,1.0,0,0,0,0,1,0,-583.76,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE'],2158.0,28.0,35.0,31.0,49.0,117.0,63.0,45.0,154.0,59.0,199.0,162.0,209.0,197.0,71.0,360.0,379.0
7,3204.0,2267.0,1460.0,49732.0,95700.0,20588.0,767.0,147.0,2219.0,204.0,140.0,0.0,18.0,1639.0,152.0,274.0,1033.0,427.0,874.0,27875.0,85.0,12.0,11.0,0.0,43.0,0.0,0.0,19.0,0.0,26.0,0.0,5.0,21.0,17,197,883700,0.0,0.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197883700,123700.0,15719.0,722.0,97.0,93.0,9.0,0.0,17.0,42.0,0.0,0.0,25.0,0.0,116.0,21.0,35.0,31.0,0.0,29.0,0.0,0.0,0.0,23.0,13.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,23560.0,3293.0,2794.0,1354.0,909.0,445.0,17.0,197.0,883700.0,17197883700.0,2245.0,148.0,18.0,6.0,0.0,64.0,34.0,6.0,10.0,98400.0,497.0,1348.0,40500.0,17197883700.0,2940.76,2708.47,1139.56,333.2,333.2,692.11,315.12,100.91,104.72,34.27,49123.76,393.18,25749.04,815.87,329.4,17.0,197.0,883700.0,17197883700.0,17197883700.0,0.52,0.74,0.47,0.58,0.36,0.52,0.22,0.26,0.0,0.0,0.0,1.0,0.0,0.0,2.0,mix_low,0.47,0.12,0.42,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.36,0.47,0.52,414.52,628.54,766.19,102177.42,817.82,53558.0,150552.0,760.41,61965.0,137307.0,801.42,95700.0,767.0,49732.0,0.29,0.08,0.15,1145.27,0.29,0.33,1460.0,0.29,1913.54,0.07,166.0,108.0,274.0,0.12,0.16,0.26,0.47,114.0,0.56,232.0,1,aff_predominantly_LI,-0.36,-0.04,0,1,0,0,1,0,0,0,1,1,0,0,1,ch_decrease_marginal,-0.05,0,0,0,0,0,0,0.47,-0.07,0.16,0.01,-0.2,214.02,137.65,0.05,0.04,-0.09,1,1,1,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,1,0,1,17197883700,0,True,0,1,0,1.0,0.0,0,0,0,0,0,1,160.21,20.09,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,1,1.0,1.0,['SLI'],1460.0,110.0,123.0,143.0,61.0,98.0,62.0,64.0,32.0,40.0,106.0,205.0,231.0,95.0,51.0,34.0,5.0
8,5139.0,4759.0,1746.0,78750.0,215000.0,20691.0,1424.0,294.0,3487.0,482.0,167.0,16.0,27.0,1924.0,58.0,55.0,1424.0,322.0,1425.0,32700.0,163.0,39.0,0.0,43.0,30.0,21.0,21.0,0.0,9.0,138.0,14.0,0.0,26.0,17,197,880502,13.0,10.0,15.0,11.0,49.0,20.0,12.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197880502,199000.0,19822.0,973.0,48.0,217.0,78.0,31.0,19.0,0.0,45.0,44.0,0.0,0.0,241.0,123.0,0.0,42.0,8.0,20.0,48.0,0.0,0.0,24.0,9.0,0.0,7.0,0.0,0.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,32531.0,5259.0,4922.0,1749.0,1516.0,233.0,17.0,197.0,880502.0,17197880502.0,3275.0,131.0,42.0,6.0,18.0,162.0,38.0,6.0,0.0,146200.0,692.0,1760.0,59636.0,17197880502.0,3968.0,3819.0,1348.0,228.0,456.0,1058.0,375.0,115.0,169.0,68.0,76900.0,510.0,38920.0,1093.0,260.0,17.0,197.0,880502.0,17197880502.0,17197880502.0,0.32,0.51,0.19,0.42,0.18,0.32,0.19,0.49,0.0,0.0,0.0,0.0,1.0,0.0,4.0,mix_mod,0.19,0.22,0.58,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.18,0.19,0.32,247.8,335.94,557.54,159952.0,1060.8,80953.6,223686.0,1058.76,91243.08,220890.0,1080.03,215000.0,1424.0,78750.0,0.07,0.04,0.06,1353.0,0.19,0.13,1746.0,0.18,2469.0,0.1,191.0,200.0,391.0,0.12,0.2,0.06,0.43,321.0,0.63,482.0,5,aff_mix_mod,-0.04,0.32,0,0,0,1,0,1,0,0,0,1,0,1,3,ch_rapid_increase,0.14,0,0,0,0,0,1,0.4,-0.0,0.13,0.34,-0.14,88.14,221.6,0.02,0.08,-0.19,1,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,1,1,1,0,0,1,1,1,0,0,0,1,0,0,0,0,17197880502,0,False,0,0,0,1.0,1.0,0,0,0,0,1,0,-157.36,20.09,0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0,0.0,0,1.0,6.0,['SMMI'],1746.0,35.0,18.0,115.0,39.0,34.0,29.0,66.0,114.0,54.0,171.0,163.0,233.0,302.0,120.0,219.0,34.0
9,5370.0,5048.0,1820.0,102889.0,286700.0,8272.0,2039.0,323.0,3669.0,993.0,454.0,17.0,16.0,1869.0,25.0,13.0,1582.0,238.0,1907.0,40410.0,36.0,0.0,0.0,0.0,9.0,0.0,19.0,0.0,8.0,189.0,22.0,0.0,31.0,17,197,881002,24.0,70.0,0.0,15.0,27.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17197881002,285700.0,21281.0,1698.0,151.0,76.0,0.0,0.0,0.0,9.0,9.0,30.0,19.0,9.0,146.0,80.0,17.0,0.0,8.0,0.0,41.0,0.0,0.0,12.0,0.0,0.0,0.0,12.0,0.0,0.0,0.0,0.0,16.0,9.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,35250.0,4847.39,4599.52,1458.38,1420.03,38.35,17.0,197.0,881002.0,34395762003.0,2906.57,288.43,81.97,26.86,6.95,240.57,66.03,15.9,9.93,194338.75,1063.27,1468.3,77838.46,34395762003.0,3785.43,3709.8,1135.68,51.82,147.94,666.03,614.76,205.65,411.26,171.52,133824.44,474.46,50706.91,1077.34,38.39,17.0,197.0,881002.0,34395762003.0,34395762003.0,0.25,0.37,0.13,0.24,0.09,0.25,0.13,0.63,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.13,0.11,0.76,0.0,1.0,0.0,0.0,0.0,0.0,6.0,high_pdmt,0.09,0.13,0.25,97.29,189.95,451.14,278354.84,986.88,105470.38,297338.29,1626.8,119092.84,317127.0,1884.78,286700.0,2039.0,102889.0,0.06,0.02,0.05,1115.73,0.03,0.03,1820.0,0.13,2268.98,0.26,377.36,316.54,693.9,0.24,0.4,0.02,0.25,225.0,0.45,250.0,5,aff_mix_mod,-0.04,0.08,0,0,1,0,0,1,0,0,0,1,1,0,2,ch_increase,0.1,0,0,0,0,0,1,0.07,0.65,0.13,0.25,-0.14,92.66,261.2,-0.02,0.16,-0.2,1,0,0,0,0,0,0,0,0,0,1,1,1,1,1,1,1,1,1,1,0,1,1,0,1,0,0,1,0,0,1,0,17197881002,0,False,0,0,0,1.0,1.0,0,0,0,0,1,0,-788.29,20.09,0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0,0.0,0,1.0,7.0,['ARE'],1820.0,59.0,43.0,68.0,48.0,32.0,81.0,48.0,56.0,8.0,26.0,160.0,274.0,156.0,244.0,259.0,258.0


In [23]:
# columns to keep in the 2018 dataset
# lostli_18: loss of low income households from 2012 to 2018
# pctch_real_mrent_12_18: percent change in real home value from 2012 to 2018 (original dataset might have a typo)
# per_ch_zillow_12_18: percent change in rent prices from 2012 to 2018
cols_to_keep = ['state_x', 'county_x', 'tract_x', 'typology', 'FIPS', 'typ_cat', 'rail', 'lostli_18', 'pctch_real_mrent_12_18', 'per_ch_zillow_12_18', 'iinc_12']
cols_additional = ['state', 'county', 'tract', 'GEO_ID', 'FIPS', 'year', 'typology', 'typ_cat']

for col in df_2023.columns:
    if col not in cols_additional:
        to_keep = col + '_18'
        cols_to_keep.append(to_keep)
    

cols_to_keep

['state_x',
 'county_x',
 'tract_x',
 'typology',
 'FIPS',
 'typ_cat',
 'rail',
 'lostli_18',
 'pctch_real_mrent_12_18',
 'per_ch_zillow_12_18',
 'iinc_12',
 'pop_18',
 'white_18',
 'hh_18',
 'medhinc_18',
 'mhval_18',
 'mrent_18',
 'ohu_18',
 'rhu_18',
 'total_bd_18',
 'total_md_18',
 'total_pd_18',
 'total_phd_18',
 'tot_units_built_18',
 'units_40_49_18',
 'units_39_earlier_18',
 'mov_wc_w_income_18',
 'mov_wc_9000_18',
 'mov_wc_15000_18',
 'mov_wc_25000_18',
 'mov_wc_35000_18',
 'mov_wc_50000_18',
 'mov_wc_65000_18',
 'mov_wc_75000_18',
 'mov_wc_76000_more_18',
 'mov_oc_w_income_18',
 'mov_oc_9000_18',
 'mov_oc_15000_18',
 'mov_oc_25000_18',
 'mov_oc_35000_18',
 'mov_oc_50000_18',
 'mov_oc_65000_18',
 'mov_oc_75000_18',
 'mov_oc_76000_more_18',
 'mov_os_w_income_18',
 'mov_os_9000_18',
 'mov_os_15000_18',
 'mov_os_25000_18',
 'mov_os_35000_18',
 'mov_os_50000_18',
 'mov_os_65000_18',
 'mov_os_75000_18',
 'mov_os_76000_more_18',
 'mov_fa_w_income_18',
 'mov_fa_9000_18',
 'mov_fa_150

In [24]:
len(cols_to_keep)

80

In [25]:
df_2018 = merged_18[cols_to_keep]

In [26]:
df_2018['year'] = 2018

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df_2018['year'] = 2018


In [27]:
df_2018.head(10)

Unnamed: 0,state_x,county_x,tract_x,typology,FIPS,typ_cat,rail,lostli_18,pctch_real_mrent_12_18,per_ch_zillow_12_18,iinc_12,pop_18,white_18,hh_18,medhinc_18,mhval_18,mrent_18,ohu_18,rhu_18,total_bd_18,total_md_18,total_pd_18,total_phd_18,tot_units_built_18,units_40_49_18,units_39_earlier_18,mov_wc_w_income_18,mov_wc_9000_18,mov_wc_15000_18,mov_wc_25000_18,mov_wc_35000_18,mov_wc_50000_18,mov_wc_65000_18,mov_wc_75000_18,mov_wc_76000_more_18,mov_oc_w_income_18,mov_oc_9000_18,mov_oc_15000_18,mov_oc_25000_18,mov_oc_35000_18,mov_oc_50000_18,mov_oc_65000_18,mov_oc_75000_18,mov_oc_76000_more_18,mov_os_w_income_18,mov_os_9000_18,mov_os_15000_18,mov_os_25000_18,mov_os_35000_18,mov_os_50000_18,mov_os_65000_18,mov_os_75000_18,mov_os_76000_more_18,mov_fa_w_income_18,mov_fa_9000_18,mov_fa_15000_18,mov_fa_25000_18,mov_fa_35000_18,mov_fa_50000_18,mov_fa_65000_18,mov_fa_75000_18,mov_fa_76000_more_18,iinc_18,hinc_18,I_10000_18,I_15000_18,I_20000_18,I_25000_18,I_30000_18,I_35000_18,I_40000_18,I_45000_18,I_50000_18,I_60000_18,I_75000_18,I_100000_18,I_125000_18,I_150000_18,I_200000_18,I_201000_18,year
0,17,197,882900,3.0,17197882900,['ARG'],0,0,0.01,0.3,29330.0,2344.0,1199.0,866.0,49565.0,124400.0,969.0,427.0,439.0,98.0,58.0,8.0,4.0,950.0,127.0,295.0,164.0,54.0,6.0,25.0,46.0,12.0,9.0,3.0,9.0,24.0,4.0,4.0,7.0,0.0,4.0,5.0,0.0,0.0,26.0,0.0,10.0,5.0,11.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,26602.0,866.0,45.0,30.0,31.0,74.0,22.0,57.0,76.0,53.0,49.0,44.0,102.0,115.0,80.0,43.0,23.0,22.0,2018
1,17,197,883000,1.0,17197883000,['SLI'],0,0,0.13,,16370.0,3759.0,1276.0,1183.0,46175.0,123400.0,1019.0,542.0,641.0,168.0,47.0,39.0,11.0,1266.0,206.0,153.0,127.0,21.0,7.0,39.0,34.0,22.0,0.0,0.0,4.0,69.0,15.0,7.0,0.0,37.0,0.0,10.0,0.0,0.0,26.0,0.0,8.0,0.0,7.0,11.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,21376.0,1183.0,121.0,124.0,54.0,36.0,52.0,51.0,51.0,79.0,71.0,164.0,107.0,78.0,69.0,59.0,61.0,6.0,2018
2,17,197,880111,7.0,17197880111,['ARE'],0,0,0.09,0.23,27360.0,3726.0,1295.0,1099.0,80230.0,159400.0,1764.0,893.0,206.0,439.0,93.0,30.0,10.0,1186.0,9.0,14.0,10.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,0.0,27.0,0.0,0.0,10.0,0.0,17.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,28768.0,1099.0,7.0,20.0,23.0,0.0,14.0,40.0,106.0,56.0,64.0,39.0,136.0,299.0,154.0,76.0,48.0,17.0,2018
3,17,197,883602,7.0,17197883602,['ARE'],0,0,-0.17,0.09,37740.0,5692.0,4076.0,2429.0,71444.0,168400.0,854.0,2233.0,196.0,703.0,364.0,21.0,0.0,2617.0,28.0,254.0,77.0,0.0,0.0,31.0,25.0,0.0,0.0,8.0,13.0,456.0,136.0,13.0,31.0,76.0,72.0,45.0,0.0,83.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,41679.0,2429.0,30.0,13.0,85.0,67.0,23.0,92.0,73.0,64.0,89.0,277.0,546.0,225.0,225.0,261.0,264.0,95.0,2018
4,17,197,883803,1.0,17197883803,['SLI'],0,0,-0.01,-0.05,26544.0,2756.0,368.0,1439.0,41193.0,119200.0,947.0,248.0,1191.0,273.0,133.0,0.0,0.0,1570.0,52.0,35.0,52.0,0.0,0.0,8.0,0.0,11.0,0.0,33.0,0.0,254.0,25.0,19.0,33.0,83.0,54.0,40.0,0.0,0.0,33.0,33.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,19.0,30259.0,1439.0,117.0,0.0,61.0,157.0,125.0,192.0,57.0,92.0,88.0,115.0,178.0,120.0,17.0,94.0,19.0,7.0,2018
5,17,197,881700,7.0,17197881700,['ARE'],0,0,0.02,0.23,40685.0,3375.0,2384.0,1320.0,69250.0,161300.0,1199.0,1066.0,254.0,537.0,324.0,16.0,20.0,1485.0,255.0,502.0,145.0,35.0,26.0,15.0,10.0,31.0,22.0,0.0,6.0,97.0,12.0,33.0,9.0,0.0,0.0,0.0,34.0,9.0,21.0,0.0,0.0,0.0,0.0,21.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,0.0,19.0,0.0,0.0,0.0,34135.0,1320.0,58.0,37.0,38.0,28.0,42.0,41.0,52.0,81.0,53.0,110.0,158.0,191.0,154.0,80.0,138.0,59.0,2018
6,17,197,883504,7.0,17197883504,['ARE'],0,0,0.13,0.08,40232.0,5358.0,4574.0,2158.0,92984.0,306400.0,2073.0,1981.0,177.0,955.0,572.0,123.0,133.0,2261.0,16.0,110.0,70.0,32.0,0.0,0.0,7.0,24.0,0.0,0.0,7.0,83.0,7.0,0.0,0.0,0.0,0.0,22.0,0.0,54.0,26.0,0.0,6.0,0.0,0.0,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,47201.0,2158.0,28.0,35.0,31.0,49.0,117.0,63.0,45.0,154.0,59.0,199.0,162.0,209.0,197.0,71.0,360.0,379.0,2018
7,17,197,883700,1.0,17197883700,['SLI'],0,0,-0.04,-0.05,23560.0,3204.0,2267.0,1460.0,49732.0,95700.0,767.0,1033.0,427.0,204.0,140.0,0.0,18.0,1639.0,152.0,274.0,85.0,12.0,11.0,0.0,43.0,0.0,0.0,19.0,0.0,26.0,0.0,5.0,21.0,0.0,0.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,27875.0,1460.0,110.0,123.0,143.0,61.0,98.0,62.0,64.0,32.0,40.0,106.0,205.0,231.0,95.0,51.0,34.0,5.0,2018
8,17,197,880502,6.0,17197880502,['SMMI'],0,0,0.32,0.14,32531.0,5139.0,4759.0,1746.0,78750.0,215000.0,1424.0,1424.0,322.0,482.0,167.0,16.0,27.0,1924.0,58.0,55.0,163.0,39.0,0.0,43.0,30.0,21.0,21.0,0.0,9.0,138.0,14.0,0.0,26.0,13.0,10.0,15.0,11.0,49.0,20.0,12.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,32700.0,1746.0,35.0,18.0,115.0,39.0,34.0,29.0,66.0,114.0,54.0,171.0,163.0,233.0,302.0,120.0,219.0,34.0,2018
9,17,197,881002,7.0,17197881002,['ARE'],0,0,0.08,0.1,35250.0,5370.0,5048.0,1820.0,102889.0,286700.0,2039.0,1582.0,238.0,993.0,454.0,17.0,16.0,1869.0,25.0,13.0,36.0,0.0,0.0,0.0,9.0,0.0,19.0,0.0,8.0,189.0,22.0,0.0,31.0,24.0,70.0,0.0,15.0,27.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,40410.0,1820.0,59.0,43.0,68.0,48.0,32.0,81.0,48.0,56.0,8.0,26.0,160.0,274.0,156.0,244.0,259.0,258.0,2018


In [28]:
for col in df_2018.columns:
    if col[-2:] == '18' and col not in ['pctch_real_mrent_12_18', 'per_ch_zillow_12_18']:
        new_col = col[:-3]
        df_2018 = df_2018.rename(columns={col: new_col})

In [29]:
df_2018.shape

(1982, 81)

In [30]:
df_2018 = df_2018.rename(
    columns={
        'state_x': 'state',
        'county_x': 'county',
        'tract_x': 'tract'
    }
)

In [31]:
df_2018.columns

Index(['state', 'county', 'tract', 'typology', 'FIPS', 'typ_cat', 'rail',
       'lostli', 'pctch_real_mrent_12_18', 'per_ch_zillow_12_18', 'iinc_12',
       'pop', 'white', 'hh', 'medhinc', 'mhval', 'mrent', 'ohu', 'rhu',
       'total_bd', 'total_md', 'total_pd', 'total_phd', 'tot_units_built',
       'units_40_49', 'units_39_earlier', 'mov_wc_w_income', 'mov_wc_9000',
       'mov_wc_15000', 'mov_wc_25000', 'mov_wc_35000', 'mov_wc_50000',
       'mov_wc_65000', 'mov_wc_75000', 'mov_wc_76000_more', 'mov_oc_w_income',
       'mov_oc_9000', 'mov_oc_15000', 'mov_oc_25000', 'mov_oc_35000',
       'mov_oc_50000', 'mov_oc_65000', 'mov_oc_75000', 'mov_oc_76000_more',
       'mov_os_w_income', 'mov_os_9000', 'mov_os_15000', 'mov_os_25000',
       'mov_os_35000', 'mov_os_50000', 'mov_os_65000', 'mov_os_75000',
       'mov_os_76000_more', 'mov_fa_w_income', 'mov_fa_9000', 'mov_fa_15000',
       'mov_fa_25000', 'mov_fa_35000', 'mov_fa_50000', 'mov_fa_65000',
       'mov_fa_75000', 'mov_fa_76000_

# Additional Variables

## Transportation - whether railways exist

In [32]:
# add transportation data
df_transit = pd.read_csv('Transport_fips.csv')
df_transit.head(10)

Unnamed: 0,Buffer,Agency,Line(s),Station Name,Year Opened,Latitude,Longitude,Block_FIPS,FIPS
0,Existing Transit,Amtrak,Hiawatha,Amtrak Milwaukee,Pre-2000,43.03,-87.92,550791874003003,55079187400
1,Existing Transit,Amtrak,Hiawatha,Milwaukee General Mitchell Int Airport,Pre-2000,42.94,-87.92,550790217005018,55079021700
2,Existing Transit,Amtrak,Hiawatha,Sturtevant,Pre-2000,42.72,-87.91,551010017026002,55101001702
3,Existing Transit,CTA,Blue Line,Addison-Blue,Pre-2000,41.95,-87.72,170311609001029,17031160900
4,Existing Transit,CTA,Blue Line,Austin-Blue,Pre-2000,41.87,-87.78,170318131001009,17031813100
5,Existing Transit,CTA,Blue Line,Belmont-Blue,Pre-2000,41.94,-87.71,170312106011005,17031210601
6,Existing Transit,CTA,Blue Line,California-O'Hare,Pre-2000,41.92,-87.7,170312214002003,17031221400
7,Existing Transit,CTA,Blue Line,Chicago-Blue,Pre-2000,41.9,-87.66,170312435002007,17031243500
8,Existing Transit,CTA,Blue Line,Cicero-Forest Park,Pre-2000,41.87,-87.75,170318314001009,17031831400
9,Existing Transit,CTA,Blue Line,Clinton-Blue,Pre-2000,41.88,-87.64,170318419001018,17031841900


In [33]:
df_transit_num = df_transit.groupby('FIPS').size().reset_index(name='num_transit')
df_transit_num.head(10)

Unnamed: 0,FIPS,num_transit
0,17031010202,1
1,17031010300,1
2,17031010503,1
3,17031010600,1
4,17031010701,1
5,17031030101,1
6,17031030102,1
7,17031030701,1
8,17031030703,1
9,17031031200,2


In [34]:
df_transit_num['rail'] = df_transit_num['num_transit'].apply(lambda x: 1 if x > 0 else 0)
df_transit_num.drop(columns=['num_transit'], inplace=True)

In [35]:
df_transit_num.head(10)

Unnamed: 0,FIPS,rail
0,17031010202,1
1,17031010300,1
2,17031010503,1
3,17031010600,1
4,17031010701,1
5,17031030101,1
6,17031030102,1
7,17031030701,1
8,17031030703,1
9,17031031200,1


In [36]:
df_transit_num['FIPS'] = df_transit_num['FIPS'].astype(str)

In [37]:
# join data with df_2023
df_2023_full = pd.merge(df_2023, df_transit_num, on='FIPS', how='left')
df_2023_full.head(20)

Unnamed: 0,pop,white,hh,medhinc,mhval,mrent,ohu,rhu,total_bd,total_md,total_pd,total_phd,tot_units_built,units_40_49,units_39_earlier,mov_wc_w_income,mov_wc_9000,mov_wc_15000,mov_wc_25000,mov_wc_35000,mov_wc_50000,mov_wc_65000,mov_wc_75000,mov_wc_76000_more,mov_oc_w_income,mov_oc_9000,mov_oc_15000,mov_oc_25000,mov_oc_35000,mov_oc_50000,mov_oc_65000,mov_oc_75000,mov_oc_76000_more,mov_os_w_income,mov_os_9000,mov_os_15000,mov_os_25000,mov_os_35000,mov_os_50000,mov_os_65000,mov_os_75000,mov_os_76000_more,mov_fa_w_income,mov_fa_9000,mov_fa_15000,mov_fa_25000,mov_fa_35000,mov_fa_50000,mov_fa_65000,state,county,tract,mov_fa_75000,mov_fa_76000_more,iinc,hinc,I_10000,I_15000,I_20000,I_25000,I_30000,I_35000,I_40000,I_45000,I_50000,I_60000,I_75000,I_100000,I_125000,I_150000,I_200000,I_201000,FIPS,typology,year,typ_cat,rail
0,3726.0,1475.0,2190.0,69460.0,296600.0,1252.0,689.0,1501.0,775.0,385.0,54.0,132.0,2841.0,289.0,1760.0,196.0,80.0,24.0,53.0,0.0,23.0,0.0,0.0,16.0,15.0,5.0,5.0,5.0,0.0,0.0,0.0,0.0,0.0,41.0,0.0,0.0,0.0,0.0,0.0,21.0,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10100,0.0,0.0,37386.0,2190.0,125.0,109.0,41.0,148.0,118.0,191.0,51.0,45.0,96.0,102.0,299.0,418.0,82.0,118.0,124.0,123.0,17031010100,,2023,,
1,7588.0,1883.0,3038.0,49639.0,239100.0,1333.0,823.0,2215.0,684.0,647.0,135.0,106.0,3276.0,196.0,1586.0,564.0,84.0,176.0,37.0,33.0,80.0,0.0,51.0,103.0,8.0,0.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,198.0,0.0,9.0,16.0,109.0,43.0,0.0,0.0,21.0,25.0,0.0,0.0,0.0,25.0,0.0,0.0,17,31,10201,0.0,0.0,39311.0,3038.0,223.0,61.0,153.0,0.0,92.0,172.0,355.0,243.0,233.0,49.0,192.0,576.0,220.0,201.0,161.0,107.0,17031010201,,2023,,
2,2609.0,987.0,1130.0,55119.0,231900.0,1292.0,270.0,860.0,656.0,232.0,52.0,42.0,1303.0,76.0,512.0,209.0,41.0,1.0,33.0,24.0,25.0,26.0,25.0,34.0,56.0,35.0,0.0,0.0,10.0,11.0,0.0,0.0,0.0,129.0,28.0,0.0,7.0,0.0,32.0,0.0,24.0,38.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10202,0.0,0.0,34938.0,1130.0,100.0,79.0,12.0,12.0,40.0,52.0,20.0,94.0,103.0,104.0,36.0,236.0,99.0,31.0,66.0,46.0,17031010202,,2023,,1.0
3,6311.0,3558.0,3185.0,65871.0,305000.0,1257.0,859.0,2326.0,1585.0,644.0,121.0,149.0,3377.0,292.0,1655.0,1072.0,191.0,187.0,133.0,105.0,99.0,121.0,93.0,143.0,65.0,10.0,5.0,0.0,0.0,3.0,30.0,0.0,17.0,166.0,0.0,25.0,89.0,23.0,0.0,0.0,29.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10300,0.0,0.0,38532.0,3185.0,44.0,231.0,98.0,259.0,225.0,45.0,69.0,100.0,81.0,293.0,422.0,436.0,242.0,245.0,166.0,229.0,17031010300,,2023,,1.0
4,4282.0,3349.0,2058.0,49017.0,229400.0,1248.0,513.0,1545.0,999.0,400.0,128.0,70.0,2460.0,216.0,1216.0,616.0,121.0,19.0,0.0,51.0,201.0,50.0,18.0,156.0,140.0,72.0,0.0,41.0,0.0,0.0,0.0,0.0,27.0,310.0,245.0,0.0,33.0,22.0,0.0,10.0,0.0,0.0,21.0,12.0,9.0,0.0,0.0,0.0,0.0,17,31,10400,0.0,0.0,33561.0,2058.0,141.0,131.0,298.0,81.0,59.0,41.0,56.0,33.0,268.0,101.0,180.0,218.0,99.0,129.0,85.0,138.0,17031010400,,2023,,
5,3519.0,2298.0,2379.0,48250.0,196600.0,1176.0,341.0,2038.0,1157.0,573.0,0.0,206.0,2705.0,262.0,1198.0,383.0,0.0,0.0,19.0,38.0,156.0,77.0,16.0,77.0,47.0,0.0,0.0,0.0,20.0,27.0,0.0,0.0,0.0,110.0,57.0,0.0,16.0,0.0,0.0,0.0,0.0,37.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10501,0.0,0.0,36258.0,2379.0,171.0,127.0,223.0,152.0,76.0,100.0,57.0,137.0,171.0,231.0,235.0,234.0,191.0,122.0,85.0,67.0,17031010501,,2023,,
6,3329.0,2171.0,1637.0,61367.0,282200.0,1311.0,469.0,1168.0,770.0,550.0,38.0,156.0,1807.0,164.0,1004.0,454.0,156.0,38.0,36.0,54.0,53.0,24.0,27.0,66.0,26.0,13.0,0.0,13.0,0.0,0.0,0.0,0.0,0.0,222.0,88.0,42.0,29.0,11.0,23.0,9.0,0.0,20.0,12.0,0.0,12.0,0.0,0.0,0.0,0.0,17,31,10502,0.0,0.0,36926.0,1637.0,99.0,118.0,152.0,82.0,61.0,32.0,58.0,37.0,60.0,102.0,153.0,290.0,147.0,57.0,32.0,157.0,17031010502,,2023,,
7,2844.0,1806.0,1477.0,21924.0,470500.0,1122.0,177.0,1300.0,350.0,256.0,38.0,111.0,1570.0,109.0,510.0,591.0,329.0,88.0,53.0,60.0,22.0,36.0,0.0,3.0,75.0,23.0,18.0,0.0,0.0,0.0,34.0,0.0,0.0,78.0,69.0,0.0,0.0,9.0,0.0,0.0,0.0,0.0,66.0,35.0,20.0,0.0,0.0,11.0,0.0,17,31,10503,0.0,0.0,13289.0,1477.0,298.0,249.0,103.0,133.0,46.0,44.0,49.0,13.0,37.0,97.0,92.0,125.0,65.0,48.0,45.0,33.0,17031010503,,2023,,1.0
8,6708.0,3804.0,3066.0,71920.0,254500.0,1276.0,1094.0,1972.0,1843.0,760.0,136.0,267.0,3176.0,69.0,1683.0,797.0,45.0,6.0,78.0,249.0,191.0,138.0,59.0,31.0,36.0,0.0,0.0,0.0,0.0,34.0,0.0,0.0,2.0,209.0,26.0,46.0,36.0,50.0,33.0,18.0,0.0,0.0,88.0,0.0,0.0,0.0,0.0,0.0,88.0,17,31,10600,0.0,0.0,38090.0,3066.0,81.0,152.0,49.0,45.0,209.0,130.0,172.0,134.0,28.0,169.0,464.0,374.0,280.0,312.0,176.0,291.0,17031010600,,2023,,1.0
9,3573.0,1431.0,1652.0,74208.0,345400.0,1338.0,820.0,832.0,1047.0,382.0,41.0,41.0,1753.0,123.0,847.0,296.0,72.0,0.0,52.0,37.0,34.0,31.0,8.0,62.0,35.0,0.0,0.0,0.0,35.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10701,0.0,0.0,43372.0,1652.0,31.0,51.0,50.0,40.0,51.0,169.0,54.0,49.0,57.0,113.0,193.0,255.0,161.0,92.0,126.0,160.0,17031010701,,2023,,1.0


In [38]:
df_2023_full['rail'] = df_2023_full['rail'].fillna(0)
df_2023_full.isnull().sum()

pop                     0
white                   0
hh                      0
medhinc                 0
mhval                   0
mrent                   0
ohu                     0
rhu                     0
total_bd                0
total_md                0
total_pd                0
total_phd               0
tot_units_built         0
units_40_49             0
units_39_earlier        0
mov_wc_w_income         0
mov_wc_9000             0
mov_wc_15000            0
mov_wc_25000            0
mov_wc_35000            0
mov_wc_50000            0
mov_wc_65000            0
mov_wc_75000            0
mov_wc_76000_more       0
mov_oc_w_income         0
mov_oc_9000             0
mov_oc_15000            0
mov_oc_25000            0
mov_oc_35000            0
mov_oc_50000            0
mov_oc_65000            0
mov_oc_75000            0
mov_oc_76000_more       0
mov_os_w_income         0
mov_os_9000             0
mov_os_15000            0
mov_os_25000            0
mov_os_35000            0
mov_os_50000

In [39]:
df_2023_full.columns

Index(['pop', 'white', 'hh', 'medhinc', 'mhval', 'mrent', 'ohu', 'rhu',
       'total_bd', 'total_md', 'total_pd', 'total_phd', 'tot_units_built',
       'units_40_49', 'units_39_earlier', 'mov_wc_w_income', 'mov_wc_9000',
       'mov_wc_15000', 'mov_wc_25000', 'mov_wc_35000', 'mov_wc_50000',
       'mov_wc_65000', 'mov_wc_75000', 'mov_wc_76000_more', 'mov_oc_w_income',
       'mov_oc_9000', 'mov_oc_15000', 'mov_oc_25000', 'mov_oc_35000',
       'mov_oc_50000', 'mov_oc_65000', 'mov_oc_75000', 'mov_oc_76000_more',
       'mov_os_w_income', 'mov_os_9000', 'mov_os_15000', 'mov_os_25000',
       'mov_os_35000', 'mov_os_50000', 'mov_os_65000', 'mov_os_75000',
       'mov_os_76000_more', 'mov_fa_w_income', 'mov_fa_9000', 'mov_fa_15000',
       'mov_fa_25000', 'mov_fa_35000', 'mov_fa_50000', 'mov_fa_65000', 'state',
       'county', 'tract', 'mov_fa_75000', 'mov_fa_76000_more', 'iinc', 'hinc',
       'I_10000', 'I_15000', 'I_20000', 'I_25000', 'I_30000', 'I_35000',
       'I_40000', 'I_45000'

## Adjust for Price Levels

In [86]:
INFLATION_18_23 = 1.21 # according to https://www.bls.gov/data/inflation_calculator.htm
inflation_adjust = ['medhinc', 'iinc'] # iinc is the median income in the past 12 months

df_23_adjusted = df_2023_full.copy()
for col in inflation_adjust:
    df_23_adjusted[col] = df_23_adjusted[col] / INFLATION_18_23

df_23_adjusted.head()

Unnamed: 0,pop,white,hh,medhinc,mhval,mrent,ohu,rhu,total_bd,total_md,total_pd,total_phd,tot_units_built,units_40_49,units_39_earlier,mov_wc_w_income,mov_wc_9000,mov_wc_15000,mov_wc_25000,mov_wc_35000,mov_wc_50000,mov_wc_65000,mov_wc_75000,mov_wc_76000_more,mov_oc_w_income,mov_oc_9000,mov_oc_15000,mov_oc_25000,mov_oc_35000,mov_oc_50000,mov_oc_65000,mov_oc_75000,mov_oc_76000_more,mov_os_w_income,mov_os_9000,mov_os_15000,mov_os_25000,mov_os_35000,mov_os_50000,mov_os_65000,mov_os_75000,mov_os_76000_more,mov_fa_w_income,mov_fa_9000,mov_fa_15000,mov_fa_25000,mov_fa_35000,mov_fa_50000,mov_fa_65000,state,county,tract,mov_fa_75000,mov_fa_76000_more,iinc,hinc,I_10000,I_15000,I_20000,I_25000,I_30000,I_35000,I_40000,I_45000,I_50000,I_60000,I_75000,I_100000,I_125000,I_150000,I_200000,I_201000,FIPS,typology,year,typ_cat,rail
0,3726.0,1475.0,2190.0,57404.96,296600.0,1252.0,689.0,1501.0,775.0,385.0,54.0,132.0,2841.0,289.0,1760.0,196.0,80.0,24.0,53.0,0.0,23.0,0.0,0.0,16.0,15.0,5.0,5.0,5.0,0.0,0.0,0.0,0.0,0.0,41.0,0.0,0.0,0.0,0.0,0.0,21.0,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10100,0.0,0.0,30897.52,2190.0,125.0,109.0,41.0,148.0,118.0,191.0,51.0,45.0,96.0,102.0,299.0,418.0,82.0,118.0,124.0,123.0,17031010100,,2023,,0.0
1,7588.0,1883.0,3038.0,41023.97,239100.0,1333.0,823.0,2215.0,684.0,647.0,135.0,106.0,3276.0,196.0,1586.0,564.0,84.0,176.0,37.0,33.0,80.0,0.0,51.0,103.0,8.0,0.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,198.0,0.0,9.0,16.0,109.0,43.0,0.0,0.0,21.0,25.0,0.0,0.0,0.0,25.0,0.0,0.0,17,31,10201,0.0,0.0,32488.43,3038.0,223.0,61.0,153.0,0.0,92.0,172.0,355.0,243.0,233.0,49.0,192.0,576.0,220.0,201.0,161.0,107.0,17031010201,,2023,,0.0
2,2609.0,987.0,1130.0,45552.89,231900.0,1292.0,270.0,860.0,656.0,232.0,52.0,42.0,1303.0,76.0,512.0,209.0,41.0,1.0,33.0,24.0,25.0,26.0,25.0,34.0,56.0,35.0,0.0,0.0,10.0,11.0,0.0,0.0,0.0,129.0,28.0,0.0,7.0,0.0,32.0,0.0,24.0,38.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10202,0.0,0.0,28874.38,1130.0,100.0,79.0,12.0,12.0,40.0,52.0,20.0,94.0,103.0,104.0,36.0,236.0,99.0,31.0,66.0,46.0,17031010202,,2023,,1.0
3,6311.0,3558.0,3185.0,54438.84,305000.0,1257.0,859.0,2326.0,1585.0,644.0,121.0,149.0,3377.0,292.0,1655.0,1072.0,191.0,187.0,133.0,105.0,99.0,121.0,93.0,143.0,65.0,10.0,5.0,0.0,0.0,3.0,30.0,0.0,17.0,166.0,0.0,25.0,89.0,23.0,0.0,0.0,29.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10300,0.0,0.0,31844.63,3185.0,44.0,231.0,98.0,259.0,225.0,45.0,69.0,100.0,81.0,293.0,422.0,436.0,242.0,245.0,166.0,229.0,17031010300,,2023,,1.0
4,4282.0,3349.0,2058.0,40509.92,229400.0,1248.0,513.0,1545.0,999.0,400.0,128.0,70.0,2460.0,216.0,1216.0,616.0,121.0,19.0,0.0,51.0,201.0,50.0,18.0,156.0,140.0,72.0,0.0,41.0,0.0,0.0,0.0,0.0,27.0,310.0,245.0,0.0,33.0,22.0,0.0,10.0,0.0,0.0,21.0,12.0,9.0,0.0,0.0,0.0,0.0,17,31,10400,0.0,0.0,27736.36,2058.0,141.0,131.0,298.0,81.0,59.0,41.0,56.0,33.0,268.0,101.0,180.0,218.0,99.0,129.0,85.0,138.0,17031010400,,2023,,0.0


In [87]:
# adjust for housing price change
df_23_adjusted['mhval'] = df_23_adjusted['mhval'] / INFLATION_18_23
df_23_adjusted['mrent'] = df_23_adjusted['mrent'] / INFLATION_18_23
df_23_adjusted.head()

# since we will standardize the data later, we will not adjust for rent/selling price INCREASES here; we only care about inflation

Unnamed: 0,pop,white,hh,medhinc,mhval,mrent,ohu,rhu,total_bd,total_md,total_pd,total_phd,tot_units_built,units_40_49,units_39_earlier,mov_wc_w_income,mov_wc_9000,mov_wc_15000,mov_wc_25000,mov_wc_35000,mov_wc_50000,mov_wc_65000,mov_wc_75000,mov_wc_76000_more,mov_oc_w_income,mov_oc_9000,mov_oc_15000,mov_oc_25000,mov_oc_35000,mov_oc_50000,mov_oc_65000,mov_oc_75000,mov_oc_76000_more,mov_os_w_income,mov_os_9000,mov_os_15000,mov_os_25000,mov_os_35000,mov_os_50000,mov_os_65000,mov_os_75000,mov_os_76000_more,mov_fa_w_income,mov_fa_9000,mov_fa_15000,mov_fa_25000,mov_fa_35000,mov_fa_50000,mov_fa_65000,state,county,tract,mov_fa_75000,mov_fa_76000_more,iinc,hinc,I_10000,I_15000,I_20000,I_25000,I_30000,I_35000,I_40000,I_45000,I_50000,I_60000,I_75000,I_100000,I_125000,I_150000,I_200000,I_201000,FIPS,typology,year,typ_cat,rail
0,3726.0,1475.0,2190.0,57404.96,245123.97,1034.71,689.0,1501.0,775.0,385.0,54.0,132.0,2841.0,289.0,1760.0,196.0,80.0,24.0,53.0,0.0,23.0,0.0,0.0,16.0,15.0,5.0,5.0,5.0,0.0,0.0,0.0,0.0,0.0,41.0,0.0,0.0,0.0,0.0,0.0,21.0,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10100,0.0,0.0,30897.52,2190.0,125.0,109.0,41.0,148.0,118.0,191.0,51.0,45.0,96.0,102.0,299.0,418.0,82.0,118.0,124.0,123.0,17031010100,,2023,,0.0
1,7588.0,1883.0,3038.0,41023.97,197603.31,1101.65,823.0,2215.0,684.0,647.0,135.0,106.0,3276.0,196.0,1586.0,564.0,84.0,176.0,37.0,33.0,80.0,0.0,51.0,103.0,8.0,0.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,198.0,0.0,9.0,16.0,109.0,43.0,0.0,0.0,21.0,25.0,0.0,0.0,0.0,25.0,0.0,0.0,17,31,10201,0.0,0.0,32488.43,3038.0,223.0,61.0,153.0,0.0,92.0,172.0,355.0,243.0,233.0,49.0,192.0,576.0,220.0,201.0,161.0,107.0,17031010201,,2023,,0.0
2,2609.0,987.0,1130.0,45552.89,191652.89,1067.77,270.0,860.0,656.0,232.0,52.0,42.0,1303.0,76.0,512.0,209.0,41.0,1.0,33.0,24.0,25.0,26.0,25.0,34.0,56.0,35.0,0.0,0.0,10.0,11.0,0.0,0.0,0.0,129.0,28.0,0.0,7.0,0.0,32.0,0.0,24.0,38.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10202,0.0,0.0,28874.38,1130.0,100.0,79.0,12.0,12.0,40.0,52.0,20.0,94.0,103.0,104.0,36.0,236.0,99.0,31.0,66.0,46.0,17031010202,,2023,,1.0
3,6311.0,3558.0,3185.0,54438.84,252066.12,1038.84,859.0,2326.0,1585.0,644.0,121.0,149.0,3377.0,292.0,1655.0,1072.0,191.0,187.0,133.0,105.0,99.0,121.0,93.0,143.0,65.0,10.0,5.0,0.0,0.0,3.0,30.0,0.0,17.0,166.0,0.0,25.0,89.0,23.0,0.0,0.0,29.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10300,0.0,0.0,31844.63,3185.0,44.0,231.0,98.0,259.0,225.0,45.0,69.0,100.0,81.0,293.0,422.0,436.0,242.0,245.0,166.0,229.0,17031010300,,2023,,1.0
4,4282.0,3349.0,2058.0,40509.92,189586.78,1031.4,513.0,1545.0,999.0,400.0,128.0,70.0,2460.0,216.0,1216.0,616.0,121.0,19.0,0.0,51.0,201.0,50.0,18.0,156.0,140.0,72.0,0.0,41.0,0.0,0.0,0.0,0.0,27.0,310.0,245.0,0.0,33.0,22.0,0.0,10.0,0.0,0.0,21.0,12.0,9.0,0.0,0.0,0.0,0.0,17,31,10400,0.0,0.0,27736.36,2058.0,141.0,131.0,298.0,81.0,59.0,41.0,56.0,33.0,268.0,101.0,180.0,218.0,99.0,129.0,85.0,138.0,17031010400,,2023,,0.0


All price indicators are adjusted to align with 2018 data.

## Generate Variables Indicating Change Since Last Period 

Next, we impute missing values for 2023 - variables indicating changes since the last period (2018)

In [88]:
# match variables
df_23 = df_23_adjusted.copy()
df_18 = df_2018.copy()

df_23['total_li'] = df_23['I_10000'] + df_23['I_15000'] + df_23['I_20000'] + df_23['I_25000'] + df_23['I_30000'] + df_23['I_35000']
df_18['total_li'] = df_18['I_10000'] + df_18['I_15000'] + df_18['I_20000'] + df_18['I_25000'] + df_18['I_30000'] + df_18['I_35000']

In [89]:
# generate variable indicating whether median individual income in 2018 is higher than in 2012
df_18['more_ind_inc'] = np.where(df_18['iinc'] > df_18['iinc_12'], 1, 0)
df_18['pctch_ind_inc'] = (df_18['iinc'] - df_18['iinc_12']) / df_18['iinc_12']
df_18.drop(columns=['iinc_12'], inplace=True)

In [90]:
df_18.rename(columns = {'pctch_real_mrent_12_18': 'pctch_real_mhval_sl', 'per_ch_zillow_12_18': 'per_ch_rent_sl'}, inplace=True)
df_18.columns

Index(['state', 'county', 'tract', 'typology', 'FIPS', 'typ_cat', 'rail',
       'lostli', 'pctch_real_mhval_sl', 'per_ch_rent_sl', 'pop', 'white', 'hh',
       'medhinc', 'mhval', 'mrent', 'ohu', 'rhu', 'total_bd', 'total_md',
       'total_pd', 'total_phd', 'tot_units_built', 'units_40_49',
       'units_39_earlier', 'mov_wc_w_income', 'mov_wc_9000', 'mov_wc_15000',
       'mov_wc_25000', 'mov_wc_35000', 'mov_wc_50000', 'mov_wc_65000',
       'mov_wc_75000', 'mov_wc_76000_more', 'mov_oc_w_income', 'mov_oc_9000',
       'mov_oc_15000', 'mov_oc_25000', 'mov_oc_35000', 'mov_oc_50000',
       'mov_oc_65000', 'mov_oc_75000', 'mov_oc_76000_more', 'mov_os_w_income',
       'mov_os_9000', 'mov_os_15000', 'mov_os_25000', 'mov_os_35000',
       'mov_os_50000', 'mov_os_65000', 'mov_os_75000', 'mov_os_76000_more',
       'mov_fa_w_income', 'mov_fa_9000', 'mov_fa_15000', 'mov_fa_25000',
       'mov_fa_35000', 'mov_fa_50000', 'mov_fa_65000', 'mov_fa_75000',
       'mov_fa_76000_more', 'iinc', 'hin

In [91]:
df_23 = pd.merge(df_23, df_18[['FIPS', 'total_li', 'mhval', 'mrent', 'iinc']], on='FIPS', how='left')
df_23.columns

Index(['pop', 'white', 'hh', 'medhinc', 'mhval_x', 'mrent_x', 'ohu', 'rhu',
       'total_bd', 'total_md', 'total_pd', 'total_phd', 'tot_units_built',
       'units_40_49', 'units_39_earlier', 'mov_wc_w_income', 'mov_wc_9000',
       'mov_wc_15000', 'mov_wc_25000', 'mov_wc_35000', 'mov_wc_50000',
       'mov_wc_65000', 'mov_wc_75000', 'mov_wc_76000_more', 'mov_oc_w_income',
       'mov_oc_9000', 'mov_oc_15000', 'mov_oc_25000', 'mov_oc_35000',
       'mov_oc_50000', 'mov_oc_65000', 'mov_oc_75000', 'mov_oc_76000_more',
       'mov_os_w_income', 'mov_os_9000', 'mov_os_15000', 'mov_os_25000',
       'mov_os_35000', 'mov_os_50000', 'mov_os_65000', 'mov_os_75000',
       'mov_os_76000_more', 'mov_fa_w_income', 'mov_fa_9000', 'mov_fa_15000',
       'mov_fa_25000', 'mov_fa_35000', 'mov_fa_50000', 'mov_fa_65000', 'state',
       'county', 'tract', 'mov_fa_75000', 'mov_fa_76000_more', 'iinc_x',
       'hinc', 'I_10000', 'I_15000', 'I_20000', 'I_25000', 'I_30000',
       'I_35000', 'I_40000', 'I_

In [92]:
df_23.shape

(2072, 82)

In [93]:
df_23['pctch_real_mhval_sl'] = df_23['mhval_x'] / df_23['mhval_y'] - 1
df_23['per_ch_rent_sl'] = df_23['mrent_x'] / df_23['mrent_y'] - 1
df_23['lostli'] = df_23['total_li_x'] - df_23['total_li_y']
df_23['more_ind_inc'] = np.where(df_23['iinc_x'] > df_23['iinc_y'], 1, 0)
df_23['pctch_ind_inc'] = (df_23['iinc_x'] - df_23['iinc_y']) / df_23['iinc_y']
df_23.drop(columns=['total_li_y', 'mhval_y', 'mrent_y', 'iinc_y'], inplace=True)
df_23.rename(columns = {'total_li_x': 'total_li', 'mhval_x': 'mhval', 'mrent_x': 'mrent', 'iinc_x': 'iinc'}, inplace=True)
df_23.info() # the variables match

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 2072 entries, 0 to 2071
Data columns (total 83 columns):
 #   Column               Non-Null Count  Dtype  
---  ------               --------------  -----  
 0   pop                  2072 non-null   float64
 1   white                2072 non-null   float64
 2   hh                   2072 non-null   float64
 3   medhinc              2072 non-null   float64
 4   mhval                2072 non-null   float64
 5   mrent                2072 non-null   float64
 6   ohu                  2072 non-null   float64
 7   rhu                  2072 non-null   float64
 8   total_bd             2072 non-null   float64
 9   total_md             2072 non-null   float64
 10  total_pd             2072 non-null   float64
 11  total_phd            2072 non-null   float64
 12  tot_units_built      2072 non-null   float64
 13  units_40_49          2072 non-null   float64
 14  units_39_earlier     2072 non-null   float64
 15  mov_wc_w_income      2072 non-null   f

In [94]:
df_c = pd.concat([df_23, df_18], axis=0)
df_c.head(10)

  df_c = pd.concat([df_23, df_18], axis=0)


Unnamed: 0,pop,white,hh,medhinc,mhval,mrent,ohu,rhu,total_bd,total_md,total_pd,total_phd,tot_units_built,units_40_49,units_39_earlier,mov_wc_w_income,mov_wc_9000,mov_wc_15000,mov_wc_25000,mov_wc_35000,mov_wc_50000,mov_wc_65000,mov_wc_75000,mov_wc_76000_more,mov_oc_w_income,mov_oc_9000,mov_oc_15000,mov_oc_25000,mov_oc_35000,mov_oc_50000,mov_oc_65000,mov_oc_75000,mov_oc_76000_more,mov_os_w_income,mov_os_9000,mov_os_15000,mov_os_25000,mov_os_35000,mov_os_50000,mov_os_65000,mov_os_75000,mov_os_76000_more,mov_fa_w_income,mov_fa_9000,mov_fa_15000,mov_fa_25000,mov_fa_35000,mov_fa_50000,mov_fa_65000,state,county,tract,mov_fa_75000,mov_fa_76000_more,iinc,hinc,I_10000,I_15000,I_20000,I_25000,I_30000,I_35000,I_40000,I_45000,I_50000,I_60000,I_75000,I_100000,I_125000,I_150000,I_200000,I_201000,FIPS,typology,year,typ_cat,rail,total_li,pctch_real_mhval_sl,per_ch_rent_sl,lostli,more_ind_inc,pctch_ind_inc
0,3726.0,1475.0,2190.0,57404.96,245123.97,1034.71,689.0,1501.0,775.0,385.0,54.0,132.0,2841.0,289.0,1760.0,196.0,80.0,24.0,53.0,0.0,23.0,0.0,0.0,16.0,15.0,5.0,5.0,5.0,0.0,0.0,0.0,0.0,0.0,41.0,0.0,0.0,0.0,0.0,0.0,21.0,0.0,20.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10100,0.0,0.0,30897.52,2190.0,125.0,109.0,41.0,148.0,118.0,191.0,51.0,45.0,96.0,102.0,299.0,418.0,82.0,118.0,124.0,123.0,17031010100,,2023,,0.0,732.0,-0.05,0.18,-398.0,1,0.12
1,7588.0,1883.0,3038.0,41023.97,197603.31,1101.65,823.0,2215.0,684.0,647.0,135.0,106.0,3276.0,196.0,1586.0,564.0,84.0,176.0,37.0,33.0,80.0,0.0,51.0,103.0,8.0,0.0,0.0,0.0,8.0,0.0,0.0,0.0,0.0,198.0,0.0,9.0,16.0,109.0,43.0,0.0,0.0,21.0,25.0,0.0,0.0,0.0,25.0,0.0,0.0,17,31,10201,0.0,0.0,32488.43,3038.0,223.0,61.0,153.0,0.0,92.0,172.0,355.0,243.0,233.0,49.0,192.0,576.0,220.0,201.0,161.0,107.0,17031010201,,2023,,0.0,701.0,0.26,0.08,-582.0,1,0.21
2,2609.0,987.0,1130.0,45552.89,191652.89,1067.77,270.0,860.0,656.0,232.0,52.0,42.0,1303.0,76.0,512.0,209.0,41.0,1.0,33.0,24.0,25.0,26.0,25.0,34.0,56.0,35.0,0.0,0.0,10.0,11.0,0.0,0.0,0.0,129.0,28.0,0.0,7.0,0.0,32.0,0.0,24.0,38.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10202,0.0,0.0,28874.38,1130.0,100.0,79.0,12.0,12.0,40.0,52.0,20.0,94.0,103.0,104.0,36.0,236.0,99.0,31.0,66.0,46.0,17031010202,,2023,,1.0,295.0,0.2,0.1,-216.0,1,0.26
3,6311.0,3558.0,3185.0,54438.84,252066.12,1038.84,859.0,2326.0,1585.0,644.0,121.0,149.0,3377.0,292.0,1655.0,1072.0,191.0,187.0,133.0,105.0,99.0,121.0,93.0,143.0,65.0,10.0,5.0,0.0,0.0,3.0,30.0,0.0,17.0,166.0,0.0,25.0,89.0,23.0,0.0,0.0,29.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10300,0.0,0.0,31844.63,3185.0,44.0,231.0,98.0,259.0,225.0,45.0,69.0,100.0,81.0,293.0,422.0,436.0,242.0,245.0,166.0,229.0,17031010300,,2023,,1.0,902.0,0.45,0.06,-447.0,1,0.06
4,4282.0,3349.0,2058.0,40509.92,189586.78,1031.4,513.0,1545.0,999.0,400.0,128.0,70.0,2460.0,216.0,1216.0,616.0,121.0,19.0,0.0,51.0,201.0,50.0,18.0,156.0,140.0,72.0,0.0,41.0,0.0,0.0,0.0,0.0,27.0,310.0,245.0,0.0,33.0,22.0,0.0,10.0,0.0,0.0,21.0,12.0,9.0,0.0,0.0,0.0,0.0,17,31,10400,0.0,0.0,27736.36,2058.0,141.0,131.0,298.0,81.0,59.0,41.0,56.0,33.0,268.0,101.0,180.0,218.0,99.0,129.0,85.0,138.0,17031010400,,2023,,0.0,751.0,-0.13,0.02,-54.0,1,0.38
5,3519.0,2298.0,2379.0,39876.03,162479.34,971.9,341.0,2038.0,1157.0,573.0,0.0,206.0,2705.0,262.0,1198.0,383.0,0.0,0.0,19.0,38.0,156.0,77.0,16.0,77.0,47.0,0.0,0.0,0.0,20.0,27.0,0.0,0.0,0.0,110.0,57.0,0.0,16.0,0.0,0.0,0.0,0.0,37.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10501,0.0,0.0,29965.29,2379.0,171.0,127.0,223.0,152.0,76.0,100.0,57.0,137.0,171.0,231.0,235.0,234.0,191.0,122.0,85.0,67.0,17031010501,,2023,,0.0,849.0,-0.49,0.01,-384.0,1,0.12
6,3329.0,2171.0,1637.0,50716.53,233223.14,1083.47,469.0,1168.0,770.0,550.0,38.0,156.0,1807.0,164.0,1004.0,454.0,156.0,38.0,36.0,54.0,53.0,24.0,27.0,66.0,26.0,13.0,0.0,13.0,0.0,0.0,0.0,0.0,0.0,222.0,88.0,42.0,29.0,11.0,23.0,9.0,0.0,20.0,12.0,0.0,12.0,0.0,0.0,0.0,0.0,17,31,10502,0.0,0.0,30517.36,1637.0,99.0,118.0,152.0,82.0,61.0,32.0,58.0,37.0,60.0,102.0,153.0,290.0,147.0,57.0,32.0,157.0,17031010502,,2023,,0.0,544.0,0.05,0.09,-160.0,1,0.17
7,2844.0,1806.0,1477.0,18119.01,388842.98,927.27,177.0,1300.0,350.0,256.0,38.0,111.0,1570.0,109.0,510.0,591.0,329.0,88.0,53.0,60.0,22.0,36.0,0.0,3.0,75.0,23.0,18.0,0.0,0.0,0.0,34.0,0.0,0.0,78.0,69.0,0.0,0.0,9.0,0.0,0.0,0.0,0.0,66.0,35.0,20.0,0.0,0.0,11.0,0.0,17,31,10503,0.0,0.0,10982.64,1477.0,298.0,249.0,103.0,133.0,46.0,44.0,49.0,13.0,37.0,97.0,92.0,125.0,65.0,48.0,45.0,33.0,17031010503,,2023,,1.0,873.0,0.13,0.34,271.0,0,-0.21
8,6708.0,3804.0,3066.0,59438.02,210330.58,1054.55,1094.0,1972.0,1843.0,760.0,136.0,267.0,3176.0,69.0,1683.0,797.0,45.0,6.0,78.0,249.0,191.0,138.0,59.0,31.0,36.0,0.0,0.0,0.0,0.0,34.0,0.0,0.0,2.0,209.0,26.0,46.0,36.0,50.0,33.0,18.0,0.0,0.0,88.0,0.0,0.0,0.0,0.0,0.0,88.0,17,31,10600,0.0,0.0,31479.34,3066.0,81.0,152.0,49.0,45.0,209.0,130.0,172.0,134.0,28.0,169.0,464.0,374.0,280.0,312.0,176.0,291.0,17031010600,,2023,,1.0,666.0,-0.06,0.06,-435.0,1,0.2
9,3573.0,1431.0,1652.0,61328.93,285454.55,1105.79,820.0,832.0,1047.0,382.0,41.0,41.0,1753.0,123.0,847.0,296.0,72.0,0.0,52.0,37.0,34.0,31.0,8.0,62.0,35.0,0.0,0.0,0.0,35.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,17,31,10701,0.0,0.0,35844.63,1652.0,31.0,51.0,50.0,40.0,51.0,169.0,54.0,49.0,57.0,113.0,193.0,255.0,161.0,92.0,126.0,160.0,17031010701,,2023,,1.0,392.0,0.38,0.07,-64.0,1,0.23


In [95]:
df_c.columns # double check columns

Index(['pop', 'white', 'hh', 'medhinc', 'mhval', 'mrent', 'ohu', 'rhu',
       'total_bd', 'total_md', 'total_pd', 'total_phd', 'tot_units_built',
       'units_40_49', 'units_39_earlier', 'mov_wc_w_income', 'mov_wc_9000',
       'mov_wc_15000', 'mov_wc_25000', 'mov_wc_35000', 'mov_wc_50000',
       'mov_wc_65000', 'mov_wc_75000', 'mov_wc_76000_more', 'mov_oc_w_income',
       'mov_oc_9000', 'mov_oc_15000', 'mov_oc_25000', 'mov_oc_35000',
       'mov_oc_50000', 'mov_oc_65000', 'mov_oc_75000', 'mov_oc_76000_more',
       'mov_os_w_income', 'mov_os_9000', 'mov_os_15000', 'mov_os_25000',
       'mov_os_35000', 'mov_os_50000', 'mov_os_65000', 'mov_os_75000',
       'mov_os_76000_more', 'mov_fa_w_income', 'mov_fa_9000', 'mov_fa_15000',
       'mov_fa_25000', 'mov_fa_35000', 'mov_fa_50000', 'mov_fa_65000', 'state',
       'county', 'tract', 'mov_fa_75000', 'mov_fa_76000_more', 'iinc', 'hinc',
       'I_10000', 'I_15000', 'I_20000', 'I_25000', 'I_30000', 'I_35000',
       'I_40000', 'I_45000'

## Dealing with Missing Variables

In [96]:
df_clean = df_c[(df_c['mhval'] > 0) & (df_c['mrent'] > 0)]

# check whether distribution of mhval and mrent is reasonable
df_clean['mhval'].describe()

count      3836.00
mean     271875.53
std      150824.43
min       19400.00
25%      169900.00
50%      235454.55
75%      331625.00
max     1528600.00
Name: mhval, dtype: float64

In [97]:
df_clean['mrent'].describe()

count   3836.00
mean    1251.89
std      407.16
min      283.47
25%      971.00
50%     1150.00
75%     1463.00
max     3501.00
Name: mrent, dtype: float64

In [98]:
# check for missing values
missing_info = df_clean.isnull().sum()
print("col with null val:")
print(missing_info[missing_info > 0])


col with null val:
typology               1917
typ_cat                1917
pctch_real_mhval_sl     134
per_ch_rent_sl          318
lostli                  134
pctch_ind_inc           134
dtype: int64


In [99]:
# impute missing values
df_clean['pctch_real_mhval_sl'] = df_clean['pctch_real_mhval_sl'].fillna(df_clean['pctch_real_mhval_sl'].mean())
df_clean['per_ch_rent_sl'] = df_clean['per_ch_rent_sl'].fillna(df_clean['per_ch_rent_sl'].mean())
df_clean['lostli'] = df_clean['lostli'].fillna(df_clean['lostli'].mean())
df_clean['pctch_ind_inc'] = df_clean['pctch_ind_inc'].fillna(df_clean['pctch_ind_inc'].mean())

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df_clean['pctch_real_mhval_sl'] = df_clean['pctch_real_mhval_sl'].fillna(df_clean['pctch_real_mhval_sl'].mean())
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df_clean['per_ch_rent_sl'] = df_clean['per_ch_rent_sl'].fillna(df_clean['per_ch_rent_sl'].mean())
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-c

In [100]:
missing_info = df_clean.isnull().sum()
print("col with null val:")
print(missing_info[missing_info > 0])  
# there are no missing data, exept for typology, which is expected

col with null val:
typology    1917
typ_cat     1917
dtype: int64


## Dealing with Abnormal Values

In [101]:
df_clean['medhinc'].describe() # there are some values below 0; we remove them

count         3836.00
mean      -1217861.87
std       26663144.11
min     -550964186.78
25%          49268.29
50%          68756.68
75%          93908.75
max         250001.00
Name: medhinc, dtype: float64

In [102]:
# check which rows have negative median income
df_clean.loc[df_clean['medhinc'] < 0, 'medhinc']

129    -550964186.78
335    -550964186.78
414    -550964186.78
528    -550964186.78
556    -550964186.78
1265   -550964186.78
1268   -550964186.78
1278   -550964186.78
1279   -550964186.78
Name: medhinc, dtype: float64

In [103]:
df_clean = df_clean.drop(df_clean[df_clean['medhinc'] < 0].index)
df_clean.loc[df_clean['medhinc'] < 0, 'medhinc']

Series([], Name: medhinc, dtype: float64)

In [104]:
# do the same for individual income
df_clean.loc[df_clean['iinc'] < 0, 'iinc']

601    -550964186.78
1276   -550964186.78
Name: iinc, dtype: float64

In [105]:
df_clean = df_clean.drop(df_clean[df_clean['iinc'] < 0].index)
df_clean.loc[df_clean['iinc'] < 0, 'iinc']

Series([], Name: iinc, dtype: float64)

In [106]:
# export data
df_clean.to_csv('training_data.csv')