In [205]:
# Import Dependencies
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import plotly.express as px

## Data Cleaning and Processing

#### Housing Inventory Counts by State

In [206]:
years = list(map(str, range(2014, 2023)))

# Read 2012-2022 sheets of an Excel file into a dictionary of DataFrames
dict_of_dfs = {year: pd.read_excel('2007-2022-HIC-Counts-by-State.xlsx', sheet_name=year, skiprows=1) for year in years}

In [207]:
# Find the common set of columns
common_columns = set.intersection(*[set(df.columns) for df in dict_of_dfs.values()])

In [208]:
# Realign data and add "Year" column
all_data = pd.DataFrame()
for year, df in dict_of_dfs.items():
    missing_cols = common_columns - set(df.columns)
    extra_cols = set(df.columns) - common_columns
    df.drop(columns=extra_cols, errors='ignore', inplace=True)
    for col in missing_cols:
        df[col] = np.nan
    df['Year'] = year
    all_data = pd.concat([all_data, df], ignore_index=True)

In [209]:
# Concatenate all of the DataFrames in the dictionary into a single DataFrame
HIC_Counts = pd.concat(dict_of_dfs.values(), ignore_index=True)

In [210]:
# Remove US Territories and Total rows for each year
HIC_Counts = HIC_Counts[~HIC_Counts['State'].isin(['MP', 'GU', 'VI', 'PR', 'Total'])]

In [211]:
row_count = HIC_Counts.shape[0]
print("Number of rows:", row_count)

Number of rows: 459


In [212]:
pd.set_option('display.max_rows', None)
pd.set_option('display.max_columns', None)

In [213]:
HIC_Counts.dtypes

State                                                         object
Total Year-Round Beds (ES, TH, SH)                             int64
Total Non-DV Year-Round Beds (ES, TH, SH)                      int64
Total HMIS Year-Round Beds (ES, TH, SH)                        int64
HMIS Participation Rate for Year-Round Beds (ES, TH, SH)     float64
Total Year-Round Beds (ES)                                     int64
Total Year-Round Beds (TH)                                     int64
Total Year-Round Beds (SH)                                     int64
Total Units for Households with Children (ES, TH, SH)          int64
Total Beds for Households with Children (ES, TH, SH)           int64
Total Beds for Households without Children (ES, TH, SH)        int64
Total Beds for Households with only Children (ES, TH, SH)      int64
Total Year-Round Beds (ES).1                                   int64
Total Non-DV Year-Round Beds (ES)                              int64
Total HMIS Year-Round Beds (ES)   

In [214]:
participation_columns = ['HMIS Participation Rate for Year-Round Beds (ES, TH, SH)',
                         'HMIS Participation Rate for Year-Round Beds (ES)',
                         'HMIS Participation Rate for Year-Round Beds (TH)',
                         'HMIS Participation Rate for Year-Round Beds (SH)',
                         'HMIS Participation Rate for Year-Round Beds (RRH)',
                         'HMIS Participation Rate for Year-Round Beds (PSH)',
                         'HMIS Participation Rate for Year-Round Beds (OPH)']

# Replace '.' with NaN
HIC_Counts[participation_columns] = HIC_Counts[participation_columns].replace('.', np.nan)

# Convert to float
HIC_Counts[participation_columns] = HIC_Counts[participation_columns].astype(float)

In [215]:
missing_values = HIC_Counts.isnull().sum()
missing_values

State                                                          0
Total Year-Round Beds (ES, TH, SH)                             0
Total Non-DV Year-Round Beds (ES, TH, SH)                      0
Total HMIS Year-Round Beds (ES, TH, SH)                        0
HMIS Participation Rate for Year-Round Beds (ES, TH, SH)       0
Total Year-Round Beds (ES)                                     0
Total Year-Round Beds (TH)                                     0
Total Year-Round Beds (SH)                                     0
Total Units for Households with Children (ES, TH, SH)          0
Total Beds for Households with Children (ES, TH, SH)           0
Total Beds for Households without Children (ES, TH, SH)        0
Total Beds for Households with only Children (ES, TH, SH)      0
Total Year-Round Beds (ES).1                                   0
Total Non-DV Year-Round Beds (ES)                              0
Total HMIS Year-Round Beds (ES)                                0
HMIS Participation Rate f

In [216]:
HIC_Counts['HMIS Participation Rate for Year-Round Beds (OPH)'] = HIC_Counts['HMIS Participation Rate for Year-Round Beds (OPH)'].fillna('0%')
HIC_Counts['HMIS Participation Rate for Year-Round Beds (SH)'] = HIC_Counts['HMIS Participation Rate for Year-Round Beds (SH)'].fillna('0%')
HIC_Counts['HMIS Participation Rate for Year-Round Beds (RRH)'] = HIC_Counts['HMIS Participation Rate for Year-Round Beds (RRH)'].fillna('0%')

In [217]:
missing_values = HIC_Counts.isnull().sum()
missing_values

State                                                        0
Total Year-Round Beds (ES, TH, SH)                           0
Total Non-DV Year-Round Beds (ES, TH, SH)                    0
Total HMIS Year-Round Beds (ES, TH, SH)                      0
HMIS Participation Rate for Year-Round Beds (ES, TH, SH)     0
Total Year-Round Beds (ES)                                   0
Total Year-Round Beds (TH)                                   0
Total Year-Round Beds (SH)                                   0
Total Units for Households with Children (ES, TH, SH)        0
Total Beds for Households with Children (ES, TH, SH)         0
Total Beds for Households without Children (ES, TH, SH)      0
Total Beds for Households with only Children (ES, TH, SH)    0
Total Year-Round Beds (ES).1                                 0
Total Non-DV Year-Round Beds (ES)                            0
Total HMIS Year-Round Beds (ES)                              0
HMIS Participation Rate for Year-Round Beds (ES)       

In [218]:
southeast = {'AL', 'AR', 'FL', 'GA', 'KY', 'LA', 'MS', 'NC', 'SC', 'TN', 'VA', 'DC', 'WV'}
northeast = {'CT', 'DE', 'ME', 'MD', 'MA', 'NH', 'NJ', 'NY', 'PA', 'RI', 'VT', 'DC'}
west = {'AK', 'CA', 'CO', 'HI', 'ID', 'MT', 'NV', 'OR', 'UT', 'WA', 'WY'}
midwest = {'IL', 'IN', 'IA', 'KS', 'MI', 'MN', 'MO', 'NE', 'ND', 'OH', 'SD', 'WI'}
southwest = {'AZ', 'NM', 'OK', 'TX'}

state_to_region = {state: 'Southeast' for state in southeast}
state_to_region.update({state: 'Northeast' for state in northeast})
state_to_region.update({state: 'West' for state in west})
state_to_region.update({state: 'Midwest' for state in midwest})
state_to_region.update({state: 'Southwest' for state in southwest})

In [219]:
# Add Region column 
HIC_Counts['Region'] = HIC_Counts['State'].map(state_to_region)

#### Census Data 

In [220]:
census_data_pre2020 = pd.read_csv('Census2010_to_2019.csv', skiprows=3)

In [221]:
New_Labels = ['Geographic Area', 'Census', 'Estimates Base', '2010', '2011', '2012', '2013', '2014', '2015', '2016', '2017', '2018', '2019']
census_data_pre2020.columns = New_Labels

In [222]:
census_data_pre2020.head()

Unnamed: 0,Geographic Area,Census,Estimates Base,2010,2011,2012,2013,2014,2015,2016,2017,2018,2019
0,United States,308745538,308758105,309321666,311556874,313830990,315993715,318301008,320635163,322941311,324985539,326687501,328239523
1,Northeast,55317240,55318443,55380134,55604223,55775216,55901806,56006011,56034684,56042330,56059240,56046620,55982803
2,Midwest,66927001,66929725,66974416,67157800,67336743,67560379,67745167,67860583,67987540,68126781,68236628,68329004
3,South,114555744,114563030,114866680,116006522,117241208,118364400,119624037,120997341,122351760,123542189,124569433,125580448
4,West,71945553,71946907,72100436,72788329,73477823,74167130,74925793,75742555,76559681,77257329,77834820,78347268


In [223]:
census_data_post2020 = pd.read_csv('Census2020_to_2022.csv', skiprows=3)

In [224]:
New_Labels = ['Geographic Area', 'Estimates Base', '2020', '2021', '2022']
census_data_post2020.columns = New_Labels

In [225]:
census_data_post2020.head()

Unnamed: 0,Geographic Area,Estimates Base,2020,2021,2022
0,United States,331449520,331511512,332031554,333287557
1,Northeast,57609156,57448898,57259257,57040406
2,Midwest,68985537,68961043,68836505,68787595
3,South,126266262,126450613,127346029,128716192
4,West,78588565,78650958,78589763,78743364


In [226]:
census_data = census_data_pre2020.merge(census_data_post2020, on='Geographic Area')
census_data.head(10)

Unnamed: 0,Geographic Area,Census,Estimates Base_x,2010,2011,2012,2013,2014,2015,2016,2017,2018,2019,Estimates Base_y,2020,2021,2022
0,United States,308745538,308758105,309321666,311556874,313830990,315993715,318301008,320635163,322941311,324985539,326687501,328239523,331449520,331511512,332031554,333287557
1,Northeast,55317240,55318443,55380134,55604223,55775216,55901806,56006011,56034684,56042330,56059240,56046620,55982803,57609156,57448898,57259257,57040406
2,Midwest,66927001,66929725,66974416,67157800,67336743,67560379,67745167,67860583,67987540,68126781,68236628,68329004,68985537,68961043,68836505,68787595
3,South,114555744,114563030,114866680,116006522,117241208,118364400,119624037,120997341,122351760,123542189,124569433,125580448,126266262,126450613,127346029,128716192
4,West,71945553,71946907,72100436,72788329,73477823,74167130,74925793,75742555,76559681,77257329,77834820,78347268,78588565,78650958,78589763,78743364
5,.Alabama,4779736,4780125,4785437,4799069,4815588,4830081,4841799,4852347,4863525,4874486,4887681,4903185,5024356,5031362,5049846,5074296
6,.Alaska,710231,710249,713910,722128,730443,737068,736283,737498,741456,739700,735139,731545,733378,732923,734182,733583
7,.Arizona,6392017,6392288,6407172,6472643,6554978,6632764,6730413,6829676,6941072,7044008,7158024,7278717,7151507,7179943,7264877,7359197
8,.Arkansas,2915918,2916031,2921964,2940667,2952164,2959400,2967392,2978048,2989918,3001345,3009733,3017804,3011555,3014195,3028122,3045637
9,.California,37253956,37254519,37319502,37638369,37948800,38260787,38596972,38918045,39167117,39358497,39461588,39512223,39538245,39501653,39142991,39029342


In [227]:
state_abbr = {
    '.Alabama': 'AL',
    '.Alaska': 'AK',
    '.Arizona': 'AZ',
    '.Arkansas': 'AR',
    '.California': 'CA',
    '.Colorado': 'CO',
    '.Connecticut': 'CT',
    '.Delaware': 'DE',
    '.Florida': 'FL',
    '.Georgia': 'GA',
    '.Hawaii': 'HI',
    '.Idaho': 'ID',
    '.Illinois': 'IL',
    '.Indiana': 'IN',
    '.Iowa': 'IA',
    '.Kansas': 'KS',
    '.Kentucky': 'KY',
    '.Louisiana': 'LA',
    '.Maine': 'ME',
    '.Maryland': 'MD',
    '.Massachusetts': 'MA',
    '.Michigan': 'MI',
    '.Minnesota': 'MN',
    '.Mississippi': 'MS',
    '.Missouri': 'MO',
    '.Montana': 'MT',
    '.Nebraska': 'NE',
    '.Nevada': 'NV',
    '.New Hampshire': 'NH',
    '.New Jersey': 'NJ',
    '.New Mexico': 'NM',
    '.New York': 'NY',
    '.North Carolina': 'NC',
    '.North Dakota': 'ND',
    '.Ohio': 'OH',
    '.Oklahoma': 'OK',
    '.Oregon': 'OR',
    '.Pennsylvania': 'PA',
    '.Rhode Island': 'RI',
    '.South Carolina': 'SC',
    '.South Dakota': 'SD',
    '.Tennessee': 'TN',
    '.Texas': 'TX',
    '.Utah': 'UT',
    '.Vermont': 'VT',
    '.Virginia': 'VA',
    '.Washington': 'WA',
    '.West Virginia': 'WV',
    '.Wisconsin': 'WI',
    '.Wyoming': 'WY',
    '.District of Columbia': 'DC'
}

census_data['Geographic Area'] = census_data['Geographic Area'].map(state_abbr)

In [228]:
census_data.head(10)

Unnamed: 0,Geographic Area,Census,Estimates Base_x,2010,2011,2012,2013,2014,2015,2016,2017,2018,2019,Estimates Base_y,2020,2021,2022
0,,308745538,308758105,309321666,311556874,313830990,315993715,318301008,320635163,322941311,324985539,326687501,328239523,331449520,331511512,332031554,333287557
1,,55317240,55318443,55380134,55604223,55775216,55901806,56006011,56034684,56042330,56059240,56046620,55982803,57609156,57448898,57259257,57040406
2,,66927001,66929725,66974416,67157800,67336743,67560379,67745167,67860583,67987540,68126781,68236628,68329004,68985537,68961043,68836505,68787595
3,,114555744,114563030,114866680,116006522,117241208,118364400,119624037,120997341,122351760,123542189,124569433,125580448,126266262,126450613,127346029,128716192
4,,71945553,71946907,72100436,72788329,73477823,74167130,74925793,75742555,76559681,77257329,77834820,78347268,78588565,78650958,78589763,78743364
5,AL,4779736,4780125,4785437,4799069,4815588,4830081,4841799,4852347,4863525,4874486,4887681,4903185,5024356,5031362,5049846,5074296
6,AK,710231,710249,713910,722128,730443,737068,736283,737498,741456,739700,735139,731545,733378,732923,734182,733583
7,AZ,6392017,6392288,6407172,6472643,6554978,6632764,6730413,6829676,6941072,7044008,7158024,7278717,7151507,7179943,7264877,7359197
8,AR,2915918,2916031,2921964,2940667,2952164,2959400,2967392,2978048,2989918,3001345,3009733,3017804,3011555,3014195,3028122,3045637
9,CA,37253956,37254519,37319502,37638369,37948800,38260787,38596972,38918045,39167117,39358497,39461588,39512223,39538245,39501653,39142991,39029342


In [229]:
census_data = census_data.dropna(subset=['Geographic Area'])
census_data.head()

Unnamed: 0,Geographic Area,Census,Estimates Base_x,2010,2011,2012,2013,2014,2015,2016,2017,2018,2019,Estimates Base_y,2020,2021,2022
5,AL,4779736,4780125,4785437,4799069,4815588,4830081,4841799,4852347,4863525,4874486,4887681,4903185,5024356,5031362,5049846,5074296
6,AK,710231,710249,713910,722128,730443,737068,736283,737498,741456,739700,735139,731545,733378,732923,734182,733583
7,AZ,6392017,6392288,6407172,6472643,6554978,6632764,6730413,6829676,6941072,7044008,7158024,7278717,7151507,7179943,7264877,7359197
8,AR,2915918,2916031,2921964,2940667,2952164,2959400,2967392,2978048,2989918,3001345,3009733,3017804,3011555,3014195,3028122,3045637
9,CA,37253956,37254519,37319502,37638369,37948800,38260787,38596972,38918045,39167117,39358497,39461588,39512223,39538245,39501653,39142991,39029342


#### Adding Census Data to Housing Inventory Counts by State

In [230]:
HIC_Counts['Population'] = np.nan

In [231]:
for index, row in HIC_Counts.iterrows():
    state = row['State']
    year = row['Year']
    population = census_data.loc[census_data['Geographic Area'] == state, str(year)].values[0]
    HIC_Counts.at[index, 'Population'] = population

In [232]:
HIC_Counts.head()

Unnamed: 0,State,"Total Year-Round Beds (ES, TH, SH)","Total Non-DV Year-Round Beds (ES, TH, SH)","Total HMIS Year-Round Beds (ES, TH, SH)","HMIS Participation Rate for Year-Round Beds (ES, TH, SH)",Total Year-Round Beds (ES),Total Year-Round Beds (TH),Total Year-Round Beds (SH),"Total Units for Households with Children (ES, TH, SH)","Total Beds for Households with Children (ES, TH, SH)","Total Beds for Households without Children (ES, TH, SH)","Total Beds for Households with only Children (ES, TH, SH)",Total Year-Round Beds (ES).1,Total Non-DV Year-Round Beds (ES),Total HMIS Year-Round Beds (ES),HMIS Participation Rate for Year-Round Beds (ES),Total Seasonal Beds (ES),Total Overflow Beds (ES),Total Units for Households with Children (ES),Total Beds for Households with Children (ES),Total Beds for Households without Children (ES),Total Beds for Households with only Children (ES),Total Year-Round Beds (TH).1,Total Non-DV Year-Round Beds (TH),Total HMIS Year-Round Beds (TH),HMIS Participation Rate for Year-Round Beds (TH),Total Units for Households with Children (TH),Total Beds for Households with Children (TH),Total Beds for Households without Children (TH),Total Beds for Households with only Children (TH),Total Year-Round Beds (SH).1,Total Non-DV Year-Round Beds (SH),Total HMIS Year-Round Beds (SH),HMIS Participation Rate for Year-Round Beds (SH),Total Units for Households with Children (SH),Total Beds for Households with Children (SH),Total Beds for Households without Children (SH),Total Beds for Households with only Children (SH),Total Year-Round Beds (RRH),Total Non-DV Year-Round Beds (RRH),Total HMIS Year-Round Beds (RRH),HMIS Participation Rate for Year-Round Beds (RRH),Total Units for Households with Children (RRH),Total Beds for Households with Children (RRH),Total Beds for Households without Children (RRH),Total Beds for Households with only Children (RRH),Total Year-Round Beds (PSH),Total Non-DV Year-Round Beds (PSH),Total HMIS Year-Round Beds (PSH),HMIS Participation Rate for Year-Round Beds (PSH),Total Units for Households with Children (PSH),Total Beds for Households with Children (PSH),Total Beds for Households without Children (PSH),Total Beds for Households with only Children (PSH),Total Year-Round Beds (OPH),Total Non-DV Year-Round Beds (OPH),Total HMIS Year-Round Beds (OPH),HMIS Participation Rate for Year-Round Beds (OPH),Total Units for Households with Children (OPH),Total Beds for Households with Children (OPH),Total Beds for Households without Children (OPH),Total Beds for Households with only Children (OPH),Year,Region,Population
0,AK,1814,1382,1031,0.5684,1189,625,0,186,646,1117,51,1189,831,650,0.5467,20,122,117,401,766,22,625,551,381,0.6096,69,245,351,29,0,0,0,0%,0,0,0,0,158,158,158,1.0,30,123,35,0,715,715,715,1.0,55,167,548,0,0,0,0,0%,0,0,0,0,2014,West,736283
1,AL,3724,3212,1985,0.533,1838,1852,34,477,1394,2294,36,1838,1527,965,0.525,10,430,202,540,1276,22,1852,1651,986,0.5324,275,854,984,14,34,34,34,1.0,0,0,34,0,53,53,43,0.8113,11,39,14,0,2891,2891,1775,0.614,417,1206,1685,0,0,0,0,0%,0,0,0,0,2014,Southeast,4841799
2,AR,2151,1687,944,0.4389,1466,685,0,179,690,1428,33,1466,1114,559,0.3813,0,308,103,449,1002,15,685,573,385,0.562,76,241,426,18,0,0,0,0%,0,0,0,0,157,157,157,1.0,37,93,64,0,923,923,613,0.6641,122,331,592,0,22,16,16,0.7273,2,9,13,0,2014,Southeast,2967392
3,AZ,8873,7411,6063,0.6833,4481,4352,40,1418,4845,3983,45,4481,3305,2769,0.6179,229,434,636,2222,2231,28,4352,4066,3254,0.7477,782,2623,1712,17,40,40,40,1.0,0,0,40,0,441,345,344,0.78,117,339,102,0,7358,7358,5568,0.7567,836,2794,4564,0,707,707,47,0.0665,99,292,415,0,2014,Southwest,6730413
4,CA,44035,38960,31075,0.7057,17869,25959,207,5831,19739,23854,442,17869,15351,11796,0.6601,5300,1450,1827,6424,11065,380,25959,23402,19072,0.7347,4004,13315,12582,62,207,207,207,1.0,0,0,207,0,3504,3432,2938,0.8385,1097,3068,430,6,45580,45250,32954,0.723,4942,14412,31167,1,2516,2516,1763,0.7007,684,2110,406,0,2014,West,38596972


In [233]:
s = HIC_Counts.select_dtypes('number').columns

HIC_Counts_Per_Capita = pd.DataFrame(columns=s)

HIC_Counts['Population'] = HIC_Counts['Population'].str.replace(',', '').astype(float)

HIC_Counts_Per_Capita[s] = HIC_Counts[s].div(HIC_Counts['Population'].values, axis=0)

In [234]:
HIC_Counts_Per_Capita.head()

Unnamed: 0,"Total Year-Round Beds (ES, TH, SH)","Total Non-DV Year-Round Beds (ES, TH, SH)","Total HMIS Year-Round Beds (ES, TH, SH)","HMIS Participation Rate for Year-Round Beds (ES, TH, SH)",Total Year-Round Beds (ES),Total Year-Round Beds (TH),Total Year-Round Beds (SH),"Total Units for Households with Children (ES, TH, SH)","Total Beds for Households with Children (ES, TH, SH)","Total Beds for Households without Children (ES, TH, SH)","Total Beds for Households with only Children (ES, TH, SH)",Total Year-Round Beds (ES).1,Total Non-DV Year-Round Beds (ES),Total HMIS Year-Round Beds (ES),HMIS Participation Rate for Year-Round Beds (ES),Total Seasonal Beds (ES),Total Overflow Beds (ES),Total Units for Households with Children (ES),Total Beds for Households with Children (ES),Total Beds for Households without Children (ES),Total Beds for Households with only Children (ES),Total Year-Round Beds (TH).1,Total Non-DV Year-Round Beds (TH),Total HMIS Year-Round Beds (TH),HMIS Participation Rate for Year-Round Beds (TH),Total Units for Households with Children (TH),Total Beds for Households with Children (TH),Total Beds for Households without Children (TH),Total Beds for Households with only Children (TH),Total Year-Round Beds (SH).1,Total Non-DV Year-Round Beds (SH),Total HMIS Year-Round Beds (SH),Total Units for Households with Children (SH),Total Beds for Households with Children (SH),Total Beds for Households without Children (SH),Total Beds for Households with only Children (SH),Total Year-Round Beds (RRH),Total Non-DV Year-Round Beds (RRH),Total HMIS Year-Round Beds (RRH),Total Units for Households with Children (RRH),Total Beds for Households with Children (RRH),Total Beds for Households without Children (RRH),Total Beds for Households with only Children (RRH),Total Year-Round Beds (PSH),Total Non-DV Year-Round Beds (PSH),Total HMIS Year-Round Beds (PSH),HMIS Participation Rate for Year-Round Beds (PSH),Total Units for Households with Children (PSH),Total Beds for Households with Children (PSH),Total Beds for Households without Children (PSH),Total Beds for Households with only Children (PSH),Total Year-Round Beds (OPH),Total Non-DV Year-Round Beds (OPH),Total HMIS Year-Round Beds (OPH),Total Units for Households with Children (OPH),Total Beds for Households with Children (OPH),Total Beds for Households without Children (OPH),Total Beds for Households with only Children (OPH)
0,0.002464,0.001877,0.0014,7.719858e-07,0.001615,0.000849,0.0,0.000253,0.000877,0.001517,6.9e-05,0.001615,0.001129,0.000883,7.425134e-07,2.7e-05,0.000166,0.000159,0.000545,0.00104,3e-05,0.000849,0.000748,0.000517,8.279425e-07,9.4e-05,0.000333,0.000477,3.9e-05,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000215,0.000215,0.000215,4.1e-05,0.000167,4.8e-05,0.0,0.000971,0.000971,0.000971,1.358173e-06,7.5e-05,0.000227,0.000744,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,0.000769,0.000663,0.00041,1.10083e-07,0.00038,0.000383,7e-06,9.9e-05,0.000288,0.000474,7e-06,0.00038,0.000315,0.000199,1.084308e-07,2e-06,8.9e-05,4.2e-05,0.000112,0.000264,5e-06,0.000383,0.000341,0.000204,1.099591e-07,5.7e-05,0.000176,0.000203,3e-06,7e-06,7e-06,7e-06,0.0,0.0,7e-06,0.0,1.1e-05,1.1e-05,9e-06,2e-06,8e-06,3e-06,0.0,0.000597,0.000597,0.000367,1.268124e-07,8.6e-05,0.000249,0.000348,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,0.000725,0.000569,0.000318,1.479077e-07,0.000494,0.000231,0.0,6e-05,0.000233,0.000481,1.1e-05,0.000494,0.000375,0.000188,1.284967e-07,0.0,0.000104,3.5e-05,0.000151,0.000338,5e-06,0.000231,0.000193,0.00013,1.893919e-07,2.6e-05,8.1e-05,0.000144,6e-06,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.3e-05,5.3e-05,5.3e-05,1.2e-05,3.1e-05,2.2e-05,0.0,0.000311,0.000311,0.000207,2.237992e-07,4.1e-05,0.000112,0.0002,0.0,7e-06,5e-06,5e-06,6.739925e-07,3e-06,4e-06,0.0
3,0.001318,0.001101,0.000901,1.015242e-07,0.000666,0.000647,6e-06,0.000211,0.00072,0.000592,7e-06,0.000666,0.000491,0.000411,9.180714e-08,3.4e-05,6.4e-05,9.4e-05,0.00033,0.000331,4e-06,0.000647,0.000604,0.000483,1.110927e-07,0.000116,0.00039,0.000254,3e-06,6e-06,6e-06,6e-06,0.0,0.0,6e-06,0.0,6.6e-05,5.1e-05,5.1e-05,1.7e-05,5e-05,1.5e-05,0.0,0.001093,0.001093,0.000827,1.1243e-07,0.000124,0.000415,0.000678,0.0,0.000105,0.000105,7e-06,1.470935e-05,4.3e-05,6.2e-05,0.0
4,0.001141,0.001009,0.000805,1.828382e-08,0.000463,0.000673,5e-06,0.000151,0.000511,0.000618,1.1e-05,0.000463,0.000398,0.000306,1.710238e-08,0.000137,3.8e-05,4.7e-05,0.000166,0.000287,1e-05,0.000673,0.000606,0.000494,1.903517e-08,0.000104,0.000345,0.000326,2e-06,5e-06,5e-06,5e-06,0.0,0.0,5e-06,0.0,9.1e-05,8.9e-05,7.6e-05,2.8e-05,7.9e-05,1.1e-05,1.554526e-07,0.001181,0.001172,0.000854,1.873204e-08,0.000128,0.000373,0.000807,2.590877e-08,6.5e-05,6.5e-05,4.6e-05,1.77216e-05,5.5e-05,1.1e-05,0.0


## Exploratory Data Analysis

In [235]:
HIC_Counts_Per_Capita_stats = HIC_Counts_Per_Capita.describe()
HIC_Counts_Per_Capita_stats

Unnamed: 0,"Total Year-Round Beds (ES, TH, SH)","Total Non-DV Year-Round Beds (ES, TH, SH)","Total HMIS Year-Round Beds (ES, TH, SH)","HMIS Participation Rate for Year-Round Beds (ES, TH, SH)",Total Year-Round Beds (ES),Total Year-Round Beds (TH),Total Year-Round Beds (SH),"Total Units for Households with Children (ES, TH, SH)","Total Beds for Households with Children (ES, TH, SH)","Total Beds for Households without Children (ES, TH, SH)","Total Beds for Households with only Children (ES, TH, SH)",Total Year-Round Beds (ES).1,Total Non-DV Year-Round Beds (ES),Total HMIS Year-Round Beds (ES),HMIS Participation Rate for Year-Round Beds (ES),Total Seasonal Beds (ES),Total Overflow Beds (ES),Total Units for Households with Children (ES),Total Beds for Households with Children (ES),Total Beds for Households without Children (ES),Total Beds for Households with only Children (ES),Total Year-Round Beds (TH).1,Total Non-DV Year-Round Beds (TH),Total HMIS Year-Round Beds (TH),HMIS Participation Rate for Year-Round Beds (TH),Total Units for Households with Children (TH),Total Beds for Households with Children (TH),Total Beds for Households without Children (TH),Total Beds for Households with only Children (TH),Total Year-Round Beds (SH).1,Total Non-DV Year-Round Beds (SH),Total HMIS Year-Round Beds (SH),Total Units for Households with Children (SH),Total Beds for Households with Children (SH),Total Beds for Households without Children (SH),Total Beds for Households with only Children (SH),Total Year-Round Beds (RRH),Total Non-DV Year-Round Beds (RRH),Total HMIS Year-Round Beds (RRH),Total Units for Households with Children (RRH),Total Beds for Households with Children (RRH),Total Beds for Households without Children (RRH),Total Beds for Households with only Children (RRH),Total Year-Round Beds (PSH),Total Non-DV Year-Round Beds (PSH),Total HMIS Year-Round Beds (PSH),HMIS Participation Rate for Year-Round Beds (PSH),Total Units for Households with Children (PSH),Total Beds for Households with Children (PSH),Total Beds for Households without Children (PSH),Total Beds for Households with only Children (PSH),Total Year-Round Beds (OPH),Total Non-DV Year-Round Beds (OPH),Total HMIS Year-Round Beds (OPH),Total Units for Households with Children (OPH),Total Beds for Households with Children (OPH),Total Beds for Households without Children (OPH),Total Beds for Households with only Children (OPH)
count,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0
mean,0.001368,0.001183,0.00097,2.726265e-07,0.000933,0.00043,6e-06,0.000204,0.000645,0.000709,1.4e-05,0.000933,0.000797,0.00066,2.639511e-07,8.2e-05,9e-05,0.00013,0.000425,0.000498,1e-05,0.00043,0.00038,0.000304,2.79141e-07,7.4e-05,0.000221,0.000205,4e-06,6e-06,6e-06,6e-06,2.485847e-09,5.189379e-09,6e-06,1.042471e-09,0.000426,0.000406,0.000385,0.00011,0.000332,9.4e-05,3.028103e-07,0.001173,0.001165,0.000895,2.910222e-07,0.000155,0.000447,0.000726,5.279138e-07,0.000189,0.000187,0.0001281912,4e-05,0.00012,7e-05,9.470181e-08
std,0.001427,0.001372,0.001324,3.070581e-07,0.001109,0.000401,7e-06,0.000246,0.000773,0.000714,1.6e-05,0.001109,0.001092,0.001072,3.086006e-07,0.00014,0.000245,0.000194,0.000628,0.000539,1e-05,0.000401,0.000365,0.000334,3.126388e-07,7.6e-05,0.000234,0.000198,9e-06,7e-06,7e-06,7e-06,3.810579e-08,8.017453e-08,7e-06,2.23342e-08,0.001054,0.00105,0.001023,0.000344,0.001004,8.4e-05,1.713368e-06,0.001767,0.001751,0.001475,2.90699e-07,0.000273,0.000866,0.000924,4.626542e-06,0.000764,0.000758,0.000584041,0.00019,0.000576,0.000212,5.390656e-07
min,0.000254,0.000193,9.9e-05,1.470585e-08,0.000166,7.6e-05,0.0,3.8e-05,9.7e-05,0.000154,0.0,0.000166,0.000108,4e-06,3.836157e-09,0.0,0.0,2.1e-05,8e-05,8.1e-05,0.0,7.6e-05,4.1e-05,8e-06,1.551634e-08,0.0,0.0,2.2e-05,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000105,0.000102,2.4e-05,1.64296e-08,1.1e-05,3.5e-05,6.5e-05,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
25%,0.000806,0.000652,0.000482,8.166423e-08,0.000538,0.00023,0.0,0.0001,0.000331,0.00045,5e-06,0.000538,0.000417,0.000283,7.664974e-08,1.9e-05,2.4e-05,5.8e-05,0.000212,0.000304,4e-06,0.00023,0.000188,0.000134,8.587269e-08,3.2e-05,9.7e-05,0.00011,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.000148,0.000136,0.00013,3.1e-05,9.5e-05,4.2e-05,0.0,0.00059,0.000589,0.00041,1.000669e-07,6.6e-05,0.00018,0.000381,0.0,4e-06,4e-06,3.171029e-07,0.0,0.0,2e-06,0.0
50%,0.000984,0.000834,0.000639,1.335374e-07,0.00063,0.000336,5e-06,0.000135,0.000432,0.000521,9e-06,0.00063,0.000509,0.000409,1.320544e-07,4.9e-05,4.5e-05,7.9e-05,0.00026,0.000358,8e-06,0.000336,0.00029,0.000223,1.409772e-07,5.3e-05,0.000156,0.000158,1e-06,5e-06,5e-06,4e-06,0.0,0.0,5e-06,0.0,0.000243,0.000226,0.000217,5.3e-05,0.000169,6.9e-05,0.0,0.000834,0.000832,0.000609,1.607098e-07,0.000112,0.000297,0.000522,0.0,4.2e-05,3.7e-05,2.555543e-05,5e-06,1.6e-05,1.9e-05,0.0
75%,0.001343,0.001116,0.000875,3.264421e-07,0.000901,0.000498,8e-06,0.00021,0.000636,0.000705,1.7e-05,0.000901,0.000719,0.00054,3.152606e-07,9.7e-05,9e-05,0.000119,0.000346,0.000483,1.2e-05,0.000498,0.000458,0.000362,3.468031e-07,9.3e-05,0.000268,0.000229,4e-06,8e-06,8e-06,8e-06,0.0,0.0,8e-06,0.0,0.000377,0.000343,0.000338,8.5e-05,0.000262,0.000117,0.0,0.001244,0.001226,0.000953,3.63879e-07,0.000165,0.000468,0.000819,0.0,0.000108,0.000108,7.417279e-05,1.8e-05,5.5e-05,6.3e-05,0.0
max,0.012123,0.011591,0.011216,1.540883e-06,0.008861,0.003262,7.1e-05,0.002361,0.007362,0.006877,0.000141,0.008861,0.00875,0.008549,1.466241e-06,0.001268,0.0034,0.001725,0.005548,0.00525,6.6e-05,0.003262,0.003142,0.00267,1.720042e-06,0.000655,0.001814,0.001654,9.3e-05,7.1e-05,7.1e-05,7.1e-05,6.625096e-07,1.435483e-06,7.1e-05,4.784943e-07,0.0118,0.011714,0.01074,0.004042,0.011301,0.000579,2.262731e-05,0.021535,0.02134,0.018968,1.358173e-06,0.003099,0.009671,0.011864,9.441558e-05,0.009672,0.009597,0.007738876,0.002346,0.007081,0.002592,5.438251e-06


In [236]:
HIC_Counts_stats = HIC_Counts.describe()
HIC_Counts_stats

Unnamed: 0,"Total Year-Round Beds (ES, TH, SH)","Total Non-DV Year-Round Beds (ES, TH, SH)","Total HMIS Year-Round Beds (ES, TH, SH)","HMIS Participation Rate for Year-Round Beds (ES, TH, SH)",Total Year-Round Beds (ES),Total Year-Round Beds (TH),Total Year-Round Beds (SH),"Total Units for Households with Children (ES, TH, SH)","Total Beds for Households with Children (ES, TH, SH)","Total Beds for Households without Children (ES, TH, SH)","Total Beds for Households with only Children (ES, TH, SH)",Total Year-Round Beds (ES).1,Total Non-DV Year-Round Beds (ES),Total HMIS Year-Round Beds (ES),HMIS Participation Rate for Year-Round Beds (ES),Total Seasonal Beds (ES),Total Overflow Beds (ES),Total Units for Households with Children (ES),Total Beds for Households with Children (ES),Total Beds for Households without Children (ES),Total Beds for Households with only Children (ES),Total Year-Round Beds (TH).1,Total Non-DV Year-Round Beds (TH),Total HMIS Year-Round Beds (TH),HMIS Participation Rate for Year-Round Beds (TH),Total Units for Households with Children (TH),Total Beds for Households with Children (TH),Total Beds for Households without Children (TH),Total Beds for Households with only Children (TH),Total Year-Round Beds (SH).1,Total Non-DV Year-Round Beds (SH),Total HMIS Year-Round Beds (SH),Total Units for Households with Children (SH),Total Beds for Households with Children (SH),Total Beds for Households without Children (SH),Total Beds for Households with only Children (SH),Total Year-Round Beds (RRH),Total Non-DV Year-Round Beds (RRH),Total HMIS Year-Round Beds (RRH),Total Units for Households with Children (RRH),Total Beds for Households with Children (RRH),Total Beds for Households without Children (RRH),Total Beds for Households with only Children (RRH),Total Year-Round Beds (PSH),Total Non-DV Year-Round Beds (PSH),Total HMIS Year-Round Beds (PSH),HMIS Participation Rate for Year-Round Beds (PSH),Total Units for Households with Children (PSH),Total Beds for Households with Children (PSH),Total Beds for Households without Children (PSH),Total Beds for Households with only Children (PSH),Total Year-Round Beds (OPH),Total Non-DV Year-Round Beds (OPH),Total HMIS Year-Round Beds (OPH),Total Units for Households with Children (OPH),Total Beds for Households with Children (OPH),Total Beds for Households without Children (OPH),Total Beds for Households with only Children (OPH),Population
count,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0,459.0
mean,7925.978214,6978.405229,5740.398693,0.655189,5592.172113,2291.446623,42.359477,1205.339869,3862.936819,3992.019608,71.021786,5592.172113,4905.204793,4099.766885,0.63357,406.413943,411.442266,827.742919,2714.91939,2823.396514,53.856209,2291.446623,2031.664488,1601.525054,0.670389,377.570806,1147.962963,1126.328976,17.154684,42.359477,41.701525,39.106754,0.026144,0.054466,42.294118,0.010893,1946.185185,1824.172113,1736.187364,448.786492,1367.847495,577.08061,1.257081,6890.869281,6837.603486,5159.581699,0.737714,849.08061,2407.8061,4480.973856,2.089325,854.185185,843.488017,553.311547,163.67756,499.810458,353.694989,0.679739,6402224.0
std,13439.490045,12649.362802,11075.348538,0.156946,11520.308598,3066.697532,69.226539,2342.112482,7481.108415,6172.588401,89.627124,11520.308598,10972.801779,9924.162275,0.179344,702.546064,718.117312,2133.591959,6845.078501,4914.340645,70.33995,3066.697532,2752.49929,2183.908326,0.165514,493.668741,1558.22422,1586.347503,29.644989,69.226539,69.073818,60.927148,0.401107,0.840615,69.250499,0.23338,2949.96491,2807.805246,2718.79836,679.277852,1994.849655,1101.742574,5.797843,10449.391994,10361.60369,7355.914678,0.156401,1111.273949,3250.249646,7312.31837,8.864991,2040.442439,2025.102243,1275.091039,399.749218,1277.133096,919.579726,3.65843,7238600.0
min,560.0,383.0,106.0,0.0804,345.0,92.0,0.0,54.0,210.0,277.0,0.0,345.0,290.0,4.0,0.0041,0.0,0.0,27.0,104.0,194.0,0.0,92.0,32.0,6.0,0.0455,0.0,0.0,30.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,207.0,207.0,14.0,0.0673,9.0,27.0,54.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,577601.0
25%,2262.0,1685.0,1141.5,0.56815,1377.0,592.0,0.0,259.0,839.5,1166.5,16.0,1377.0,1078.5,790.0,0.53605,58.0,77.5,159.5,551.5,824.5,13.0,592.0,538.5,386.0,0.57895,92.0,268.0,284.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,373.5,345.5,314.0,77.0,243.5,104.5,0.0,1209.0,1206.0,899.5,0.6517,154.0,429.0,792.5,0.0,14.0,13.0,1.0,0.0,0.0,6.5,0.0,1786296.0
50%,3880.0,3348.0,2837.0,0.6728,2625.0,1453.0,18.0,500.0,1623.0,2318.0,38.0,2625.0,2132.0,1664.0,0.6578,242.0,212.0,277.0,971.0,1557.0,29.0,1453.0,1244.0,986.0,0.6979,216.0,658.0,673.0,5.0,18.0,16.0,16.0,0.0,0.0,17.0,0.0,1058.0,968.0,936.0,235.0,707.0,287.0,0.0,3347.0,3317.0,2657.0,0.7584,422.0,1207.0,2327.0,0.0,154.0,152.0,96.0,22.0,64.0,82.0,0.0,4461153.0
75%,7580.5,6591.5,5530.0,0.7562,4796.5,2738.5,55.5,1189.0,3734.0,4292.0,88.5,4796.5,4194.5,3616.0,0.7482,490.5,400.0,639.0,2196.0,2810.5,64.0,2738.5,2441.0,1878.0,0.7842,484.0,1373.5,1283.5,23.0,55.5,54.0,51.0,0.0,0.0,55.5,0.0,2445.5,2308.5,2187.5,560.5,1749.0,622.5,0.0,8203.0,8152.5,6684.0,0.8341,1161.5,3173.5,5103.0,0.0,658.5,655.5,387.5,107.5,328.5,315.5,0.0,7326984.0
max,89238.0,85088.0,81126.0,0.9549,83571.0,25959.0,634.0,17280.0,55035.0,41848.0,512.0,83571.0,79663.0,76549.0,0.9648,5722.0,6615.0,16618.0,53180.0,36323.0,383.0,25959.0,23402.0,19072.0,1.0,4004.0,13315.0,12632.0,253.0,634.0,632.0,453.0,7.0,15.0,634.0,5.0,29487.0,28568.0,28094.0,6364.0,17207.0,16496.0,75.0,72086.0,71913.0,55492.0,1.0,7001.0,20439.0,52164.0,72.0,22218.0,22197.0,14878.0,4690.0,16152.0,12167.0,36.0,39512220.0
