In [None]:
import pandas as pd
import numpy as np
import os

### [CDC Social Vulnerability Index](https://www.atsdr.cdc.gov/place-health/php/svi/svi-data-documentation-download.html)
Social vulnerability is a measure of vulnerability of social groups to natural hazard damages throuh death, injury, monetary loss, and livelihood.

Data is [downloaded](https://www.atsdr.cdc.gov/place-health/php/svi/svi-data-documentation-download.html) from and [documented](https://svi.cdc.gov/map25/data/docs/SVI2022Documentation_ZCTA.pdf) on the ASTDR CDC website. Available at a census tract level for the years 2000, 2010, 2014, 2016, 2018, 2020, 2022.

In [None]:
df_list = []
data_years = [2000, 2010, 2014, 2016, 2018, 2020, 2022]

for yr in data_years:
    # read data
    print(yr)
    filename = 'data/SVI_Tract_Data/SVI_' + str(yr) + '_US.csv'
    df = pd.read_csv(filename)

    # clean data
    df = df.replace(-999., np.nan) # nan values are labelled -999
    if yr == 2000:
        df = df.rename(columns={'USTP': 'RPL_THEMES', 'STATE_NAME': 'STATE'})
    if yr == 2010:
        df = df.rename(columns={'R_PL_THEMES': 'RPL_THEMES', 'STATE_NAME': 'STATE'})
    df.STATE = df.STATE.apply(lambda x: x.strip().title()) # reformat state strings

    # aggregate to state level
    df_mean = df[['STATE', 'RPL_THEMES']].groupby('STATE').mean() # RPL_THEMES overall percentile ranking
    df_mean['Year'] = yr
    df_list.append(df_mean)

df_all = pd.concat(df_list)
df_all = df_all.reset_index()
df_all = df_all.rename(columns={'RPL_THEMES': 'SVI', 'STATE': 'State'})

2000


FileNotFoundError: [Errno 2] No such file or directory: 'data/SVI_Tract_Data/SVI_2000_US.csv'

In [None]:
df_all.loc[df_all.State == "Virginia"]

Unnamed: 0,State,SVI,Year
46,Virginia,0.451728,2000
97,Virginia,0.395867,2010
148,Virginia,0.384048,2014
199,Virginia,0.38756,2016
250,Virginia,0.39453,2018
301,Virginia,0.411145,2020
352,Virginia,0.405825,2022


In [None]:
# df_all.to_csv('data/SVI_State.csv', index=False)

### [USC's Hazards and Vulnerability Research Institude Baseline Resilience Indicators for Communities](https://www.sc.edu/study/colleges_schools/artsandsciences/centers_and_institutes/hvri/data_and_resources/bric/)
The HVRI BRIC data is used to measure the ability of a community to prepare, adapt, and recover from natural hazards.

Data is [downloaded](https://www.sc.edu/study/colleges_schools/artsandsciences/centers_and_institutes/hvri/data_and_resources/bric/bric_data/index.php) on the ASTDR CDC website and the methods are documented in this [paper](https://www.sciencedirect.com/science/article/pii/S0959378014001459). Data is available at a county level across the years 2010, 2015, 2020.

In [None]:
bric_path = 'data/BRIC_County_Data/'
files = os.listdir(bric_path)

In [None]:
df_list = []
for f in files:
    path = bric_path + f
    df = pd.read_csv(path, encoding='latin-1')

    yr = int(f[4:8])
    yr_name = 'TOT RESIL' + str(yr)
    df = df.rename(columns={yr_name: 'Resilience'})

    df_mean = df[['State Code (FIPS)', 'Resilience']].groupby('State Code (FIPS)').mean('Resilience')
    df_mean['Year'] = yr
    df_list.append(df_mean)

df_all = pd.concat(df_list)
df_all = df_all.reset_index()

In [None]:
df_all

Unnamed: 0,State Code (FIPS),Resilience,Year
0,1,3.050799,2010
1,4,2.468835,2010
2,5,2.963719,2010
3,6,2.896646,2010
4,8,3.001436,2010
...,...,...,...
146,51,2.611198,2020
147,53,2.598001,2020
148,54,2.537370,2020
149,55,2.726742,2020
