## Visualizing EPA EJSCREEN Data

### Step 1: Download software 

In [34]:
# Import software

import pandas as pd
import geopandas as gpd 
import matplotlib.pyplot as plt 
import contextily as ctx
import numpy as np
import quilt3
from geopandas_view import view 

In [35]:
### Step 3: Retrieve and Adjust Data

In [36]:
# Retrieve EPA EJ Screen data from UCR CGS Quilt Bucket

b = quilt3.Bucket("s3://spatial-ucr")
b.fetch("epa/ejscreen/ejscreen_2020.parquet", "./ejscreen_2020.parquet"), 
ej = pd.read_parquet('ejscreen_2020.parquet')

100%|██████████| 146M/146M [00:10<00:00, 14.6MB/s] 


In [None]:
# Download USA Census block groups from the 2018 ACS via Quilt

geoms = gpd.read_parquet('s3://spatial-ucr/census/acs/acs_2018_bg.parquet', columns=['geometry'])

In [None]:
# Merge EJ and ACA data sets

ej = gpd.GeoDataFrame(ej.merge(geoms, left_on='ID', right_index=True))

In [None]:
# Filter EJ Screen data so it only displays CA

ca_ej = ej[ej.ID.str.startswith('06')]

### Step 4 (OPTIONAL): Download EJ Data Output (HTML)

In [None]:
# delete hastags to run command

# data, metadata = get_ipython().display_formatter.format(ej)
# with open('EJDataTable.html', 'w') as f:
#    f.write(data['text/html'])

### Step 5: Isolate EJ Index of Interest & Visualize

In [None]:
# Filter out EJ Index for Air toxics respiratory hazard index

D_RESP_2 = ca_ej.D_RESP_2 

ca_ej.D_RESP_2 = D_RESP_2.replace(to_replace= "None", value=np.nan).astype(float)

In [None]:
# Create variable for Riverside County

riverside = ca_ej[ca_ej.ID.str.startswith("06065")]

In [None]:
# Subset EJ Data for riverside county 

view(riverside, column='D_RESP_2', scheme='quantiles', tooltip=['D_RESP_2'])