In [None]:
import altair as alt
from vega_datasets import data
import pandas as pd

# Source: https://data.cdc.gov/NCHS/Provisional-COVID-19-Deaths-by-County-and-Race-and/k8wy-p9cg

df = pd.read_csv('Provisional_COVID-19_Deaths_by_County__and_Race_and_Hispanic_Origin.csv')
df['FIPS Code'].duplicated().sum()

df = df.drop_duplicates(subset=['FIPS Code'])

counties = alt.topo_feature(data.us_10m.url, 'counties')
source = df

highlight = alt.selection_single(on='mouseover', fields=['id'], empty='none')

plot = alt.Chart(counties).mark_geoshape().encode(
    color=alt.condition(highlight, alt.value('red'), 'COVID-19 Deaths:Q'),
    tooltip=['County Name:O', 'COVID-19 Deaths:Q']
).transform_lookup(
    lookup='id',
    from_=alt.LookupData(source, 'FIPS Code', ['COVID-19 Deaths', 'County Name'])
).add_selection(highlight).project(
    type='albersUsa'
).properties(
    width=900,
    height=600
)

outline = alt.Chart(counties).mark_geoshape(stroke='blue', fillOpacity=0).project(
    type='albersUsa'
).properties(
    width=700,
    height=400
)

alt.layer(plot,outline)

In [None]:
import altair as alt
from vega_datasets import data


brush = alt.selection(type='interval')

print("INSTRUCTIONS: Drag and drop a box over the scatterplot to change data displayed in the histogram")
# POSSIBLE CHANGE: Scatterplot: x = covid deaths, y = vaccination data
points = alt.Chart(source).mark_point().encode(
    x='COVID-19 Deaths',
    y='Urban Rural Description',
    #color=alt.condition(brush, 'Origin:N', alt.value('lightgray'))
).add_selection(
    brush
)

# POSSIBLE CHANGE: Histogram: vaccination rate by county or something like this
bars = alt.Chart(source).mark_bar().encode(
    y='Urban Rural Description',
    #color='Origin:N',
    x='COVID-19 Deaths'
).transform_filter(
    brush
)

points & bars

INSTRUCTIONS: Drag and drop a box over the scatterplot to change data displayed in the histogram


## **2a. Provide a brief statement about your stakeholders, which informed your decision to select the particular chart (idom) for your Personal Visualization.**

For our universal vizualisation, we went with a map showing COVID-19 deaths per county. This is useful to our stakeholders because it allows them to compare and contrast their own county's death toll with others around it and across the United States. Hopefully this map would allow them to ensure they aren't a massive outlier in this regard.

For our personalized vizualisation, we wanted to show what type of areas are attributed to more or less COVID-19 deaths. We used a scatter bar chart on top to show the distributions of each county in each county type so that clear outliers can be seen clearly. On the bottom is a more typical bar chart that moreso shows the trend of the data. This would help our stakeholders better understand what death tolls look like in different types of population centers. This would allow them to generalize their population zone with the others so that they know what numbers to expect.

In conjuction with these graphs, our stakeholders will be able to determine if their county is outlier or on equal footing as other counties. This data could help them show the government that they need more or less supplies to deal with the mounting problems the virus brings.
