# AHRF Data Analysis

## Setup
Setup environment and initialize data analyzer class.

In [4]:
import plotly.figure_factory as ff
import plotly.graph_objs as go
from plotly.offline import download_plotlyjs, init_notebook_mode, iplot
from IPython.display import IFrame
from ahrf_analysis import AHRFDataAnalyzer

# Setup global variables

DATA_DIR = '../data'
ASC_FILE = '{}/ahrf2018.asc'.format(DATA_DIR)
SAS_FILE = '{}/AHRF2017-18.sas'.format(DATA_DIR)
NAME = 'State Name'
STATE = 'FIPS State Code'
COUNTY = 'FIPS County Code'
FIPS = 'FIPS'
NE = ('Connecticut', 'Maine', 'Massachusetts', 'New Hampshire', 'Rhode Island', 'Vermont')

init_notebook_mode(connected=True)

# Initialize analyzer object

analyzer = AHRFDataAnalyzer(ASC_FILE, SAS_FILE)

## Data parsing
Read fixed-width AHRF data file and parse into respective CSV files.

In [2]:
analyzer.parse_data()

CHECK!!!


## Data plotting

In [7]:
def plot_data(fips, values, states, column, category):
    """
    Build geocoded choropleth map of <column> data by county for selected <states>.
    """
    fig = go.Choropleth(fips=fips,
                               values=values,
                               scope=states,
                               show_state_data=True,
                               round_legend_values=True,
                               legend_title=column,
                               exponent_format=True)
    iplot(fig, filename='choropleth_map_{}'.format(category))

## Environmental data

Load environmental data and plot map for selected state(s).

In [8]:
# Column in 'ahrf2018_env.csv' file to plot
column = 'Population Density per Sq Mile 2010'
# States to analyze
states = NE

geocodes, results = analyzer.get_environmental_data(column=column, states=states)
plot_data(geocodes, results, states, column, 'env')

ValueError: Invalid properties specified for object of type plotly.graph_objs.Choropleth: ('fips', 'values', 'scope', 'show_state_data', 'round_legend_values', 'legend_title', 'exponent_format')

    Valid properties:
        autocolorscale
            Determines whether the colorscale is a default palette
            (`autocolorscale: true`) or the palette determined by
            `colorscale`. In case `colorscale` is unspecified or
            `autocolorscale` is true, the default  palette will be
            chosen according to whether numbers in the `color`
            array are all positive, all negative or mixed.
        colorbar
            plotly.graph_objs.choropleth.ColorBar instance or dict
            with compatible properties
        colorscale
            Sets the colorscale. The colorscale must be an array
            containing arrays mapping a normalized value to an rgb,
            rgba, hex, hsl, hsv, or named color string. At minimum,
            a mapping for the lowest (0) and highest (1) values are
            required. For example, `[[0, 'rgb(0,0,255)', [1,
            'rgb(255,0,0)']]`. To control the bounds of the
            colorscale in color space, use`zmin` and `zmax`.
            Alternatively, `colorscale` may be a palette name
            string of the following list: Greys,YlGnBu,Greens,YlOrR
            d,Bluered,RdBu,Reds,Blues,Picnic,Rainbow,Portland,Jet,H
            ot,Blackbody,Earth,Electric,Viridis,Cividis.
        customdata
            Assigns extra data each datum. This may be useful when
            listening to hover, click and selection events. Note
            that, "scatter" traces also appends customdata items in
            the markers DOM elements
        customdatasrc
            Sets the source reference on plot.ly for  customdata .
        geo
            Sets a reference between this trace's geospatial
            coordinates and a geographic map. If "geo" (the default
            value), the geospatial coordinates refer to
            `layout.geo`. If "geo2", the geospatial coordinates
            refer to `layout.geo2`, and so on.
        hoverinfo
            Determines which trace information appear on hover. If
            `none` or `skip` are set, no information is displayed
            upon hovering. But, if `none` is set, click and hover
            events are still fired.
        hoverinfosrc
            Sets the source reference on plot.ly for  hoverinfo .
        hoverlabel
            plotly.graph_objs.choropleth.Hoverlabel instance or
            dict with compatible properties
        hovertemplate
            Template string used for rendering the information that
            appear on hover box. Note that this will override
            `hoverinfo`. Variables are inserted using %{variable},
            for example "y: %{y}". Numbers are formatted using
            d3-format's syntax %{variable:d3-format}, for example
            "Price: %{y:$.2f}". See https://github.com/d3/d3-format
            /blob/master/README.md#locale_format for details on the
            formatting syntax. The variables available in
            `hovertemplate` are the ones emitted as event data
            described at this link
            https://plot.ly/javascript/plotlyjs-events/#event-data.
            Additionally, every attributes that can be specified
            per-point (the ones that are `arrayOk: true`) are
            available.  Anything contained in tag `<extra>` is
            displayed in the secondary box, for example
            "<extra>{fullData.name}</extra>".
        hovertemplatesrc
            Sets the source reference on plot.ly for  hovertemplate
            .
        hovertext
            Same as `text`.
        hovertextsrc
            Sets the source reference on plot.ly for  hovertext .
        ids
            Assigns id labels to each datum. These ids for object
            constancy of data points during animation. Should be an
            array of strings, not numbers or any other type.
        idssrc
            Sets the source reference on plot.ly for  ids .
        legendgroup
            Sets the legend group for this trace. Traces part of
            the same legend group hide/show at the same time when
            toggling legend items.
        locationmode
            Determines the set of locations used to match entries
            in `locations` to regions on the map.
        locations
            Sets the coordinates via location IDs or names. See
            `locationmode` for more info.
        locationssrc
            Sets the source reference on plot.ly for  locations .
        marker
            plotly.graph_objs.choropleth.Marker instance or dict
            with compatible properties
        name
            Sets the trace name. The trace name appear as the
            legend item and on hover.
        opacity
            Sets the opacity of the trace.
        reversescale
            Reverses the color mapping if true. If true, `zmin`
            will correspond to the last color in the array and
            `zmax` will correspond to the first color.
        selected
            plotly.graph_objs.choropleth.Selected instance or dict
            with compatible properties
        selectedpoints
            Array containing integer indices of selected points.
            Has an effect only for traces that support selections.
            Note that an empty array means an empty selection where
            the `unselected` are turned on for all points, whereas,
            any other non-array values means no selection all where
            the `selected` and `unselected` styles have no effect.
        showlegend
            Determines whether or not an item corresponding to this
            trace is shown in the legend.
        showscale
            Determines whether or not a colorbar is displayed for
            this trace.
        stream
            plotly.graph_objs.choropleth.Stream instance or dict
            with compatible properties
        text
            Sets the text elements associated with each location.
        textsrc
            Sets the source reference on plot.ly for  text .
        uid
            Assign an id to this trace, Use this to provide object
            constancy between traces during animations and
            transitions.
        uirevision
            Controls persistence of some user-driven changes to the
            trace: `constraintrange` in `parcoords` traces, as well
            as some `editable: true` modifications such as `name`
            and `colorbar.title`. Defaults to `layout.uirevision`.
            Note that other user-driven trace attribute changes are
            controlled by `layout` attributes: `trace.visible` is
            controlled by `layout.legend.uirevision`,
            `selectedpoints` is controlled by
            `layout.selectionrevision`, and `colorbar.(x|y)`
            (accessible with `config: {editable: true}`) is
            controlled by `layout.editrevision`. Trace changes are
            tracked by `uid`, which only falls back on trace index
            if no `uid` is provided. So if your app can add/remove
            traces before the end of the `data` array, such that
            the same trace has a different index, you can still
            preserve user-driven changes if you give each trace a
            `uid` that stays with it as it moves.
        unselected
            plotly.graph_objs.choropleth.Unselected instance or
            dict with compatible properties
        visible
            Determines whether or not this trace is visible. If
            "legendonly", the trace is not drawn, but can appear as
            a legend item (provided that the legend itself is
            visible).
        z
            Sets the color values.
        zauto
            Determines whether or not the color domain is computed
            with respect to the input data (here in `z`) or the
            bounds set in `zmin` and `zmax`  Defaults to `false`
            when `zmin` and `zmax` are set by the user.
        zmax
            Sets the upper bound of the color domain. Value should
            have the same units as in `z` and if set, `zmin` must
            be set as well.
        zmid
            Sets the mid-point of the color domain by scaling
            `zmin` and/or `zmax` to be equidistant to this point.
            Value should have the same units as in `z`. Has no
            effect when `zauto` is `false`.
        zmin
            Sets the lower bound of the color domain. Value should
            have the same units as in `z` and if set, `zmax` must
            be set as well.
        zsrc
            Sets the source reference on plot.ly for  z .
        

## Expenses data

Load expenses data and plot map for selected state(s).

In [None]:
# Column in 'ahrf2018_exps.csv' file to plot
column = 'Total Actual Medicare Costs Fee for Service 2015'
# States to analyze
states = NE

analyzer.get_expenses_data(column=column, states=states)

## Utilization data

Load utilization data and plot map for selected state(s).

In [None]:
# Column in 'ahrf2018_util.csv' file to plot
column = 'Inpatient Days Incl Nurs Home;Total Hosp 2016'
# States to analyze
states = NE

analyzer.get_utilization_data(column=column, states=states)

## Population data

Load population data and plot map for selected state(s).

In [None]:
# Column in 'ahrf2018_pop.csv' file to plot
column = 'Census Population 2010'
# States to analyze
states = NE

analyzer.get_population_data(column=column, states=states)

## Professions data

Load professions data and plot map for selected state(s).

In [3]:
# Column in 'ahrf2018_prof.csv' file to plot
column = 'Total Active M.D.s Non-Federal 2016'
# States to analyze
states = NE

analyzer.get_professions_data(column=column, states=states)

High five! You successfully sent some data to your account on plotly. View your plot in your browser at https://plot.ly/~jnalviano/0 or inside your plot.ly account where it is named 'choropleth_full_usa'


(array(['009001', '009003', '009005', '009007', '009009', '009011',
        '009013', '009015', '023001', '023003', '023005', '023007',
        '023009', '023011', '023013', '023015', '023017', '023019',
        '023021', '023023', '023025', '023027', '023029', '023031',
        '025001', '025003', '025005', '025007', '025009', '025011',
        '025013', '025015', '025017', '025019', '025021', '025023',
        '025025', '025027', '033001', '033003', '033005', '033007',
        '033009', '033011', '033013', '033015', '033017', '033019',
        '044001', '044003', '044005', '044007', '044009', '050001',
        '050003', '050005', '050007', '050009', '050011', '050013',
        '050015', '050017', '050019', '050021', '050023', '050025',
        '050027'], dtype=object),
 array([3.7270e+03, 3.8260e+03, 3.1700e+02, 4.2100e+02, 4.8380e+03,
        5.6900e+02, 1.7700e+02, 1.2400e+02, 2.4500e+02, 1.3500e+02,
        1.6150e+03, 4.6000e+01, 1.4600e+02, 3.1900e+02, 1.0400e+02,
        6.7000