# Demographic, Economic & Behavioral Data Analysis and Exploration

## Introduction



In [72]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from bs4 import BeautifulSoup as bs
import requests as r
import lxml
import plotly.plotly as py
from plotly.offline import download_plotlyjs, init_notebook_mode, plot, iplot

init_notebook_mode(connected=True)

%matplotlib inline

## Religion per State

In [56]:
with open(r'data/religions.html', "r") as f:
    page = f.read()
tree = lxml.html.fromstring(page)

In [81]:
df_religion = pd.read_html('data/religions.html')[0]

df_religion.columns = ['state', 'percentage']
df_religion['state'] = df_religion.state.str.replace(r'[0-9]+\.', '', regex=True)
df_religion['percentage'] = (df_religion['percentage'].str.replace('%', '')).astype(int) / 100

In [89]:
df_religion['percentage2'] = df_religion['percentage'] * 10000

In [95]:
scl = [[0.0, 'rgb(242,240,247)'],[0.2, 'rgb(218,218,235)'],[0.4, 'rgb(188,189,220)'],\
            [0.6, 'rgb(158,154,200)'],[0.8, 'rgb(117,107,177)'],[1.0, 'rgb(84,39,143)']]

data = [ dict(
        type='choropleth',
        colorscale=scl,
        autocolorscale = True,
        locations = df_religion['state'],
        z = df_religion['percentage'].astype(float)*1000,
        locationmode = 'USA-states',
        text = df_religion['state'],
        marker = dict(
            line = dict (
                color = 'rgb(255,255,255)',
                width = 2
            ) ),
        colorbar = dict(
            title = "Millions USD")
        ) ]

layout = dict(
        title = '2011 US Agriculture Exports by State<br>(Hover for breakdown)',
        geo = dict(
            scope='usa',
            projection=dict( type='albers usa' ),
            showlakes = True,
            lakecolor = 'rgb(255, 255, 255)'),
             )
    
fig = dict( data=data, layout=layout )
iplot( fig, filename='d3-cloropleth-map' )