In [1]:
import pandas as pd
import plotly.express as px
from getpass import getpass
import chart_studio
import chart_studio.plotly as py

username = "mdong127"
api_key = getpass()
chart_studio.tools.set_credentials_file(username=username, api_key=api_key)

········


In [2]:
complete_feature_df = pd.read_csv("../data/complete_feature_df.csv")
complete_feature_df.head()

Unnamed: 0,County,Total Residential Tons,Electricity Usage_2014,Population_2014
0,ALAMEDA,405147,2891.232325,1607792.0
1,ALPINE,291,11.974975,1080.0
2,AMADOR,8799,134.744387,36726.0
3,BUTTE,55883,718.947064,223516.0
4,CALAVERAS,11400,192.543967,44671.0


In [3]:
complete_feature_df.groupby("County").agg("mean").head()

Unnamed: 0_level_0,Total Residential Tons,Electricity Usage_2014,Population_2014
County,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
ALAMEDA,405147,2891.232325,1607792.0
ALPINE,291,11.974975,1080.0
AMADOR,8799,134.744387,36726.0
BUTTE,55883,718.947064,223516.0
CALAVERAS,11400,192.543967,44671.0


In [21]:
fig = px.scatter(complete_feature_df, x="Electricity Usage_2014", y="Total Residential Tons",
                 size="Population_2014", hover_data=["County"], color="County",
#                  log_x=True, log_y=True, 
                 labels={
                     "Total Residential Tons": "Total Residential Waste (Tons)",
                     "Electricity Usage_2014": "Electricity Usage (gWh)",
                     "Population_2014": "Population"
                 },
                 title="CA County Waste vs Electricity Usage & Population (2014)"
                )
# fig.update_traces(textposition='top left')
fig.show()

In [22]:
py.plot(fig, filename = 'Waste-vs-Energy-Population', auto_open=True)

'https://plotly.com/~mdong127/59/'

---

## State / County Data

### Cal Recycle

- The Solid Waste Information System (SWIS) database contains information on solid waste facilities, operations, and disposal sites in California.  Includes Latitude, Longitude and waste type processed
- Source: https://www2.calrecycle.ca.gov/SolidWaste/Site/Search

In [37]:
cal_waste_facilities = pd.read_csv('../data/calrecycle-waste-facilities.csv')
cal_waste_facilities.head(3)

Unnamed: 0,SWIS Number,Site Name,Activity,Waste Type,Site Is Archived,Site Operational Status,Site Regulatory Status,Site Type,Latitude,Longitude,Point of Contact,Activity Is Archived,Activity Operational Status,Activity Regulatory Status,Activity Category,Activity Classification
0,27-AA-0114,"Return to Earth, LLC",Agricultural Material Composting Operation,Agricultural,Yes,Closed,Surrendered,Non-Disposal Only,36.63163,-121.5477,Eric Kiruja,Yes,Closed,Surrendered,Composting,Solid Waste Operation
1,27-AA-0114,"Return to Earth, LLC",Agricultural Material Composting Operation,Green Materials,Yes,Closed,Surrendered,Non-Disposal Only,36.63163,-121.5477,Eric Kiruja,Yes,Closed,Surrendered,Composting,Solid Waste Operation
2,15-AA-0392,Demler Enterprises-Delano,Agricultural Material Composting Operation,Manure,No,Active,Notification,Non-Disposal Only,35.7588,-119.33784,Christine Karl,No,Active,Notification,Composting,Solid Waste Operation


---

## National Data

### EIA energy consumption

- Residential Energy consumption 
    - Totals and averages for each major end use: space heating, water heating, air-conditioning, refrigerators, and other (other appliances, electronics, and lighting)
    - Grouped by different categories like large census region, climate, housing type, etc.

- Source: https://www.eia.gov/consumption/residential/data/2015/index.php?view=consumption#by%20end%20uses'
- Downlads as an excel file that has some indentation in the index column such that it downloading it directly as a csv messes up the organization.  The rows that have no observations just separate the different cateogires

In [31]:
us_region_energy_usage = pd.read_csv('../data/eia-residential-energy-consumption.csv',index_col=0)
us_region_energy_usage.head(10)

Unnamed: 0,Total U.S.2 (Number of housing units (million)),Total Average energy expenditures \n(dollars per household using the end use),Space heating3,Water heating,Air condi-tioning,Refrig-erators,Other4
All homes,118.2,1856.0,543.0,296.0,265.0,103.0,714.0
Census region and division,,,,,,,
Northeast,21.0,2269.0,850.0,335.0,174.0,120.0,834.0
New England,5.6,2541.0,1046.0,379.0,127.0,124.0,926.0
Middle Atlantic,15.4,2169.0,779.0,318.0,188.0,118.0,800.0
Midwest,26.4,1760.0,604.0,246.0,148.0,99.0,681.0
East North Central,18.1,1762.0,612.0,247.0,140.0,101.0,676.0
West North Central,8.3,1757.0,587.0,243.0,166.0,96.0,691.0
South,44.4,1917.0,465.0,323.0,392.0,93.0,694.0
South Atlantic,23.5,1963.0,488.0,344.0,386.0,95.0,714.0


In [40]:
us_region_energy_usage.iloc[17:33]

Unnamed: 0,Total U.S.2 (Number of housing units (million)),Total Average energy expenditures \n(dollars per household using the end use),Space heating3,Water heating,Air condi-tioning,Refrig-erators,Other4
Census urban/rural classification5,,,,,,,
Urban,94.7,1773.0,495.0,274.0,269.0,102.0,694.0
Urbanized area,82.2,1782.0,488.0,272.0,279.0,104.0,705.0
Urban cluster,12.5,1710.0,540.0,286.0,202.0,92.0,625.0
Rural,23.5,2190.0,737.0,382.0,253.0,105.0,791.0
Metropolitan or micropolitan statistical area,,,,,,,
In metropolitan statistical area,98.5,1840.0,520.0,287.0,274.0,105.0,723.0
In micropolitan statistical area,12.3,1861.0,626.0,325.0,195.0,91.0,657.0
Not in metropolitan or micropolitan statistical area,7.4,2050.0,714.0,368.0,270.0,96.0,688.0
Climate region6,,,,,,,


### BLS demographic information

- Income levels, expenditures by housing, transportation, food, etc. for major regions (Northeast, Midwest, South, West) and major cities for each region
- Source: https://www.bls.gov/cex/tables.htm#MSA

In [70]:
bls_consumer_expenditures_west = pd.read_csv('../data/bls-consumer-expenditures-west.csv',index_col=0)
bls_consumer_expenditures_west.dropna(axis=0, how="all", inplace=True)
for col in bls_consumer_expenditures_west.columns:
    bls_consumer_expenditures_west[col] = bls_consumer_expenditures_west[col].str.replace(r'\D+', '')
bls_consumer_expenditures_west = bls_consumer_expenditures_west.apply(pd.to_numeric, errors='raise')
bls_consumer_expenditures_west.iloc[25:40]

Unnamed: 0_level_0,All consumer\nunits in the\nWest,Los\nAngeles,San\nFrancisco,San Diego,Seattle,Phoenix,Denver,Honolulu,Anchorage
Item,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
Household operations,1768,1647,3346,1862,2552,1668,2338,944,1281
Housekeeping supplies,746,673,674,674,765,821,729,871,967
Household furnishings and equipment,2238,1743,1545,2293,3175,2802,2492,1692,2444
Apparel and services,1989,2080,2427,2274,2915,2178,2156,1577,2653
Transportation,11210,10959,11103,11704,11506,12525,12331,8403,13313
Vehicle purchases (net outlay),4187,3435,3796,3334,3902,5890,4641,2865,5539
"Gasoline, other fuels, and motor oil",2397,2890,2123,2576,2290,2151,1943,1851,2363
Other vehicle expenses,3634,3723,3448,4291,3689,3750,4626,2543,3816
Public and other transportation,992,910,1736,1504,1625,734,1121,1143,1594
Healthcare,5005,4158,4898,4645,5140,5972,5977,4233,5179


In [69]:
bls_consumer_expenditures_west.describe()

Unnamed: 0,All consumer\nunits in the\nWest,Los\nAngeles,San\nFrancisco,San Diego,Seattle,Phoenix,Denver,Honolulu,Anchorage
count,45.0,45.0,45.0,45.0,45.0,45.0,45.0,45.0,45.0
mean,7222.888889,6941.066667,9081.422222,7525.266667,8128.955556,6071.711111,7501.244444,6588.377778,7259.866667
std,16548.299572,16776.202053,24029.336317,18422.698955,20720.920913,14683.003646,19167.250934,16871.8508,17807.027088
min,2.0,3.0,4.0,2.0,2.0,5.0,2.0,5.0,3.0
25%,606.0,576.0,661.0,648.0,657.0,479.0,600.0,561.0,628.0
50%,1854.0,1743.0,1932.0,1658.0,2098.0,1566.0,1857.0,1376.0,1594.0
75%,5005.0,4593.0,5713.0,5153.0,5140.0,4560.0,4948.0,5345.0,5311.0
max,86301.0,90037.0,138041.0,97853.0,115137.0,74635.0,106128.0,95375.0,94235.0
