In [None]:
# Import packages
import pandas as pd
import matplotlib.pyplot as plt

In [None]:
# Read in data
aqi_17 = pd.read_csv("https://aqs.epa.gov/aqsweb/airdata/daily_aqi_by_county_2017.zip", compression = 'zip')
aqi_18 = pd.read_csv("https://aqs.epa.gov/aqsweb/airdata/daily_aqi_by_county_2018.zip", compression = 'zip')

In [None]:
# Concat the two data frames
aqi = pd.concat([aqi_17, aqi_18])

In [None]:
# Simplify column names
aqi.columns = (aqi.columns
                  .str.lower()
                  .str.replace(' ','_'))

In [None]:
# Select only data from Santa Barbara County
aqi_sb = aqi[aqi['county_name'] == "Santa Barbara"]

In [None]:
# Remove `state_name`, `county_name`, `state_code`, and `county_code` columns
aqi_sb = aqi_sb.drop(columns = ['state_name', 'county_name', 'state_code', 'county_code'])

In [None]:
# Update `date` to datetime object
aqi_sb.date = pd.to_datetime(aqi_sb.date)

In [None]:
# Update the index to be the date column
aqi_sb = aqi_sb.set_index('date')

In [None]:
# Add AQI 5-day rolling mean to `aqi_sb` data frame
aqi_sb['five_day_average'] = aqi_sb['aqi'].rolling('5D').mean()

In [None]:
# Plot AQI and AQI rolling mean 
aqi_sb.drop(columns = 'number_of_sites_reporting').plot.line(y = ['aqi', 'five_day_average'])
plt.title("AQI in Santa Barbara County 2017-2018")
plt.xlabel("Date")
plt.ylabel("AQI")
plt.legend(['AQI', 'Five Day Average'])