## Create EDD Dataframes for multiple years

### Summary of notebook:
- Create cut down EDD dataframes for multiple years.
- Needed: update EDD Current Employment Statistics file as new files are released by EDD
- Outputs: EDD dataframes and CSV files for a particular year

In [1]:
import pandas as pd
import numpy as np
from jqi_functions import *

#### Load necessary data

In [2]:
edd = pd.read_csv('data/edd/Current_EDD_1121.csv')

In [3]:
edd_crosswalk = pd.read_csv('data/edd/Industry_Title_Crosswalk.csv')

In [4]:
county_info = pd.read_csv('data/county_to_regions_key.csv')

In [5]:
edd_to_ipums_crosswalk = pd.read_csv('data/edd/edd_to_ipums_crosswalk.csv')

In [6]:
edd = clean_edd(edd, edd_crosswalk, edd_to_ipums_crosswalk, county_info)

#### Separate by year

In [7]:
edd_2020 = edd.loc[edd['Year'] == 2020].copy()
edd_2019 = edd.loc[edd['Year'] == 2019].copy()
edd_2018 = edd.loc[edd['Year'] == 2018].copy()
edd_2017 = edd.loc[edd['Year'] == 2017].copy()
edd_2016 = edd.loc[edd['Year'] == 2016].copy()
edd_2015 = edd.loc[edd['Year'] == 2015].copy()
edd_2014 = edd.loc[edd['Year'] == 2014].copy()

In [8]:
edd_2020.head()

Unnamed: 0,Area Type,Area Name,Year,Month,Date,Series Code,Seasonally Adjusted,Current Employment,Industry Title,COUNTYFIP,County,Rural/Urban,CERF Regions,Crosswalk Value
72,County,Alameda,2020,January,01/01/2020,70710000,N,12300,arts entertainment and recreation,1,Alameda,Urban,Bay Area,30
73,County,Alameda,2020,February,02/01/2020,70710000,N,12500,arts entertainment and recreation,1,Alameda,Urban,Bay Area,30
74,County,Alameda,2020,March,03/01/2020,70710000,N,12200,arts entertainment and recreation,1,Alameda,Urban,Bay Area,30
75,County,Alameda,2020,April,04/01/2020,70710000,N,5400,arts entertainment and recreation,1,Alameda,Urban,Bay Area,30
76,County,Alameda,2020,May,05/01/2020,70710000,N,5900,arts entertainment and recreation,1,Alameda,Urban,Bay Area,30


In [9]:
edd_2020 = filter_edd(edd_2020, region_series_codes)
edd_2019 = filter_edd(edd_2019, region_series_codes)
edd_2018 = filter_edd(edd_2018, region_series_codes)
edd_2017 = filter_edd(edd_2017, region_series_codes)
edd_2016 = filter_edd(edd_2016, region_series_codes)
edd_2015 = filter_edd(edd_2015, region_series_codes)
edd_2014 = filter_edd(edd_2014, region_series_codes)

#### Export outputs

In [10]:
edd_2020.to_csv('data/edd/edd_2020.csv', index=False)
edd_2019.to_csv('data/edd/edd_2019.csv', index=False)
edd_2018.to_csv('data/edd/edd_2018.csv', index=False)
edd_2017.to_csv('data/edd/edd_2017.csv', index=False)
edd_2016.to_csv('data/edd/edd_2016.csv', index=False)
edd_2015.to_csv('data/edd/edd_2015.csv', index=False)
edd_2014.to_csv('data/edd/edd_2014.csv', index=False)