# How has the COVID-19 pandemic affected air quality and single-use plastic waste in the U.S.?

In [1]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
import statsmodels.api as sm
from statsmodels.formula.api import ols
import statsmodels
from scipy import stats
from pingouin import pairwise_ttests #this is for performing the pairwise tests

<p>The following datasets are taken from Federal Reserve Bank of St. Louis Plastic Manufacturing Dataset:
https://fred.stlouisfed.org/searchresults/?st=plastic&t=plastics%3Bmonthly%3Btrade&rt=trade&ob=sr

Note: U.S. recessions should probably be taken into account as a confounding factor.</p>

In [5]:
# Dataset 'Producer Price Index by Commodity: Rubber and Plastic Products: Plastic Packaging Products'
# Index Dec 2006=100, Not Seasonally Adjusted
Plastic_packaging = pd.read_csv('../WPU072A.csv')

# Dataset 'Producer Price Index by Industry: Material Recyclers: Recyclable Plastics'
# Index Jun 1996=100, Not Seasonally Adjusted
# Note: there is a gap in the dataset: data between around January 2004 and around June 2004 is missing
# Might need to impute?
Recyclers_recyclable_plastics = pd.read_csv('../PCU42993042993042.csv')

# Dataset 'Producer Price Index by Commodity: Rubber and Plastic Products: Recyclable Plastics'
# Index Dec 2011=100, Not Seasonally Adjusted
Rubber_and_Plastic_recyclable_plastics = pd.read_csv('../WPU072C.csv')

# Dataset 'Producer Price Index by Industry: Plastics Material and Resins Manufacturing'
# Index Dec 1980=100, Not Seasonally Adjusted
Plastic_and_resin = pd.read_csv('../PCU325211325211.csv')

# Dataset 'Producer Price Index by Industry: Plastics Packaging Film and Sheet Manufacturing: Coextruded Single-Web Film, for Flexible Packaging Uses'
# Index Jun 2007=100, Not Seasonally Adjusted
Plastic_film_and_sheet = pd.read_csv('../PCU32611232611212.csv')

# Dataset 'Producer Price Index by Commodity: Rubber and Plastic Products: Unlaminated Polyethylene Film and Sheet'
# Index Jun 1993=100, Not Seasonally Adjusted
# Data missing from June 2007 until July 2013 - impute?
Unlam_poly_film_and_sheet = pd.read_csv('../WPU072205011.csv')

# Dataset 'Producer Price Index by Commodity: Rubber and Plastic Products: Packaging Polyurethane Foam Products'
# Index Dec 2009=100, Not Seasonally Adjusted
# Note: data missing in interval May-June 2018 - need to impute?
Polyurethane_foam = pd.read_csv('../WPU072A01013.csv')

# Dataset 'Industrial Production: Manufacturing: Non-Durable Goods: Plastics Material and Resin'
# Index 2012=100, Seasonally Adjusted
Plastic_and_resin_manu = pd.read_csv('../IPN325211S.csv')

# Dataset 'Producer Price Index by Commodity: Rubber and Plastic Products: Unlaminated Vinyl and Vinyl Copolymer Film and Sheet'
# Index Dec 2011=100, Not Seasonally Adjusted
Vinyl_film_and_sheet = pd.read_csv('../WPU072205013.csv')

# Dataset 'Producer Price Index by Industry: Plastics Product Manufacturing'
# Index Jun 1993=100, Not Seasonally Adjusted
Plastic_manu = pd.read_csv('../PCU32613261.csv')

# Dataset 'Producer Price Index by Commodity: Rubber and Plastic Products: Plastic Products'
# Index 1982=100, Not Seasonally Adjusted
Plastic = pd.read_csv('../WPU072.csv')

# Dataset 'Producer Price Index by Industry: Plastics Bag and Pouch Manufacturing: Other Polyethylene Bags, Pouches, and Liners'
# Index Jun 2007=100, Not Seasonally Adjusted
# Note: delete first datapoint - it's temporally separated from all the rest
Plastic_bags = pd.read_csv('../PCU32611132611115.csv')

# Dataset 'Producer Price Index by Industry: Plastics Packaging Film and Sheet Manufacturing'
# Index Dec 2003=100, Not Seasonally Adjusted
Plastic_film_and_sheet_manu = pd.read_csv('../PCU326112326112.csv')

# Dataset 'Producer Price Index by Industry: Plastics Packaging Film and Sheet Manufacturing: Polypropylene/Polypropylene Multiweb Laminated Rolls and Sheets, for Flexible Packaging Uses'
# Index Jun 2007=100, Not Seasonally Adjusted
Polypropylene_packaging = pd.read_csv('../PCU32611232611231.csv')

# Dataset 'Producer Price Index by Industry: Plastics Bag and Pouch Manufacturing: Polyethylene Refuse Bags'
# Index Jun 2007=100, Not Seasonally Adjusted
# Note: delete first datapoint - it's temporally separated from all the rest
Polyethylene_refuse_bags = pd.read_csv('../PCU32611132611112.csv')

In [7]:
Plastic_and_resin_manu.shape

(583, 2)

In [8]:
Plastic_and_resin_manu.head()

Unnamed: 0,DATE,IPN325211S
0,1972-01-01,38.9872
1,1972-02-01,38.8303
2,1972-03-01,40.1707
3,1972-04-01,40.5691
4,1972-05-01,41.0615
