## <center>Regulation, government quality, and green handicraft growth</center>
## <center>Data analysis : regressions</center>

#### DIW Berlin, Caroline Stiel

last modified: October 30, 2024 (cs)

-----------------------------------------

#### 1. Import libraries, define paths

In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import pathlib
import seaborn as sns
import statsmodels.formula.api as smf

In [None]:
MAIN = pathlib.Path().resolve()
ORIG = MAIN / "origdata" # original data
DATA = MAIN / "data" # working data
RESULTS = MAIN / "results" # figures etc.

#### 2. Load green handicraft *(Klimahandwerk)* data set

In [None]:
# data set 2013 till 2022
# -----------------------
dataHanQua = pd.read_csv(DATA/"dataHanQua.csv",delimiter=';', encoding='latin-1')
dataHanQua = pd.DataFrame(dataHanQua)

# consider only years with government quality data (2013,2017,2021)
# -----------------------------------------------------------------
dataHanQua = dataHanQua[dataHanQua['EQI'].isnull()==False]

# browse through data frame
# -------------------------
with pd.option_context('display.max_rows', None, 'display.max_columns', None):
    display(dataHanQua)

#### 3. Regressions

In [None]:
# regress employees with industry FE, time FE and federal state FE
# ----------------------------------------------------------------
model = smf.ols(formula='employees_sum ~ EQI + bl_name + name + year', data=dataHanQua).fit()
print(model.summary())

In [None]:
# regress turnover with industry FE, time FE and federal state FE
# ----------------------------------------------------------------
model = smf.ols(formula='turnover ~ EQI + bl_name + name + year', data=dataHanQua).fit()
print(model.summary())