In [1]:
import numpy as np
import pandas as pd

from ols_bootstrap.pairs import PairsBootstrap
from ols_bootstrap.residual import ResidualBootstrap
from ols_bootstrap.wild import WildBootstrap

In [2]:
df = pd.read_csv('./balance2018.csv')
df = df[df['sales_clean'] != 0]
df = df[['sales_clean', 'tanass_clean', 'tax']]
df = df.dropna(subset=['tanass_clean', 'tax'])

df_scaled = df.applymap(lambda x: np.log(x + 1))

  exec(code_obj, self.user_global_ns, self.user_ns)


In [3]:
df_sample = df_scaled.sample(n=10000, replace=False)

Y_data = pd.DataFrame(df_sample.iloc[:, 0])
X_data = pd.DataFrame(df_sample.iloc[:, 1:])

In [4]:
X_data.head()

Unnamed: 0,tanass_clean,tax
191097,7.577634,3.135494
283707,0.0,5.342334
336638,0.0,0.0
27500,7.025538,3.850148
223611,10.499848,8.818926


In [5]:
Y_data.head()

Unnamed: 0,sales_clean
191097,9.412465
283707,11.658972
336638,0.693147
27500,9.439466
223611,13.247478


In [6]:
psb = PairsBootstrap(Y_data, X_data, iter = 100)
rsb = ResidualBootstrap(Y_data, X_data, iter = 100)
wb_stdn = WildBootstrap(Y_data, X_data, iter = 100, from_distro = 'standard_normal')
wb_rad = WildBootstrap(Y_data, X_data, iter = 100, from_distro = 'rademacher')
wb_mam = WildBootstrap(Y_data, X_data, iter = 100, from_distro = 'mammen')

In [7]:
psb.summary()

+----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+
|                                            Pairs Bootstrap results with sample size of 10000 and bootstrap resampling size of 100 using 95.00% CI                                            |
+----------------+------------------+-------------------------------+-----------------+-----------------------------+-------------------+----------+----------+--------------------+-----------+
|     Params     |  Original Coeff  |  Mean of Bootstrapped Coeffs  |  Orig Coeff SE  |  SE of Bootstrapped Coeffs  |  % of Diff in SE  |   Bias   |   RMSE   |         CI         |  CI Diff  |
+----------------+------------------+-------------------------------+-----------------+-----------------------------+-------------------+----------+----------+--------------------+-----------+
|     const      |      6.1889     

In [8]:
rsb.summary()

+----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+
|                                          Residual Bootstrap results with sample size of 10000 and bootstrap resampling size of 100 using 95.00% CI                                           |
+----------------+------------------+-------------------------------+-----------------+-----------------------------+-------------------+----------+----------+--------------------+-----------+
|     Params     |  Original Coeff  |  Mean of Bootstrapped Coeffs  |  Orig Coeff SE  |  SE of Bootstrapped Coeffs  |  % of Diff in SE  |   Bias   |   RMSE   |         CI         |  CI Diff  |
+----------------+------------------+-------------------------------+-----------------+-----------------------------+-------------------+----------+----------+--------------------+-----------+
|     const      |      6.1889     

In [9]:
wb_stdn.summary()

+----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+
|                                  Wild Bootstrap with Standard Normal results with sample size of 10000 and bootstrap resampling size of 100 using 95.00% CI                                  |
+----------------+------------------+-------------------------------+-----------------+-----------------------------+-------------------+----------+----------+--------------------+-----------+
|     Params     |  Original Coeff  |  Mean of Bootstrapped Coeffs  |  Orig Coeff SE  |  SE of Bootstrapped Coeffs  |  % of Diff in SE  |   Bias   |   RMSE   |         CI         |  CI Diff  |
+----------------+------------------+-------------------------------+-----------------+-----------------------------+-------------------+----------+----------+--------------------+-----------+
|     const      |      6.1889     

In [10]:
wb_rad.summary()

+----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+
|                                    Wild Bootstrap with Rademacher results with sample size of 10000 and bootstrap resampling size of 100 using 95.00% CI                                     |
+----------------+------------------+-------------------------------+-----------------+-----------------------------+-------------------+----------+----------+--------------------+-----------+
|     Params     |  Original Coeff  |  Mean of Bootstrapped Coeffs  |  Orig Coeff SE  |  SE of Bootstrapped Coeffs  |  % of Diff in SE  |   Bias   |   RMSE   |         CI         |  CI Diff  |
+----------------+------------------+-------------------------------+-----------------+-----------------------------+-------------------+----------+----------+--------------------+-----------+
|     const      |      6.1889     

In [11]:
wb_mam.summary()

+----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+
|                                      Wild Bootstrap with Mammen results with sample size of 10000 and bootstrap resampling size of 100 using 95.00% CI                                       |
+----------------+------------------+-------------------------------+-----------------+-----------------------------+-------------------+----------+----------+--------------------+-----------+
|     Params     |  Original Coeff  |  Mean of Bootstrapped Coeffs  |  Orig Coeff SE  |  SE of Bootstrapped Coeffs  |  % of Diff in SE  |   Bias   |   RMSE   |         CI         |  CI Diff  |
+----------------+------------------+-------------------------------+-----------------+-----------------------------+-------------------+----------+----------+--------------------+-----------+
|     const      |      6.1889     