In [1]:
import numpy as np
import pandas as pd
from pandas.tseries.offsets import Hour, Minute
from pandas.tseries.offsets import Day, MonthEnd
from pandas.tseries.offsets import Hour
from statsmodels.tsa.arima.model import ARIMA
from pmdarima.arima import auto_arima
from sklearn.model_selection import TimeSeriesSplit
from sklearn.metrics import mean_squared_error


In [2]:


#df = pd.read_csv('Wind_deseason.csv')
df = pd.read_csv('Wind_deseason_15.csv', parse_dates=[0], index_col=0)


In [3]:
def runAutoArima(df):
    autoAR = auto_arima(df['309_WIND_1'], trace = True, random_state = 102)
    autoAR.summary()

In [9]:

def model1(tss, df, params):
    mse = []

    for train_indx, val_indx in tss.split(df):
        train = df.iloc[train_indx]
        test = df.iloc[val_indx]
    
        mod = ARIMA(train['309_WIND_1'], order = params)
        result = mod.fit()
        print(result.summary())
    
        start = len(train)
        end = len(train)+1
    
        pred = result.predict(start = start, end = end)
    
    
        error = 0.5*(test['309_WIND_1'][0] - pred[0])**2
        mse.append(error)

    print(mse)
    return mse

    

In [10]:
def model2(tss, df):

    mse2 = []

    for train_indx, val_indx in tss.split(df):
        train = df.iloc[train_indx]
        test = df.iloc[val_indx]
    
        mod = ARIMA(train['309_WIND_1'], order = (20,1,2))
        result = mod.fit()
        print(result.summary())
        
        start = len(train)
        end = len(train)+1
    
        pred = result.predict(start = start, end = end)
    
    
        error = 0.5*(test['309_WIND_1'][0] - pred[0])**2
        mse2.append(error)
    
    print(mse2)
    return mse2
    

In [11]:
def model3(tss,df):

    mse3 = []

    for train_indx, val_indx in tss.split(df):
        train = df.iloc[train_indx]
        test = df.iloc[val_indx]
    
        pred = train['309_WIND_1'][-1]
    
    
        error = 0.5*(test['309_WIND_1'][0] - pred)**2
        mse3.append(error)
        
    print(mse3)
    return mse3


In [12]:
def runModels(df, params):
    tss = TimeSeriesSplit(n_splits = 5, test_size = 20, gap = 0)
    mse1 = model1(tss,df,params)
    mse2 = model2(tss,df)
    mse3 = model3(tss,df)
    
    return mse1, mse2, mse3

    

In [4]:

df1 = df[df.index.month.isin([1,2,3])]
df2 = df[df.index.month.isin([4,5,6])]
df3 = df[df.index.month.isin([7,8,9])]
df4 = df[df.index.month.isin([10,11,12])]

In [5]:
runAutoArima(df1)

Performing stepwise search to minimize aic
 ARIMA(2,1,2)(0,0,0)[0] intercept   : AIC=57561.876, Time=6.75 sec
 ARIMA(0,1,0)(0,0,0)[0] intercept   : AIC=59502.970, Time=0.24 sec
 ARIMA(1,1,0)(0,0,0)[0] intercept   : AIC=57572.085, Time=0.53 sec
 ARIMA(0,1,1)(0,0,0)[0] intercept   : AIC=57799.529, Time=1.40 sec
 ARIMA(0,1,0)(0,0,0)[0]             : AIC=59500.992, Time=0.20 sec
 ARIMA(1,1,2)(0,0,0)[0] intercept   : AIC=57568.451, Time=2.02 sec
 ARIMA(2,1,1)(0,0,0)[0] intercept   : AIC=inf, Time=7.53 sec
 ARIMA(3,1,2)(0,0,0)[0] intercept   : AIC=inf, Time=10.33 sec
 ARIMA(2,1,3)(0,0,0)[0] intercept   : AIC=57557.516, Time=6.98 sec
 ARIMA(1,1,3)(0,0,0)[0] intercept   : AIC=57557.210, Time=3.98 sec
 ARIMA(0,1,3)(0,0,0)[0] intercept   : AIC=57557.464, Time=1.59 sec
 ARIMA(1,1,4)(0,0,0)[0] intercept   : AIC=57557.936, Time=12.18 sec
 ARIMA(0,1,2)(0,0,0)[0] intercept   : AIC=57612.747, Time=1.51 sec
 ARIMA(0,1,4)(0,0,0)[0] intercept   : AIC=57558.301, Time=2.19 sec
 ARIMA(2,1,4)(0,0,0)[0] inter

In [6]:
runAutoArima(df2)

Performing stepwise search to minimize aic
 ARIMA(2,1,2)(0,0,0)[0] intercept   : AIC=inf, Time=8.32 sec
 ARIMA(0,1,0)(0,0,0)[0] intercept   : AIC=59744.207, Time=0.17 sec
 ARIMA(1,1,0)(0,0,0)[0] intercept   : AIC=57987.783, Time=0.35 sec
 ARIMA(0,1,1)(0,0,0)[0] intercept   : AIC=58078.569, Time=0.95 sec
 ARIMA(0,1,0)(0,0,0)[0]             : AIC=59742.211, Time=0.14 sec
 ARIMA(2,1,0)(0,0,0)[0] intercept   : AIC=57922.186, Time=0.49 sec
 ARIMA(3,1,0)(0,0,0)[0] intercept   : AIC=57916.347, Time=0.63 sec
 ARIMA(4,1,0)(0,0,0)[0] intercept   : AIC=57916.522, Time=1.51 sec
 ARIMA(3,1,1)(0,0,0)[0] intercept   : AIC=57919.438, Time=1.08 sec
 ARIMA(2,1,1)(0,0,0)[0] intercept   : AIC=57912.705, Time=1.81 sec
 ARIMA(1,1,1)(0,0,0)[0] intercept   : AIC=57931.768, Time=0.97 sec
 ARIMA(1,1,2)(0,0,0)[0] intercept   : AIC=57922.050, Time=1.97 sec
 ARIMA(3,1,2)(0,0,0)[0] intercept   : AIC=57916.686, Time=3.34 sec
 ARIMA(2,1,1)(0,0,0)[0]             : AIC=57910.707, Time=1.22 sec
 ARIMA(1,1,1)(0,0,0)[0]  

In [7]:
runAutoArima(df3)

Performing stepwise search to minimize aic
 ARIMA(2,0,2)(0,0,0)[0] intercept   : AIC=54799.906, Time=3.09 sec
 ARIMA(0,0,0)(0,0,0)[0] intercept   : AIC=88642.261, Time=0.14 sec
 ARIMA(1,0,0)(0,0,0)[0] intercept   : AIC=56975.257, Time=0.57 sec
 ARIMA(0,0,1)(0,0,0)[0] intercept   : AIC=77603.157, Time=1.64 sec
 ARIMA(0,0,0)(0,0,0)[0]             : AIC=88772.921, Time=0.07 sec
 ARIMA(1,0,2)(0,0,0)[0] intercept   : AIC=54837.432, Time=2.45 sec
 ARIMA(2,0,1)(0,0,0)[0] intercept   : AIC=54797.951, Time=1.17 sec
 ARIMA(1,0,1)(0,0,0)[0] intercept   : AIC=55021.537, Time=1.36 sec
 ARIMA(2,0,0)(0,0,0)[0] intercept   : AIC=54835.579, Time=0.95 sec
 ARIMA(3,0,1)(0,0,0)[0] intercept   : AIC=54799.722, Time=4.18 sec
 ARIMA(3,0,0)(0,0,0)[0] intercept   : AIC=54798.487, Time=1.10 sec
 ARIMA(3,0,2)(0,0,0)[0] intercept   : AIC=54801.939, Time=4.88 sec
 ARIMA(2,0,1)(0,0,0)[0]             : AIC=54798.138, Time=0.52 sec

Best model:  ARIMA(2,0,1)(0,0,0)[0] intercept
Total fit time: 22.118 seconds


In [8]:
runAutoArima(df4)

Performing stepwise search to minimize aic
 ARIMA(2,1,2)(0,0,0)[0] intercept   : AIC=inf, Time=8.63 sec
 ARIMA(0,1,0)(0,0,0)[0] intercept   : AIC=58491.132, Time=0.21 sec
 ARIMA(1,1,0)(0,0,0)[0] intercept   : AIC=56267.213, Time=0.36 sec
 ARIMA(0,1,1)(0,0,0)[0] intercept   : AIC=56577.484, Time=0.78 sec
 ARIMA(0,1,0)(0,0,0)[0]             : AIC=58489.132, Time=0.13 sec
 ARIMA(2,1,0)(0,0,0)[0] intercept   : AIC=56260.842, Time=0.47 sec
 ARIMA(3,1,0)(0,0,0)[0] intercept   : AIC=56261.284, Time=1.06 sec
 ARIMA(2,1,1)(0,0,0)[0] intercept   : AIC=inf, Time=6.03 sec
 ARIMA(1,1,1)(0,0,0)[0] intercept   : AIC=56261.247, Time=0.76 sec
 ARIMA(3,1,1)(0,0,0)[0] intercept   : AIC=inf, Time=8.93 sec
 ARIMA(2,1,0)(0,0,0)[0]             : AIC=56258.842, Time=0.27 sec
 ARIMA(1,1,0)(0,0,0)[0]             : AIC=56265.213, Time=0.20 sec
 ARIMA(3,1,0)(0,0,0)[0]             : AIC=56259.284, Time=0.58 sec
 ARIMA(2,1,1)(0,0,0)[0]             : AIC=inf, Time=2.17 sec
 ARIMA(1,1,1)(0,0,0)[0]             : AIC=5

In [13]:
mse1, mse2, mse3 = runModels(df1, (1,1,3))

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8636
Model:                 ARIMA(1, 1, 3)   Log Likelihood              -28392.663
Date:                Mon, 15 May 2023   AIC                          56795.326
Time:                        11:18:19   BIC                          56830.644
Sample:                    01-01-2020   HQIC                         56807.369
                         - 03-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1         -0.2790      0.072     -3.862      0.000      -0.421      -0.137
ma.L1          0.7464      0.073     10.286      0.000       0.604       0.889
ma.L2          0.3187      0.034      9.503      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8656
Model:                 ARIMA(1, 1, 3)   Log Likelihood              -28470.849
Date:                Mon, 15 May 2023   AIC                          56951.699
Time:                        11:18:22   BIC                          56987.028
Sample:                    01-01-2020   HQIC                         56963.744
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1         -0.2736      0.074     -3.696      0.000      -0.419      -0.129
ma.L1          0.7392      0.074      9.943      0.000       0.593       0.885
ma.L2          0.3134      0.034      9.155      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8676
Model:                 ARIMA(1, 1, 3)   Log Likelihood              -28533.364
Date:                Mon, 15 May 2023   AIC                          57076.728
Time:                        11:18:25   BIC                          57112.069
Sample:                    01-01-2020   HQIC                         57088.776
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1         -0.2684      0.075     -3.599      0.000      -0.415      -0.122
ma.L1          0.7337      0.075      9.796      0.000       0.587       0.881
ma.L2          0.3105      0.034      9.009      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8696
Model:                 ARIMA(1, 1, 3)   Log Likelihood              -28590.781
Date:                Mon, 15 May 2023   AIC                          57191.562
Time:                        11:18:27   BIC                          57226.914
Sample:                    01-01-2020   HQIC                         57203.612
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1         -0.2719      0.075     -3.648      0.000      -0.418      -0.126
ma.L1          0.7369      0.075      9.847      0.000       0.590       0.884
ma.L2          0.3117      0.034      9.057      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8716
Model:                 ARIMA(1, 1, 3)   Log Likelihood              -28709.573
Date:                Mon, 15 May 2023   AIC                          57429.146
Time:                        11:18:29   BIC                          57464.510
Sample:                    01-01-2020   HQIC                         57441.199
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1         -0.2848      0.077     -3.693      0.000      -0.436      -0.134
ma.L1          0.7465      0.077      9.639      0.000       0.595       0.898
ma.L2          0.3124      0.035      8.838      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8636
Model:                ARIMA(20, 1, 2)   Log Likelihood              -28327.609
Date:                Mon, 15 May 2023   AIC                          56701.217
Time:                        11:19:16   BIC                          56863.680
Sample:                    01-01-2020   HQIC                         56756.614
                         - 03-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          1.7418      0.525      3.321      0.001       0.714       2.770
ar.L2         -0.9107      0.760     -1.198      0.231      -2.400       0.579
ar.L3          0.1722      0.255      0.675      0.5

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8656
Model:                ARIMA(20, 1, 2)   Log Likelihood              -28405.890
Date:                Mon, 15 May 2023   AIC                          56857.781
Time:                        11:20:05   BIC                          57020.296
Sample:                    01-01-2020   HQIC                         56913.188
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          1.6769      0.575      2.919      0.004       0.551       2.803
ar.L2         -0.8177      0.833     -0.981      0.326      -2.451       0.815
ar.L3          0.1439      0.281      0.512      0.6

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8676
Model:                ARIMA(20, 1, 2)   Log Likelihood              -28467.387
Date:                Mon, 15 May 2023   AIC                          56980.774
Time:                        11:20:53   BIC                          57143.342
Sample:                    01-01-2020   HQIC                         57036.193
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          1.2800      0.420      3.050      0.002       0.458       2.102
ar.L2         -0.2403      0.609     -0.395      0.693      -1.434       0.953
ar.L3         -0.0505      0.205     -0.247      0.8

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8696
Model:                ARIMA(20, 1, 2)   Log Likelihood              -28524.483
Date:                Mon, 15 May 2023   AIC                          57094.966
Time:                        11:21:38   BIC                          57257.588
Sample:                    01-01-2020   HQIC                         57150.397
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          1.2029      0.394      3.050      0.002       0.430       1.976
ar.L2         -0.1294      0.572     -0.226      0.821      -1.251       0.992
ar.L3         -0.0876      0.192     -0.456      0.6

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8716
Model:                ARIMA(20, 1, 2)   Log Likelihood              -28644.052
Date:                Mon, 15 May 2023   AIC                          57334.105
Time:                        11:22:25   BIC                          57496.779
Sample:                    01-01-2020   HQIC                         57389.548
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          1.1824      0.411      2.879      0.004       0.378       1.987
ar.L2         -0.1041      0.594     -0.175      0.861      -1.268       1.060
ar.L3         -0.0933      0.199     -0.468      0.6

In [14]:
mse4, mse5, mse6 = runModels(df2, (2,1,1))

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8636
Model:                 ARIMA(2, 1, 1)   Log Likelihood              -28648.501
Date:                Mon, 15 May 2023   AIC                          57305.002
Time:                        11:22:26   BIC                          57333.256
Sample:                    04-01-2020   HQIC                         57314.636
                         - 06-29-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.8912      0.051     17.439      0.000       0.791       0.991
ar.L2         -0.2682      0.021    -12.835      0.000      -0.309      -0.227
ma.L1         -0.4307      0.052     -8.269      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8656
Model:                 ARIMA(2, 1, 1)   Log Likelihood              -28707.688
Date:                Mon, 15 May 2023   AIC                          57423.376
Time:                        11:22:27   BIC                          57451.640
Sample:                    04-01-2020   HQIC                         57433.012
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.8919      0.051     17.471      0.000       0.792       0.992
ar.L2         -0.2684      0.021    -12.859      0.000      -0.309      -0.228
ma.L1         -0.4316      0.052     -8.294      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8676
Model:                 ARIMA(2, 1, 1)   Log Likelihood              -28768.955
Date:                Mon, 15 May 2023   AIC                          57545.910
Time:                        11:22:28   BIC                          57574.183
Sample:                    04-01-2020   HQIC                         57555.549
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.8939      0.051     17.526      0.000       0.794       0.994
ar.L2         -0.2690      0.021    -12.897      0.000      -0.310      -0.228
ma.L1         -0.4337      0.052     -8.343      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8696
Model:                 ARIMA(2, 1, 1)   Log Likelihood              -28825.301
Date:                Mon, 15 May 2023   AIC                          57658.602
Time:                        11:22:29   BIC                          57686.885
Sample:                    04-01-2020   HQIC                         57668.243
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.8939      0.051     17.565      0.000       0.794       0.994
ar.L2         -0.2690      0.021    -12.926      0.000      -0.310      -0.228
ma.L1         -0.4337      0.052     -8.361      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8716
Model:                 ARIMA(2, 1, 1)   Log Likelihood              -28881.650
Date:                Mon, 15 May 2023   AIC                          57771.301
Time:                        11:22:30   BIC                          57799.592
Sample:                    04-01-2020   HQIC                         57780.943
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.8939      0.051     17.603      0.000       0.794       0.993
ar.L2         -0.2690      0.021    -12.953      0.000      -0.310      -0.228
ma.L1         -0.4336      0.052     -8.379      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8636
Model:                ARIMA(20, 1, 2)   Log Likelihood              -28553.855
Date:                Mon, 15 May 2023   AIC                          57153.710
Time:                        11:23:45   BIC                          57316.173
Sample:                    04-01-2020   HQIC                         57209.106
                         - 06-29-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4408      0.008     56.502      0.000       0.425       0.456
ar.L2          0.9131      0.011     79.846      0.000       0.891       0.935
ar.L3         -0.4795      0.007    -67.162      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8656
Model:                ARIMA(20, 1, 2)   Log Likelihood              -28612.857
Date:                Mon, 15 May 2023   AIC                          57271.714
Time:                        11:25:00   BIC                          57434.230
Sample:                    04-01-2020   HQIC                         57327.122
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4410      0.010     44.871      0.000       0.422       0.460
ar.L2          0.9139      0.014     64.374      0.000       0.886       0.942
ar.L3         -0.4767      0.008    -60.008      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8676
Model:                ARIMA(20, 1, 2)   Log Likelihood              -28673.227
Date:                Mon, 15 May 2023   AIC                          57392.454
Time:                        11:26:11   BIC                          57555.022
Sample:                    04-01-2020   HQIC                         57447.873
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4392      0.007     66.589      0.000       0.426       0.452
ar.L2          0.9166      0.010     95.334      0.000       0.898       0.935
ar.L3         -0.4758      0.007    -69.356      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8696
Model:                ARIMA(20, 1, 2)   Log Likelihood              -28729.694
Date:                Mon, 15 May 2023   AIC                          57505.387
Time:                        11:27:21   BIC                          57668.009
Sample:                    04-01-2020   HQIC                         57560.819
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4407      0.011     40.764      0.000       0.420       0.462
ar.L2          0.9202      0.016     58.973      0.000       0.890       0.951
ar.L3         -0.4741      0.008    -57.686      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8716
Model:                ARIMA(20, 1, 2)   Log Likelihood              -28785.069
Date:                Mon, 15 May 2023   AIC                          57616.138
Time:                        11:28:36   BIC                          57778.813
Sample:                    04-01-2020   HQIC                         57671.581
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4415      0.013     35.177      0.000       0.417       0.466
ar.L2          0.9169      0.018     50.624      0.000       0.881       0.952
ar.L3         -0.4776      0.009    -53.681      0.0

In [16]:
mse7, mse8, mse9 = runModels(df3, (2,0,1))

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8732
Model:                 ARIMA(2, 0, 1)   Log Likelihood              -27126.340
Date:                Mon, 15 May 2023   AIC                          54262.681
Time:                        11:48:35   BIC                          54298.055
Sample:                    07-01-2020   HQIC                         54274.736
                         - 09-29-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          4.8011      4.355      1.102      0.270      -3.734      13.337
ar.L1          1.3313      0.008    161.843      0.000       1.315       1.347
ar.L2         -0.3535      0.008    -43.576      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8752
Model:                 ARIMA(2, 0, 1)   Log Likelihood              -27178.767
Date:                Mon, 15 May 2023   AIC                          54367.535
Time:                        11:48:37   BIC                          54402.920
Sample:                    07-01-2020   HQIC                         54379.592
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          4.7352      4.355      1.087      0.277      -3.800      13.270
ar.L1          1.3313      0.008    162.188      0.000       1.315       1.347
ar.L2         -0.3534      0.008    -43.663      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8772
Model:                 ARIMA(2, 0, 1)   Log Likelihood              -27236.070
Date:                Mon, 15 May 2023   AIC                          54482.140
Time:                        11:48:38   BIC                          54517.536
Sample:                    07-01-2020   HQIC                         54494.200
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          4.6960      4.343      1.081      0.280      -3.816      13.208
ar.L1          1.3312      0.008    162.184      0.000       1.315       1.347
ar.L2         -0.3533      0.008    -43.652      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8792
Model:                 ARIMA(2, 0, 1)   Log Likelihood              -27289.541
Date:                Mon, 15 May 2023   AIC                          54589.082
Time:                        11:48:40   BIC                          54624.490
Sample:                    07-01-2020   HQIC                         54601.144
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          4.6327      4.343      1.067      0.286      -3.878      13.144
ar.L1          1.3314      0.008    162.521      0.000       1.315       1.347
ar.L2         -0.3534      0.008    -43.753      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8812
Model:                 ARIMA(2, 0, 1)   Log Likelihood              -27341.748
Date:                Mon, 15 May 2023   AIC                          54693.497
Time:                        11:48:41   BIC                          54728.916
Sample:                    07-01-2020   HQIC                         54705.562
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          4.5652      4.343      1.051      0.293      -3.947      13.078
ar.L1          1.3314      0.008    162.879      0.000       1.315       1.347
ar.L2         -0.3534      0.008    -43.842      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8732
Model:                ARIMA(20, 1, 2)   Log Likelihood              -27141.600
Date:                Mon, 15 May 2023   AIC                          54329.201
Time:                        11:49:24   BIC                          54491.917
Sample:                    07-01-2020   HQIC                         54384.653
                         - 09-29-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4428      0.205      2.163      0.031       0.041       0.844
ar.L2         -0.7798      0.172     -4.528      0.000      -1.117      -0.442
ar.L3          0.3555      0.081      4.377      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8752
Model:                ARIMA(20, 1, 2)   Log Likelihood              -27193.732
Date:                Mon, 15 May 2023   AIC                          54433.463
Time:                        11:50:17   BIC                          54596.233
Sample:                    07-01-2020   HQIC                         54488.927
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4582      0.163      2.817      0.005       0.139       0.777
ar.L2         -0.8181      0.147     -5.580      0.000      -1.105      -0.531
ar.L3          0.3694      0.069      5.324      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8772
Model:                ARIMA(20, 1, 2)   Log Likelihood              -27251.223
Date:                Mon, 15 May 2023   AIC                          54548.447
Time:                        11:51:07   BIC                          54711.269
Sample:                    07-01-2020   HQIC                         54603.922
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4448      0.188      2.364      0.018       0.076       0.813
ar.L2         -0.8058      0.162     -4.989      0.000      -1.122      -0.489
ar.L3          0.3674      0.076      4.844      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8792
Model:                ARIMA(20, 1, 2)   Log Likelihood              -27304.413
Date:                Mon, 15 May 2023   AIC                          54654.826
Time:                        11:51:55   BIC                          54817.700
Sample:                    07-01-2020   HQIC                         54710.312
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4748      0.133      3.558      0.000       0.213       0.736
ar.L2         -0.8562      0.123     -6.950      0.000      -1.098      -0.615
ar.L3          0.3885      0.058      6.676      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8812
Model:                ARIMA(20, 1, 2)   Log Likelihood              -27356.938
Date:                Mon, 15 May 2023   AIC                          54759.876
Time:                        11:52:40   BIC                          54922.802
Sample:                    07-01-2020   HQIC                         54815.374
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4875      0.190      2.569      0.010       0.116       0.859
ar.L2         -0.8055      0.158     -5.087      0.000      -1.116      -0.495
ar.L3          0.3591      0.074      4.847      0.0

In [17]:
mse10, mse11, mse12 = runModels(df4, (2,1,0))

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8732
Model:                 ARIMA(2, 1, 0)   Log Likelihood              -27792.094
Date:                Mon, 15 May 2023   AIC                          55590.188
Time:                        12:04:00   BIC                          55611.412
Sample:                    10-01-2020   HQIC                         55597.421
                         - 12-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4826      0.004    115.484      0.000       0.474       0.491
ar.L2         -0.0279      0.005     -5.221      0.000      -0.038      -0.017
sigma2        34.0763      0.164    208.239      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8752
Model:                 ARIMA(2, 1, 0)   Log Likelihood              -27869.588
Date:                Mon, 15 May 2023   AIC                          55745.176
Time:                        12:04:00   BIC                          55766.407
Sample:                    10-01-2020   HQIC                         55752.410
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4840      0.004    115.566      0.000       0.476       0.492
ar.L2         -0.0282      0.005     -5.276      0.000      -0.039      -0.018
sigma2        34.1842      0.164    207.841      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8772
Model:                 ARIMA(2, 1, 0)   Log Likelihood              -27955.041
Date:                Mon, 15 May 2023   AIC                          55916.082
Time:                        12:04:01   BIC                          55937.320
Sample:                    10-01-2020   HQIC                         55923.318
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4864      0.004    115.926      0.000       0.478       0.495
ar.L2         -0.0313      0.005     -5.862      0.000      -0.042      -0.021
sigma2        34.3542      0.166    207.120      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8792
Model:                 ARIMA(2, 1, 0)   Log Likelihood              -28018.856
Date:                Mon, 15 May 2023   AIC                          56043.713
Time:                        12:04:01   BIC                          56064.957
Sample:                    10-01-2020   HQIC                         56050.950
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4865      0.004    115.989      0.000       0.478       0.495
ar.L2         -0.0308      0.005     -5.763      0.000      -0.041      -0.020
sigma2        34.3548      0.166    207.218      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8812
Model:                 ARIMA(2, 1, 0)   Log Likelihood              -28072.653
Date:                Mon, 15 May 2023   AIC                          56151.306
Time:                        12:04:01   BIC                          56172.557
Sample:                    10-01-2020   HQIC                         56158.545
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.4865      0.004    116.249      0.000       0.478       0.495
ar.L2         -0.0308      0.005     -5.775      0.000      -0.041      -0.020
sigma2        34.2773      0.165    207.698      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8732
Model:                ARIMA(20, 1, 2)   Log Likelihood              -27757.986
Date:                Mon, 15 May 2023   AIC                          55561.971
Time:                        12:04:14   BIC                          55724.688
Sample:                    10-01-2020   HQIC                         55617.423
                         - 12-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.2509      0.810      0.310      0.757      -1.337       1.839
ar.L2          0.0467      0.629      0.074      0.941      -1.185       1.279
ar.L3          0.0183      0.323      0.057      0.9

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8752
Model:                ARIMA(20, 1, 2)   Log Likelihood              -27835.645
Date:                Mon, 15 May 2023   AIC                          55717.289
Time:                        12:04:35   BIC                          55880.059
Sample:                    10-01-2020   HQIC                         55772.753
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.3238      0.651      0.497      0.619      -0.953       1.600
ar.L2         -0.0814      0.591     -0.138      0.890      -1.240       1.077
ar.L3          0.0633      0.289      0.219      0.8

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8772
Model:                ARIMA(20, 1, 2)   Log Likelihood              -27921.524
Date:                Mon, 15 May 2023   AIC                          55889.048
Time:                        12:04:53   BIC                          56051.870
Sample:                    10-01-2020   HQIC                         55944.524
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.3395      0.634      0.536      0.592      -0.903       1.582
ar.L2         -0.0793      0.609     -0.130      0.896      -1.273       1.115
ar.L3          0.0565      0.287      0.197      0.8

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8792
Model:                ARIMA(20, 1, 2)   Log Likelihood              -27985.525
Date:                Mon, 15 May 2023   AIC                          56017.050
Time:                        12:05:04   BIC                          56179.924
Sample:                    10-01-2020   HQIC                         56072.537
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.2532      0.780      0.325      0.746      -1.276       1.782
ar.L2          0.0458      0.547      0.084      0.933      -1.027       1.118
ar.L3          0.0154      0.301      0.051      0.9

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:             309_WIND_1   No. Observations:                 8812
Model:                ARIMA(20, 1, 2)   Log Likelihood              -28039.200
Date:                Mon, 15 May 2023   AIC                          56124.399
Time:                        12:05:25   BIC                          56287.326
Sample:                    10-01-2020   HQIC                         56179.898
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.3290      0.678      0.485      0.628      -1.001       1.659
ar.L2         -0.0765      0.600     -0.127      0.899      -1.253       1.100
ar.L3          0.0587      0.297      0.198      0.8

In [18]:
print('season 1')

print('model 1:')
print(mse1)
print('model 2:')
print(mse2)
print('model 3:')
print(mse3)

season 1
model 1:
[0.002307307035920576, 0.04408290619685475, 7.531547753021891, 9.322766253652572, 78.63151018518468]
model 2:
[0.05412670149355198, 0.002351441107970144, 6.256636935749598, 7.130508179596404, 72.63095048533144]
model 3:
[1.4372685961048244, 8.152266994884567, 3.723118367900999, 8.699540859455698, 51.29608555087137]


In [19]:
print('season 1')

print('model 1:')
print(mse4)
print('model 2:')
print(mse5)
print('model 3:')
print(mse6)

season 1
model 1:
[0.4249990383871715, 9.854757171131864, 0.21274526265633192, 0.08459618474568688, 0.2331762333341678]
model 2:
[0.3149862990663455, 12.060681074334317, 0.7203025557548489, 0.21219712448738412, 0.15068671664679553]
model 3:
[0.4361406242256827, 39.31444537232737, 0.6043108825320133, 0.044812201668319555, 0.12531352080462788]


In [20]:
print('season 1')

print('model 1:')
print(mse7)
print('model 2:')
print(mse8)
print('model 3:')
print(mse9)

season 1
model 1:
[0.3755642966572977, 0.2188674606970579, 14.065320080801877, 0.17072930339088027, 0.19818046009606385]
model 2:
[0.04164095134144251, 0.011873010014144859, 14.761320368009338, 0.053605177521764594, 0.0008673118562807803]
model 3:
[0.03592531002914436, 0.020277554938902705, 27.144077893806486, 0.0023153780917547773, 0.0021309790223842497]


In [21]:
print('season 1')

print('model 1:')
print(mse10)
print('model 2:')
print(mse11)
print('model 3:')
print(mse12)

season 1
model 1:
[257.1657628517167, 7.99609604562359, 205.20233099062744, 0.026718444183807043, 0.0490521573383226]
model 2:
[252.92240689563502, 12.804015659903015, 191.84471170741736, 0.02011203572442258, 0.042526204103490055]
model 3:
[429.2858913652768, 7.214697783115516, 206.75059991821237, 0.05509133720566302, 0.008705038878606425]
