In [1]:
import numpy as np
import pandas as pd
from pandas.tseries.offsets import Hour, Minute
from pandas.tseries.offsets import Day, MonthEnd
from pandas.tseries.offsets import Hour
from statsmodels.tsa.arima.model import ARIMA
from pmdarima.arima import auto_arima
from sklearn.model_selection import TimeSeriesSplit
from sklearn.metrics import mean_squared_error


In [2]:


#df = pd.read_csv('Wind_deseason.csv')
df = pd.read_csv('PV_deseason_15.csv', parse_dates=[0], index_col=0)


In [3]:
def runAutoArima(df):
    autoAR = auto_arima(df['310_PV_1'], trace = True, random_state = 102)
    autoAR.summary()

In [4]:

def model1(tss, df, params):
    mse = []

    for train_indx, val_indx in tss.split(df):
        train = df.iloc[train_indx]
        test = df.iloc[val_indx]
    
        mod = ARIMA(train['310_PV_1'], order = params)
        result = mod.fit()
        print(result.summary())
    
        start = len(train)
        end = len(train)+1
    
        pred = result.predict(start = start, end = end)
    
    
        error = 0.5*(test['310_PV_1'][0] - pred[0])**2
        mse.append(error)

    print(mse)
    return mse

    

In [5]:
def model2(tss, df):

    mse2 = []

    for train_indx, val_indx in tss.split(df):
        train = df.iloc[train_indx]
        test = df.iloc[val_indx]
    
        mod = ARIMA(train['310_PV_1'], order = (8,1,1))
        result = mod.fit()
        print(result.summary())
        
        start = len(train)
        end = len(train)+1
    
        pred = result.predict(start = start, end = end)
    
    
        error = 0.5*(test['310_PV_1'][0] - pred[0])**2
        mse2.append(error)
    
    print(mse2)
    return mse2
    

In [6]:
def model3(tss,df):

    mse3 = []

    for train_indx, val_indx in tss.split(df):
        train = df.iloc[train_indx]
        test = df.iloc[val_indx]
    
        pred = train['310_PV_1'][-1]
    
    
        error = 0.5*(test['310_PV_1'][0] - pred)**2
        mse3.append(error)
        
    print(mse3)
    return mse3


In [7]:
def runModels(df, params):
    tss = TimeSeriesSplit(n_splits = 5, test_size = 20, gap = 0)
    mse1 = model1(tss,df,params)
    mse2 = model2(tss,df)
    mse3 = model3(tss,df)
    
    return mse1, mse2, mse3

    

In [8]:

df1 = df[df.index.month.isin([1,2,3])]
df2 = df[df.index.month.isin([4,5,6])]
df3 = df[df.index.month.isin([7,8,9])]
df4 = df[df.index.month.isin([10,11,12])]

In [9]:
runAutoArima(df1)

Performing stepwise search to minimize aic
 ARIMA(2,1,2)(0,0,0)[0] intercept   : AIC=inf, Time=6.32 sec
 ARIMA(0,1,0)(0,0,0)[0] intercept   : AIC=45536.069, Time=0.14 sec
 ARIMA(1,1,0)(0,0,0)[0] intercept   : AIC=45535.008, Time=0.31 sec
 ARIMA(0,1,1)(0,0,0)[0] intercept   : AIC=45534.329, Time=0.49 sec
 ARIMA(0,1,0)(0,0,0)[0]             : AIC=45534.069, Time=0.13 sec
 ARIMA(1,1,1)(0,0,0)[0] intercept   : AIC=inf, Time=5.90 sec

Best model:  ARIMA(0,1,0)(0,0,0)[0]          
Total fit time: 13.317 seconds


In [10]:
runAutoArima(df2)

Performing stepwise search to minimize aic
 ARIMA(2,0,2)(0,0,0)[0] intercept   : AIC=41791.421, Time=1.33 sec
 ARIMA(0,0,0)(0,0,0)[0] intercept   : AIC=58026.401, Time=0.12 sec
 ARIMA(1,0,0)(0,0,0)[0] intercept   : AIC=41833.582, Time=0.46 sec
 ARIMA(0,0,1)(0,0,0)[0] intercept   : AIC=50392.181, Time=0.92 sec
 ARIMA(0,0,0)(0,0,0)[0]             : AIC=58376.543, Time=0.07 sec
 ARIMA(1,0,2)(0,0,0)[0] intercept   : AIC=41789.427, Time=1.32 sec
 ARIMA(0,0,2)(0,0,0)[0] intercept   : AIC=46492.052, Time=1.64 sec
 ARIMA(1,0,1)(0,0,0)[0] intercept   : AIC=41798.033, Time=0.65 sec
 ARIMA(1,0,3)(0,0,0)[0] intercept   : AIC=41791.426, Time=2.09 sec
 ARIMA(0,0,3)(0,0,0)[0] intercept   : AIC=44743.164, Time=2.07 sec
 ARIMA(2,0,1)(0,0,0)[0] intercept   : AIC=41790.802, Time=2.02 sec
 ARIMA(2,0,3)(0,0,0)[0] intercept   : AIC=41788.345, Time=7.30 sec
 ARIMA(3,0,3)(0,0,0)[0] intercept   : AIC=41789.898, Time=10.04 sec
 ARIMA(2,0,4)(0,0,0)[0] intercept   : AIC=41790.319, Time=6.08 sec
 ARIMA(1,0,4)(0,0,

In [11]:
runAutoArima(df3)

Performing stepwise search to minimize aic
 ARIMA(2,1,2)(0,0,0)[0] intercept   : AIC=inf, Time=7.51 sec
 ARIMA(0,1,0)(0,0,0)[0] intercept   : AIC=39314.800, Time=0.16 sec
 ARIMA(1,1,0)(0,0,0)[0] intercept   : AIC=39310.492, Time=0.39 sec
 ARIMA(0,1,1)(0,0,0)[0] intercept   : AIC=39309.935, Time=0.49 sec
 ARIMA(0,1,0)(0,0,0)[0]             : AIC=39312.800, Time=0.14 sec
 ARIMA(1,1,1)(0,0,0)[0] intercept   : AIC=39305.900, Time=1.35 sec
 ARIMA(2,1,1)(0,0,0)[0] intercept   : AIC=inf, Time=4.32 sec
 ARIMA(1,1,2)(0,0,0)[0] intercept   : AIC=inf, Time=5.64 sec
 ARIMA(0,1,2)(0,0,0)[0] intercept   : AIC=39296.850, Time=0.68 sec
 ARIMA(0,1,3)(0,0,0)[0] intercept   : AIC=39286.163, Time=0.89 sec
 ARIMA(1,1,3)(0,0,0)[0] intercept   : AIC=inf, Time=7.73 sec
 ARIMA(0,1,4)(0,0,0)[0] intercept   : AIC=39257.086, Time=1.42 sec
 ARIMA(1,1,4)(0,0,0)[0] intercept   : AIC=inf, Time=10.01 sec
 ARIMA(0,1,5)(0,0,0)[0] intercept   : AIC=39206.277, Time=1.68 sec
 ARIMA(1,1,5)(0,0,0)[0] intercept   : AIC=inf, T

In [12]:
runAutoArima(df4)

Performing stepwise search to minimize aic
 ARIMA(2,0,2)(0,0,0)[0] intercept   : AIC=39401.329, Time=2.02 sec
 ARIMA(0,0,0)(0,0,0)[0] intercept   : AIC=54749.632, Time=0.14 sec
 ARIMA(1,0,0)(0,0,0)[0] intercept   : AIC=39827.946, Time=0.47 sec
 ARIMA(0,0,1)(0,0,0)[0] intercept   : AIC=46772.946, Time=0.96 sec
 ARIMA(0,0,0)(0,0,0)[0]             : AIC=54941.876, Time=0.08 sec
 ARIMA(1,0,2)(0,0,0)[0] intercept   : AIC=39438.187, Time=1.37 sec
 ARIMA(2,0,1)(0,0,0)[0] intercept   : AIC=39399.484, Time=1.38 sec
 ARIMA(1,0,1)(0,0,0)[0] intercept   : AIC=39473.909, Time=0.98 sec
 ARIMA(2,0,0)(0,0,0)[0] intercept   : AIC=39426.695, Time=0.55 sec
 ARIMA(3,0,1)(0,0,0)[0] intercept   : AIC=39401.389, Time=3.16 sec
 ARIMA(3,0,0)(0,0,0)[0] intercept   : AIC=39406.437, Time=0.70 sec
 ARIMA(3,0,2)(0,0,0)[0] intercept   : AIC=39389.302, Time=4.81 sec
 ARIMA(4,0,2)(0,0,0)[0] intercept   : AIC=39376.574, Time=7.17 sec
 ARIMA(4,0,1)(0,0,0)[0] intercept   : AIC=39380.889, Time=3.44 sec
 ARIMA(5,0,2)(0,0,0

In [13]:
mse1, mse2, mse3 = runModels(df1, (0,1,0))

                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8636
Model:                 ARIMA(0, 1, 0)   Log Likelihood              -22516.255
Date:                Sat, 13 May 2023   AIC                          45034.509
Time:                        09:04:41   BIC                          45041.573
Sample:                    01-01-2020   HQIC                         45036.918
                         - 03-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
sigma2        10.7752      0.050    216.388      0.000      10.678      10.873
Ljung-Box (L1) (Q):                   3.83   Jarque-Bera (JB):            139530.62
Prob(Q):                              0.05   Pr

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8656
Model:                 ARIMA(0, 1, 0)   Log Likelihood              -22558.394
Date:                Sat, 13 May 2023   AIC                          45118.788
Time:                        09:04:41   BIC                          45125.854
Sample:                    01-01-2020   HQIC                         45121.197
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
sigma2        10.7503      0.050    216.900      0.000      10.653      10.847
Ljung-Box (L1) (Q):                   3.84   Jarque-Bera (JB):            140601.25
Prob(Q):                              0.05   Pr

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8696
Model:                 ARIMA(0, 1, 0)   Log Likelihood              -22675.704
Date:                Sat, 13 May 2023   AIC                          45353.408
Time:                        09:04:41   BIC                          45360.479
Sample:                    01-01-2020   HQIC                         45355.818
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
sigma2        10.7826      0.050    216.534      0.000      10.685      10.880
Ljung-Box (L1) (Q):                   3.21   Jarque-Bera (JB):            138800.23
Prob(Q):                              0.07   Pr

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8636
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -22232.634
Date:                Sat, 13 May 2023   AIC                          44485.269
Time:                        09:04:48   BIC                          44555.905
Sample:                    01-01-2020   HQIC                         44509.354
                         - 03-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9175      0.005    181.343      0.000       0.908       0.927
ar.L2         -0.0688      0.006    -11.011      0.000      -0.081      -0.057
ar.L3          0.0133      0.007      2.049      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8656
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -22274.113
Date:                Sat, 13 May 2023   AIC                          44568.226
Time:                        09:04:56   BIC                          44638.885
Sample:                    01-01-2020   HQIC                         44592.317
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9175      0.005    181.762      0.000       0.908       0.927
ar.L2         -0.0688      0.006    -11.037      0.000      -0.081      -0.057
ar.L3          0.0133      0.006      2.057      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8676
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -22329.245
Date:                Sat, 13 May 2023   AIC                          44678.490
Time:                        09:05:03   BIC                          44749.172
Sample:                    01-01-2020   HQIC                         44702.585
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9193      0.005    182.063      0.000       0.909       0.929
ar.L2         -0.0694      0.006    -11.128      0.000      -0.082      -0.057
ar.L3          0.0134      0.006      2.062      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8696
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -22397.633
Date:                Sat, 13 May 2023   AIC                          44815.267
Time:                        09:05:11   BIC                          44885.972
Sample:                    01-01-2020   HQIC                         44839.367
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9212      0.005    181.803      0.000       0.911       0.931
ar.L2         -0.0713      0.006    -11.415      0.000      -0.084      -0.059
ar.L3          0.0145      0.007      2.235      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8716
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -22445.420
Date:                Sat, 13 May 2023   AIC                          44910.840
Time:                        09:05:19   BIC                          44981.568
Sample:                    01-01-2020   HQIC                         44934.946
                         - 03-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9219      0.005    182.006      0.000       0.912       0.932
ar.L2         -0.0710      0.006    -11.380      0.000      -0.083      -0.059
ar.L3          0.0148      0.006      2.275      0.0

In [14]:
mse4, mse5, mse6 = runModels(df2, (4,0,1))

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8636
Model:                 ARIMA(4, 0, 1)   Log Likelihood              -20635.844
Date:                Sat, 13 May 2023   AIC                          41285.688
Time:                        09:05:27   BIC                          41335.134
Sample:                    04-01-2020   HQIC                         41302.548
                         - 06-29-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          1.5125      0.366      4.136      0.000       0.796       2.229
ar.L1          0.0079      0.024      0.334      0.738      -0.038       0.054
ar.L2          0.9084      0.023     38.848      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8656
Model:                 ARIMA(4, 0, 1)   Log Likelihood              -20673.802
Date:                Sat, 13 May 2023   AIC                          41361.603
Time:                        09:05:35   BIC                          41411.065
Sample:                    04-01-2020   HQIC                         41378.467
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          1.5628      0.368      4.251      0.000       0.842       2.283
ar.L1          0.0247      0.034      0.724      0.469      -0.042       0.092
ar.L2          0.8944      0.034     26.439      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8676
Model:                 ARIMA(4, 0, 1)   Log Likelihood              -20737.755
Date:                Sat, 13 May 2023   AIC                          41489.510
Time:                        09:05:43   BIC                          41538.988
Sample:                    04-01-2020   HQIC                         41506.377
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          1.3713      0.367      3.737      0.000       0.652       2.090
ar.L1          0.0272      0.033      0.820      0.412      -0.038       0.092
ar.L2          0.8911      0.033     27.031      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8696
Model:                 ARIMA(4, 0, 1)   Log Likelihood              -20793.814
Date:                Sat, 13 May 2023   AIC                          41601.628
Time:                        09:05:52   BIC                          41651.122
Sample:                    04-01-2020   HQIC                         41618.498
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          1.3866      0.369      3.758      0.000       0.663       2.110
ar.L1          0.0256      0.032      0.800      0.424      -0.037       0.088
ar.L2          0.8943      0.032     28.168      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8716
Model:                 ARIMA(4, 0, 1)   Log Likelihood              -20849.091
Date:                Sat, 13 May 2023   AIC                          41712.182
Time:                        09:06:02   BIC                          41761.693
Sample:                    04-01-2020   HQIC                         41729.056
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          1.4031      0.370      3.794      0.000       0.678       2.128
ar.L1          0.0155      0.028      0.556      0.579      -0.039       0.070
ar.L2          0.9044      0.028     32.799      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8636
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -20635.049
Date:                Sat, 13 May 2023   AIC                          41290.097
Time:                        09:06:08   BIC                          41360.733
Sample:                    04-01-2020   HQIC                         41314.183
                         - 06-29-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9753      0.005    215.369      0.000       0.966       0.984
ar.L2         -0.0414      0.006     -7.516      0.000      -0.052      -0.031
ar.L3         -0.0328      0.006     -5.392      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8656
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -20672.836
Date:                Sat, 13 May 2023   AIC                          41365.671
Time:                        09:06:14   BIC                          41436.330
Sample:                    04-01-2020   HQIC                         41389.762
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9754      0.005    216.015      0.000       0.967       0.984
ar.L2         -0.0414      0.005     -7.533      0.000      -0.052      -0.031
ar.L3         -0.0327      0.006     -5.403      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8676
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -20735.503
Date:                Sat, 13 May 2023   AIC                          41491.006
Time:                        09:06:20   BIC                          41561.688
Sample:                    04-01-2020   HQIC                         41515.101
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9749      0.005    213.871      0.000       0.966       0.984
ar.L2         -0.0407      0.006     -7.397      0.000      -0.051      -0.030
ar.L3         -0.0334      0.006     -5.490      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8696
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -20791.076
Date:                Sat, 13 May 2023   AIC                          41602.152
Time:                        09:06:25   BIC                          41672.857
Sample:                    04-01-2020   HQIC                         41626.253
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9741      0.005    212.733      0.000       0.965       0.983
ar.L2         -0.0386      0.006     -7.009      0.000      -0.049      -0.028
ar.L3         -0.0351      0.006     -5.781      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8716
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -20845.568
Date:                Sat, 13 May 2023   AIC                          41711.135
Time:                        09:06:31   BIC                          41781.863
Sample:                    04-01-2020   HQIC                         41735.241
                         - 06-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9747      0.005    212.329      0.000       0.966       0.984
ar.L2         -0.0393      0.006     -7.135      0.000      -0.050      -0.029
ar.L3         -0.0344      0.006     -5.660      0.0

In [15]:
mse7, mse8, mse9 = runModels(df3, (0,1,5))

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8732
Model:                 ARIMA(0, 1, 5)   Log Likelihood              -19405.107
Date:                Sat, 13 May 2023   AIC                          38822.214
Time:                        09:06:32   BIC                          38864.662
Sample:                    07-01-2020   HQIC                         38836.680
                         - 09-29-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ma.L1          0.0007      0.004      0.177      0.860      -0.007       0.009
ma.L2         -0.0739      0.004    -17.275      0.000      -0.082      -0.065
ma.L3         -0.0620      0.005    -12.922      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8752
Model:                 ARIMA(0, 1, 5)   Log Likelihood              -19439.547
Date:                Sat, 13 May 2023   AIC                          38891.093
Time:                        09:06:32   BIC                          38933.555
Sample:                    07-01-2020   HQIC                         38905.562
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ma.L1          0.0007      0.004      0.177      0.859      -0.007       0.009
ma.L2         -0.0739      0.004    -17.315      0.000      -0.082      -0.066
ma.L3         -0.0620      0.005    -12.951      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8772
Model:                 ARIMA(0, 1, 5)   Log Likelihood              -19481.687
Date:                Sat, 13 May 2023   AIC                          38975.374
Time:                        09:06:33   BIC                          39017.849
Sample:                    07-01-2020   HQIC                         38989.846
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ma.L1          0.0016      0.004      0.389      0.697      -0.006       0.009
ma.L2         -0.0740      0.004    -17.358      0.000      -0.082      -0.066
ma.L3         -0.0625      0.005    -13.075      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8792
Model:                 ARIMA(0, 1, 5)   Log Likelihood              -19517.838
Date:                Sat, 13 May 2023   AIC                          39047.677
Time:                        09:06:34   BIC                          39090.166
Sample:                    07-01-2020   HQIC                         39062.151
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ma.L1          0.0016      0.004      0.404      0.686      -0.006       0.009
ma.L2         -0.0740      0.004    -17.382      0.000      -0.082      -0.066
ma.L3         -0.0623      0.005    -13.045      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8812
Model:                 ARIMA(0, 1, 5)   Log Likelihood              -19561.702
Date:                Sat, 13 May 2023   AIC                          39135.405
Time:                        09:06:36   BIC                          39177.907
Sample:                    07-01-2020   HQIC                         39149.883
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ma.L1          0.0025      0.004      0.631      0.528      -0.005       0.010
ma.L2         -0.0740      0.004    -17.386      0.000      -0.082      -0.066
ma.L3         -0.0633      0.005    -13.257      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8732
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -19156.827
Date:                Sat, 13 May 2023   AIC                          38333.654
Time:                        09:06:42   BIC                          38404.401
Sample:                    07-01-2020   HQIC                         38357.764
                         - 09-29-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9538      0.004    220.658      0.000       0.945       0.962
ar.L2         -0.0666      0.005    -13.653      0.000      -0.076      -0.057
ar.L3          0.0101      0.005      1.892      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8752
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -19190.720
Date:                Sat, 13 May 2023   AIC                          38401.441
Time:                        09:06:48   BIC                          38472.210
Sample:                    07-01-2020   HQIC                         38425.555
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9539      0.004    221.158      0.000       0.945       0.962
ar.L2         -0.0666      0.005    -13.689      0.000      -0.076      -0.057
ar.L3          0.0101      0.005      1.896      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8772
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -19232.294
Date:                Sat, 13 May 2023   AIC                          38484.587
Time:                        09:06:54   BIC                          38555.379
Sample:                    07-01-2020   HQIC                         38508.707
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9548      0.004    221.628      0.000       0.946       0.963
ar.L2         -0.0674      0.005    -13.882      0.000      -0.077      -0.058
ar.L3          0.0098      0.005      1.852      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8792
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -19267.944
Date:                Sat, 13 May 2023   AIC                          38555.887
Time:                        09:06:59   BIC                          38626.702
Sample:                    07-01-2020   HQIC                         38580.012
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9548      0.004    222.034      0.000       0.946       0.963
ar.L2         -0.0675      0.005    -13.917      0.000      -0.077      -0.058
ar.L3          0.0100      0.005      1.891      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8812
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -19310.683
Date:                Sat, 13 May 2023   AIC                          38641.367
Time:                        09:07:05   BIC                          38712.204
Sample:                    07-01-2020   HQIC                         38665.497
                         - 09-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          0.9557      0.004    222.327      0.000       0.947       0.964
ar.L2         -0.0682      0.005    -14.080      0.000      -0.078      -0.059
ar.L3          0.0093      0.005      1.755      0.0

In [16]:
mse10, mse11, mse12 = runModels(df4, (4,0,2))

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8732
Model:                 ARIMA(4, 0, 2)   Log Likelihood              -19489.431
Date:                Sat, 13 May 2023   AIC                          38994.861
Time:                        09:07:10   BIC                          39051.459
Sample:                    10-01-2020   HQIC                         39014.149
                         - 12-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          0.7851      0.306      2.562      0.010       0.185       1.386
ar.L1          0.7595      0.051     14.810      0.000       0.659       0.860
ar.L2         -0.2548      0.078     -3.287      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8752
Model:                 ARIMA(4, 0, 2)   Log Likelihood              -19524.456
Date:                Sat, 13 May 2023   AIC                          39064.912
Time:                        09:07:15   BIC                          39121.528
Sample:                    10-01-2020   HQIC                         39084.204
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          0.7934      0.306      2.590      0.010       0.193       1.394
ar.L1          0.7599      0.051     14.854      0.000       0.660       0.860
ar.L2         -0.2559      0.077     -3.307      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8772
Model:                 ARIMA(4, 0, 2)   Log Likelihood              -19569.476
Date:                Sat, 13 May 2023   AIC                          39154.951
Time:                        09:07:20   BIC                          39211.586
Sample:                    10-01-2020   HQIC                         39174.247
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          0.7886      0.306      2.581      0.010       0.190       1.388
ar.L1          0.7623      0.051     14.841      0.000       0.662       0.863
ar.L2         -0.2544      0.078     -3.269      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8792
Model:                 ARIMA(4, 0, 2)   Log Likelihood              -19604.875
Date:                Sat, 13 May 2023   AIC                          39225.750
Time:                        09:07:26   BIC                          39282.403
Sample:                    10-01-2020   HQIC                         39245.050
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          0.7964      0.305      2.609      0.009       0.198       1.395
ar.L1          0.7611      0.051     14.835      0.000       0.661       0.862
ar.L2         -0.2518      0.078     -3.243      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8812
Model:                 ARIMA(4, 0, 2)   Log Likelihood              -19645.316
Date:                Sat, 13 May 2023   AIC                          39306.633
Time:                        09:07:32   BIC                          39363.304
Sample:                    10-01-2020   HQIC                         39325.937
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
const          0.7897      0.304      2.595      0.009       0.193       1.386
ar.L1          0.7630      0.051     14.842      0.000       0.662       0.864
ar.L2         -0.2494      0.078     -3.202      0.0

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8732
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -19490.114
Date:                Sat, 13 May 2023   AIC                          39000.227
Time:                        09:07:45   BIC                          39070.974
Sample:                    10-01-2020   HQIC                         39024.337
                         - 12-30-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          1.0801      0.004    249.947      0.000       1.072       1.089
ar.L2         -0.1613      0.005    -30.654      0.000      -0.172      -0.151
ar.L3          0.0083      0.006      1.461      0.1

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8752
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -19525.125
Date:                Sat, 13 May 2023   AIC                          39070.251
Time:                        09:07:59   BIC                          39141.020
Sample:                    10-01-2020   HQIC                         39094.366
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          1.0803      0.004    250.510      0.000       1.072       1.089
ar.L2         -0.1613      0.005    -30.725      0.000      -0.172      -0.151
ar.L3          0.0081      0.006      1.421      0.1

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8772
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -19570.178
Date:                Sat, 13 May 2023   AIC                          39160.356
Time:                        09:08:11   BIC                          39231.148
Sample:                    10-01-2020   HQIC                         39184.476
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          1.0815      0.004    250.978      0.000       1.073       1.090
ar.L2         -0.1623      0.005    -30.933      0.000      -0.173      -0.152
ar.L3          0.0078      0.006      1.375      0.1

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8792
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -19605.597
Date:                Sat, 13 May 2023   AIC                          39231.195
Time:                        09:08:24   BIC                          39302.010
Sample:                    10-01-2020   HQIC                         39255.319
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          1.0815      0.004    251.504      0.000       1.073       1.090
ar.L2         -0.1623      0.005    -30.997      0.000      -0.173      -0.152
ar.L3          0.0078      0.006      1.384      0.1

  self._init_dates(dates, freq)
  self._init_dates(dates, freq)
  self._init_dates(dates, freq)


                               SARIMAX Results                                
Dep. Variable:               310_PV_1   No. Observations:                 8812
Model:                 ARIMA(8, 1, 1)   Log Likelihood              -19646.053
Date:                Sat, 13 May 2023   AIC                          39312.107
Time:                        09:08:35   BIC                          39382.944
Sample:                    10-01-2020   HQIC                         39336.237
                         - 12-31-2020                                         
Covariance Type:                  opg                                         
                 coef    std err          z      P>|z|      [0.025      0.975]
------------------------------------------------------------------------------
ar.L1          1.0824      0.004    251.990      0.000       1.074       1.091
ar.L2         -0.1629      0.005    -31.164      0.000      -0.173      -0.153
ar.L3          0.0078      0.006      1.380      0.1

In [17]:
print('season 1')

print('model 1:')
print(mse1)
print('model 2:')
print(mse2)
print('model 3:')
print(mse3)

season 1
model 1:
[6.585237596444411e-08, 6.367640648241624e-08, 0.047635261339835505, 0.1448118062792337, 1.1679915586611139e-05]
model 2:
[0.0005271222900270099, 0.0004985826129790794, 2.504233616235757, 3.489839165441675, 0.0241032772045714]
model 3:
[6.585237596444411e-08, 6.367640648241624e-08, 0.047635261339835505, 0.1448118062792337, 1.1679915586611139e-05]


In [18]:
print('season 1')

print('model 1:')
print(mse4)
print('model 2:')
print(mse5)
print('model 3:')
print(mse6)

season 1
model 1:
[0.028354618179509933, 0.03217568087818579, 10.722301326982427, 9.978822938691467, 0.036799154377839385]
model 2:
[0.0028227181642028927, 0.0022072300689064865, 12.09145288742478, 7.916610621961014, 0.021532800398056866]
model 3:
[2.3163960404393124e-09, 2.3397900415427924e-09, 21.17608704586783, 3.3299293830482632, 0.004750331027174225]


In [19]:
print('season 1')

print('model 1:')
print(mse7)
print('model 2:')
print(mse8)
print('model 3:')
print(mse9)

season 1
model 1:
[5.8472795664470366e-06, 1.6374282129226117e-07, 0.015428900971092185, 0.009738608873722458, 0.11288018518089919]
model 2:
[0.006508134746365506, 0.005366351340264234, 0.11644537213554854, 0.01033673101596749, 0.04435843840896852]
model 3:
[7.508669485454959e-08, 7.744802287517372e-08, 5.2659079840720344e-05, 0.01386328330780133, 0.00957320037187524]


In [20]:
print('season 1')

print('model 1:')
print(mse10)
print('model 2:')
print(mse11)
print('model 3:')
print(mse12)

season 1
model 1:
[0.10167176051527589, 0.10143354757881852, 0.7136450221548084, 0.001584633709055546, 0.04884286744684924]
model 2:
[0.09745697295899802, 0.0970279010101349, 0.7224988389595439, 0.0010533868549048653, 0.051708917729424805]
model 3:
[9.662277185560306e-08, 9.648390387573474e-08, 0.5056458319608859, 0.05995596125085395, 0.0002996943678626279]
