In [None]:
# grid search ARIMA parameters for time series
import warnings
from math import sqrt
from pandas import read_csv
from datetime import datetime
from statsmodels.tsa.arima.model import ARIMA
from sklearn.metrics import mean_squared_error
 
# evaluate an ARIMA model for a given order (p,d,q)
def evaluate_arima_model(X, arima_order):
    # prepare training dataset
    train_size = int(len(X) * 0.66)
    train, test = X[0:train_size], X[train_size:]
    history = [x for x in train]
    # make predictions
    predictions = list()
    for t in range(len(test)):
        model = ARIMA(history, order=arima_order)
        model_fit = model.fit()
        yhat = model_fit.forecast()[0]
        predictions.append(yhat)
        history.append(test[t])
    # calculate out of sample error
    rmse = sqrt(mean_squared_error(test, predictions))
    return rmse
 
# evaluate combinations of p, d and q values for an ARIMA model
def evaluate_models(dataset, p_values, d_values, q_values):
    dataset = dataset.astype('float32')
    best_score, best_cfg = float("inf"), None
    for p in p_values:
        for d in d_values:
            for q in q_values:
                order = (p,d,q)
                try:
                    rmse = evaluate_arima_model(dataset, order)
                    if rmse < best_score:
                        best_score, best_cfg = rmse, order
                    print('ARIMA%s RMSE=%.3f' % (order,rmse))
                except:
                    continue
    print('Best ARIMA%s RMSE=%.3f' % (best_cfg, best_score))
 
# load dataset
def parser(x):
    return datetime.strptime(x, '%Y-%m')

series = read_csv('predict.csv', header=0, index_col=0, parse_dates=True, squeeze=True, date_parser=parser)
# evaluate parameters
p_values = range(0,10)
d_values = range(0, 3)
q_values = range(0, 3)
warnings.filterwarnings("ignore")
evaluate_models(series.values, p_values, d_values, q_values)


ARIMA(0, 0, 0) RMSE=11.340
ARIMA(0, 0, 1) RMSE=10.091
ARIMA(0, 0, 2) RMSE=9.515
ARIMA(0, 1, 0) RMSE=10.820
ARIMA(0, 1, 1) RMSE=10.927
ARIMA(0, 1, 2) RMSE=10.091
ARIMA(0, 2, 0) RMSE=16.820
ARIMA(0, 2, 1) RMSE=10.859
ARIMA(0, 2, 2) RMSE=10.946
ARIMA(1, 0, 0) RMSE=9.709
ARIMA(1, 0, 1) RMSE=9.717
ARIMA(1, 0, 2) RMSE=10.342
ARIMA(1, 1, 0) RMSE=10.767
ARIMA(1, 1, 1) RMSE=9.706
ARIMA(1, 1, 2) RMSE=9.713
ARIMA(1, 2, 0) RMSE=13.347
ARIMA(1, 2, 1) RMSE=10.807
ARIMA(1, 2, 2) RMSE=9.957
ARIMA(2, 0, 0) RMSE=9.723
ARIMA(2, 0, 1) RMSE=9.722
ARIMA(2, 0, 2) RMSE=8.458
ARIMA(2, 1, 0) RMSE=10.927
ARIMA(2, 1, 1) RMSE=9.718
ARIMA(2, 1, 2) RMSE=9.745
ARIMA(2, 2, 0) RMSE=13.069
ARIMA(2, 2, 1) RMSE=10.961
ARIMA(2, 2, 2) RMSE=10.907
ARIMA(3, 0, 0) RMSE=9.311
ARIMA(3, 0, 1) RMSE=9.023
ARIMA(3, 0, 2) RMSE=10.142
ARIMA(3, 1, 0) RMSE=10.855
ARIMA(3, 1, 1) RMSE=9.309
ARIMA(3, 1, 2) RMSE=9.268
ARIMA(3, 2, 0) RMSE=12.803
ARIMA(3, 2, 1) RMSE=10.892
ARIMA(3, 2, 2) RMSE=11.022
ARIMA(4, 0, 0) RMSE=9.198
ARIMA(4, 0, 1) RM