In [1]:
import warnings
from pandas import read_csv
from pandas import datetime
from statsmodels.tsa.arima_model import ARIMA
from sklearn.metrics import mean_squared_error
 
# evaluate an ARIMA model for a given order (p,d,q)
def evaluate_arima_model(X, arima_order):
	# prepare training dataset
	train_size = int(len(X) * 0.66)
	train, test = X[0:train_size], X[train_size:]
	history = [x for x in train]
	# make predictions
	predictions = list()
	for t in range(len(test)):
		model = ARIMA(history, order=arima_order)
		model_fit = model.fit(disp=0)
		yhat = model_fit.forecast()[0]
		predictions.append(yhat)
		history.append(test[t])
	# calculate out of sample error
	error = mean_squared_error(test, predictions)
	return error
 
def evaluate_models(dataset, p_values, d_values, q_values):
	dataset = dataset.astype('float32')
	best_score, best_cfg = float("inf"), None
	for p in p_values:
		for d in d_values:
			for q in q_values:
				order = (p,d,q)
				try:
					mse = evaluate_arima_model(dataset, order)
					if mse < best_score:
						best_score, best_cfg = mse, order
					print('ARIMA%s MSE=%.3f' % (order,mse))
				except:
					continue
	print('Best ARIMA%s MSE=%.3f' % (best_cfg, best_score))
 
# load dataset
def parser(x):
	return datetime.strptime('190'+x, '%Y-%m')
series = read_csv('sales-of-shampoo-over-a-three-ye.csv', header=0, parse_dates=[0], index_col=0, squeeze=True, date_parser=parser)
# evaluate parameters
p_values = [0, 1, 2, 4, 6, 8, 10]
d_values = range(0, 3)
q_values = range(0, 3)
warnings.filterwarnings("ignore")
evaluate_models(series.values, p_values, d_values, q_values)

  from pandas import datetime


ARIMA(0, 0, 0) MSE=52425.268
ARIMA(0, 0, 1) MSE=38145.238
ARIMA(0, 0, 2) MSE=23989.616
ARIMA(0, 1, 0) MSE=18003.173
ARIMA(0, 1, 1) MSE=9558.513
ARIMA(0, 1, 2) MSE=6306.175
ARIMA(0, 2, 0) MSE=67339.808
ARIMA(0, 2, 1) MSE=18321.087
ARIMA(1, 0, 0) MSE=23112.983
ARIMA(1, 0, 2) MSE=7332.818
ARIMA(1, 1, 0) MSE=7121.375
ARIMA(1, 1, 1) MSE=7003.683
ARIMA(1, 2, 0) MSE=18608.005
ARIMA(2, 0, 0) MSE=10176.522
ARIMA(2, 1, 0) MSE=5689.929
ARIMA(2, 1, 1) MSE=7759.706
ARIMA(2, 2, 0) MSE=9860.933
ARIMA(4, 0, 0) MSE=9762.462
ARIMA(4, 1, 0) MSE=6649.590
ARIMA(4, 1, 1) MSE=6796.242
ARIMA(4, 2, 0) MSE=7596.329
ARIMA(4, 2, 1) MSE=4694.878
ARIMA(6, 1, 0) MSE=6810.078
ARIMA(6, 1, 1) MSE=4496.088
ARIMA(6, 2, 0) MSE=6261.077
ARIMA(8, 1, 0) MSE=6579.254
ARIMA(10, 1, 0) MSE=7543.371
Best ARIMA(6, 1, 1) MSE=4496.088
