In [3]:
%load_ext jupyternotify

<IPython.core.display.Javascript object>

In [4]:
# Silence TensorFlow warnings
import os
os.environ['TF_CPP_MIN_LOG_LEVEL'] = '3'  # or any {'0', '1', '2'}
import tensorflow as tf

In [5]:
# Import Statements
#from __future__ import absolute_import
from pandas import DataFrame, Series, concat, read_csv, datetime
from sklearn.metrics import mean_squared_error
from sklearn.preprocessing import MinMaxScaler, StandardScaler
from sklearn.externals import joblib
from keras.models import Sequential
from keras.layers import Dense, LSTM, TimeDistributed
from keras.callbacks import LambdaCallback, History
from math import sqrt
from matplotlib import pyplot
import numpy
import pickle

In [6]:
# date-time parsing function for loading the dataset
def parser(x):
	return datetime.strptime('190'+x, '%Y-%m')

In [8]:
# frame a sequence as a supervised learning problem
def timeseries_to_supervised(data, lag=1):
    df = DataFrame(data)
    columns = [df.shift(i) for i in range(1, lag+1)]
    columns.append(df)
    df = concat(columns, axis=1)
    df.fillna(0, inplace=True)
    return df

In [9]:
# create a differenced series
def difference(dataset, interval=1):
    diff = list()
    for i in range(interval, len(dataset)):
        value = dataset[i] - dataset[i - interval]
        diff.append(value)
    return Series(diff)

In [10]:
# invert differenced value
def inverse_difference(history, yhat, interval=1):
    return yhat + history[-interval]

In [11]:
# scale train and test data to [-1, 1]
def scale(train, test):
    # fit scaler
    '''scaler = MinMaxScaler(feature_range=(-1, 1))'''
    scaler = StandardScaler()
    scaler = scaler.fit(train)
    # transform train
    train = train.reshape(train.shape[0], train.shape[1])
    train_scaled = scaler.transform(train)
    # transform test
    test = test.reshape(test.shape[0], test.shape[1])
    test_scaled = scaler.transform(test)
    return scaler, train_scaled, test_scaled

In [12]:
# fit an LSTM network to training data
def fit_lstm(train, test, batch_size, nb_epoch, neurons):
    X, y = train[:, 0:-1], train[:, -1]
    X = X.reshape(X.shape[0], 1, X.shape[1])

    x_test, y_test = test[:, 0:-1], test[:, -1]
    x_test = x_test.reshape(x_test.shape[0], 1, x_test.shape[1])

    history = History()

    print(X.shape)
    print(x_test.shape)
    model = Sequential()
    model.add(LSTM(neurons, batch_input_shape=(batch_size, X.shape[1], X.shape[2]), stateful=False, return_sequences=True))
    model.add(Dense(2*neurons, activation='relu'))
    model.add(Dense(128, activation='relu'))
    model.add(Dense(neurons, activation='relu'))
    model.add(LSTM(neurons, stateful=True, return_sequences=False))
    model.add(Dense(1, activation='sigmoid'))
    model.compile(loss='mean_squared_error', optimizer='adam')
    h = model.fit(X, y, epochs=nb_epoch, batch_size=batch_size, verbose=1, shuffle=False, validation_data=(x_test, y_test), callbacks=[history])
    return model, h

In [13]:
# load dataset
series = read_csv('./shampoo_sales_data.csv', header=0, parse_dates=[0], index_col=0, squeeze=True, date_parser=parser)

# transform data to be stationary
raw_values = series.values
diff_values = difference(raw_values, 1)

In [14]:
# transform data to be supervised learning
supervised = timeseries_to_supervised(diff_values, 1)
supervised_values = supervised.values

In [15]:
# split data into train and test-sets, saving results
train, test = supervised_values[0:-12], supervised_values[-12:]
numpy.savetxt('train_df.csv', train, delimiter=',')
numpy.savetxt('test_df.csv', test, delimiter=',')

In [16]:
# transform the scale of the data
scaler, train_scaled, test_scaled = scale(train, test)

# Save scaler object and scaled data
joblib.dump(scaler, 'lstm_scaler.pkl')
numpy.savetxt('train_scaled_df.csv', train_scaled, delimiter=',')
numpy.savetxt('test_scaled_df.csv', test_scaled, delimiter=',')

print(train_scaled.shape, test_scaled.shape)

(23, 2) (12, 2)


In [17]:
%%notify
# fit the model
lstm_model, hist = fit_lstm(train_scaled, test_scaled, 1, 256, 8)

(23, 1, 1)
(12, 1, 1)
Train on 23 samples, validate on 12 samples
Epoch 1/256
Epoch 2/256
Epoch 3/256
Epoch 4/256
Epoch 5/256
Epoch 6/256
Epoch 7/256
Epoch 8/256
Epoch 9/256
Epoch 10/256
Epoch 11/256
Epoch 12/256
Epoch 13/256
Epoch 14/256
Epoch 15/256
Epoch 16/256
Epoch 17/256
Epoch 18/256
Epoch 19/256
Epoch 20/256
Epoch 21/256
Epoch 22/256
Epoch 23/256
Epoch 24/256
Epoch 25/256
Epoch 26/256
Epoch 27/256
Epoch 28/256
Epoch 29/256
Epoch 30/256
Epoch 31/256
Epoch 32/256
Epoch 33/256
Epoch 34/256
Epoch 35/256
Epoch 36/256
Epoch 37/256
Epoch 38/256
Epoch 39/256
Epoch 40/256
Epoch 41/256
Epoch 42/256
Epoch 43/256
Epoch 44/256
Epoch 45/256
Epoch 46/256
Epoch 47/256
Epoch 48/256
Epoch 49/256
Epoch 50/256
Epoch 51/256
Epoch 52/256
Epoch 53/256
Epoch 54/256
Epoch 55/256
Epoch 56/256
Epoch 57/256
Epoch 58/256
Epoch 59/256
Epoch 60/256
Epoch 61/256
Epoch 62/256
Epoch 63/256
Epoch 64/256
Epoch 65/256
Epoch 66/256
Epoch 67/256
Epoch 68/256
Epoch 69/256
Epoch 70/256
Epoch 71/256
Epoch 72/256
Epoch 7

Epoch 82/256
Epoch 83/256
Epoch 84/256
Epoch 85/256
Epoch 86/256
Epoch 87/256
Epoch 88/256
Epoch 89/256
Epoch 90/256
Epoch 91/256
Epoch 92/256
Epoch 93/256
Epoch 94/256
Epoch 95/256
Epoch 96/256
Epoch 97/256
Epoch 98/256
Epoch 99/256
Epoch 100/256
Epoch 101/256
Epoch 102/256
Epoch 103/256
Epoch 104/256
Epoch 105/256
Epoch 106/256
Epoch 107/256
Epoch 108/256
Epoch 109/256
Epoch 110/256
Epoch 111/256
Epoch 112/256
Epoch 113/256
Epoch 114/256
Epoch 115/256
Epoch 116/256
Epoch 117/256
Epoch 118/256
Epoch 119/256
Epoch 120/256
Epoch 121/256
Epoch 122/256
Epoch 123/256
Epoch 124/256
Epoch 125/256
Epoch 126/256
Epoch 127/256
Epoch 128/256
Epoch 129/256
Epoch 130/256
Epoch 131/256
Epoch 132/256
Epoch 133/256
Epoch 134/256
Epoch 135/256
Epoch 136/256
Epoch 137/256
Epoch 138/256
Epoch 139/256
Epoch 140/256
Epoch 141/256
Epoch 142/256
Epoch 143/256
Epoch 144/256
Epoch 145/256
Epoch 146/256
Epoch 147/256
Epoch 148/256
Epoch 149/256
Epoch 150/256
Epoch 151/256
Epoch 152/256
Epoch 153/256
Epoch 154/

Epoch 162/256
Epoch 163/256
Epoch 164/256
Epoch 165/256
Epoch 166/256
Epoch 167/256
Epoch 168/256
Epoch 169/256
Epoch 170/256
Epoch 171/256
Epoch 172/256
Epoch 173/256
Epoch 174/256
Epoch 175/256
Epoch 176/256
Epoch 177/256
Epoch 178/256
Epoch 179/256
Epoch 180/256
Epoch 181/256
Epoch 182/256
Epoch 183/256
Epoch 184/256
Epoch 185/256
Epoch 186/256
Epoch 187/256
Epoch 188/256
Epoch 189/256
Epoch 190/256
Epoch 191/256
Epoch 192/256
Epoch 193/256
Epoch 194/256
Epoch 195/256
Epoch 196/256
Epoch 197/256
Epoch 198/256
Epoch 199/256
Epoch 200/256
Epoch 201/256
Epoch 202/256
Epoch 203/256
Epoch 204/256
Epoch 205/256
Epoch 206/256
Epoch 207/256
Epoch 208/256
Epoch 209/256
Epoch 210/256
Epoch 211/256
Epoch 212/256
Epoch 213/256
Epoch 214/256
Epoch 215/256
Epoch 216/256
Epoch 217/256
Epoch 218/256
Epoch 219/256
Epoch 220/256
Epoch 221/256
Epoch 222/256
Epoch 223/256
Epoch 224/256
Epoch 225/256
Epoch 226/256
Epoch 227/256
Epoch 228/256
Epoch 229/256
Epoch 230/256
Epoch 231/256
Epoch 232/256
Epoch 

Epoch 243/256
Epoch 244/256
Epoch 245/256
Epoch 246/256
Epoch 247/256
Epoch 248/256
Epoch 249/256
Epoch 250/256
Epoch 251/256
Epoch 252/256
Epoch 253/256
Epoch 254/256
Epoch 255/256
Epoch 256/256


<IPython.core.display.Javascript object>

In [18]:
# forecast the entire training dataset to build up state for forecasting
train_reshaped = train_scaled[:, 0].reshape(len(train_scaled), 1, 1)
lstm_model.predict(train_reshaped, batch_size=1)

array([[  1.14889222e-03],
       [  4.14664090e-01],
       [  1.04069861e-03],
       [  3.38487893e-01],
       [  9.62449994e-04],
       [  8.10564030e-03],
       [  5.99552179e-04],
       [  2.80909380e-03],
       [  4.81603965e-02],
       [  7.42009342e-01],
       [  2.44079763e-03],
       [  7.19859958e-01],
       [  5.31214941e-03],
       [  6.79030299e-01],
       [  2.71259807e-03],
       [  6.96812465e-04],
       [  5.58013856e-01],
       [  1.34018192e-03],
       [  5.42357624e-01],
       [  1.24095089e-03],
       [  3.23404670e-02],
       [  7.85897311e-04],
       [  5.62866092e-01]], dtype=float32)

In [19]:
# Save model
# serialize model to JSON
model_json = lstm_model.to_json()
with open("model.json", "w") as json_file:
    json_file.write(model_json)
# serialize weights to HDF5
lstm_model.save_weights("model.h5")
print("Saved model to disk")

with open('model_history.pkl', 'wb') as file_pi:
        pickle.dump(hist.history, file_pi)

Saved model to disk


In [20]:
%notify -m 'Notebook has finished running.'

<IPython.core.display.Javascript object>