In [None]:
from sweat4science.workspace.Workspace import Workspace
from sweat4science.evaluation.sessionset import MF_sessionset as mfs
import sweat4science as s4s

import os
import numpy as np

import keras
from keras.models import Sequential
from keras.layers.core import Dense, Activation
from keras.layers.recurrent import LSTM
from keras.preprocessing.sequence import pad_sequences
from keras.models import model_from_json

from matplotlib import pyplot as plt
%matplotlib inline

from sklearn.model_selection import KFold
from s4s_rnn import utils, evaluation

# import sys
# print(sys.path)

In [None]:
workspace_folder = "/home/minh/workspace/git/rnd/session-data"
ws = Workspace(workspace_folder)
sessions = mfs.ICT_indoor(ws)


In [None]:
import re

for session in sessions:
    if len(re.findall("slope", str(session))) > 0:
        sessions.remove(session)
    pass

sessions = np.array(sessions)
print("\n".join(map(str, sessions)))


In [None]:
def evaluate_cross_validation(sessions, result_dir, model_name, experiment_name, date_string,
                              time_steps, hidden_neurons, num_epoch, input_dim=4,
                              save_plot=False, time_horizon=None, old_norm=False,
                              plot_input=False):
    predictions = {}
    # Construct base name
    base_name = "%s_%s_%s_%02dstep_%02din_%03dhidden_%03depoch_" \
                % (model_name, experiment_name, date_string, time_steps, input_dim, hidden_neurons, num_epoch)
#     base_name = experiment_name + "_" + str(time_steps) + "step_" + str(input_dim) + "in_" \
#         + str(hidden_neurons) + "hidden_" + date_string + "_" + str(num_epoch) + "epoch_"
    base_name = os.path.join(result_dir, base_name)
    print("\nBase name: %s\n" % (base_name))

    # Open model
    model_file_name = base_name  + "model.json"
    json_file = open(model_file_name, 'r')
    loaded_model_json = json_file.read()
    json_file.close()

    # Cross validation testing
    test_predictions = None
    test_actual_outputs = None
    kf = KFold(len(sessions))
    for train_index, test_index in kf.split(sessions):
        test_sessions = sessions[test_index]
        print("\nTesting on:\n" + "\n".join(map(str, test_sessions)))

        test_data_x, test_data_y, scaler = \
            utils.get_data_from_sessions(test_sessions, time_steps, return_norm=True, old_norm=old_norm)

        loaded_model = model_from_json(loaded_model_json)

        match = re.match('.+/running_indoor_(.+)/(\d+)>', str(test_sessions[0]))
        cross_validation_name = base_name + match.groups()[0] + "_" + match.groups()[1] + "_"
        session_name = "%s_%s" % (match.groups()[0], match.groups()[1])
        prediction_name = "%2dlookback_%dneurons" % (time_steps, hidden_neurons)
        if time_horizon is not None:
            prediction_name += "%dhorizon" % time_horizon
            pass

        experiment_result = evaluation.ExperimentEvalutation(exp_name=session_name, scaler=scaler,
                                                             true_output=test_data_y)

        prediction = utils.evaluate_model(loaded_model, cross_validation_name + "weights.h5",
                                          test_data_x, test_data_y, horizon=time_horizon)
        experiment_result.add_prediction(prediction_name, prediction, unnormalize=True)

        print("MSE: %.5f\nRMSE: %.5f" % (experiment_result.mse[prediction_name],
                                         np.sqrt(experiment_result.mse[prediction_name])))

        if time_horizon is None:
            plot_title = "Heart rate simulation for running_indoor_"
        else:
            plot_title = "Heart rate prediction at %ds horizon for running_indoor_" % time_horizon
            pass

        plot_title += match.groups()[0] + "/" + match.groups()[1] + ", lookback of " + str(time_steps)
        utils.plot_predictions(experiment_result.predictions[prediction_name],
                               experiment_result.true_output[-len(prediction):],
                               cross_validation_name + "result.png", plot_title)

        if plot_input:
            utils.plot_inputs(test_data_x[:, -1, :])
            pass

        test_predictions = experiment_result.predictions[prediction_name] if test_predictions is None \
            else np.append(test_predictions, experiment_result.predictions[prediction_name], axis=0)
        test_actual_outputs = experiment_result.true_output if test_actual_outputs is None \
            else np.append(test_actual_outputs, experiment_result.true_output, axis=0)

        predictions[session_name] = experiment_result

        pass

    mse = np.mean((test_predictions - test_actual_outputs)**2)
    rmse = np.sqrt(mse)
    print("\nOverall results:\n MSE: %.5f\n RMSE: %.5f" % (mse, rmse))

    return predictions


In [None]:
evaluate_cross_validation(sessions=sessions, result_dir="../train_results", model_name="lstm", experiment_name="indoor",
                          date_string="20161205", time_steps=5, hidden_neurons=400, num_epoch=150, time_horizon=None)

In [None]:
evaluate_cross_validation(sessions=sessions, result_dir="../train_results", model_name="gru", experiment_name="indoor",
                          date_string="20161208", time_steps=5, hidden_neurons=400, num_epoch=150, time_horizon=None)

In [None]:
evaluate_cross_validation(sessions=sessions, result_dir="../train_results", model_name="lstm", experiment_name="indoor",
                          date_string="20161114", time_steps=5, hidden_neurons=400, num_epoch=150, time_horizon=None,
                          old_norm=True)

In [None]:
evaluate_cross_validation(sessions=sessions, result_dir="../train_results", experiment_name="lstm_indoor",
                          date_string="20161205", time_steps=10, hidden_neurons=400, num_epoch=150, time_horizon=None,
                          old_norm=False)

In [None]:
# evaluate_cross_validation(sessions=sessions, result_dir="../train_results", experiment_name="lstm_indoor",
#                           date_string="20161114", time_steps=10, hidden_neurons=400, num_epoch=150, time_horizon=None,
#                           old_norm=True)

In [None]:
evaluate_cross_validation(sessions=sessions, result_dir="../train_results", experiment_name="lstm_indoor",
                          date_string="20161205", time_steps=15, hidden_neurons=400, num_epoch=150, time_horizon=None,
                          old_norm=False)

In [None]:
evaluate_cross_validation(sessions=sessions, result_dir="../train_results", model_name="lstm", experiment_name="indoor",
                          date_string="20161205", time_steps=10, hidden_neurons=400, num_epoch=150, time_horizon=30)

In [None]:
evaluate_cross_validation(sessions=sessions, result_dir="../train_results", experiment_name="lstm_indoor",
                          date_string="20161205", time_steps=10, hidden_neurons=400, num_epoch=150, old_norm=False,
                          plot_input=True)

In [None]:
evaluate_cross_validation(sessions=sessions, result_dir="../train_results", experiment_name="lstm_indoor",
                          date_string="20161114", time_steps=10, hidden_neurons=400, num_epoch=150, old_norm=True,
                          plot_input=True)

In [None]:
evaluate_cross_validation(sessions=sessions, result_dir="../train_results", experiment_name="lstm_indoor_sigmoid",
                          date_string="20161127", time_steps=10, hidden_neurons=400, num_epoch=150)

In [None]:
data = np.genfromtxt("artificial_data/sinx_plus_x.csv", delimiter=',')
plt.figure(figsize=(10, 7))
plt.title("Artificially generated data")
plt.plot(data[:, -1:], 'g*')
plt.show()

data_mean = np.mean(data, axis=0)
data_std = np.std(data, axis=0)
data = (data - data_mean) / data_std

num_train = int(0.9*len(data))
test_data_x_ = data[num_train:, :-1]
test_data_y = data[num_train:, -1:]

input_dim = 2
output_dim = 1
hidden_neurons = 400
num_epoch = 50
for ntsteps in [5, 10, 15]:
    base_name = "lstm_sinx_plus_x_" + str(ntsteps) + "step_" + str(input_dim) +\
                "in_" + str(hidden_neurons) + "hidden_" + "20161116" +\
                "_" + str(num_epoch) + "epoch_"
    base_name = os.path.join("train_results", base_name)
    model_file_name = base_name  + "model.json"
    json_file = open(model_file_name, 'r')
    loaded_model_json = json_file.read()
    json_file.close()

    loaded_model = model_from_json(loaded_model_json)

    test_data_x = utils.reshape_array_by_time_steps(test_data_x_, time_steps=ntsteps)
    
    test_data_y_unnormed, test_predict_unnormed, mse = \
            utils.evaluate_model(loaded_model, base_name + "weights.h5",
                                 test_data_x, test_data_y, data_mean[-1], data_std[-1])

    print("MSE: %.5f\nRMSE: %.5f" % (mse, np.sqrt(mse)) )

    # Plot
    utils.plot_predictions(test_predict_unnormed, test_data_y_unnormed, base_name + "result.png",
                           "Artificial data of function sin(x) + x, lookback of " + str(ntsteps), y_label="Output")
    pass

