In [1]:
from dataset import BPI2012Dataset
from parameters.dataset import BPI2012Parameters
from utils.save import get_json_dict
from parameters.training import TrainingParameters, LossParameters, OptimizerParameters
from parameters.model import LSTMPredNextModelParameters
from model import LSTMPredNextModel
from controller import TrainingController

In [2]:
bpi_2012_parms = BPI2012Parameters()

In [3]:
get_json_dict(bpi_2012_parms)

{'file_path': './data/event_logs/BPI_Challenge_2012.xes',
 'preprocessed_folder_path': './data/preprocessed/BPI_Challenge_2012_with_resource',
 'include_types': ['A'],
 'include_complete_only': True}

In [4]:
dataset = BPI2012Dataset(bpi_2012_parms)


| Preprocessed data loaded successfully: ./data/preprocessed/BPI_Challenge_2012_with_resource/A_CompleteOnly 


In [5]:
model_params = LSTMPredNextModelParameters()

In [6]:
get_json_dict(model_params)

{'activity_embedding_dim': 32,
 'resource_embedding_dim': 128,
 'lstm_hidden': 64,
 'dense_dim': 64,
 'dropout': 0.1}

In [7]:
model = LSTMPredNextModel(
    activity_vocab = dataset.activity_vocab,
    resource_vocab = dataset.resource_vocab,
    parameters = model_params
)

In [8]:
train_params = TrainingParameters(
    stop_epoch=20,
)

In [9]:
get_json_dict(train_params)

{'stop_epoch': 20,
 'batch_size': 128,
 'verbose_freq': 250,
 'run_validation_freq': 80,
 'train_test_split_portion': [0.8, 0.1],
 'random_seed': 12345}

In [10]:
loss_params = LossParameters()

In [12]:
get_json_dict(loss_params)

{'loss': 'CrossEntropy', 'from_logits': False}

In [13]:
optim_params = OptimizerParameters()

In [14]:
get_json_dict(optim_params)

{'optimizer': 'Adam',
 'learning_rate': 0.005,
 'l2': 1e-10,
 'lr_scheduler': 'ExponentialDecay',
 'lr_step_scheduler_step': 800,
 'lr_setp_scheduler_gamma': 0.8,
 'lr_exp_decay_scheduler_step': 1000,
 'lr_exp_decay_scheduler_rate': 0.96,
 'lr_exp_decay_scheduler_staircase': True,
 'SGD_momentum': 0.9}

In [15]:
controller = TrainingController(
    dataset,
    model,
    train_params,
    optim_params,
    loss_params,
)


| Running on /job:localhost/replica:0/task:0/device:CPU:0  


In [16]:
controller.model_info()

Model: "LSTMPredNextModel"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
embedding (Embedding)        multiple                  416       
_________________________________________________________________
embedding_1 (Embedding)      multiple                  8192      
_________________________________________________________________
lstm (LSTM)                  multiple                  24832     
_________________________________________________________________
lstm_1 (LSTM)                multiple                  33024     
_________________________________________________________________
lstm_2 (LSTM)                multiple                  49408     
_________________________________________________________________
lstm_3 (LSTM)                multiple                  33024     
_________________________________________________________________
sequential (Sequential)      (1, 64)             

In [17]:
# tensorboard --logdir logs/gradient_tape --host localhost --port 8088
test_accuracy = controller.train()


| Training records in logs/gradient_tape/20210706-164147 

| Total epochs: 20 

| Total steps: 1640 

| Start epoch 0 

| Evaluation result | Loss [0.9076] | Accuracy [0.3250]  

| Start epoch 1 

| Evaluation result | Loss [0.6171] | Accuracy [0.6012]  

| Start epoch 2 

| Evaluation result | Loss [0.3713] | Accuracy [0.6532]  

| Start epoch 3 

| Evaluation result | Loss [0.2480] | Accuracy [0.8403]  

| Start epoch 4 

| Evaluation result | Loss [0.2161] | Accuracy [0.8398]  

| Start epoch 5 

| Evaluation result | Loss [0.2108] | Accuracy [0.8406]  

| Start epoch 6 

| Evaluation result | Loss [0.2106] | Accuracy [0.8422]  

| Start epoch 7 

| Evaluation result | Loss [0.2104] | Accuracy [0.8441]  

| Start epoch 8 

| Evaluation result | Loss [0.2107] | Accuracy [0.8437]  

| Start epoch 9 

| Evaluation result | Loss [0.2109] | Accuracy [0.8419]  

| Start epoch 10 

| Evaluation result | Loss [0.2110] | Accuracy [0.8422]  

| Start epoch 11 

| Evaluation result | Loss [0.

In [18]:
# test_accuracy = controller.perform_eval_on_testset()

In [19]:
save_folder_path = model.get_folder_path("bpi_2012_pred_next_training.ipynb", test_accuracy , dataset.info_str())

In [20]:
controller.save_parameters(save_folder_path)
model.save(save_folder_path)


| Parameters saved successfully to: ./SavedModels/0.8441_LSTMPredNextModel_A_CompleteOnly_2021-07-06 16'46'36.809124  

| Vocabs saved successfully to: ./SavedModels/0.8441_LSTMPredNextModel_A_CompleteOnly_2021-07-06 16'46'36.809124  

| Model saved successfully to: ./SavedModels/0.8441_LSTMPredNextModel_A_CompleteOnly_2021-07-06 16'46'36.809124  


In [20]:
# controller.load_parameters(save_folder_path)
# model.load(save_folder_path)