In [1]:
# useing this variable for saving models and summaries
exp_name = "RCNN1001_y"

## Running CNN then RNN
5 layers CNN [2, 2, 2, 2, 2], then RNN, bias_shape = [32,64,64, 64, 64]

In [2]:
%load_ext autoreload
%autoreload 2
import numpy as np
import tensorflow as tf
import sys
from hdf5storage import savemat
import pickle

sys.path.append('../../src')
sys.path.append('../../src/models')

In [3]:
import models.CNN_lstm_model as CNN_lstm_model
import training  
import evaluation.nn_eval as nn_eval 

## Loading synthetic data

In [4]:
#loading data
data_path= '../../data/synthetic2/' + 'processed3.p'

with open(data_path, 'r') as fin:
    data = pickle.load(fin)
    
train_data = data['train_data']
validation_data = data['validation_data']
test_data = data['test_data']

train_gt = np.expand_dims(data['train_gt'], axis=-1)
validation_gt = np.expand_dims(data['validation_gt'], axis=-1)
test_gt = np.expand_dims(data['test_gt'], axis=-1)

index_of_changes = data['index_of_changes']

## Model

In [5]:
## Model Parameter
n_variables= 12
learning_rate = 0.001
batch_size = 10

pooling_stride = [2, 2, 2, 2, 2]
weights_shape = [[5,n_variables, 32],
                 [5, 32, 64],
                 [5, 64, 64],
                 [5, 64, 64],
                 [5, 64, 64]]

bias_shape = [32,64,64, 64, 64]
activation = tf.nn.relu

lstm_n_hidden = 128
n_classes = 1


#positive weight for weighted cross entropy
s = train_data.shape
resolution = np.prod(pooling_stride)
gt_effective = np.reshape(train_gt, (s[0]*(s[1]/resolution), resolution))
pos_weight = (1.0 - gt_effective.max(axis=1).mean()) / gt_effective.max(axis=1).mean()

In [6]:
pos_weight

14.854262989736288

In [7]:
# Launch the graph
config = tf.ConfigProto()
config.gpu_options.allow_growth = True
sess = tf.Session(config=config)

In [8]:
summary_path = '../../summary_synthetic/train_abrupt_test_gradual/' + exp_name 
checkpoint_path = '../../model_synthetic/train_abrupt_test_gradual/' + exp_name + '/' + exp_name 

In [9]:
model = CNN_lstm_model.Model(n_variables, n_classes)

In [10]:
model.build_cnn_lstm_net(pooling_stride,
                         weights_shape,
                         bias_shape,
                         activation,
                         lstm_n_hidden,
                         n_classes,
                         learning_rate,
                         pos_weight,
                         trainable_conv=True,
                         trainable_last=True)


In [11]:
train_obj = training.Trainer(model,
                 train_data, train_gt,
                 validation_data, validation_gt,
                 sess,
                 summary_path,
                 batch_size,
                 global_step = 0)

In [12]:
train_obj.train(max_iter = 10000,
                train_eval_step=100,
                validation_eval_step=100,
                display_step=100)

Training: 0
AUC = 0.104 vs. 0.056
F1 = 0.126 vs. 0.114
Precision = 0.068 vs. 0.061
Recall = 0.950 vs. 0.975
Validation: 0
AUC = 0.134 vs. 0.075
F1 = 0.247 vs. 0.165
Precision = 0.147 vs. 0.090
Recall = 0.783 vs. 1.000
Minibatch Loss= 1.545129
Training: 100
AUC = 0.985 vs. 0.059
F1 = 0.938 vs. 0.116
Precision = 0.942 vs. 0.062
Recall = 0.934 vs. 0.959
Validation: 100
AUC = 0.119 vs. 0.134
F1 = 0.193 vs. 0.212
Precision = 0.109 vs. 0.163
Recall = 0.826 vs. 0.304
Minibatch Loss= 0.183488
Training: 200
AUC = 0.925 vs. 0.055
F1 = 0.850 vs. 0.113
Precision = 0.833 vs. 0.060
Recall = 0.868 vs. 0.992
Validation: 200
AUC = 0.261 vs. 0.116
F1 = 0.284 vs. 0.174
Precision = 0.202 vs. 0.116
Recall = 0.478 vs. 0.348
Minibatch Loss= 0.247138
Training: 300
AUC = 0.997 vs. 0.067
F1 = 0.983 vs. 0.123
Precision = 1.000 vs. 0.074
Recall = 0.967 vs. 0.364
Validation: 300
AUC = 0.177 vs. 0.158
F1 = 0.276 vs. 0.202
Precision = 0.165 vs. 0.209
Recall = 0.848 vs. 0.196
Minibatch Loss= 0.156044
Training: 400
AU

In [21]:
train_obj.train(max_iter = 5000,
                train_eval_step=100,
                validation_eval_step=100,
                display_step=100)

Training: 10000
AUC = 1.000 vs. 0.063
F1 = 1.000 vs. 0.115
Precision = 1.000 vs. 0.064
Recall = 1.000 vs. 0.587
Validation: 10000
AUC = 0.266 vs. 0.076
F1 = 0.288 vs. 0.172
Precision = 0.259 vs. 0.094
Recall = 0.326 vs. 0.957
Minibatch Loss= 0.147919
Training: 10100
AUC = 1.000 vs. 0.072
F1 = 1.000 vs. 0.135
Precision = 1.000 vs. 0.114
Recall = 1.000 vs. 0.165
Validation: 10100
AUC = 0.266 vs. 0.111
F1 = 0.288 vs. 0.202
Precision = 0.259 vs. 0.157
Recall = 0.326 vs. 0.283
Minibatch Loss= 0.147891
Training: 10200
AUC = 1.000 vs. 0.056
F1 = 1.000 vs. 0.112
Precision = 1.000 vs. 0.060
Recall = 1.000 vs. 1.000
Validation: 10200
AUC = 0.267 vs. 0.119
F1 = 0.288 vs. 0.171
Precision = 0.259 vs. 0.095
Recall = 0.326 vs. 0.848
Minibatch Loss= 0.147880
Training: 10300
AUC = 1.000 vs. 0.060
F1 = 1.000 vs. 0.116
Precision = 1.000 vs. 0.062
Recall = 1.000 vs. 0.893
Validation: 10300
AUC = 0.268 vs. 0.080
F1 = 0.288 vs. 0.165
Precision = 0.259 vs. 0.090
Recall = 0.326 vs. 1.000
Minibatch Loss= 0.147

In [23]:
train_obj.train(max_iter = 5000,
                train_eval_step=100,
                validation_eval_step=100,
                display_step=100)

Training: 15000
AUC = 1.000 vs. 0.065
F1 = 1.000 vs. 0.122
Precision = 1.000 vs. 0.067
Recall = 1.000 vs. 0.711
Validation: 15000
AUC = 0.337 vs. 0.096
F1 = 0.400 vs. 0.197
Precision = 0.310 vs. 0.120
Recall = 0.565 vs. 0.543
Minibatch Loss= 0.147938
Training: 15100
AUC = 1.000 vs. 0.062
F1 = 0.992 vs. 0.114
Precision = 0.984 vs. 0.061
Recall = 1.000 vs. 0.967
Validation: 15100
AUC = 0.337 vs. 0.089
F1 = 0.397 vs. 0.183
Precision = 0.306 vs. 0.107
Recall = 0.565 vs. 0.630
Minibatch Loss= 0.148150
Training: 15200
AUC = 1.000 vs. 0.065
F1 = 1.000 vs. 0.118
Precision = 1.000 vs. 0.064
Recall = 1.000 vs. 0.702
Validation: 15200
AUC = 0.336 vs. 0.087
F1 = 0.400 vs. 0.169
Precision = 0.310 vs. 0.092
Recall = 0.565 vs. 0.978
Minibatch Loss= 0.147904
Training: 15300
AUC = 1.000 vs. 0.059
F1 = 1.000 vs. 0.113
Precision = 1.000 vs. 0.060
Recall = 1.000 vs. 0.893
Validation: 15300
AUC = 0.335 vs. 0.081
F1 = 0.397 vs. 0.165
Precision = 0.306 vs. 0.090
Recall = 0.565 vs. 1.000
Minibatch Loss= 0.147

KeyboardInterrupt: 

In [None]:
saver = tf.train.Saver()
saver.save(sess, checkpoint_path, global_step=train_obj.global_step)

In [None]:
saver = tf.train.Saver()
saver.restore(sess, checkpoint_path+'-1000')

In [17]:
_ = nn_eval.evaluate_model(model,
                                   sess,
                                   test_data,
                                   test_gt)

AUC = 0.247 vs. 0.068
F1 = 0.254 vs. 0.128
Precision = 0.419 vs. 0.069
Recall = 0.182 vs. 0.829


In [18]:
out = nn_eval.deploy(model,
                     sess,
                     test_data,
                     test_gt)

In [19]:
#shape of probability_change is (batch size, T, num_classes)
#since num_classes = 1 we squeeze that axis
out = np.squeeze(out, axis = 2)

In [20]:
savemat('../../poc_synthetic/train_abrupt_test_gradual/poc'+exp_name+'.mat', {'poc':out})