In [1]:
# useing this variable for saving models and summaries
exp_name = "HRNN_synthetic_1"

## Running CNN then RNN
5 layers CNN [2, 2, 2, 2, 2], then RNN, bias_shape = [32,64,64, 64, 64]

In [4]:
%load_ext autoreload
%autoreload 2
import numpy as np
import tensorflow as tf
import sys
from hdf5storage import savemat
import hickle

sys.path.append('../src')

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload


In [3]:
from models.HRNN_model import Model
import training  
import evaluation.nn_eval as nn_eval 

## Loading synthetic data

In [8]:
#loading data
data_path= '/data2/data/zebrahim/synthetic_dataset/data_8192_1000_3_4_4_.03_.03_.2' + 'processed_data2.h'

with open(data_path, 'r') as fin:
    data = hickle.load(fin)
    
train_data = data['train_data']
validation_data = data['validation_data']
test_data = data['test_data']

train_gt = np.expand_dims(data['train_gt'], axis=-1)
validation_gt = np.expand_dims(data['validation_gt'], axis=-1)
test_gt = np.expand_dims(data['test_gt'], axis=-1)

index_of_changes = data['index_of_changes']
 

In [9]:
train_data.shape

(890, 8192, 12)

## Model

In [10]:
## Model Parameter
n_variables= 12
learning_rate = 0.001
batch_size = 10

wavelet_levels= 6
convolution_levels = 5
pooling_stride = [2, 2, 2, 2, 2]
weights_shape = [[5,n_variables, 32],
                 [5, 32, 64],
                 [5, 64, 64],
                 [5, 64, 64],
                 [5, 64, 64]]

bias_shape = [32, 64, 64, 64, 64]
activation = tf.nn.relu
wavelet_weights_shape = [[5, n_variables, n_variables]]    #high_pass and low_pass dimensions

lstm_n_hidden = 128
n_classes = 1

##positive weight for weighted cross entropy
s = train_gt.shape
resolution = np.prod(pooling_stride)

pooled_gt = np.reshape(train_gt[:,:(s[0]*s[1]/resolution)*resolution,:], (s[0]*(s[1]/resolution), resolution, s[2])).max(axis=1)
pos_weight = (1.0 - pooled_gt.mean(axis = 0)) / pooled_gt.mean(axis=0)

variables_weights = np.ones((n_classes,))

In [11]:
pos_weight

array([ 3.18601822])

In [12]:
# Launch the graph
config = tf.ConfigProto()
config.gpu_options.allow_growth = True
sess = tf.Session(config=config)

In [13]:
summary_path = '../summary_synthetic/' + exp_name 
checkpoint_path = '../model_synthetic/' + exp_name + '/' + exp_name 


In [14]:
model = Model(n_variables = n_variables,
                            learning_rate = learning_rate,
                            n_classes = n_classes)

In [15]:
model.build_model(pos_weight = pos_weight, 
                 learning_rate = learning_rate,
                 wavelet_levels = wavelet_levels,    
                 convolution_levels = convolution_levels,    
                 pooling_stride = pooling_stride,     
                 weights_shape = weights_shape,
                 bias_shape = bias_shape,
                 wavelet_weights_shape = wavelet_weights_shape,    
                 activation = activation,
                 lstm_n_hidden = lstm_n_hidden,
                 trainable_wavelet = True,
                 trainable_conv = True,
                 trainable_last = True,
                 variables_weights = variables_weights,
                 optimizer = tf.train.AdamOptimizer
)

6
Tensor("Squeeze_29:0", shape=(?, ?, 64), dtype=float32)
Tensor("Squeeze_29:0", shape=(?, ?, 64), dtype=float32) Tensor("zeros:0", shape=(?, ?, 128), dtype=float32) 5
Tensor("Squeeze_24:0", shape=(?, ?, 64), dtype=float32) Tensor("Reshape:0", shape=(?, ?, ?), dtype=float32) 4
Tensor("Squeeze_19:0", shape=(?, ?, 64), dtype=float32) Tensor("Reshape_1:0", shape=(?, ?, ?), dtype=float32) 3
Tensor("Squeeze_14:0", shape=(?, ?, 64), dtype=float32) Tensor("Reshape_2:0", shape=(?, ?, ?), dtype=float32) 2
Tensor("Squeeze_9:0", shape=(?, ?, 64), dtype=float32) Tensor("Reshape_3:0", shape=(?, ?, ?), dtype=float32) 1
Tensor("Squeeze_4:0", shape=(?, ?, 64), dtype=float32) Tensor("Reshape_4:0", shape=(?, ?, ?), dtype=float32) 0
Tensor("Squeeze_30:0", shape=(?, ?, 1), dtype=float32) Tensor("Reshape_7:0", shape=(?, ?, 1), dtype=float32)


In [16]:
trainer = training.Trainer(model = model,
                    data_train = train_data,
                    ground_truth_train = train_gt,
                    data_validation = test_data,
                    ground_truth_validation = test_gt,
                    sess = sess,
                    summary_path = summary_path,
                    batch_size = batch_size,
                    global_step = 0,
                    eval_type = 'change')

In [17]:
trainer.train(max_iter = 20000,
                train_eval_step=100,
                validation_eval_step=100,
                display_step=100)

Training: 0
AUC = 0.241 vs. 0.242
F1 = 0.392 vs. 0.384
Precision = 0.307 vs. 0.238
Recall = 0.540 vs. 1.000
Validation: 0
AUC = 0.204 vs. 0.232
F1 = 0.376 vs. 0.376
Precision = 0.231 vs. 0.231
Recall = 1.000 vs. 1.000
Minibatch Loss= 1.069105
Training: 100
AUC = 0.589 vs. 0.241
F1 = 0.581 vs. 0.378
Precision = 0.442 vs. 0.238
Recall = 0.847 vs. 0.916
Validation: 100
AUC = 0.503 vs. 0.232
F1 = 0.483 vs. 0.376
Precision = 0.405 vs. 0.232
Recall = 0.597 vs. 0.997
Minibatch Loss= 0.822554
Training: 200
AUC = 0.721 vs. 0.202
F1 = 0.693 vs. 0.346
Precision = 0.673 vs. 0.209
Recall = 0.714 vs. 0.998
Validation: 200
AUC = 0.725 vs. 0.229
F1 = 0.674 vs. 0.376
Precision = 0.660 vs. 0.231
Recall = 0.688 vs. 1.000
Minibatch Loss= 0.692992
Training: 300
AUC = 0.903 vs. 0.207
F1 = 0.837 vs. 0.361
Precision = 0.847 vs. 0.220
Recall = 0.828 vs. 1.000
Validation: 300
AUC = 0.870 vs. 0.226
F1 = 0.785 vs. 0.376
Precision = 0.785 vs. 0.232
Recall = 0.786 vs. 0.997
Minibatch Loss= 0.489919
Training: 400
AU

KeyboardInterrupt: 

In [18]:
saver = tf.train.Saver()
saver.save(sess, checkpoint_path, global_step=trainer.global_step)

'../model_synthetic/HRNN_synthetic_1/HRNN_synthetic_1-6883'

In [None]:
#saver = tf.train.Saver()
#saver.restore(sess, checkpoint_path+'-1000')

In [19]:
_= nn_eval.evaluate_model (model, sess, test_data, test_gt)

AUC = 0.960 vs. 0.232
F1 = 0.893 vs. 0.376
Precision = 0.902 vs. 0.231
Recall = 0.884 vs. 1.000


In [20]:
out = nn_eval.deploy (model, sess, test_data, test_gt)

In [15]:
#shape of probability_change is (batch size, T, num_classes)
#since num_classes = 1 we squeeze that axis
probability_change = np.squeeze(probability_of_pos, axis = 2)

In [21]:
savemat('../poc/poc'+exp_name+'.mat', {'poc':out[:,:,-1]})