In [1]:
# useing this variable for saving models and summaries
exp_name = "DWN2001_newWavelet"

# Neural wavelet network
6levels wavelet then 5 layers CNN [2, 2, 2, 2, 2] 

## Importing Libraries

In [2]:
%load_ext autoreload
%autoreload 2
import numpy as np
import tensorflow as tf
import sys
from hdf5storage import savemat
import pickle

sys.path.append('../src')

In [3]:
import models.New_wavelet as wavelet_conv_model
import training
import evaluation.nn_eval as nn_eval 

## Loading synthetic data

In [4]:
#loading data
data_path= '/data2/data/zebrahim/synthetic_dataset/data_8192_1000_3_4_4_.03_.03_.2' + 'processed_data.p'

with open(data_path, 'r') as fin:
    data = pickle.load(fin)
    
train_data = data['train_data']
validation_data = data['validation_data']
test_data = data['test_data']

train_gt = np.expand_dims(data['train_gt'], axis=-1)
validation_gt = np.expand_dims(data['validation_gt'], axis=-1)
test_gt = np.expand_dims(data['test_gt'], axis=-1)

index_of_changes = data['index_of_changes']
 

In [5]:
#index of changes for test dataset
gt_test_idx_changes = index_of_changes[900:1000]

## Model

In [14]:
# Model parameters
n_variables = 12
learning_rate = 0.001
batch_size = 10


wavelet_levels = 6    #number of wavelet layer to have in the network
convolution_levels = 5    #number of convolution to have in the network
pooling_stride = [2, 2, 2, 2, 2]    #stride of pooling in convolution
weights_shape = [[5, n_variables, 32],
                 [5, 32, 64],
                 [5, 64, 64],
                 [5, 64, 64],
                 [5, 64, 64]]
bias_shape = [32, 64, 64, 64, 64]
#wavelet_weights_shape = [[5, n_variables, n_variables]]    #high_pass and low_pass dimensions
wavelet_kernel_size = 3
activation = tf.nn.relu
granularity = np.prod(pooling_stride)
n_classes = 1

##positive weight for weighted cross entropy
s = train_data.shape
resolution = np.prod(pooling_stride)
gt_effective = np.reshape(train_gt, (s[0]*(s[1]/resolution), resolution))
pos_weight = (1.0 - gt_effective.max(axis=1).mean()) / gt_effective.max(axis=1).mean()

In [7]:
print pos_weight

3.18601822124


In [8]:
# Launch the graph
config = tf.ConfigProto()
config.gpu_options.allow_growth = True
sess = tf.Session(config=config)

In [9]:
summary_path = '../summary/' + exp_name 
checkpoint_path = '../model/' + exp_name + '/' + exp_name 

In [10]:
model = wavelet_conv_model.Model(n_variables = n_variables,
                                 learning_rate = learning_rate,
                                 n_classes = n_classes)

In [15]:
model.build_model(pos_weight = pos_weight, 
                                 learning_rate = learning_rate,
                                 wavelet_levels = wavelet_levels,    
                                 convolution_levels = convolution_levels,    
                                 pooling_stride = pooling_stride,     
                                 weights_shape = weights_shape,
                                 bias_shape = bias_shape,
                                 wavelet_kernel_size = wavelet_kernel_size,    
                                 activation = activation,
                                 trainable_wavelet = True,
                                 trainable_conv = True,
                                 trainable_last = True,
                                 variables_weights = None,)

In [16]:
trainer = training.Trainer(model = model,
                    data_train = train_data,
                    ground_truth_train = train_gt,
                    data_validation = validation_data,
                    ground_truth_validation = validation_gt,
                    sess = sess,
                    summary_path = summary_path,
                    batch_size = batch_size)

In [17]:
trainer.train(max_iter = 10000,
                train_eval_step = 100,
                validation_eval_step = 100,
                display_step = 100)

Training: 0
AUC = 0.234 vs. 0.224
F1 = 0.401 vs. 0.363
Precision = 0.295 vs. 0.222
Recall = 0.627 vs. 1.000
Validation: 0
AUC = 0.308 vs. 0.234
F1 = 0.432 vs. 0.371
Precision = 0.292 vs. 0.228
Recall = 0.834 vs. 1.000
Minibatch Loss= 1.028049
Training: 100
AUC = 0.627 vs. 0.244
F1 = 0.627 vs. 0.387
Precision = 0.683 vs. 0.242
Recall = 0.579 vs. 0.962
Validation: 100
AUC = 0.691 vs. 0.218
F1 = 0.656 vs. 0.372
Precision = 0.601 vs. 0.228
Recall = 0.722 vs. 0.998
Minibatch Loss= 0.907921
Training: 200
AUC = 0.662 vs. 0.230
F1 = 0.655 vs. 0.368
Precision = 0.689 vs. 0.225
Recall = 0.623 vs. 1.000
Validation: 200
AUC = 0.707 vs. 0.227
F1 = 0.659 vs. 0.372
Precision = 0.701 vs. 0.229
Recall = 0.623 vs. 0.986
Minibatch Loss= 0.833184
Training: 300
AUC = 0.743 vs. 0.237
F1 = 0.726 vs. 0.387
Precision = 0.716 vs. 0.240
Recall = 0.737 vs. 0.998
Validation: 300
AUC = 0.737 vs. 0.222
F1 = 0.706 vs. 0.371
Precision = 0.783 vs. 0.228
Recall = 0.643 vs. 0.997
Minibatch Loss= 0.791215
Training: 400
AU

In [19]:
#Save the model
saver = tf.train.Saver()
saver.save(sess, checkpoint_path, global_step=trainer.global_step)

'../model/DWN2001_newWavelet/DWN2001_newWavelet-10000'

In [23]:
#This is the model evaluation on test dataset
probability_of_pos= nn_eval.evaluate_model (model, sess, test_data, test_gt)

AUC = 0.839 vs. 0.232
F1 = 0.767 vs. 0.376
Precision = 0.774 vs. 0.231
Recall = 0.760 vs. 0.999


In [25]:
out = nn_eval.deploy(model, sess, test_data, test_gt)

In [27]:
#shape of probability_change is (batch size, T, num_classes)
#since num_classes = 1 we squeeze that axis
out = np.squeeze(out, axis = 2)

In [28]:
out.shape

(100, 256)

In [30]:
savemat('../poc/poc'+exp_name+'.mat', {'poc':out})