In [1]:
# useing this variable for saving models and summaries
exp_name = "DWN9005_opp"

## Importing Libraries

In [2]:
%load_ext autoreload
%autoreload 2
import tensorflow as tf
import numpy as np
from hdf5storage import savemat
import hickle 

import sys
sys.path.append('../src')

In [3]:
import models.wavelet_conv_model_light as wavelet_conv_model
import training
import evaluation.nn_eval_activity as nn_eval

## Loading synthetic data

In [4]:
#loading data
data_path= '../data/opp1.hkl'
with open(data_path, 'r') as fin:
    data = hickle.load(fin)

In [5]:
train_data = data['train_data']
validation_data = data['validation_data']
test_data = data['test_data']

train_gt = data['train_gt']
validation_gt = data['validation_gt']
test_gt = data['test_gt']

In [6]:
train_data.shape, train_gt.shape

((1, 700165, 77), (1, 700165, 18))

In [7]:
test_data.shape, test_gt.shape

((1, 120516, 77), (1, 120516, 18))

## Model

In [8]:
# Model parameters
n_variables = 77
learning_rate = 0.001
batch_size = 1

wavelet_levels = 5    #number of wavelet layer to have in the network
convolution_levels = 3    #number of convolution to have in the network
pooling_stride = [4, 4, 4]
weights_shape = [[5, n_variables, 32],
                 [5, 32, 32],
                 [5, 32, 32]]
bias_shape = [32, 32, 32]
wavelet_kernel_size = 5    #high_pass and low_pass dimensions
activation = tf.nn.relu
n_classes = 18

##positive weight for weighted cross entropy
s = train_gt.shape
resolution = np.prod(pooling_stride)
pooled_gt = np.reshape(train_gt[0,:(s[0]*s[1]/resolution)*resolution,:], (s[0]*(s[1]/resolution), resolution, s[2])).max(axis=1)
pos_weight = (1.0 - pooled_gt.mean(axis = 0)) / pooled_gt.mean(axis=0)


In [9]:
train_data = train_data[:,:-(train_data.shape[1]%((2**(wavelet_levels-1))*resolution)),:]
validation_data = validation_data[:,:-(validation_data.shape[1]%((2**(wavelet_levels-1))*resolution)),:]
test_data = test_data[:,:-(test_data.shape[1]%((2**(wavelet_levels-1))*resolution)),:]

train_gt = train_gt[:,:-(train_gt.shape[1]%((2**(wavelet_levels-1))*resolution)),:]
validation_gt = validation_gt[:,:-(validation_gt.shape[1]%((2**(wavelet_levels-1))*resolution)),:]
test_gt = test_gt[:,:-(test_gt.shape[1]%((2**(wavelet_levels-1))*resolution)),:]


In [10]:
pos_weight.shape

(18,)

In [11]:
pos_weight

array([  0.15400844,  34.75163399,  34.29032258,  35.46666667,
        35.7114094 ,  26.21393035,  26.69620253,  39.51851852,
        40.59695817,  45.55319149,  50.12149533,  48.50226244,
        52.10679612,  43.11290323,  43.11290323,  33.08099688,
        10.4795383 ,  35.83501684])

In [12]:
# Launch the graph
config = tf.ConfigProto()
config.gpu_options.allow_growth = True
sess = tf.Session(config=config)

In [13]:
summary_path = '../summary/' + exp_name 
checkpoint_path = '../model/' + exp_name + '/checkpoint' 

In [14]:
model = wavelet_conv_model.Model(n_variables = n_variables,
                                 learning_rate = learning_rate,
                                 n_classes = n_classes)

In [15]:
model.build_neural_wavelet_layer(pos_weight = pos_weight, 
                                 learning_rate = learning_rate,
                                 wavelet_levels = wavelet_levels,    
                                 convolution_levels = convolution_levels,    
                                 pooling_stride = pooling_stride,     
                                 weights_shape = weights_shape,
                                 bias_shape = bias_shape,
                                 wavelet_kernel_size = wavelet_kernel_size,    
                                 activation = activation)
                        

TypeError: build_neural_wavelet_layer() takes exactly 13 arguments (10 given)

In [None]:
trainer = training.Trainer(model = model,
                    data_train = train_data,
                    ground_truth_train = train_gt,
                    data_validation = test_data,
                    ground_truth_validation = test_gt,
                    sess = sess,
                    summary_path = summary_path,
                    batch_size = batch_size,
                    global_step = 0,
                    eval_type = 'activity')

In [17]:
trainer.run_debug_ops()

{'wavelet_out_shape': [array([     1, 699392,     77], dtype=int32), array([     1, 349696,     77], dtype=int32), array([     1, 174848,     77], dtype=int32), array([    1, 87424,    77], dtype=int32), array([    1, 43712,    77], dtype=int32)], 'cnn_out_shape': [array([    1, 10928,    18], dtype=int32), array([   1, 5464,   18], dtype=int32), array([   1, 2732,   18], dtype=int32), array([   1, 1366,   18], dtype=int32), array([  1, 683,  18], dtype=int32)], 'input_shape': array([     1, 699392,     77], dtype=int32), 'label_shape': array([     1, 699392,     18], dtype=int32)}


In [18]:
trainer.train(max_iter = 4000,
                train_eval_step = 1, 
                validation_eval_step = 1,
                display_step = 1)

Train Batch Evaluation
AUC = 0.079 vs. 0.077
F1 = 0.122 vs. 0.108
Accuracy = 0.003 vs. 0.056
Validation
AUC = 0.074 vs. 0.070
F1 = 0.107 vs. 0.099
Accuracy = 0.000 vs. 0.056
Minibatch Loss= 1.281807
Train Batch Evaluation
AUC = 0.086 vs. 0.077
F1 = 0.132 vs. 0.109
Accuracy = 0.005 vs. 0.056
Validation
AUC = 0.079 vs. 0.070
F1 = 0.117 vs. 0.098
Accuracy = 0.001 vs. 0.056
Minibatch Loss= 1.280940
Train Batch Evaluation
AUC = 0.091 vs. 0.076
F1 = 0.140 vs. 0.107
Accuracy = 0.013 vs. 0.056
Validation
AUC = 0.083 vs. 0.073
F1 = 0.120 vs. 0.108
Accuracy = 0.006 vs. 0.056
Minibatch Loss= 1.280178
Train Batch Evaluation
AUC = 0.094 vs. 0.077
F1 = 0.147 vs. 0.108
Accuracy = 0.032 vs. 0.056
Validation
AUC = 0.082 vs. 0.071
F1 = 0.121 vs. 0.108
Accuracy = 0.013 vs. 0.056
Minibatch Loss= 1.279428
Train Batch Evaluation
AUC = 0.099 vs. 0.077
F1 = 0.154 vs. 0.108
Accuracy = 0.035 vs. 0.056
Validation
AUC = 0.083 vs. 0.072
F1 = 0.123 vs. 0.105
Accuracy = 0.018 vs. 0.056
Minibatch Loss= 1.278616
Train

KeyboardInterrupt: 

In [19]:
#Save the model
saver = tf.train.Saver()
saver.save(sess, checkpoint_path, global_step=trainer.global_step)

[autoreload of models.wavelet_conv_model_light failed: Traceback (most recent call last):
  File "/data2/data/zebrahim/anaconda2/envs/tensorflow/lib/python2.7/site-packages/IPython/extensions/autoreload.py", line 247, in check
    superreload(m, reload, self.old_objects)
  File "../src/models/wavelet_conv_model_light.py", line 109
    trainable=trainable_last
            ^
SyntaxError: invalid syntax
]


'../model/DWN9005_opp/checkpoint-607'

In [None]:
trainer.train(max_iter = 4000,
                train_eval_step = 1, 
                validation_eval_step = 1,
                display_step = 1)

Train Batch Evaluation
AUC = 0.896 vs. 0.077
F1 = 0.879 vs. 0.108
Accuracy = 0.919 vs. 0.056
Validation
AUC = 0.517 vs. 0.069
F1 = 0.556 vs. 0.102
Accuracy = 0.864 vs. 0.056
Minibatch Loss= 0.074121
Train Batch Evaluation
AUC = 0.896 vs. 0.077
F1 = 0.881 vs. 0.109
Accuracy = 0.900 vs. 0.056
Validation
AUC = 0.505 vs. 0.072
F1 = 0.554 vs. 0.103
Accuracy = 0.855 vs. 0.056
Minibatch Loss= 0.072992
Train Batch Evaluation
AUC = 0.897 vs. 0.077
F1 = 0.880 vs. 0.110
Accuracy = 0.897 vs. 0.056
Validation
AUC = 0.517 vs. 0.070
F1 = 0.555 vs. 0.102
Accuracy = 0.849 vs. 0.056
Minibatch Loss= 0.075119
Train Batch Evaluation
AUC = 0.896 vs. 0.077
F1 = 0.880 vs. 0.109
Accuracy = 0.913 vs. 0.056
Validation
AUC = 0.512 vs. 0.070
F1 = 0.556 vs. 0.102
Accuracy = 0.864 vs. 0.056
Minibatch Loss= 0.070315
Train Batch Evaluation
AUC = 0.896 vs. 0.077
F1 = 0.881 vs. 0.108
Accuracy = 0.920 vs. 0.056
Validation
AUC = 0.505 vs. 0.072
F1 = 0.555 vs. 0.105
Accuracy = 0.869 vs. 0.056
Minibatch Loss= 0.073153
Train

In [None]:
#load the model
saver = tf.train.Saver()
#saver.restore(sess, "../model" + "/CNN7002_Gleam" + "/CNN7002_Gleam")
saver.restore(sess, '../model/CNN7002_Gleam/CNN7002_Gleam-10000')


In [23]:
#This is the model evaluation on test dataset
_= nn_eval.evaluate_model (model, sess, test_data, test_gt)

AUC = 0.537 vs. 0.069
F1 = 0.586 vs. 0.103
Accuracy = 0.919 vs. 0.056


In [None]:
#shape of probability_change is (batch size, T, num_classes)
#since num_classes = 1 we squeeze that axis
probability_change = np.squeeze(probability_of_pos, axis = 2)

In [None]:
savemat('../poc/poc'+exp_name+'.mat', {'poc':probability_change})

In [21]:
1

1