In [1]:
# useing this variable for saving models and summaries
exp_name = "CNN1002"

## Importing Libraries

In [2]:
%load_ext autoreload
%autoreload 2
import tensorflow as tf
import numpy as np
from hdf5storage import savemat
import pickle 

import sys
sys.path.append('../../src')

In [3]:
import models.CNN_model as CNN_model
import training
import evaluation.nn_eval as nn_eval

## Loading synthetic data

In [4]:
#loading data
data_path= '../../data/synthetic2/' + 'processed2.p'

with open(data_path, 'r') as fin:
    data = pickle.load(fin)
    
train_data = data['train_data']
validation_data = data['validation_data']
test_data = data['test_data']

train_gt = np.expand_dims(data['train_gt'], axis=-1)
validation_gt = np.expand_dims(data['validation_gt'], axis=-1)
test_gt = np.expand_dims(data['test_gt'], axis=-1)

index_of_changes = data['index_of_changes']
 

In [5]:
train_data.shape, validation_data.shape, test_data.shape, train_gt.shape, validation_gt.shape, test_gt.shape, index_of_changes.shape

((8, 8192, 12),
 (2, 8192, 12),
 (10, 8192, 12),
 (8, 8192, 1),
 (2, 8192, 1),
 (10, 8192, 1),
 (10, 4))

## Model

In [6]:
# Model parameters
n_variables = 12
learning_rate = 0.001
batch_size = 10

convolution_levels = 5    #number of convolution to have in the network
pooling_stride = [2, 2, 2, 2, 2]
weights_shape = [[5, n_variables, 32],
                 [9, 32, 64],
                 [9, 64, 64],
                 [9, 64, 64],
                 [9, 64, 64]]
bias_shape = [32, 64, 64, 64, 64]
activation = tf.nn.relu
n_classes = 1

##positive weight for weighted cross entropy
s = train_data.shape
resolution = np.prod(pooling_stride)
gt_effective = np.reshape(train_gt, (s[0]*(s[1]/resolution), resolution))
pos_weight = (1.0 - gt_effective.max(axis=1).mean()) / gt_effective.max(axis=1).mean()

#variables_weights = np.ones((n_classes,))

In [7]:
print pos_weight

14.8812031901


In [8]:
# Launch the graph
config = tf.ConfigProto()
config.gpu_options.allow_growth = True
sess = tf.Session(config=config)

In [9]:
summary_path = '../../summary_synthetic/train_abrupt_test_gradual/' + exp_name 
checkpoint_path = '../../model_synthetic/train_abrupt_test_gradual/' + exp_name + '/' + exp_name 

In [10]:
model = CNN_model.Model(n_variables = n_variables,
                        learning_rate = learning_rate,
                        n_classes = n_classes)

In [11]:
model.build_conv_net(pos_weight_values= pos_weight,
                     learning_rate = learning_rate,
                     convolution_levels = convolution_levels, 
                     pooling_stride = pooling_stride,
                     weights_shape = weights_shape,
                     bias_shape = bias_shape,
                     n_classes = n_classes,
                     activation = activation,
                     trainable_conv = True,
                     trainable_last = True,)

In [12]:
trainer = training.Trainer(model = model,
                    data_train = train_data,
                    ground_truth_train = train_gt,
                    data_validation = validation_data,
                    ground_truth_validation = validation_gt,
                    sess = sess,
                    summary_path = summary_path,
                    batch_size = batch_size,
                    global_step = 0)

In [13]:
trainer.train(max_iter = 10000,
                train_eval_step = 100, 
                validation_eval_step = 100,
                display_step = 100)

Training: 0
AUC = 0.058 vs. 0.065
F1 = 0.138 vs. 0.120
Precision = 0.080 vs. 0.065
Recall = 0.516 vs. 0.750
Validation: 0
AUC = 0.280 vs. 0.095
F1 = 0.316 vs. 0.177
Precision = 0.300 vs. 0.097
Recall = 0.333 vs. 0.956
Minibatch Loss= 1.298494
Training: 100
AUC = 0.981 vs. 0.060
F1 = 0.948 vs. 0.117
Precision = 0.944 vs. 0.062
Recall = 0.952 vs. 0.992
Validation: 100
AUC = 0.498 vs. 0.084
F1 = 0.507 vs. 0.162
Precision = 0.773 vs. 0.088
Recall = 0.378 vs. 1.000
Minibatch Loss= 0.191954
Training: 200
AUC = 0.997 vs. 0.062
F1 = 0.972 vs. 0.119
Precision = 0.953 vs. 0.065
Recall = 0.992 vs. 0.661
Validation: 200
AUC = 0.475 vs. 0.116
F1 = 0.520 vs. 0.210
Precision = 0.402 vs. 0.165
Recall = 0.733 vs. 0.289
Minibatch Loss= 0.166373
Training: 300
AUC = 0.999 vs. 0.065
F1 = 0.992 vs. 0.120
Precision = 0.984 vs. 0.064
Recall = 1.000 vs. 0.863
Validation: 300
AUC = 0.524 vs. 0.108
F1 = 0.528 vs. 0.204
Precision = 0.412 vs. 0.120
Recall = 0.733 vs. 0.689
Minibatch Loss= 0.151618
Training: 400
AU

In [14]:
trainer.train(max_iter = 10000,
                train_eval_step = 1000, 
                validation_eval_step = 1000,
                display_step = 1000)

Training: 10000
AUC = 1.000 vs. 0.069
F1 = 1.000 vs. 0.117
Precision = 1.000 vs. 0.062
Recall = 1.000 vs. 0.903
Validation: 10000
AUC = 0.574 vs. 0.113
F1 = 0.513 vs. 0.164
Precision = 0.417 vs. 0.090
Recall = 0.667 vs. 0.956
Minibatch Loss= 0.141110
Training: 11000
AUC = 1.000 vs. 0.066
F1 = 1.000 vs. 0.118
Precision = 1.000 vs. 0.065
Recall = 1.000 vs. 0.597
Validation: 11000
AUC = 0.613 vs. 0.118
F1 = 0.575 vs. 0.165
Precision = 0.750 vs. 0.090
Recall = 0.467 vs. 1.000
Minibatch Loss= 0.141006
Training: 12000
AUC = 1.000 vs. 0.064
F1 = 1.000 vs. 0.116
Precision = 1.000 vs. 0.062
Recall = 1.000 vs. 1.000
Validation: 12000
AUC = 0.593 vs. 0.125
F1 = 0.597 vs. 0.214
Precision = 0.909 vs. 0.231
Recall = 0.444 vs. 0.200
Minibatch Loss= 0.140994
Training: 13000
AUC = 1.000 vs. 0.069
F1 = 1.000 vs. 0.119
Precision = 1.000 vs. 0.063
Recall = 1.000 vs. 0.952
Validation: 13000
AUC = 0.550 vs. 0.097
F1 = 0.541 vs. 0.164
Precision = 0.690 vs. 0.089
Recall = 0.444 vs. 1.000
Minibatch Loss= 0.140

In [14]:
#Save the model
saver = tf.train.Saver()
saver.save(sess, checkpoint_path, global_step=trainer.global_step)

'../../model_synthetic/train_abrupt_test_gradual/CNN1002/CNN1002-10000'

In [None]:
#load the model
saver = tf.train.Saver()
saver.restore(sess, "../models/model" + exp_name + "/model")

In [28]:
#This is the model evaluation on test dataset
probability_of_pos= nn_eval.evaluate_model (model, sess, test_data, test_gt)

AUC = 0.494 vs. 0.289
F1 = 0.464 vs. 0.435
Precision = 0.431 vs. 0.279
Recall = 0.502 vs. 0.984


In [29]:
#shape of probability_change is (batch size, T, num_classes)
#since num_classes = 1 we squeeze that axis
#squeezed_probability_of_pos = np.squeeze(probability_of_pos, axis = 2)

In [30]:
out = nn_eval.deploy (model, sess, test_data, test_gt)

In [31]:
out = np.squeeze(out, axis = 2)
out.shape

(10, 256)

In [32]:
savemat('../../poc_synthetic/train_abrupt_test_gradual/poc'+exp_name+'.mat', {'poc':out})