In [5]:
%load_ext autoreload
%autoreload 2

from config.rnn import default
from models import RNNV2, RNN, RNNV12
import numpy as np
from functional import seq
import tensorflow as tf
from tensorpack import (TrainConfig, SyncMultiGPUTrainerParameterServer as Trainer, 
                        PredictConfig, MultiProcessDatasetPredictor as Predictor,
                        SaverRestore, logger)
from tensorpack.callbacks import (ScheduledHyperParamSetter, MaxSaver, ModelSaver,
                                  DataParallelInferenceRunner as InfRunner)
from tensorpack.predict import SimpleDatasetPredictor
from tensorpack.tfutils.common import get_default_sess_config
from utils import DataManager
from utils.validation import (Accumulator, AggregateMetric, calcu_metrics)

resnet_loc = "./data/resnet_v2_101/resnet_v2_101.ckpt"
log_dir = './train_log/rnn_v2/1conv-0aconv/'
logger.set_logger_dir(log_dir, action='d')

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
[32m[1102 09:49:26 @logger.py:74][0m Argv: /home/yangyang/Applications/anaconda3/lib/python3.6/site-packages/ipykernel_launcher.py -f /run/user/1007/jupyter/kernel-f2d6d34e-e919-4aed-acf1-f7d068e9f2ab.json


In [6]:
config = default
ignore_restore = ['learning_rate', 'global_step']
save_name = "all-stages-max-micro-auc.tfmodel"

In [7]:
config.stages = [2, 3, 4, 5, 6]
config.proportion = {'train': 0.55, 'val': 0.0, 'test': 0.45}
config.annotation_number = None
dm = DataManager.from_config(config)
train_set = dm.get_train_set()
test_set = dm.get_test_set()

In [8]:
config.proportion = {'train': 0.8, 'val':0.2, 'test': 0.0}
config.stages = [6]
config.annotation_number = 10
dm = DataManager.from_dataset(train_set, test_set, config)
dm.get_num_info()

{'test': (1178, 6583), 'train': (1057, 6116), 'val': (234, 1328)}

In [9]:
dm.get_imbalance_ratio()

Unnamed: 0,train,val,test
dorsal prothoracic pharyngeal muscle,5.074713,4.571429,5.299465
embryonic brain,1.936111,1.752941,1.923077
embryonic central nervous system,3.194444,2.836066,3.51341
embryonic dorsal epidermis,2.815884,2.774194,2.99322
embryonic head epidermis,4.62234,4.571429,4.89
embryonic midgut,1.076621,0.983051,1.073944
embryonic ventral epidermis,3.24498,3.333333,3.530769
embryonic/larval muscle system,3.034351,3.105263,3.10453
ubiquitous,5.181287,5.0,5.333333
ventral nerve cord,1.849057,1.629213,1.8523


In [10]:
config.weight_decay = 0.0
config.dropout_keep_prob = 0.7
config.gamma = 2
config.use_glimpse = False
config.doubly_stochastic_lambda = 0
config.read_time = 5
config.batch_size = 64

threshold = 0.4
train_data = dm.get_train_stream()
val_data = dm.get_train_stream()

In [14]:
np.set_printoptions(formatter={'float_kind': lambda x: '%.2f' % x})
model = RNN(config, is_finetuning=False, 
              label_scale=dm.get_imbalance_ratio().train.values)
tf.reset_default_graph()
train_config = TrainConfig(model=model, dataflow=train_data,
                           callbacks=[
                               ScheduledHyperParamSetter('learning_rate', [(0, 1e-4), (15, 1e-5)]),
                               InfRunner(val_data, [AggregateMetric(config.validation_metrics, threshold)],
                                         [1]),
                               ModelSaver(var_collections='model_variables'),
                               MaxSaver('micro_auc', save_name),
                           ],
                           session_init=SaverRestore(
                               model_path=resnet_loc, ignore=ignore_restore),
                           max_epoch=20, tower=[1])
Trainer(train_config).train()

[32m[1102 09:55:09 @inference_runner.py:83][0m InferenceRunner will eval on an InputSource of size 16
[32m[1102 09:55:10 @input_source.py:178][0m Setting up the queue 'QueueInput/input_queue' for CPU prefetching ...
[32m[1102 09:55:10 @training.py:92][0m Building graph for training tower 0 on device LeastLoadedDeviceSetter-/gpu:1...
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
[32m[1102 09:55:14 @model_utils.py:47][0m [36mModel Parameters: 
[0

[32m[1102 09:55:19 @base.py:212][0m Creating the session ...
[32m[1102 09:55:21 @base.py:216][0m Initializing the session ...
[32m[1102 09:55:21 @sessinit.py:116][0m Restoring checkpoint from ./data/resnet_v2_101/resnet_v2_101.ckpt ...
INFO:tensorflow:Restoring parameters from ./data/resnet_v2_101/resnet_v2_101.ckpt
[32m[1102 09:55:23 @base.py:223][0m Graph Finalized.
[32m[1102 09:55:23 @param.py:144][0m After epoch 0, learning_rate will change to 0.00010000
[32m[1102 09:55:23 @concurrency.py:36][0m Starting EnqueueThread DataParallelInferenceRunner/QueueInput/input_queue ...
[32m[1102 09:55:24 @concurrency.py:36][0m Starting EnqueueThread QueueInput/input_queue ...
[32m[1102 09:55:24 @base.py:257][0m Start Epoch 1 ...


100%|##########|16/16[00:40<00:00, 0.50it/s]

[32m[1102 09:56:05 @base.py:267][0m Epoch 1 (global_step 16) finished, time:40.06 sec.



  'precision', 'predicted', average, warn_for)
100%|##########|16/16[00:23<00:00, 0.65it/s]


[32m[1102 09:56:29 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-16.
[32m[1102 09:56:30 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 09:56:30 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 24
[32m[1102 09:56:30 @monitor.py:361][0m QueueInput/queue_size_1: 8.3006
[32m[1102 09:56:30 @monitor.py:361][0m coverage: 6.5615
[32m[1102 09:56:30 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 09:56:30 @monitor.py:361][0m loss/value: 0.17339
[32m[1102 09:56:30 @monitor.py:361][0m macro_auc: 0.74763
[32m[1102 09:56:30 @monitor.py:361][0m macro_f1: 0.22897
[32m[1102 09:56:30 @monitor.py:361][0m mean_average_precision: 0.54096
[32m[1102 09:56:30 @monitor.py:361][0m micro_auc: 0.52735
[32m[1102 09:56:30 @monitor.py:361][0m micro_f1: 0.30673
[32m[1102 09:56:30 @monitor.py:361][0m one_error: 0.78027
[32m[1102 09:56:30 @monitor.py:361][0m ranking_loss: 0.49629
[32m[1102 09:56:30 @monitor.py:361][0m r

100%|##########|16/16[00:28<00:00, 0.58it/s]

[32m[1102 09:56:59 @base.py:267][0m Epoch 2 (global_step 32) finished, time:28.80 sec.



100%|##########|16/16[00:24<00:00, 0.69it/s]


[32m[1102 09:57:24 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-32.
[32m[1102 09:57:26 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 09:57:26 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 25.093
[32m[1102 09:57:26 @monitor.py:361][0m QueueInput/queue_size_1: 20.374
[32m[1102 09:57:26 @monitor.py:361][0m coverage: 6.375
[32m[1102 09:57:26 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 09:57:26 @monitor.py:361][0m loss/value: 0.13929
[32m[1102 09:57:26 @monitor.py:361][0m macro_auc: 0.79843
[32m[1102 09:57:26 @monitor.py:361][0m macro_f1: 0.29775
[32m[1102 09:57:26 @monitor.py:361][0m mean_average_precision: 0.61317
[32m[1102 09:57:26 @monitor.py:361][0m micro_auc: 0.57833
[32m[1102 09:57:26 @monitor.py:361][0m micro_f1: 0.36954
[32m[1102 09:57:26 @monitor.py:361][0m one_error: 0.79688
[32m[1102 09:57:26 @monitor.py:361][0m ranking_loss: 0.45362
[32m[1102 09:57:26 @monitor.py:361][0

100%|##########|16/16[00:29<00:00, 0.55it/s]

[32m[1102 09:57:55 @base.py:267][0m Epoch 3 (global_step 48) finished, time:29.18 sec.



100%|##########|16/16[00:25<00:00, 0.70it/s]


[32m[1102 09:58:21 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-48.
[32m[1102 09:58:22 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 09:58:22 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 35.314
[32m[1102 09:58:22 @monitor.py:361][0m QueueInput/queue_size_1: 32.813
[32m[1102 09:58:22 @monitor.py:361][0m coverage: 5.9414
[32m[1102 09:58:22 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 09:58:22 @monitor.py:361][0m loss/value: 0.12239
[32m[1102 09:58:22 @monitor.py:361][0m macro_auc: 0.82081
[32m[1102 09:58:22 @monitor.py:361][0m macro_f1: 0.32952
[32m[1102 09:58:22 @monitor.py:361][0m mean_average_precision: 0.65012
[32m[1102 09:58:22 @monitor.py:361][0m micro_auc: 0.62262
[32m[1102 09:58:22 @monitor.py:361][0m micro_f1: 0.39816
[32m[1102 09:58:22 @monitor.py:361][0m one_error: 0.70508
[32m[1102 09:58:22 @monitor.py:361][0m ranking_loss: 0.40931
[32m[1102 09:58:22 @monitor.py:361][

100%|##########|16/16[00:30<00:00, 0.55it/s]

[32m[1102 09:58:53 @base.py:267][0m Epoch 4 (global_step 64) finished, time:30.20 sec.



100%|##########|16/16[00:23<00:00, 0.71it/s]


[32m[1102 09:59:16 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-64.
[32m[1102 09:59:17 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 09:59:17 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 43.169
[32m[1102 09:59:17 @monitor.py:361][0m QueueInput/queue_size_1: 42.759
[32m[1102 09:59:17 @monitor.py:361][0m coverage: 5.5674
[32m[1102 09:59:17 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 09:59:17 @monitor.py:361][0m loss/value: 0.1093
[32m[1102 09:59:17 @monitor.py:361][0m macro_auc: 0.83807
[32m[1102 09:59:17 @monitor.py:361][0m macro_f1: 0.3049
[32m[1102 09:59:17 @monitor.py:361][0m mean_average_precision: 0.67355
[32m[1102 09:59:17 @monitor.py:361][0m micro_auc: 0.64326
[32m[1102 09:59:17 @monitor.py:361][0m micro_f1: 0.37797
[32m[1102 09:59:17 @monitor.py:361][0m one_error: 0.67969
[32m[1102 09:59:17 @monitor.py:361][0m ranking_loss: 0.38298
[32m[1102 09:59:17 @monitor.py:361][0m

100%|##########|16/16[00:29<00:00, 0.56it/s]

[32m[1102 09:59:47 @base.py:267][0m Epoch 5 (global_step 80) finished, time:29.43 sec.



100%|##########|16/16[00:22<00:00, 0.71it/s]


[32m[1102 10:00:10 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-80.
[32m[1102 10:00:12 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 10:00:12 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.007
[32m[1102 10:00:12 @monitor.py:361][0m QueueInput/queue_size_1: 46.825
[32m[1102 10:00:12 @monitor.py:361][0m coverage: 5.207
[32m[1102 10:00:12 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 10:00:12 @monitor.py:361][0m loss/value: 0.10096
[32m[1102 10:00:12 @monitor.py:361][0m macro_auc: 0.85625
[32m[1102 10:00:12 @monitor.py:361][0m macro_f1: 0.34033
[32m[1102 10:00:12 @monitor.py:361][0m mean_average_precision: 0.70117
[32m[1102 10:00:12 @monitor.py:361][0m micro_auc: 0.67417
[32m[1102 10:00:12 @monitor.py:361][0m micro_f1: 0.40766
[32m[1102 10:00:12 @monitor.py:361][0m one_error: 0.64844
[32m[1102 10:00:12 @monitor.py:361][0m ranking_loss: 0.34805
[32m[1102 10:00:12 @monitor.py:361][0

100%|##########|16/16[00:29<00:00, 0.54it/s]

[32m[1102 10:00:41 @base.py:267][0m Epoch 6 (global_step 96) finished, time:29.91 sec.



100%|##########|16/16[00:22<00:00, 0.69it/s]


[32m[1102 10:01:04 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-96.
[32m[1102 10:01:06 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 10:01:06 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 48.407
[32m[1102 10:01:06 @monitor.py:361][0m QueueInput/queue_size_1: 48.547
[32m[1102 10:01:06 @monitor.py:361][0m coverage: 5.0928
[32m[1102 10:01:06 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 10:01:06 @monitor.py:361][0m loss/value: 0.094641
[32m[1102 10:01:06 @monitor.py:361][0m macro_auc: 0.86784
[32m[1102 10:01:06 @monitor.py:361][0m macro_f1: 0.44258
[32m[1102 10:01:06 @monitor.py:361][0m mean_average_precision: 0.72359
[32m[1102 10:01:06 @monitor.py:361][0m micro_auc: 0.69792
[32m[1102 10:01:06 @monitor.py:361][0m micro_f1: 0.47235
[32m[1102 10:01:06 @monitor.py:361][0m one_error: 0.62109
[32m[1102 10:01:06 @monitor.py:361][0m ranking_loss: 0.33166
[32m[1102 10:01:06 @monitor.py:361]

100%|##########|16/16[00:29<00:00, 0.54it/s]

[32m[1102 10:01:36 @base.py:267][0m Epoch 7 (global_step 112) finished, time:29.28 sec.



100%|##########|16/16[00:22<00:00, 0.70it/s]


[32m[1102 10:01:59 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-112.
[32m[1102 10:01:59 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.02
[32m[1102 10:01:59 @monitor.py:361][0m QueueInput/queue_size_1: 49.335
[32m[1102 10:01:59 @monitor.py:361][0m coverage: 5.1006
[32m[1102 10:01:59 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 10:01:59 @monitor.py:361][0m loss/value: 0.089014
[32m[1102 10:01:59 @monitor.py:361][0m macro_auc: 0.87484
[32m[1102 10:01:59 @monitor.py:361][0m macro_f1: 0.40412
[32m[1102 10:01:59 @monitor.py:361][0m mean_average_precision: 0.74073
[32m[1102 10:01:59 @monitor.py:361][0m micro_auc: 0.68726
[32m[1102 10:01:59 @monitor.py:361][0m micro_f1: 0.44568
[32m[1102 10:01:59 @monitor.py:361][0m one_error: 0.61914
[32m[1102 10:01:59 @monitor.py:361][0m ranking_loss: 0.3378
[32m[1102 10:01:59 @monitor.py:361][0m ranking_mean_average_precision: 0.5322
[32m[1102 10:01:59 @monitor.py:361

100%|##########|16/16[00:29<00:00, 0.54it/s]

[32m[1102 10:02:28 @base.py:267][0m Epoch 8 (global_step 128) finished, time:29.40 sec.



100%|##########|16/16[00:22<00:00, 0.70it/s]


[32m[1102 10:02:51 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-128.
[32m[1102 10:02:53 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 10:02:53 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.357
[32m[1102 10:02:53 @monitor.py:361][0m QueueInput/queue_size_1: 49.708
[32m[1102 10:02:53 @monitor.py:361][0m coverage: 4.8789
[32m[1102 10:02:53 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 10:02:53 @monitor.py:361][0m loss/value: 0.083679
[32m[1102 10:02:53 @monitor.py:361][0m macro_auc: 0.88593
[32m[1102 10:02:53 @monitor.py:361][0m macro_f1: 0.47573
[32m[1102 10:02:53 @monitor.py:361][0m mean_average_precision: 0.7652
[32m[1102 10:02:53 @monitor.py:361][0m micro_auc: 0.71606
[32m[1102 10:02:53 @monitor.py:361][0m micro_f1: 0.50644
[32m[1102 10:02:53 @monitor.py:361][0m one_error: 0.59082
[32m[1102 10:02:53 @monitor.py:361][0m ranking_loss: 0.30204
[32m[1102 10:02:53 @monitor.py:361]

100%|##########|16/16[00:29<00:00, 0.55it/s]

[32m[1102 10:03:22 @base.py:267][0m Epoch 9 (global_step 144) finished, time:29.39 sec.



100%|##########|16/16[00:22<00:00, 0.71it/s]


[32m[1102 10:03:45 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-144.
[32m[1102 10:03:47 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 10:03:47 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.558
[32m[1102 10:03:47 @monitor.py:361][0m QueueInput/queue_size_1: 49.824
[32m[1102 10:03:47 @monitor.py:361][0m coverage: 4.5264
[32m[1102 10:03:47 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 10:03:47 @monitor.py:361][0m loss/value: 0.079322
[32m[1102 10:03:47 @monitor.py:361][0m macro_auc: 0.89361
[32m[1102 10:03:47 @monitor.py:361][0m macro_f1: 0.53997
[32m[1102 10:03:47 @monitor.py:361][0m mean_average_precision: 0.77509
[32m[1102 10:03:47 @monitor.py:361][0m micro_auc: 0.76354
[32m[1102 10:03:47 @monitor.py:361][0m micro_f1: 0.56392
[32m[1102 10:03:47 @monitor.py:361][0m one_error: 0.49023
[32m[1102 10:03:47 @monitor.py:361][0m ranking_loss: 0.25706
[32m[1102 10:03:47 @monitor.py:361]

100%|##########|16/16[00:29<00:00, 0.57it/s]

[32m[1102 10:04:16 @base.py:267][0m Epoch 10 (global_step 160) finished, time:29.09 sec.



100%|##########|16/16[00:22<00:00, 0.71it/s]


[32m[1102 10:04:39 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-160.
[32m[1102 10:04:40 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 10:04:40 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.566
[32m[1102 10:04:40 @monitor.py:361][0m QueueInput/queue_size_1: 49.854
[32m[1102 10:04:40 @monitor.py:361][0m coverage: 4.2373
[32m[1102 10:04:40 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 10:04:40 @monitor.py:361][0m loss/value: 0.074488
[32m[1102 10:04:40 @monitor.py:361][0m macro_auc: 0.90041
[32m[1102 10:04:40 @monitor.py:361][0m macro_f1: 0.55376
[32m[1102 10:04:40 @monitor.py:361][0m mean_average_precision: 0.78495
[32m[1102 10:04:40 @monitor.py:361][0m micro_auc: 0.79875
[32m[1102 10:04:40 @monitor.py:361][0m micro_f1: 0.58622
[32m[1102 10:04:40 @monitor.py:361][0m one_error: 0.38379
[32m[1102 10:04:40 @monitor.py:361][0m ranking_loss: 0.22252
[32m[1102 10:04:40 @monitor.py:361]

100%|##########|16/16[00:29<00:00, 0.55it/s]

[32m[1102 10:05:10 @base.py:267][0m Epoch 11 (global_step 176) finished, time:29.07 sec.



100%|##########|16/16[00:22<00:00, 0.70it/s]


[32m[1102 10:05:33 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-176.
[32m[1102 10:05:33 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.604
[32m[1102 10:05:33 @monitor.py:361][0m QueueInput/queue_size_1: 49.936
[32m[1102 10:05:33 @monitor.py:361][0m coverage: 4.3457
[32m[1102 10:05:33 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 10:05:33 @monitor.py:361][0m loss/value: 0.07031
[32m[1102 10:05:33 @monitor.py:361][0m macro_auc: 0.91067
[32m[1102 10:05:33 @monitor.py:361][0m macro_f1: 0.56313
[32m[1102 10:05:33 @monitor.py:361][0m mean_average_precision: 0.80717
[32m[1102 10:05:33 @monitor.py:361][0m micro_auc: 0.77555
[32m[1102 10:05:33 @monitor.py:361][0m micro_f1: 0.56056
[32m[1102 10:05:33 @monitor.py:361][0m one_error: 0.47461
[32m[1102 10:05:33 @monitor.py:361][0m ranking_loss: 0.24728
[32m[1102 10:05:33 @monitor.py:361][0m ranking_mean_average_precision: 0.6325
[32m[1102 10:05:33 @monitor.py:36

100%|##########|16/16[00:29<00:00, 0.54it/s]

[32m[1102 10:06:02 @base.py:267][0m Epoch 12 (global_step 192) finished, time:29.17 sec.



100%|##########|16/16[00:22<00:00, 0.70it/s]


[32m[1102 10:06:25 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-192.
[32m[1102 10:06:25 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.689
[32m[1102 10:06:25 @monitor.py:361][0m QueueInput/queue_size_1: 49.972
[32m[1102 10:06:25 @monitor.py:361][0m coverage: 4.2168
[32m[1102 10:06:25 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 10:06:25 @monitor.py:361][0m loss/value: 0.06706
[32m[1102 10:06:25 @monitor.py:361][0m macro_auc: 0.91793
[32m[1102 10:06:25 @monitor.py:361][0m macro_f1: 0.58132
[32m[1102 10:06:25 @monitor.py:361][0m mean_average_precision: 0.81416
[32m[1102 10:06:25 @monitor.py:361][0m micro_auc: 0.79297
[32m[1102 10:06:25 @monitor.py:361][0m micro_f1: 0.57727
[32m[1102 10:06:25 @monitor.py:361][0m one_error: 0.50293
[32m[1102 10:06:25 @monitor.py:361][0m ranking_loss: 0.23664
[32m[1102 10:06:25 @monitor.py:361][0m ranking_mean_average_precision: 0.63937
[32m[1102 10:06:25 @monitor.py:3

100%|##########|16/16[00:29<00:00, 0.56it/s]

[32m[1102 10:06:55 @base.py:267][0m Epoch 13 (global_step 208) finished, time:29.54 sec.



100%|##########|16/16[00:22<00:00, 0.72it/s]


[32m[1102 10:07:17 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-208.
[32m[1102 10:07:19 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 10:07:20 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.428
[32m[1102 10:07:20 @monitor.py:361][0m QueueInput/queue_size_1: 49.988
[32m[1102 10:07:20 @monitor.py:361][0m coverage: 4.2578
[32m[1102 10:07:20 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 10:07:20 @monitor.py:361][0m loss/value: 0.06456
[32m[1102 10:07:20 @monitor.py:361][0m macro_auc: 0.92195
[32m[1102 10:07:20 @monitor.py:361][0m macro_f1: 0.56037
[32m[1102 10:07:20 @monitor.py:361][0m mean_average_precision: 0.82567
[32m[1102 10:07:20 @monitor.py:361][0m micro_auc: 0.81659
[32m[1102 10:07:20 @monitor.py:361][0m micro_f1: 0.59246
[32m[1102 10:07:20 @monitor.py:361][0m one_error: 0.30664
[32m[1102 10:07:20 @monitor.py:361][0m ranking_loss: 0.21416
[32m[1102 10:07:20 @monitor.py:361]

100%|##########|16/16[00:29<00:00, 0.54it/s]

[32m[1102 10:07:49 @base.py:267][0m Epoch 14 (global_step 224) finished, time:29.24 sec.



100%|##########|16/16[00:22<00:00, 0.69it/s]


[32m[1102 10:08:12 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-224.
[32m[1102 10:08:12 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.397
[32m[1102 10:08:12 @monitor.py:361][0m QueueInput/queue_size_1: 49.995
[32m[1102 10:08:12 @monitor.py:361][0m coverage: 4.5117
[32m[1102 10:08:12 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 10:08:12 @monitor.py:361][0m loss/value: 0.059566
[32m[1102 10:08:12 @monitor.py:361][0m macro_auc: 0.9195
[32m[1102 10:08:12 @monitor.py:361][0m macro_f1: 0.52453
[32m[1102 10:08:12 @monitor.py:361][0m mean_average_precision: 0.83046
[32m[1102 10:08:12 @monitor.py:361][0m micro_auc: 0.79575
[32m[1102 10:08:12 @monitor.py:361][0m micro_f1: 0.55336
[32m[1102 10:08:12 @monitor.py:361][0m one_error: 0.34473
[32m[1102 10:08:12 @monitor.py:361][0m ranking_loss: 0.23826
[32m[1102 10:08:12 @monitor.py:361][0m ranking_mean_average_precision: 0.67736
[32m[1102 10:08:12 @monitor.py:3

100%|##########|16/16[00:29<00:00, 0.56it/s]

[32m[1102 10:08:41 @base.py:267][0m Epoch 15 (global_step 240) finished, time:29.10 sec.
[32m[1102 10:08:41 @param.py:144][0m After epoch 15, learning_rate will change to 0.00001000



100%|##########|16/16[00:22<00:00, 0.71it/s]


[32m[1102 10:09:05 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-240.
[32m[1102 10:09:05 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.705
[32m[1102 10:09:05 @monitor.py:361][0m QueueInput/queue_size_1: 49.998
[32m[1102 10:09:05 @monitor.py:361][0m coverage: 4.791
[32m[1102 10:09:05 @monitor.py:361][0m learning_rate: 0.0001
[32m[1102 10:09:05 @monitor.py:361][0m loss/value: 0.056864
[32m[1102 10:09:05 @monitor.py:361][0m macro_auc: 0.92721
[32m[1102 10:09:05 @monitor.py:361][0m macro_f1: 0.51558
[32m[1102 10:09:05 @monitor.py:361][0m mean_average_precision: 0.83651
[32m[1102 10:09:05 @monitor.py:361][0m micro_auc: 0.77371
[32m[1102 10:09:05 @monitor.py:361][0m micro_f1: 0.50316
[32m[1102 10:09:05 @monitor.py:361][0m one_error: 0.32031
[32m[1102 10:09:05 @monitor.py:361][0m ranking_loss: 0.2607
[32m[1102 10:09:05 @monitor.py:361][0m ranking_mean_average_precision: 0.66815
[32m[1102 10:09:05 @monitor.py:36

100%|##########|16/16[00:29<00:00, 0.55it/s]

[32m[1102 10:09:34 @base.py:267][0m Epoch 16 (global_step 256) finished, time:29.45 sec.



100%|##########|16/16[00:22<00:00, 0.71it/s]


[32m[1102 10:09:57 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-256.
[32m[1102 10:09:59 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 10:09:59 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.732
[32m[1102 10:09:59 @monitor.py:361][0m QueueInput/queue_size_1: 49.999
[32m[1102 10:09:59 @monitor.py:361][0m coverage: 4.2832
[32m[1102 10:09:59 @monitor.py:361][0m learning_rate: 1e-05
[32m[1102 10:09:59 @monitor.py:361][0m loss/value: 0.052588
[32m[1102 10:09:59 @monitor.py:361][0m macro_auc: 0.93523
[32m[1102 10:09:59 @monitor.py:361][0m macro_f1: 0.56023
[32m[1102 10:09:59 @monitor.py:361][0m mean_average_precision: 0.85124
[32m[1102 10:09:59 @monitor.py:361][0m micro_auc: 0.81851
[32m[1102 10:09:59 @monitor.py:361][0m micro_f1: 0.56017
[32m[1102 10:09:59 @monitor.py:361][0m one_error: 0.27148
[32m[1102 10:09:59 @monitor.py:361][0m ranking_loss: 0.21432
[32m[1102 10:09:59 @monitor.py:361]

100%|##########|16/16[00:29<00:00, 0.54it/s]

[32m[1102 10:10:28 @base.py:267][0m Epoch 17 (global_step 272) finished, time:29.11 sec.



100%|##########|16/16[00:22<00:00, 0.71it/s]


[32m[1102 10:10:51 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-272.
[32m[1102 10:10:52 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 10:10:52 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.526
[32m[1102 10:10:52 @monitor.py:361][0m QueueInput/queue_size_1: 49.87
[32m[1102 10:10:52 @monitor.py:361][0m coverage: 4.0371
[32m[1102 10:10:52 @monitor.py:361][0m learning_rate: 1e-05
[32m[1102 10:10:52 @monitor.py:361][0m loss/value: 0.050051
[32m[1102 10:10:52 @monitor.py:361][0m macro_auc: 0.93334
[32m[1102 10:10:52 @monitor.py:361][0m macro_f1: 0.58547
[32m[1102 10:10:52 @monitor.py:361][0m mean_average_precision: 0.84963
[32m[1102 10:10:52 @monitor.py:361][0m micro_auc: 0.83775
[32m[1102 10:10:52 @monitor.py:361][0m micro_f1: 0.59149
[32m[1102 10:10:52 @monitor.py:361][0m one_error: 0.25781
[32m[1102 10:10:52 @monitor.py:361][0m ranking_loss: 0.19455
[32m[1102 10:10:52 @monitor.py:361][

100%|##########|16/16[00:29<00:00, 0.54it/s]

[32m[1102 10:11:22 @base.py:267][0m Epoch 18 (global_step 288) finished, time:29.47 sec.



100%|##########|16/16[00:22<00:00, 0.68it/s]


[32m[1102 10:11:45 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-288.
[32m[1102 10:11:47 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 10:11:47 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.502
[32m[1102 10:11:47 @monitor.py:361][0m QueueInput/queue_size_1: 49.943
[32m[1102 10:11:47 @monitor.py:361][0m coverage: 3.958
[32m[1102 10:11:47 @monitor.py:361][0m learning_rate: 1e-05
[32m[1102 10:11:47 @monitor.py:361][0m loss/value: 0.047822
[32m[1102 10:11:47 @monitor.py:361][0m macro_auc: 0.93072
[32m[1102 10:11:47 @monitor.py:361][0m macro_f1: 0.57523
[32m[1102 10:11:47 @monitor.py:361][0m mean_average_precision: 0.844
[32m[1102 10:11:47 @monitor.py:361][0m micro_auc: 0.84311
[32m[1102 10:11:47 @monitor.py:361][0m micro_f1: 0.5879
[32m[1102 10:11:47 @monitor.py:361][0m one_error: 0.24219
[32m[1102 10:11:47 @monitor.py:361][0m ranking_loss: 0.18658
[32m[1102 10:11:47 @monitor.py:361][0m 

100%|##########|16/16[00:29<00:00, 0.54it/s]

[32m[1102 10:12:16 @base.py:267][0m Epoch 19 (global_step 304) finished, time:29.11 sec.



100%|##########|16/16[00:22<00:00, 0.71it/s]


[32m[1102 10:12:39 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-304.
[32m[1102 10:12:40 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 10:12:40 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.665
[32m[1102 10:12:40 @monitor.py:361][0m QueueInput/queue_size_1: 49.932
[32m[1102 10:12:40 @monitor.py:361][0m coverage: 3.8301
[32m[1102 10:12:40 @monitor.py:361][0m learning_rate: 1e-05
[32m[1102 10:12:40 @monitor.py:361][0m loss/value: 0.046396
[32m[1102 10:12:40 @monitor.py:361][0m macro_auc: 0.9345
[32m[1102 10:12:40 @monitor.py:361][0m macro_f1: 0.59859
[32m[1102 10:12:40 @monitor.py:361][0m mean_average_precision: 0.85324
[32m[1102 10:12:40 @monitor.py:361][0m micro_auc: 0.85144
[32m[1102 10:12:40 @monitor.py:361][0m micro_f1: 0.60039
[32m[1102 10:12:40 @monitor.py:361][0m one_error: 0.24414
[32m[1102 10:12:40 @monitor.py:361][0m ranking_loss: 0.17556
[32m[1102 10:12:40 @monitor.py:361][

100%|##########|16/16[00:29<00:00, 0.56it/s]

[32m[1102 10:13:10 @base.py:267][0m Epoch 20 (global_step 320) finished, time:29.29 sec.



100%|##########|16/16[00:22<00:00, 0.69it/s]


[32m[1102 10:13:33 @saver.py:89][0m Model saved to ./train_log/rnn_v2/1conv-0aconv/model-320.
[32m[1102 10:13:34 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1102 10:13:34 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 49.453
[32m[1102 10:13:34 @monitor.py:361][0m QueueInput/queue_size_1: 49.523
[32m[1102 10:13:34 @monitor.py:361][0m coverage: 3.5859
[32m[1102 10:13:34 @monitor.py:361][0m learning_rate: 1e-05
[32m[1102 10:13:34 @monitor.py:361][0m loss/value: 0.045761
[32m[1102 10:13:34 @monitor.py:361][0m macro_auc: 0.93903
[32m[1102 10:13:34 @monitor.py:361][0m macro_f1: 0.62433
[32m[1102 10:13:34 @monitor.py:361][0m mean_average_precision: 0.86014
[32m[1102 10:13:34 @monitor.py:361][0m micro_auc: 0.87231
[32m[1102 10:13:34 @monitor.py:361][0m micro_f1: 0.62473
[32m[1102 10:13:34 @monitor.py:361][0m one_error: 0.22559
[32m[1102 10:13:34 @monitor.py:361][0m ranking_loss: 0.15499
[32m[1102 10:13:34 @monitor.py:361]

In [14]:
tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES)

[<tf.Variable 'EMA/QueueInput/queue_size:0' shape=() dtype=float32_ref>,
 <tf.Variable 'EMA/QueueInput/queue_size/biased:0' shape=() dtype=float32_ref>,
 <tf.Variable 'EMA/QueueInput/queue_size/local_step:0' shape=() dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/conv1/weights:0' shape=(7, 7, 3, 64) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/conv1/biases:0' shape=(64,) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/block1/unit_1/bottleneck_v2/preact/beta:0' shape=(64,) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/block1/unit_1/bottleneck_v2/preact/gamma:0' shape=(64,) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/block1/unit_1/bottleneck_v2/preact/moving_mean:0' shape=(64,) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/block1/unit_1/bottleneck_v2/preact/moving_variance:0' shape=(64,) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/block1/unit_1/bottleneck_v2/shortcut/weights:0' shape=(1, 1, 64, 256) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/block1/unit_1/bot