In [1]:
%load_ext autoreload
%autoreload 2

from config.rnn import default
from models import RNN
import numpy as np
from functional import seq
import tensorflow as tf
from tensorpack import (TrainConfig, SyncMultiGPUTrainerParameterServer as Trainer, 
                        PredictConfig, MultiProcessDatasetPredictor as Predictor,
                        SaverRestore, logger)
from tensorpack.callbacks import (ScheduledHyperParamSetter, MaxSaver, ModelSaver,
                                  DataParallelInferenceRunner as InfRunner)
from tensorpack.predict import SimpleDatasetPredictor
from tensorpack.tfutils.common import get_default_sess_config
from utils import DataManager
from utils.validation import (Accumulator, AggregateMetric, calcu_metrics)

resnet_loc = "./data/resnet_v2_101/resnet_v2_101.ckpt"
log_dir = 'train_log/transfer/all_stages-g4/'
logger.set_logger_dir(log_dir)

[32m[1028 14:44:34 @logger.py:74][0m Argv: /home/yangyang/Applications/anaconda3/lib/python3.6/site-packages/ipykernel_launcher.py -f /run/user/1007/jupyter/kernel-e923b5b8-ab46-403c-80b0-5ee95881bab3.json


In [2]:
config = default
ignore_restore = ['learning_rate', 'global_step']
save_name = "all-stages-max-micro-auc.tfmodel"

#### Split train set and test set

In [10]:
config.stages = [2, 3, 4, 5, 6]
config.proportion = {'train': 0.55, 'val': 0.0, 'test': 0.45}
config.annotation_number = None
dm = DataManager.from_config(config)
train_set = dm.get_train_set()

Group numbers:
train: 5014, validation: 0, test: 4726
Image numbers:
train: 22989, validation: 0, test: 21028


#### Gether data to train rnn

In [12]:
config.proportion = {'train': 0.8, 'val':0.2, 'test': 0.0}
config.annotation_number = 30
dm = DataManager.from_dataset(train_set, config)

Group numbers:
train: 3584, validation: 778, test: 0
Image numbers:
train: 16196, validation: 3364, test: 0


In [13]:
config.weight_decay = 0.0
config.dropout_keep_prob = 0.5
config.gamma = 4
config.use_glimpse = True
config.read_time = 5
config.batch_size = 64
config.use_hidden_dense = False

threshold = 0.5
train_data = dm.get_train_stream()
val_data = dm.get_validation_stream()
model = RNN(config, is_finetuning=False)

In [15]:
tf.reset_default_graph()
train_config = TrainConfig(model=model, dataflow=train_data,
                           callbacks=[
                               ScheduledHyperParamSetter('learning_rate', [(0, 1e-4), (15, 1e-5)]),
                               InfRunner(val_data, [AggregateMetric(config.validation_metrics, threshold)],
                                         [1]),
                               ModelSaver(var_collections='model_variables'),
                               MaxSaver('micro_auc', save_name),
                           ],
                           session_init=SaverRestore(
                               model_path=resnet_loc, ignore=ignore_restore),
                           max_epoch=20, tower=[1])
Trainer(train_config).train()

[32m[1028 14:47:49 @inference_runner.py:83][0m InferenceRunner will eval on an InputSource of size 12
[32m[1028 14:47:49 @input_source.py:178][0m Setting up the queue 'QueueInput/input_queue' for CPU prefetching ...
[32m[1028 14:47:49 @training.py:92][0m Building graph for training tower 0 on device LeastLoadedDeviceSetter-/gpu:1...
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
INFO:tensorflow:Scale of 0 disables regularizer.
[32m[1028 14:47:53 @model_utils.py:47][0m [36mModel Parameters: 
[0

[32m[1028 14:47:58 @base.py:212][0m Creating the session ...
[32m[1028 14:48:03 @base.py:216][0m Initializing the session ...
[32m[1028 14:48:03 @sessinit.py:116][0m Restoring checkpoint from ./data/resnet_v2_101/resnet_v2_101.ckpt ...
INFO:tensorflow:Restoring parameters from ./data/resnet_v2_101/resnet_v2_101.ckpt
[32m[1028 14:48:08 @base.py:223][0m Graph Finalized.
[32m[1028 14:48:08 @param.py:144][0m After epoch 0, learning_rate will change to 0.00010000
[32m[1028 14:48:08 @concurrency.py:36][0m Starting EnqueueThread DataParallelInferenceRunner/QueueInput/input_queue ...
[32m[1028 14:48:09 @concurrency.py:36][0m Starting EnqueueThread QueueInput/input_queue ...
[32m[1028 14:48:09 @base.py:257][0m Start Epoch 1 ...


100%|##########|56/56[03:28<00:00, 0.36it/s]

[32m[1028 14:51:38 @base.py:267][0m Epoch 1 (global_step 56) finished, time:208.37 sec.



  'precision', 'predicted', average, warn_for)
100%|##########|12/12[00:21<00:00, 0.56it/s]


[32m[1028 14:52:00 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-56.
[32m[1028 14:52:02 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 14:52:02 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 50
[32m[1028 14:52:02 @monitor.py:361][0m QueueInput/queue_size_1: 0.17499
[32m[1028 14:52:02 @monitor.py:361][0m coverage: 15.995
[32m[1028 14:52:02 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 14:52:02 @monitor.py:361][0m loss/value: 0.054061
[32m[1028 14:52:02 @monitor.py:361][0m macro_auc: 0.61021
[32m[1028 14:52:02 @monitor.py:361][0m macro_f1: 0.097238
[32m[1028 14:52:02 @monitor.py:361][0m mean_average_precision: 0.21321
[32m[1028 14:52:02 @monitor.py:361][0m micro_auc: 0.62328
[32m[1028 14:52:02 @monitor.py:361][0m micro_f1: 0.21767
[32m[1028 14:52:02 @monitor.py:361][0m one_error: 0.69401
[32m[1028 14:52:02 @monitor.py:361][0m ranking_loss: 0.34084
[32m[1028 14:52:02 @monitor.py:361][

100%|##########|56/56[02:14<00:00, 0.39it/s]

[32m[1028 14:54:16 @base.py:267][0m Epoch 2 (global_step 112) finished, time:134.37 sec.



100%|##########|12/12[00:19<00:00, 0.58it/s]


[32m[1028 14:54:38 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-112.
[32m[1028 14:54:40 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 14:54:40 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.411
[32m[1028 14:54:40 @monitor.py:361][0m QueueInput/queue_size_1: 0.23413
[32m[1028 14:54:40 @monitor.py:361][0m coverage: 15.117
[32m[1028 14:54:40 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 14:54:40 @monitor.py:361][0m loss/value: 0.029075
[32m[1028 14:54:40 @monitor.py:361][0m macro_auc: 0.67565
[32m[1028 14:54:40 @monitor.py:361][0m macro_f1: 0.092022
[32m[1028 14:54:40 @monitor.py:361][0m mean_average_precision: 0.26915
[32m[1028 14:54:40 @monitor.py:361][0m micro_auc: 0.65776
[32m[1028 14:54:40 @monitor.py:361][0m micro_f1: 0.2392
[32m[1028 14:54:40 @monitor.py:361][0m one_error: 0.79557
[32m[1028 14:54:40 @monitor.py:361][0m ranking_loss: 0.31769
[32m[1028 14:54:40 @monitor.py:36

100%|##########|56/56[02:21<00:00, 0.37it/s]

[32m[1028 14:57:01 @base.py:267][0m Epoch 3 (global_step 168) finished, time:141.01 sec.



100%|##########|12/12[00:22<00:00, 0.61it/s]


[32m[1028 14:57:24 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-168.
[32m[1028 14:57:27 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 14:57:27 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.301
[32m[1028 14:57:27 @monitor.py:361][0m QueueInput/queue_size_1: 0.28242
[32m[1028 14:57:27 @monitor.py:361][0m coverage: 14.09
[32m[1028 14:57:27 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 14:57:27 @monitor.py:361][0m loss/value: 0.023807
[32m[1028 14:57:27 @monitor.py:361][0m macro_auc: 0.70623
[32m[1028 14:57:27 @monitor.py:361][0m macro_f1: 0.080561
[32m[1028 14:57:27 @monitor.py:361][0m mean_average_precision: 0.3096
[32m[1028 14:57:27 @monitor.py:361][0m micro_auc: 0.67916
[32m[1028 14:57:27 @monitor.py:361][0m micro_f1: 0.24575
[32m[1028 14:57:27 @monitor.py:361][0m one_error: 0.58464
[32m[1028 14:57:27 @monitor.py:361][0m ranking_loss: 0.28776
[32m[1028 14:57:27 @monitor.py:361

100%|##########|56/56[02:24<00:00, 0.39it/s]

[32m[1028 14:59:52 @base.py:267][0m Epoch 4 (global_step 224) finished, time:144.76 sec.



100%|##########|12/12[00:19<00:00, 0.69it/s]


[32m[1028 15:00:12 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-224.
[32m[1028 15:00:14 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:00:14 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.234
[32m[1028 15:00:14 @monitor.py:361][0m QueueInput/queue_size_1: 0.2849
[32m[1028 15:00:14 @monitor.py:361][0m coverage: 12.941
[32m[1028 15:00:14 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 15:00:14 @monitor.py:361][0m loss/value: 0.021519
[32m[1028 15:00:14 @monitor.py:361][0m macro_auc: 0.75913
[32m[1028 15:00:14 @monitor.py:361][0m macro_f1: 0.097013
[32m[1028 15:00:14 @monitor.py:361][0m mean_average_precision: 0.35957
[32m[1028 15:00:14 @monitor.py:361][0m micro_auc: 0.70824
[32m[1028 15:00:14 @monitor.py:361][0m micro_f1: 0.26191
[32m[1028 15:00:14 @monitor.py:361][0m one_error: 0.55859
[32m[1028 15:00:14 @monitor.py:361][0m ranking_loss: 0.2572
[32m[1028 15:00:14 @monitor.py:361

100%|##########|56/56[02:11<00:00, 0.39it/s]

[32m[1028 15:02:26 @base.py:267][0m Epoch 5 (global_step 280) finished, time:131.64 sec.



100%|##########|12/12[00:22<00:00, 0.56it/s]


[32m[1028 15:02:48 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-280.
[32m[1028 15:02:50 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:02:50 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.194
[32m[1028 15:02:50 @monitor.py:361][0m QueueInput/queue_size_1: 0.35382
[32m[1028 15:02:50 @monitor.py:361][0m coverage: 12.284
[32m[1028 15:02:50 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 15:02:50 @monitor.py:361][0m loss/value: 0.020127
[32m[1028 15:02:50 @monitor.py:361][0m macro_auc: 0.77079
[32m[1028 15:02:51 @monitor.py:361][0m macro_f1: 0.10416
[32m[1028 15:02:51 @monitor.py:361][0m mean_average_precision: 0.37339
[32m[1028 15:02:51 @monitor.py:361][0m micro_auc: 0.72447
[32m[1028 15:02:51 @monitor.py:361][0m micro_f1: 0.28036
[32m[1028 15:02:51 @monitor.py:361][0m one_error: 0.65625
[32m[1028 15:02:51 @monitor.py:361][0m ranking_loss: 0.24485
[32m[1028 15:02:51 @monitor.py:36

100%|##########|56/56[02:18<00:00, 0.39it/s]

[32m[1028 15:05:09 @base.py:267][0m Epoch 6 (global_step 336) finished, time:138.04 sec.



100%|##########|12/12[00:21<00:00, 0.58it/s]


[32m[1028 15:05:31 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-336.
[32m[1028 15:05:33 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:05:33 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.291
[32m[1028 15:05:33 @monitor.py:361][0m QueueInput/queue_size_1: 0.40947
[32m[1028 15:05:33 @monitor.py:361][0m coverage: 11.249
[32m[1028 15:05:33 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 15:05:33 @monitor.py:361][0m loss/value: 0.018894
[32m[1028 15:05:34 @monitor.py:361][0m macro_auc: 0.80886
[32m[1028 15:05:34 @monitor.py:361][0m macro_f1: 0.12405
[32m[1028 15:05:34 @monitor.py:361][0m mean_average_precision: 0.40213
[32m[1028 15:05:34 @monitor.py:361][0m micro_auc: 0.75349
[32m[1028 15:05:34 @monitor.py:361][0m micro_f1: 0.3083
[32m[1028 15:05:34 @monitor.py:361][0m one_error: 0.65625
[32m[1028 15:05:34 @monitor.py:361][0m ranking_loss: 0.21762
[32m[1028 15:05:34 @monitor.py:361

100%|##########|56/56[02:26<00:00, 0.35it/s]

[32m[1028 15:08:01 @base.py:267][0m Epoch 7 (global_step 392) finished, time:146.66 sec.



100%|##########|12/12[00:19<00:00, 0.68it/s]


[32m[1028 15:08:21 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-392.
[32m[1028 15:08:23 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:08:23 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.26
[32m[1028 15:08:23 @monitor.py:361][0m QueueInput/queue_size_1: 0.28372
[32m[1028 15:08:23 @monitor.py:361][0m coverage: 10.306
[32m[1028 15:08:23 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 15:08:23 @monitor.py:361][0m loss/value: 0.01799
[32m[1028 15:08:23 @monitor.py:361][0m macro_auc: 0.83741
[32m[1028 15:08:23 @monitor.py:361][0m macro_f1: 0.14586
[32m[1028 15:08:23 @monitor.py:361][0m mean_average_precision: 0.43878
[32m[1028 15:08:23 @monitor.py:361][0m micro_auc: 0.78707
[32m[1028 15:08:23 @monitor.py:361][0m micro_f1: 0.34362
[32m[1028 15:08:23 @monitor.py:361][0m one_error: 0.60286
[32m[1028 15:08:23 @monitor.py:361][0m ranking_loss: 0.19079
[32m[1028 15:08:23 @monitor.py:361]

100%|##########|56/56[02:07<00:00, 0.38it/s]

[32m[1028 15:10:30 @base.py:267][0m Epoch 8 (global_step 448) finished, time:127.16 sec.



100%|##########|12/12[00:19<00:00, 0.62it/s]


[32m[1028 15:10:50 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-448.
[32m[1028 15:10:53 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:10:53 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.377
[32m[1028 15:10:53 @monitor.py:361][0m QueueInput/queue_size_1: 0.36255
[32m[1028 15:10:53 @monitor.py:361][0m coverage: 9.026
[32m[1028 15:10:53 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 15:10:53 @monitor.py:361][0m loss/value: 0.017239
[32m[1028 15:10:53 @monitor.py:361][0m macro_auc: 0.87338
[32m[1028 15:10:53 @monitor.py:361][0m macro_f1: 0.14928
[32m[1028 15:10:53 @monitor.py:361][0m mean_average_precision: 0.50812
[32m[1028 15:10:53 @monitor.py:361][0m micro_auc: 0.82099
[32m[1028 15:10:53 @monitor.py:361][0m micro_f1: 0.37339
[32m[1028 15:10:53 @monitor.py:361][0m one_error: 0.54297
[32m[1028 15:10:53 @monitor.py:361][0m ranking_loss: 0.16777
[32m[1028 15:10:53 @monitor.py:361

100%|##########|56/56[02:12<00:00, 0.38it/s]

[32m[1028 15:13:05 @base.py:267][0m Epoch 9 (global_step 504) finished, time:132.63 sec.



100%|##########|12/12[00:19<00:00, 0.55it/s]


[32m[1028 15:13:26 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-504.
[32m[1028 15:13:28 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:13:28 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.252
[32m[1028 15:13:28 @monitor.py:361][0m QueueInput/queue_size_1: 0.1917
[32m[1028 15:13:28 @monitor.py:361][0m coverage: 8.3086
[32m[1028 15:13:28 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 15:13:28 @monitor.py:361][0m loss/value: 0.016684
[32m[1028 15:13:28 @monitor.py:361][0m macro_auc: 0.88085
[32m[1028 15:13:28 @monitor.py:361][0m macro_f1: 0.17095
[32m[1028 15:13:28 @monitor.py:361][0m mean_average_precision: 0.52641
[32m[1028 15:13:28 @monitor.py:361][0m micro_auc: 0.84192
[32m[1028 15:13:28 @monitor.py:361][0m micro_f1: 0.40543
[32m[1028 15:13:28 @monitor.py:361][0m one_error: 0.5013
[32m[1028 15:13:28 @monitor.py:361][0m ranking_loss: 0.14753
[32m[1028 15:13:28 @monitor.py:361]

100%|##########|56/56[02:22<00:00, 0.30it/s]

[32m[1028 15:15:50 @base.py:267][0m Epoch 10 (global_step 560) finished, time:142.12 sec.



100%|##########|12/12[00:20<00:00, 0.64it/s]


[32m[1028 15:16:11 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-560.
[32m[1028 15:16:13 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:16:13 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.223
[32m[1028 15:16:13 @monitor.py:361][0m QueueInput/queue_size_1: 0.28713
[32m[1028 15:16:13 @monitor.py:361][0m coverage: 7.418
[32m[1028 15:16:13 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 15:16:13 @monitor.py:361][0m loss/value: 0.015969
[32m[1028 15:16:13 @monitor.py:361][0m macro_auc: 0.89859
[32m[1028 15:16:13 @monitor.py:361][0m macro_f1: 0.18938
[32m[1028 15:16:13 @monitor.py:361][0m mean_average_precision: 0.55473
[32m[1028 15:16:13 @monitor.py:361][0m micro_auc: 0.86777
[32m[1028 15:16:13 @monitor.py:361][0m micro_f1: 0.43074
[32m[1028 15:16:13 @monitor.py:361][0m one_error: 0.47786
[32m[1028 15:16:13 @monitor.py:361][0m ranking_loss: 0.12656
[32m[1028 15:16:13 @monitor.py:361

100%|##########|56/56[02:07<00:00, 0.39it/s]

[32m[1028 15:18:21 @base.py:267][0m Epoch 11 (global_step 616) finished, time:127.91 sec.



100%|##########|12/12[00:18<00:00, 0.68it/s]


[32m[1028 15:18:41 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-616.
[32m[1028 15:18:44 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:18:44 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.177
[32m[1028 15:18:44 @monitor.py:361][0m QueueInput/queue_size_1: 0.37356
[32m[1028 15:18:44 @monitor.py:361][0m coverage: 6.7799
[32m[1028 15:18:44 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 15:18:44 @monitor.py:361][0m loss/value: 0.015686
[32m[1028 15:18:44 @monitor.py:361][0m macro_auc: 0.90492
[32m[1028 15:18:44 @monitor.py:361][0m macro_f1: 0.21937
[32m[1028 15:18:44 @monitor.py:361][0m mean_average_precision: 0.57873
[32m[1028 15:18:44 @monitor.py:361][0m micro_auc: 0.88398
[32m[1028 15:18:44 @monitor.py:361][0m micro_f1: 0.45518
[32m[1028 15:18:44 @monitor.py:361][0m one_error: 0.42969
[32m[1028 15:18:44 @monitor.py:361][0m ranking_loss: 0.10912
[32m[1028 15:18:44 @monitor.py:36

100%|##########|56/56[02:10<00:00, 0.34it/s]

[32m[1028 15:20:54 @base.py:267][0m Epoch 12 (global_step 672) finished, time:130.23 sec.



100%|##########|12/12[00:18<00:00, 0.67it/s]


[32m[1028 15:21:14 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-672.
[32m[1028 15:21:16 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:21:16 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.167
[32m[1028 15:21:16 @monitor.py:361][0m QueueInput/queue_size_1: 0.38122
[32m[1028 15:21:16 @monitor.py:361][0m coverage: 6.2708
[32m[1028 15:21:16 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 15:21:16 @monitor.py:361][0m loss/value: 0.015219
[32m[1028 15:21:16 @monitor.py:361][0m macro_auc: 0.90995
[32m[1028 15:21:16 @monitor.py:361][0m macro_f1: 0.23781
[32m[1028 15:21:16 @monitor.py:361][0m mean_average_precision: 0.58742
[32m[1028 15:21:16 @monitor.py:361][0m micro_auc: 0.89779
[32m[1028 15:21:16 @monitor.py:361][0m micro_f1: 0.472
[32m[1028 15:21:16 @monitor.py:361][0m one_error: 0.40104
[32m[1028 15:21:16 @monitor.py:361][0m ranking_loss: 0.096588
[32m[1028 15:21:16 @monitor.py:361

100%|##########|56/56[02:16<00:00, 0.39it/s]

[32m[1028 15:23:33 @base.py:267][0m Epoch 13 (global_step 728) finished, time:136.44 sec.



100%|##########|12/12[00:20<00:00, 0.62it/s]


[32m[1028 15:23:55 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-728.
[32m[1028 15:23:57 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:23:57 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.24
[32m[1028 15:23:57 @monitor.py:361][0m QueueInput/queue_size_1: 0.35828
[32m[1028 15:23:57 @monitor.py:361][0m coverage: 5.9206
[32m[1028 15:23:57 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 15:23:57 @monitor.py:361][0m loss/value: 0.014806
[32m[1028 15:23:57 @monitor.py:361][0m macro_auc: 0.91279
[32m[1028 15:23:57 @monitor.py:361][0m macro_f1: 0.22994
[32m[1028 15:23:57 @monitor.py:361][0m mean_average_precision: 0.59209
[32m[1028 15:23:57 @monitor.py:361][0m micro_auc: 0.90448
[32m[1028 15:23:57 @monitor.py:361][0m micro_f1: 0.46589
[32m[1028 15:23:57 @monitor.py:361][0m one_error: 0.36849
[32m[1028 15:23:57 @monitor.py:361][0m ranking_loss: 0.090084
[32m[1028 15:23:57 @monitor.py:36

100%|##########|56/56[02:17<00:00, 0.38it/s]

[32m[1028 15:26:15 @base.py:267][0m Epoch 14 (global_step 784) finished, time:137.71 sec.



100%|##########|12/12[00:20<00:00, 0.64it/s]


[32m[1028 15:26:37 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-784.
[32m[1028 15:26:39 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:26:39 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.284
[32m[1028 15:26:39 @monitor.py:361][0m QueueInput/queue_size_1: 0.51666
[32m[1028 15:26:39 @monitor.py:361][0m coverage: 6.1159
[32m[1028 15:26:39 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 15:26:39 @monitor.py:361][0m loss/value: 0.014335
[32m[1028 15:26:39 @monitor.py:361][0m macro_auc: 0.91569
[32m[1028 15:26:39 @monitor.py:361][0m macro_f1: 0.2602
[32m[1028 15:26:39 @monitor.py:361][0m mean_average_precision: 0.60465
[32m[1028 15:26:39 @monitor.py:361][0m micro_auc: 0.90621
[32m[1028 15:26:39 @monitor.py:361][0m micro_f1: 0.47959
[32m[1028 15:26:39 @monitor.py:361][0m one_error: 0.37891
[32m[1028 15:26:39 @monitor.py:361][0m ranking_loss: 0.093297
[32m[1028 15:26:39 @monitor.py:36

100%|##########|56/56[02:21<00:00, 0.36it/s]

[32m[1028 15:29:01 @base.py:267][0m Epoch 15 (global_step 840) finished, time:141.98 sec.
[32m[1028 15:29:01 @param.py:144][0m After epoch 15, learning_rate will change to 0.00001000



100%|##########|12/12[00:22<00:00, 0.61it/s]


[32m[1028 15:29:24 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-840.
[32m[1028 15:29:26 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:29:26 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.273
[32m[1028 15:29:26 @monitor.py:361][0m QueueInput/queue_size_1: 0.29955
[32m[1028 15:29:26 @monitor.py:361][0m coverage: 5.724
[32m[1028 15:29:26 @monitor.py:361][0m learning_rate: 0.0001
[32m[1028 15:29:26 @monitor.py:361][0m loss/value: 0.014139
[32m[1028 15:29:26 @monitor.py:361][0m macro_auc: 0.91614
[32m[1028 15:29:26 @monitor.py:361][0m macro_f1: 0.27582
[32m[1028 15:29:26 @monitor.py:361][0m mean_average_precision: 0.6089
[32m[1028 15:29:26 @monitor.py:361][0m micro_auc: 0.91683
[32m[1028 15:29:26 @monitor.py:361][0m micro_f1: 0.48032
[32m[1028 15:29:26 @monitor.py:361][0m one_error: 0.33594
[32m[1028 15:29:26 @monitor.py:361][0m ranking_loss: 0.082618
[32m[1028 15:29:26 @monitor.py:361

100%|##########|56/56[02:16<00:00, 0.39it/s]

[32m[1028 15:31:43 @base.py:267][0m Epoch 16 (global_step 896) finished, time:136.66 sec.



100%|##########|12/12[00:19<00:00, 0.67it/s]


[32m[1028 15:32:03 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-896.
[32m[1028 15:32:05 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:32:05 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.286
[32m[1028 15:32:05 @monitor.py:361][0m QueueInput/queue_size_1: 0.25083
[32m[1028 15:32:05 @monitor.py:361][0m coverage: 5.556
[32m[1028 15:32:05 @monitor.py:361][0m learning_rate: 1e-05
[32m[1028 15:32:05 @monitor.py:361][0m loss/value: 0.013697
[32m[1028 15:32:05 @monitor.py:361][0m macro_auc: 0.91667
[32m[1028 15:32:05 @monitor.py:361][0m macro_f1: 0.27479
[32m[1028 15:32:05 @monitor.py:361][0m mean_average_precision: 0.61485
[32m[1028 15:32:05 @monitor.py:361][0m micro_auc: 0.92023
[32m[1028 15:32:05 @monitor.py:361][0m micro_f1: 0.48558
[32m[1028 15:32:05 @monitor.py:361][0m one_error: 0.34115
[32m[1028 15:32:05 @monitor.py:361][0m ranking_loss: 0.079756
[32m[1028 15:32:05 @monitor.py:361

100%|##########|56/56[02:17<00:00, 0.38it/s]

[32m[1028 15:34:23 @base.py:267][0m Epoch 17 (global_step 952) finished, time:137.78 sec.



100%|##########|12/12[00:23<00:00, 0.52it/s]


[32m[1028 15:34:47 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-952.
[32m[1028 15:34:50 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:34:50 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.078
[32m[1028 15:34:50 @monitor.py:361][0m QueueInput/queue_size_1: 0.27401
[32m[1028 15:34:50 @monitor.py:361][0m coverage: 5.2539
[32m[1028 15:34:50 @monitor.py:361][0m learning_rate: 1e-05
[32m[1028 15:34:50 @monitor.py:361][0m loss/value: 0.013691
[32m[1028 15:34:50 @monitor.py:361][0m macro_auc: 0.9154
[32m[1028 15:34:50 @monitor.py:361][0m macro_f1: 0.27255
[32m[1028 15:34:50 @monitor.py:361][0m mean_average_precision: 0.6161
[32m[1028 15:34:50 @monitor.py:361][0m micro_auc: 0.92432
[32m[1028 15:34:50 @monitor.py:361][0m micro_f1: 0.47299
[32m[1028 15:34:50 @monitor.py:361][0m one_error: 0.33333
[32m[1028 15:34:50 @monitor.py:361][0m ranking_loss: 0.073867
[32m[1028 15:34:50 @monitor.py:361]

100%|##########|56/56[02:18<00:00, 0.36it/s]

[32m[1028 15:37:09 @base.py:267][0m Epoch 18 (global_step 1008) finished, time:138.79 sec.



100%|##########|12/12[00:19<00:00, 0.63it/s]


[32m[1028 15:37:29 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-1008.
[32m[1028 15:37:31 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:37:31 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.12
[32m[1028 15:37:31 @monitor.py:361][0m QueueInput/queue_size_1: 0.32265
[32m[1028 15:37:31 @monitor.py:361][0m coverage: 5.0391
[32m[1028 15:37:31 @monitor.py:361][0m learning_rate: 1e-05
[32m[1028 15:37:31 @monitor.py:361][0m loss/value: 0.013586
[32m[1028 15:37:31 @monitor.py:361][0m macro_auc: 0.91895
[32m[1028 15:37:32 @monitor.py:361][0m macro_f1: 0.27258
[32m[1028 15:37:32 @monitor.py:361][0m mean_average_precision: 0.61192
[32m[1028 15:37:32 @monitor.py:361][0m micro_auc: 0.92777
[32m[1028 15:37:32 @monitor.py:361][0m micro_f1: 0.47274
[32m[1028 15:37:32 @monitor.py:361][0m one_error: 0.34115
[32m[1028 15:37:32 @monitor.py:361][0m ranking_loss: 0.071257
[32m[1028 15:37:32 @monitor.py:36

100%|##########|56/56[02:17<00:00, 0.38it/s]

[32m[1028 15:39:49 @base.py:267][0m Epoch 19 (global_step 1064) finished, time:137.80 sec.



100%|##########|12/12[00:19<00:00, 0.64it/s]


[32m[1028 15:40:10 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-1064.
[32m[1028 15:40:12 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:40:12 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.115
[32m[1028 15:40:12 @monitor.py:361][0m QueueInput/queue_size_1: 0.20894
[32m[1028 15:40:12 @monitor.py:361][0m coverage: 4.944
[32m[1028 15:40:12 @monitor.py:361][0m learning_rate: 1e-05
[32m[1028 15:40:12 @monitor.py:361][0m loss/value: 0.013535
[32m[1028 15:40:12 @monitor.py:361][0m macro_auc: 0.9188
[32m[1028 15:40:12 @monitor.py:361][0m macro_f1: 0.25897
[32m[1028 15:40:12 @monitor.py:361][0m mean_average_precision: 0.61233
[32m[1028 15:40:12 @monitor.py:361][0m micro_auc: 0.9287
[32m[1028 15:40:12 @monitor.py:361][0m micro_f1: 0.45713
[32m[1028 15:40:12 @monitor.py:361][0m one_error: 0.33333
[32m[1028 15:40:12 @monitor.py:361][0m ranking_loss: 0.069966
[32m[1028 15:40:12 @monitor.py:361]

100%|##########|56/56[02:12<00:00, 0.39it/s]

[32m[1028 15:42:25 @base.py:267][0m Epoch 20 (global_step 1120) finished, time:132.26 sec.



100%|##########|12/12[00:19<00:00, 0.68it/s]


[32m[1028 15:42:45 @saver.py:89][0m Model saved to train_log/transfer/all_stages-g4/model-1120.
[32m[1028 15:42:47 @saver.py:158][0m Model with maximum 'micro_auc' saved.
[32m[1028 15:42:47 @monitor.py:361][0m DataParallelInferenceRunner/QueueInput/queue_size_1: 47.148
[32m[1028 15:42:47 @monitor.py:361][0m QueueInput/queue_size_1: 0.2985
[32m[1028 15:42:47 @monitor.py:361][0m coverage: 4.9232
[32m[1028 15:42:47 @monitor.py:361][0m learning_rate: 1e-05
[32m[1028 15:42:47 @monitor.py:361][0m loss/value: 0.013615
[32m[1028 15:42:47 @monitor.py:361][0m macro_auc: 0.91943
[32m[1028 15:42:47 @monitor.py:361][0m macro_f1: 0.25983
[32m[1028 15:42:47 @monitor.py:361][0m mean_average_precision: 0.62163
[32m[1028 15:42:47 @monitor.py:361][0m micro_auc: 0.9297
[32m[1028 15:42:47 @monitor.py:361][0m micro_f1: 0.45549
[32m[1028 15:42:47 @monitor.py:361][0m one_error: 0.32552
[32m[1028 15:42:47 @monitor.py:361][0m ranking_loss: 0.068116
[32m[1028 15:42:47 @monitor.py:361

In [15]:
tf.get_collection(tf.GraphKeys.GLOBAL_VARIABLES)

[<tf.Variable 'EMA/QueueInput/queue_size:0' shape=() dtype=float32_ref>,
 <tf.Variable 'EMA/QueueInput/queue_size/biased:0' shape=() dtype=float32_ref>,
 <tf.Variable 'EMA/QueueInput/queue_size/local_step:0' shape=() dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/conv1/weights:0' shape=(7, 7, 3, 64) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/conv1/biases:0' shape=(64,) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/block1/unit_1/bottleneck_v2/preact/beta:0' shape=(64,) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/block1/unit_1/bottleneck_v2/preact/gamma:0' shape=(64,) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/block1/unit_1/bottleneck_v2/preact/moving_mean:0' shape=(64,) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/block1/unit_1/bottleneck_v2/preact/moving_variance:0' shape=(64,) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/block1/unit_1/bottleneck_v2/shortcut/weights:0' shape=(1, 1, 64, 256) dtype=float32_ref>,
 <tf.Variable 'resnet_v2_101/block1/unit_1/bot

In [1]:
a, b = 1, 2