/
test_get_dataset.py
52 lines (36 loc) · 1.37 KB
/
test_get_dataset.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
"""test_get_dataset.py
This test script could be used to verify either the 'train' or
'validation' dataset, by visualizing data augmented images on
TensorBoard.
Examples:
$ cd ${HOME}/project/keras_imagenet
$ python3 test_get_dataset.py train
$ tensorboard --logdir logs/train
"""
import os
import shutil
import argparse
import tensorflow as tf
from utils.dataset import get_dataset
DATASET_DIR = os.path.join(os.environ['HOME'], 'data/ILSVRC2012/tfrecords')
parser = argparse.ArgumentParser()
parser.add_argument('subset', type=str, choices=['train', 'validation'])
args = parser.parse_args()
log_dir = os.path.join('logs', args.subset)
shutil.rmtree(log_dir, ignore_errors=True) # clear prior log data
dataset = get_dataset(DATASET_DIR, args.subset, batch_size=64)
iterator = dataset.make_initializable_iterator()
batch_xs, batch_ys = iterator.get_next()
mean_rgb = tf.reduce_mean(batch_xs, axis=[0, 1, 2])
# convert normalized image back: [-1, 1] -> [0, 1]
batch_imgs = tf.multiply(batch_xs, 0.5)
batch_imgs = tf.add(batch_imgs, 0.5)
summary_op = tf.summary.image('image_batch', batch_imgs, max_outputs=64)
with tf.Session() as sess:
writer = tf.summary.FileWriter(log_dir, sess.graph)
sess.run(iterator.initializer)
rgb = sess.run(mean_rgb)
print('Mean RGB (-1.0~1.0):', rgb)
summary = sess.run(summary_op)
writer.add_summary(summary)
writer.close()