Merge pull request #4155 from kuenishi/iterator-with

Provide a cleaner way to collect threads and processes in MultiprocessIterator
chainer · Apr 3, 2018 · 4b9bab9 · 4b9bab9
2 parents 5f3151a + dd6e88e
commit 4b9bab9
Show file tree

Hide file tree

Showing 4 changed files with 71 additions and 43 deletions.
diff --git a/chainer/dataset/iterator.py b/chainer/dataset/iterator.py
@@ -61,6 +61,24 @@ def finalize(self):
         """
         pass
 
+    def __enter__(self):
+        """With statement context manager method
+
+        This method does nothing by default. Implementation may override it to
+        better handle the internal resources by with statement.
+
+        """
+        return self
+
+    def __exit__(self, exc_type, exc_value, traceback):
+        """With statement context manager method
+
+        This method does nothing by default. Implementation may override it to
+        better handle the internal resources by with statement.
+
+        """
+        return None
+
     def serialize(self, serializer):
         """Serializes the internal state of the iterator.
 

diff --git a/chainer/iterators/multiprocess_iterator.py b/chainer/iterators/multiprocess_iterator.py
@@ -116,6 +116,12 @@ def __del__(self):
 
     finalize = __del__
 
+    def __enter__(self):
+        return self
+
+    def __exit__(self, exc_type, exc_value, traceback):
+        self.finalize()
+
     def __copy__(self):
         other = MultiprocessIterator(
             self.dataset, self.batch_size, self.repeat, self.shuffle,

diff --git a/chainer/iterators/multithread_iterator.py b/chainer/iterators/multithread_iterator.py
@@ -61,7 +61,10 @@ def reset(self):
         self._next = None
         self._previous_epoch_detail = None
 
-    def __del__(self):
+    def __enter__(self):
+        return self
+
+    def __exit__(self, exc_type, exc_value, traceback):
         self.finalize()
 
     def finalize(self):

diff --git a/examples/mnist/train_mnist_custom_loop.py b/examples/mnist/train_mnist_custom_loop.py
@@ -11,6 +11,7 @@
 
 import chainer
 from chainer.dataset import convert
+from chainer.iterators import MultiprocessIterator
 import chainer.links as L
 from chainer import serializers
 
@@ -62,48 +63,48 @@ def main():
     train_count = len(train)
     test_count = len(test)
 
-    train_iter = chainer.iterators.SerialIterator(train, args.batchsize)
-    test_iter = chainer.iterators.SerialIterator(test, args.batchsize,
-                                                 repeat=False, shuffle=False)
-
-    sum_accuracy = 0
-    sum_loss = 0
-
-    while train_iter.epoch < args.epoch:
-        batch = train_iter.next()
-        x_array, t_array = convert.concat_examples(batch, args.gpu)
-        x = chainer.Variable(x_array)
-        t = chainer.Variable(t_array)
-        optimizer.update(model, x, t)
-        sum_loss += float(model.loss.data) * len(t.data)
-        sum_accuracy += float(model.accuracy.data) * len(t.data)
-
-        if train_iter.is_new_epoch:
-            print('epoch: {}'.format(train_iter.epoch))
-            print('train mean loss: {}, accuracy: {}'.format(
-                sum_loss / train_count, sum_accuracy / train_count))
-            # evaluation
-            sum_accuracy = 0
-            sum_loss = 0
-            for batch in test_iter:
-                x_array, t_array = convert.concat_examples(batch, args.gpu)
-                x = chainer.Variable(x_array)
-                t = chainer.Variable(t_array)
-                loss = model(x, t)
-                sum_loss += float(loss.data) * len(t.data)
-                sum_accuracy += float(model.accuracy.data) * len(t.data)
-
-            test_iter.reset()
-            print('test mean  loss: {}, accuracy: {}'.format(
-                sum_loss / test_count, sum_accuracy / test_count))
-            sum_accuracy = 0
-            sum_loss = 0
-
-    # Save the model and the optimizer
-    print('save the model')
-    serializers.save_npz('{}/mlp.model'.format(args.out), model)
-    print('save the optimizer')
-    serializers.save_npz('{}/mlp.state'.format(args.out), optimizer)
+    with MultiprocessIterator(train, args.batchsize) as train_iter, \
+        MultiprocessIterator(test, args.batchsize,
+                             repeat=False, shuffle=False) as test_iter:
+
+        sum_accuracy = 0
+        sum_loss = 0
+
+        while train_iter.epoch < args.epoch:
+            batch = train_iter.next()
+            x_array, t_array = convert.concat_examples(batch, args.gpu)
+            x = chainer.Variable(x_array)
+            t = chainer.Variable(t_array)
+            optimizer.update(model, x, t)
+            sum_loss += float(model.loss.data) * len(t.data)
+            sum_accuracy += float(model.accuracy.data) * len(t.data)
+
+            if train_iter.is_new_epoch:
+                print('epoch: {}'.format(train_iter.epoch))
+                print('train mean loss: {}, accuracy: {}'.format(
+                    sum_loss / train_count, sum_accuracy / train_count))
+                # evaluation
+                sum_accuracy = 0
+                sum_loss = 0
+                for batch in test_iter:
+                    x_array, t_array = convert.concat_examples(batch, args.gpu)
+                    x = chainer.Variable(x_array)
+                    t = chainer.Variable(t_array)
+                    loss = model(x, t)
+                    sum_loss += float(loss.data) * len(t.data)
+                    sum_accuracy += float(model.accuracy.data) * len(t.data)
+
+                test_iter.reset()
+                print('test mean  loss: {}, accuracy: {}'.format(
+                    sum_loss / test_count, sum_accuracy / test_count))
+                sum_accuracy = 0
+                sum_loss = 0
+
+        # Save the model and the optimizer
+        print('save the model')
+        serializers.save_npz('{}/mlp.model'.format(args.out), model)
+        print('save the optimizer')
+        serializers.save_npz('{}/mlp.state'.format(args.out), optimizer)
 
 
 if __name__ == '__main__':