This repository has been archived by the owner on May 2, 2022. It is now read-only.
/
loop.py
63 lines (51 loc) · 1.77 KB
/
loop.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
# Tai Sakuma <tai.sakuma@gmail.com>
import os
import gzip
try:
import cPickle as pickle
except:
import pickle
##__________________________________________________________________||
class DatasetLoop(object):
def __init__(self, datasets, reader):
self.datasets = datasets
self.reader = reader
def __repr__(self):
name_value_pairs = (
('datasets', self.datasets),
('reader', self.reader),
)
return '{}({})'.format(
self.__class__.__name__,
', '.join(['{}={!r}'.format(n, v) for n, v in name_value_pairs]),
)
def __call__(self):
self.reader.begin()
for dataset in self.datasets:
self.reader.read(dataset)
return self.reader.end()
##__________________________________________________________________||
class ResumableDatasetLoop(object):
def __init__(self, datasets, reader, workingarea):
self.datasets = datasets
self.reader = reader
self.workingarea = workingarea
def __repr__(self):
name_value_pairs = (
('datasets', self.datasets),
('reader', self.reader),
('workingarea', self.workingarea),
)
return '{}({})'.format(
self.__class__.__name__,
', '.join(['{}={!r}'.format(n, v) for n, v in name_value_pairs]),
)
def __call__(self):
self.reader.begin()
for dataset in self.datasets:
self.reader.read(dataset)
path = os.path.join(self.workingarea.path, 'reader.p.gz')
with gzip.open(path, 'wb') as f:
pickle.dump(self.reader, f, protocol=pickle.HIGHEST_PROTOCOL)
return self.reader.end()
##__________________________________________________________________||