forked from h5py/h5py
-
Notifications
You must be signed in to change notification settings - Fork 0
/
base.py
385 lines (293 loc) · 10.2 KB
/
base.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
# This file is part of h5py, a Python interface to the HDF5 library.
#
# http://www.h5py.org
#
# Copyright 2008-2013 Andrew Collette and contributors
#
# License: Standard 3-clause BSD; see "license.txt" for full license terms
# and contributor agreement.
import posixpath
import warnings
import os
import sys
from h5py import h5d, h5i, h5r, h5p, h5f, h5t
# The high-level interface is serialized; every public API function & method
# is wrapped in a lock. We re-use the low-level lock because (1) it's fast,
# and (2) it eliminates the possibility of deadlocks due to out-of-order
# lock acquisition.
from h5py._objects import phil, with_phil
py3 = sys.version_info[0] == 3
def is_hdf5(fname):
""" Determine if a file is valid HDF5 (False if it doesn't exist). """
with phil:
fname = os.path.abspath(fname)
if os.path.isfile(fname):
try:
fname = fname.encode(sys.getfilesystemencoding())
except (UnicodeError, LookupError):
pass
return h5f.is_hdf5(fname)
return False
def guess_dtype(data):
""" Attempt to guess an appropriate dtype for the object, returning None
if nothing is appropriate (or if it should be left up the the array
constructor to figure out)
"""
with phil:
if isinstance(data, h5r.RegionReference):
return h5t.special_dtype(ref=h5r.RegionReference)
if isinstance(data, h5r.Reference):
return h5t.special_dtype(ref=h5r.Reference)
if type(data) == bytes:
return h5t.special_dtype(vlen=bytes)
if type(data) == unicode:
return h5t.special_dtype(vlen=unicode)
return None
def default_lapl():
""" Default link access property list """
lapl = h5p.create(h5p.LINK_ACCESS)
fapl = h5p.create(h5p.FILE_ACCESS)
fapl.set_fclose_degree(h5f.CLOSE_STRONG)
lapl.set_elink_fapl(fapl)
return lapl
def default_lcpl():
""" Default link creation property list """
lcpl = h5p.create(h5p.LINK_CREATE)
lcpl.set_create_intermediate_group(True)
return lcpl
dlapl = default_lapl()
dlcpl = default_lcpl()
class CommonStateObject(object):
"""
Mixin class that allows sharing information between objects which
reside in the same HDF5 file. Requires that the host class have
a ".id" attribute which returns a low-level ObjectID subclass.
Also implements Unicode operations.
"""
@property
def _lapl(self):
""" Fetch the link access property list appropriate for this object
"""
return dlapl
@property
def _lcpl(self):
""" Fetch the link creation property list appropriate for this object
"""
return dlcpl
def _e(self, name, lcpl=None):
""" Encode a name according to the current file settings.
Returns name, or 2-tuple (name, lcpl) if lcpl is True
- Binary strings are always passed as-is, h5t.CSET_ASCII
- Unicode strings are encoded utf8, h5t.CSET_UTF8
If name is None, returns either None or (None, None) appropriately.
"""
def get_lcpl(coding):
lcpl = self._lcpl.copy()
lcpl.set_char_encoding(coding)
return lcpl
if name is None:
return (None, None) if lcpl else None
if isinstance(name, bytes):
coding = h5t.CSET_ASCII
else:
try:
name = name.encode('ascii')
coding = h5t.CSET_ASCII
except UnicodeEncodeError:
name = name.encode('utf8')
coding = h5t.CSET_UTF8
if lcpl:
return name, get_lcpl(coding)
return name
def _d(self, name):
""" Decode a name according to the current file settings.
- Try to decode utf8
- Failing that, return the byte string
If name is None, returns None.
"""
if name is None:
return None
try:
return name.decode('utf8')
except UnicodeDecodeError:
pass
return name
class _RegionProxy(object):
"""
Proxy object which handles region references.
To create a new region reference (datasets only), use slicing syntax:
>>> newref = obj.regionref[0:10:2]
To determine the target dataset shape from an existing reference:
>>> shape = obj.regionref.shape(existingref)
where <obj> may be any object in the file. To determine the shape of
the selection in use on the target dataset:
>>> selection_shape = obj.regionref.selection(existingref)
"""
def __init__(self, obj):
self.id = obj.id
@with_phil
def __getitem__(self, args):
if not isinstance(self.id, h5d.DatasetID):
raise TypeError("Region references can only be made to datasets")
from . import selections
selection = selections.select(self.id.shape, args, dsid=self.id)
return h5r.create(self.id, b'.', h5r.DATASET_REGION, selection._id)
def shape(self, ref):
""" Get the shape of the target dataspace referred to by *ref*. """
with phil:
sid = h5r.get_region(ref, self.id)
return sid.shape
def selection(self, ref):
""" Get the shape of the target dataspace selection referred to by *ref*
"""
with phil:
from . import selections
sid = h5r.get_region(ref, self.id)
return selections.guess_shape(sid)
class HLObject(CommonStateObject):
"""
Base class for high-level interface objects.
"""
@property
@with_phil
def file(self):
""" Return a File instance associated with this object """
import files
return files.File(self.id)
@property
@with_phil
def name(self):
""" Return the full name of this object. None if anonymous. """
return self._d(h5i.get_name(self.id))
@property
@with_phil
def parent(self):
"""Return the parent group of this object.
This is always equivalent to obj.file[posixpath.dirname(obj.name)].
ValueError if this object is anonymous.
"""
if self.name is None:
raise ValueError("Parent of an anonymous object is undefined")
return self.file[posixpath.dirname(self.name)]
@property
@with_phil
def id(self):
""" Low-level identifier appropriate for this object """
return self._id
@property
@with_phil
def ref(self):
""" An (opaque) HDF5 reference to this object """
return h5r.create(self.id, b'.', h5r.OBJECT)
@property
@with_phil
def regionref(self):
"""Create a region reference (Datasets only).
The syntax is regionref[<slices>]. For example, dset.regionref[...]
creates a region reference in which the whole dataset is selected.
Can also be used to determine the shape of the referenced dataset
(via .shape property), or the shape of the selection (via the
.selection property).
"""
return _RegionProxy(self)
@property
@with_phil
def attrs(self):
""" Attributes attached to this object """
import attrs
return attrs.AttributeManager(self)
@with_phil
def __init__(self, oid):
""" Setup this object, given its low-level identifier """
self._id = oid
@with_phil
def __hash__(self):
return hash(self.id)
@with_phil
def __eq__(self, other):
if hasattr(other, 'id'):
return self.id == other.id
return False
@with_phil
def __ne__(self, other):
return not self.__eq__(other)
def __nonzero__(self):
with phil:
return bool(self.id)
class View(object):
def __init__(self, obj):
self._obj = obj
@with_phil
def __len__(self):
return len(self._obj)
class KeyView(View):
@with_phil
def __contains__(self, what):
return what in self._obj
@with_phil
def __iter__(self):
for x in self._obj:
yield x
class ValueView(View):
def __contains__(self, what):
raise TypeError("Containership testing doesn't work for values. :(")
@with_phil
def __iter__(self):
for x in self._obj:
yield self._obj.get(x)
class ItemView(View):
@with_phil
def __contains__(self, what):
if what[0] in self._obj:
return what[1] == self._obj.get(what[0])
return False
@with_phil
def __iter__(self):
for x in self._obj:
yield (x, self._obj.get(x))
class DictCompat(object):
"""
Contains dictionary-style compatibility methods for groups and
attributes.
"""
def get(self, name, default=None):
""" Retrieve the member, or return default if it doesn't exist """
with phil:
try:
return self[name]
except KeyError:
return default
if py3:
def keys(self):
""" Get a view object on member names """
return KeyView(self)
def values(self):
""" Get a view object on member objects """
return ValueView(self)
def items(self):
""" Get a view object on member items """
return ItemView(self)
else:
def keys(self):
""" Get a list containing member names """
with phil:
return list(self)
def iterkeys(self):
""" Get an iterator over member names """
return iter(self)
def values(self):
""" Get a list containing member objects """
with phil:
return [self.get(x) for x in self]
def itervalues(self):
""" Get an iterator over member objects """
for x in self:
yield self.get(x)
def items(self):
""" Get a list of tuples containing (name, object) pairs """
with phil:
return [(x, self.get(x)) for x in self]
def iteritems(self):
""" Get an iterator over (name, object) pairs """
for x in self:
yield (x, self.get(x))