/
readers.py
846 lines (679 loc) · 33.4 KB
/
readers.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
"""
Functions for loading GST objects from text files.
"""
#***************************************************************************************************
# Copyright 2015, 2019 National Technology & Engineering Solutions of Sandia, LLC (NTESS).
# Under the terms of Contract DE-NA0003525 with NTESS, the U.S. Government retains certain rights
# in this software.
# Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except
# in compliance with the License. You may obtain a copy of the License at
# http://www.apache.org/licenses/LICENSE-2.0 or in the LICENSE file in the root pyGSTi directory.
#***************************************************************************************************
import os as _os
import pathlib as _pathlib
import warnings as _warnings
import json as _json
from pygsti.io import metadir as _metadir
from pygsti.io import mongodb as _mongodb
from pygsti.io import stdinput as _stdinput
from pygsti import baseobjs as _baseobjs
from pygsti import circuits as _circuits
from pygsti import data as _data
from pygsti.tools.legacytools import deprecate as _deprecated_fn
@_deprecated_fn('read_dataset')
def load_dataset(filename, cache=False, collision_action="aggregate",
record_zero_counts=True, ignore_zero_count_lines=True,
with_times="auto", circuit_parse_cache=None, verbosity=1):
"""Deprecated!"""
return read_dataset(filename, cache, collision_action,
record_zero_counts, ignore_zero_count_lines,
with_times, circuit_parse_cache, verbosity)
def read_dataset(filename, cache=False, collision_action="aggregate",
record_zero_counts=True, ignore_zero_count_lines=True,
with_times="auto", circuit_parse_cache=None, verbosity=1):
"""
Load a DataSet from a file.
This function first tries to load file as a saved DataSet object,
then as a standard text-formatted DataSet.
Parameters
----------
filename : string
The name of the file
cache : bool, optional
When set to True, a pickle file with the name filename + ".cache"
is searched for and loaded instead of filename if it exists
and is newer than filename. If no cache file exists or one
exists but it is older than filename, a cache file will be
written after loading from filename.
collision_action : {"aggregate", "keepseparate"}
Specifies how duplicate circuits should be handled. "aggregate"
adds duplicate-circuit counts, whereas "keepseparate" tags duplicate
circuits by setting their `.occurrence` IDs to sequential positive integers.
record_zero_counts : bool, optional
Whether zero-counts are actually recorded (stored) in the returned
DataSet. If False, then zero counts are ignored, except for potentially
registering new outcome labels. When reading from a cache file
(using `cache==True`) this argument is ignored: the presence of zero-
counts is dictated by the value of `record_zero_counts` when the cache file
was created.
ignore_zero_count_lines : bool, optional
Whether circuits for which there are no counts should be ignored
(i.e. omitted from the DataSet) or not.
with_times : bool or "auto", optional
Whether to the time-stamped data format should be read in. If
"auto", then the time-stamped format is allowed but not required on a
per-circuit basis (so the dataset can contain both formats). Typically
you only need to set this to False when reading in a template file.
circuit_parse_cache : dict, optional
A dictionary mapping qubit string representations into created
:class:`Circuit` objects, which can improve performance by reducing
or eliminating the need to parse circuit strings.
verbosity : int, optional
If zero, no output is shown. If greater than zero,
loading progress is shown.
Returns
-------
DataSet
"""
printer = _baseobjs.VerbosityPrinter.create_printer(verbosity)
try:
# a saved Dataset object is ok
ds = _data.DataSet(file_to_load_from=filename)
except:
#Parser functions don't take a VerbosityPrinter yet, and so
# always output to stdout (TODO)
bToStdout = (printer.verbosity > 0 and printer.filename is None)
if cache:
#bReadCache = False
cache_filename = filename + ".cache"
if _os.path.exists(cache_filename) and \
_os.path.getmtime(filename) < _os.path.getmtime(cache_filename):
try:
printer.log("Reading from cache file: %s" % cache_filename)
ds = _data.DataSet(file_to_load_from=cache_filename)
return ds
except: print("WARNING: Failed to load from cache file") # pragma: no cover
else:
printer.log("Cache file not found or is tool old -- one will"
+ "be created after loading is completed")
# otherwise must use standard dataset file format
parser = _stdinput.StdInputParser()
ds = parser.parse_datafile(filename, bToStdout,
collision_action=collision_action,
record_zero_counts=record_zero_counts,
ignore_zero_count_lines=ignore_zero_count_lines,
with_times=with_times)
printer.log("Writing cache file (to speed future loads): %s"
% cache_filename)
ds.save(cache_filename)
else:
# otherwise must use standard dataset file format
parser = _stdinput.StdInputParser()
ds = parser.parse_datafile(filename, bToStdout,
collision_action=collision_action,
record_zero_counts=record_zero_counts,
ignore_zero_count_lines=ignore_zero_count_lines,
with_times=with_times)
return ds
@_deprecated_fn('read_multidataset')
def load_multidataset(filename, cache=False, collision_action="aggregate",
record_zero_counts=True, verbosity=1):
"""Deprecated!"""
return read_multidataset(filename, cache, collision_action,
record_zero_counts, verbosity)
def read_multidataset(filename, cache=False, collision_action="aggregate",
record_zero_counts=True, verbosity=1):
"""
Load a MultiDataSet from a file.
This function first tries to load file as a saved MultiDataSet object,
then as a standard text-formatted MultiDataSet.
Parameters
----------
filename : string
The name of the file
cache : bool, optional
When set to True, a pickle file with the name filename + ".cache"
is searched for and loaded instead of filename if it exists
and is newer than filename. If no cache file exists or one
exists but it is older than filename, a cache file will be
written after loading from filename.
collision_action : {"aggregate", "keepseparate"}
Specifies how duplicate circuits should be handled. "aggregate"
adds duplicate-circuit counts, whereas "keepseparate" tags duplicate
circuits by setting their `.occurrence` IDs to sequential positive integers.
record_zero_counts : bool, optional
Whether zero-counts are actually recorded (stored) in the returned
MultiDataSet. If False, then zero counts are ignored, except for
potentially registering new outcome labels. When reading from a cache
file (using `cache==True`) this argument is ignored: the presence of
zero-counts is dictated by the value of `record_zero_counts` when the cache
file was created.
verbosity : int, optional
If zero, no output is shown. If greater than zero,
loading progress is shown.
Returns
-------
MultiDataSet
"""
printer = _baseobjs.VerbosityPrinter.create_printer(verbosity)
try:
# a saved MultiDataset object is ok
mds = _data.MultiDataSet(file_to_load_from=filename)
except:
#Parser functions don't take a VerbosityPrinter yet, and so
# always output to stdout (TODO)
bToStdout = (printer.verbosity > 0 and printer.filename is None)
if cache:
# bReadCache = False
cache_filename = filename + ".cache"
if _os.path.exists(cache_filename) and \
_os.path.getmtime(filename) < _os.path.getmtime(cache_filename):
try:
printer.log("Reading from cache file: %s" % cache_filename)
mds = _data.MultiDataSet(file_to_load_from=cache_filename)
return mds
except: print("WARNING: Failed to load from cache file") # pragma: no cover
else:
printer.log("Cache file not found or is too old -- one will be"
+ "created after loading is completed")
# otherwise must use standard dataset file format
parser = _stdinput.StdInputParser()
mds = parser.parse_multidatafile(filename, bToStdout,
collision_action=collision_action,
record_zero_counts=record_zero_counts)
printer.log("Writing cache file (to speed future loads): %s"
% cache_filename)
mds.save(cache_filename)
else:
# otherwise must use standard dataset file format
parser = _stdinput.StdInputParser()
mds = parser.parse_multidatafile(filename, bToStdout,
collision_action=collision_action,
record_zero_counts=record_zero_counts)
return mds
@_deprecated_fn('read_time_dependent_dataset')
def load_time_dependent_dataset(filename, cache=False, record_zero_counts=True):
"""Deprecated!"""
return read_time_dependent_dataset(filename, cache, record_zero_counts)
def read_time_dependent_dataset(filename, cache=False, record_zero_counts=True):
"""
Load time-dependent (time-stamped) data as a DataSet.
Parameters
----------
filename : string
The name of the file
cache : bool, optional
Reserved to perform caching similar to `read_dataset`. Currently
this argument doesn't do anything.
record_zero_counts : bool, optional
Whether zero-counts are actually recorded (stored) in the returned
DataSet. If False, then zero counts are ignored, except for
potentially registering new outcome labels.
Returns
-------
DataSet
"""
parser = _stdinput.StdInputParser()
create_subcircuits = not _circuits.Circuit.default_expand_subcircuits
tdds = parser.parse_tddatafile(filename, record_zero_counts=record_zero_counts,
create_subcircuits=create_subcircuits)
return tdds
@_deprecated_fn('pygsti.models.Model.read(...)')
def load_model(filename):
"""
Load a Model from a file, formatted using the standard text-format for models.
Parameters
----------
filename : string
The name of the file
Returns
-------
Model
"""
return _stdinput.parse_model(filename)
@_deprecated_fn()
def load_circuit_dict(filename):
"""
Load a circuit dictionary from a file, formatted using the standard text-format.
Parameters
----------
filename : string
The name of the file.
Returns
-------
Dictionary with keys = circuit labels and values = :class:`Circuit` objects.
"""
std = _stdinput.StdInputParser()
return std.parse_dictfile(filename)
@_deprecated_fn('read_circuit_list')
def load_circuit_list(filename, read_raw_strings=False, line_labels='auto', num_lines=None):
"""Deprecated!"""
return read_circuit_list(filename, read_raw_strings, line_labels, num_lines)
def read_circuit_list(filename, read_raw_strings=False, line_labels='auto', num_lines=None):
"""
Load a circuit list from a file, formatted using the standard text-format.
Parameters
----------
filename : string
The name of the file
read_raw_strings : boolean
If True, circuits are not converted to :class:`Circuit` objects.
line_labels : iterable, optional
The (string valued) line labels used to initialize :class:`Circuit`
objects when line label information is absent from the one-line text
representation contained in `filename`. If `'auto'`, then line labels
are taken to be the list of all state-space labels present in the
circuit's layers. If there are no such labels then the special value
`'*'` is used as a single line label.
num_lines : int, optional
Specify this instead of `line_labels` to set the latter to the
integers between 0 and `num_lines-1`.
Returns
-------
list of Circuit objects
"""
if read_raw_strings:
rawList = []
with open(str(filename), 'r') as circuitlist:
for line in circuitlist:
if len(line.strip()) == 0: continue
if len(line) == 0 or line[0] == '#': continue
rawList.append(line.strip())
return rawList
else:
create_subcircuits = not _circuits.Circuit.default_expand_subcircuits
std = _stdinput.StdInputParser()
return std.parse_stringfile(filename, line_labels, num_lines, create_subcircuits)
def convert_strings_to_circuits(obj):
"""
Converts an object resulting from :function:`convert_circuits_to_strings` back to its original.
Parameters
----------
obj : list or tuple or dict
The object to convert.
Returns
-------
object
"""
from pygsti.circuits import Circuit as _Circuit
std = _stdinput.StdInputParser()
def _replace_strs_with_circuits(x):
if isinstance(x, (list, tuple)):
if len(x) > 0 and x[0] == 'dict_items': # then convert this list into a dictionary
return {_replace_strs_with_circuits(k): _replace_strs_with_circuits(v) for k, v in x[1:]}
else: # normal list/tuple load -- we always load a tuple so it can work as a dict key
return tuple([_replace_strs_with_circuits(el) for el in x])
if isinstance(x, dict): # this case isn't written anymore - just to read old-format files (TODO REMOVE LATER)
return {_replace_strs_with_circuits(k): _replace_strs_with_circuits(v) for k, v in x.items()}
if isinstance(x, str):
return std.parse_circuit(x, create_subcircuits=_Circuit.default_expand_subcircuits)
return x
return _replace_strs_with_circuits(obj)
def read_circuit_strings(filename):
""" TODO: docstring - load various Circuit-containing standard objects from a file where
they have been replaced by their string representations """
if str(filename).endswith('.json'):
with open(filename, 'r') as f:
json_dict = _json.load(f)
return convert_strings_to_circuits(json_dict)
else:
raise ValueError("Cannot determine format from extension of filename: %s" % str(filename))
@_deprecated_fn('read_protocol_from_dir')
def load_protocol_from_dir(dirname, quick_load=False, comm=None):
"""Deprecated!"""
return read_protocol_from_dir(dirname, quick_load, comm)
def read_protocol_from_dir(dirname, quick_load=False, comm=None):
"""
Load a :class:`Protocol` from a directory on disk.
Parameters
----------
dirname : string
Directory name.
quick_load : bool, optional
Setting this to True skips the loading of components that may take
a long time to load. This can be useful when this information isn't
needed and loading takes a long time.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize file access.
Returns
-------
Protocol
"""
dirname = _pathlib.Path(dirname)
return _metadir._cls_from_meta_json(dirname).from_dir(dirname, quick_load=quick_load)
@_deprecated_fn('read_edesign_from_dir')
def load_edesign_from_dir(dirname, quick_load=False, comm=None):
"""Deprecated!"""
return read_edesign_from_dir(dirname, quick_load, comm)
def read_edesign_from_dir(dirname, quick_load=False, comm=None):
"""
Load a :class:`ExperimentDesign` from a directory on disk.
Parameters
----------
dirname : string
Directory name.
quick_load : bool, optional
Setting this to True skips the loading of components that may take
a long time to load. This can be useful when this information isn't
needed and loading takes a long time.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize file access.
Returns
-------
ExperimentDesign
"""
dirname = _pathlib.Path(dirname)
return _metadir._cls_from_meta_json(dirname / 'edesign').from_dir(dirname, quick_load=quick_load)
def create_edesign_from_dir(dirname):
from .. import protocols as _proto
topdir = _pathlib.Path(dirname)
edesign_dir = topdir / 'edesign'
circuit_lists = []; circuit_list_names = []
if edesign_dir.is_dir():
if (edesign_dir / 'meta.json').exists(): # load existing edesign
return _metadir._cls_from_meta_json(dirname / 'edesign').from_dir(dirname, quick_load=False)
# Find any circuit list files in the edesign directory
for child in sorted(edesign_dir.iterdir()):
if child.is_file():
try:
lst = read_circuit_list(child, read_raw_strings=False, line_labels='auto')
circuit_lists.append(lst); circuit_list_names.append(child.name)
except Exception:
pass
#Otherwise see if we should recurse or not
subdirs = []
for child in topdir.iterdir():
if child == edesign_dir: continue # special case, shouldn't be strictly needed
if child.is_dir() and (child / 'edesign').is_dir():
subdirs.append(child)
sub_edesigns = [create_edesign_from_dir(subdir) for subdir in subdirs]
if len(sub_edesigns) > 0:
if len(circuit_lists) > 0:
_warnings.warn("Ignoring %d circuit-list files [%s] in %d because sub-designs were detected." %
(len(circuit_lists), ", ".join(circuit_list_names), edesign_dir.name))
return _proto.CombinedExperimentDesign({subdir.name: sub_edesign
for subdir, sub_edesign in zip(subdirs, sub_edesigns)})
elif len(circuit_lists) > 1:
return _proto.CircuitListsDesign(circuit_lists)
elif len(circuit_lists) == 1:
return _proto.ExperimentDesign(circuit_lists[0])
else:
raise ValueError("Could not create an experiment design from the files in this directory!")
def read_edesign_from_mongodb(mongodb, doc_id, quick_load=False, comm=None, custom_collection_names=None):
"""
Load a :class:`ExperimentDesign` from a MongoDB database.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to load data from.
doc_id : str
The user-defined identifier of the experiment design to load.
quick_load : bool, optional
Setting this to True skips the loading of components that may take
a long time to load. This can be useful when this information isn't
needed and loading takes a long time.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize file access.
custom_collection_names : dict, optional
Overrides for the default MongoDB collection names used for storing different
types of pyGSTi objects. In this case, only the `"edesigns"` key of this dictionary
is relevant. Default values are given by :method:`pygsti.io.mongodb_collection_names`.
Returns
-------
ExperimentDesign
"""
doc = mongodb[_mongodb.mongodb_collection_names(custom_collection_names)['edesigns']].find_one({'_id': doc_id})
if 'type' not in doc:
raise ValueError("Document exists, but expected 'type' key within document is missing!")
return _metadir._class_for_name(doc['type']).from_mongodb(mongodb, doc_id, quick_load=quick_load,
custom_collection_names=custom_collection_names)
def remove_edesign_from_mongodb(mongodb, doc_id, custom_collection_names=None, session=None):
"""
Remove an :class:`ExperimentDesign` from a MongoDB database.
If no experiment design with `doc_id` exists, this function returns `False`,
otherwise it returns `True`.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to remove data from.
doc_id : str
The user-defined identifier of the experiment design to remove.
custom_collection_names : dict, optional
Overrides for the default MongoDB collection names used for storing different
types of pyGSTi objects. In this case, only the `"edesigns"` key of this dictionary
is relevant. Default values are given by :method:`pygsti.io.mongodb_collection_names`.
session : pymongo.client_session.ClientSession, optional
MongoDB session object to use when interacting with the MongoDB
database. This can be used to implement transactions
among other things.
Returns
-------
bool
`True` if the specified experiment design was removed, `False` if it didn't exist.
"""
from ..protocols import ExperimentDesign as _ExperimentDesign
return _ExperimentDesign.remove_from_mongodb(mongodb, doc_id, custom_collection_names, session)
@_deprecated_fn('read_data_from_dir')
def load_data_from_dir(dirname, quick_load=False, comm=None):
"""Deprecated!"""
return read_data_from_dir(dirname, quick_load, comm)
def read_data_from_dir(dirname, quick_load=False, comm=None):
"""
Load a :class:`ProtocolData` from a directory on disk.
Parameters
----------
dirname : string
Directory name.
quick_load : bool, optional
Setting this to True skips the loading of components that may take
a long time to load. This can be useful when this information isn't
needed and loading takes a long time.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize file access.
Returns
-------
ProtocolData
"""
dirname = _pathlib.Path(dirname)
try:
protocol_data = _metadir._cls_from_meta_json(dirname / 'data')
except FileNotFoundError:
from ..protocols import ProtocolData as _ProtocolData
protocol_data = _ProtocolData # use ProtocolData as default class
return protocol_data.from_dir(dirname, quick_load=quick_load)
def read_data_from_mongodb(mongodb, doc_id, quick_load=False, comm=None, custom_collection_names=None):
"""
Load a :class:`ProtocolData` from a MongoDB database.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to load data from.
doc_id : str
The user-defined identifier of the data to load.
quick_load : bool, optional
Setting this to True skips the loading of components that may take
a long time to load. This can be useful when this information isn't
needed and loading takes a long time.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize database access.
custom_collection_names : dict, optional
Overrides for the default MongoDB collection names used for storing different
types of pyGSTi objects. Default values are given by
:method:`pygsti.io.mongodb_collection_names`.
Returns
-------
ProtocolData
"""
doc = mongodb[_mongodb.mongodb_collection_names(custom_collection_names)['data']].find_one({'_id': doc_id})
if doc is None or 'type' not in doc:
from ..protocols import ProtocolData as _ProtocolData
data_cls = _ProtocolData
else:
data_cls = _metadir._class_for_name(doc['type'])
return data_cls.from_mongodb(mongodb, doc_id, quick_load=quick_load,
custom_collection_names=custom_collection_names)
def remove_data_from_mongodb(mongodb, doc_id, custom_collection_names=None, session=None):
"""
Remove :class:`ProtocolData` from a MongoDB database.
If no experiment design with `doc_id` exists, this function returns `False`,
otherwise it returns `True`.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to remove data from.
doc_id : str
The user-defined identifier of the experiment design to remove.
custom_collection_names : dict, optional
Overrides for the default MongoDB collection names used for storing different
types of pyGSTi objects. In this case, only the `"edesigns"` key of this dictionary
is relevant. Default values are given by :method:`pygsti.io.mongodb_collection_names`.
session : pymongo.client_session.ClientSession, optional
MongoDB session object to use when interacting with the MongoDB
database. This can be used to implement transactions
among other things.
Returns
-------
bool
`True` if the specified experiment design was removed, `False` if it didn't exist.
"""
from ..protocols import ProtocolData as _ProtocolData
return _ProtocolData.remove_from_mongodb(mongodb, doc_id,
custom_collection_names, session)
@_deprecated_fn('read_results_from_dir')
def load_results_from_dir(dirname, name=None, preloaded_data=None, quick_load=False, comm=None):
"""Deprecated!"""
return read_results_from_dir(dirname, name, preloaded_data, quick_load, comm)
def read_results_from_dir(dirname, name=None, preloaded_data=None, quick_load=False, comm=None):
"""
Load a :class:`ProtocolResults` or :class:`ProtocolsResultsDir` from a directory on disk.
Which object type is loaded depends on whether `name` is given: if it is, then
a :class:`ProtocolResults` object is loaded. If not, a :class:`ProtocolsResultsDir`
results.
Parameters
----------
dirname : string
Directory name. This should be a "base" directory, containing
subdirectories like "edesign", "data", and "results"
name : string or None
The 'name' of a particular :class:`ProtocolResults` object, which
is a sub-directory beneath `dirname/results/`. If None, then *all*
the results (all names) at the given base-directory are loaded and
returned as a :class:`ProtocolResultsDir` object.
preloaded_data : ProtocolData, optional
The data object belonging to the to-be-loaded results, in cases
when this has been loaded already (only use this if you know what
you're doing).
quick_load : bool, optional
Setting this to True skips the loading of data and experiment-design
components that may take a long time to load. This can be useful
all the information of interest lies only within the results objects.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize file access.
Returns
-------
ProtocolResults or ProtocolResultsDir
"""
from ..protocols import ProtocolResultsDir as _ProtocolResultsDir
dirname = _pathlib.Path(dirname)
results_dir = dirname / 'results'
if name is None: # then it's a directory object
cls = _metadir._cls_from_meta_json(results_dir) if (results_dir / 'meta.json').exists() \
else _ProtocolResultsDir # default if no meta.json (if only a results obj has been written inside dir)
return cls.from_dir(dirname, preloaded_data=preloaded_data, quick_load=quick_load)
else: # it's a ProtocolResults object
return _metadir._cls_from_meta_json(results_dir / name).from_dir(dirname, name, preloaded_data, quick_load)
def read_results_from_mongodb(mongodb, doc_id, name=None, preloaded_data=None, quick_load=False,
comm=None, custom_collection_names=None):
"""
Load a :class:`ProtocolResults` or :class:`ProtocolsResultsDir` from a MongoDB database.
Which object type is loaded depends on whether `name` is given: if it is, then
a :class:`ProtocolResults` object is loaded. If not, a :class:`ProtocolsResultsDir`
is loaded.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to load data from.
doc_id : str
The user-defined identifier of the results directory to load.
name : string or None
The 'name' of a particular :class:`ProtocolResults` object belonging
to the directory given by `doc_id`. If None, then *all*
the results (all names) in the given results directory are loaded and
returned as a :class:`ProtocolResultsDir` object.
preloaded_data : ProtocolData, optional
The data object belonging to the to-be-loaded results, in cases
when this has been loaded already (only use this if you know what
you're doing).
quick_load : bool, optional
Setting this to True skips the loading of data and experiment-design
components that may take a long time to load. This can be useful
all the information of interest lies only within the results objects.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize database access.
custom_collection_names : dict, optional
Overrides for the default MongoDB collection names used for storing different
types of pyGSTi objects. Default values are given by
:method:`pygsti.io.mongodb_collection_names`.
Returns
-------
ProtocolResults or ProtocolResultsDir
"""
if name is None:
#Currently, there's just a single ProtocolResultsDir class. If we want to allow custom classes
# we'll need to use the 'resultdirs' collection to store this information (FUTURE)
#doc = mongodb[_mongodb.mongodb_collection_names(custom_collection_names)['resultdirs']].find_one({'_id': doc_id})
#if doc is None or 'type' not in doc:
from ..protocols import ProtocolResultsDir as _ProtocolResultsDir
resultsdir_cls = _ProtocolResultsDir
#else:
# resultsdir_cls = _metadir._class_for_name(doc['type'])
return resultsdir_cls.from_mongodb(mongodb, doc_id, None, None, preloaded_data, quick_load,
custom_collection_names)
else: # it's a ProtocolResults object
doc = mongodb[_mongodb.mongodb_collection_names(custom_collection_names)['results']].find_one(
{'directory_id': doc_id, 'name': name}, ['type'])
results_cls = _metadir._class_for_name(doc['type'])
return results_cls.from_mongodb(mongodb, doc_id, name, preloaded_data, quick_load, custom_collection_names)
def remove_results_from_mongodb(mongodb, doc_id, name=None, comm=None, custom_collection_names=None, session=None):
"""
Remove :class:`ProtocolResults` or :class:`ProtocolsResultsDir` data from a MongoDB database.
Which object type is removed depends on whether `name` is given: if it is, then
data corresponding to a :class:`ProtocolResults` object is removed. If not, that of
a :class:`ProtocolsResultsDir` is removed.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to remove data from.
doc_id : str
The user-defined identifier of the results directory to remove.
name : string or None
The 'name' of a particular :class:`ProtocolResults` object belonging
to the directory given by `doc_id`. If None, then *all*
the results (all names) in the given results directory are removed.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize database access.
custom_collection_names : dict, optional
Overrides for the default MongoDB collection names used for storing different
types of pyGSTi objects. Default values are given by
:method:`pygsti.io.mongodb_collection_names`.
session : pymongo.client_session.ClientSession, optional
MongoDB session object to use when interacting with the MongoDB
database. This can be used to implement transactions
among other things.
Returns
-------
bool
`True` if the specified results were removed, `False` if they didn't exist.
"""
if name is None:
#See FUTURE comment in read_results_from_mongodb above
from ..protocols import ProtocolResultsDir as _ProtocolResultsDir
resultsdir_cls = _ProtocolResultsDir
return resultsdir_cls.remove_from_mongodb(mongodb, doc_id, custom_collection_names, session)
else:
doc = mongodb[_mongodb.mongodb_collection_names(custom_collection_names)['results']].find_one(
{'directory_id': doc_id, 'name': name}, ['type'])
if doc is None:
return False
results_cls = _metadir._class_for_name(doc['type'])
return results_cls.remove_from_mongodb(mongodb, doc_id, name, custom_collection_names, session)