/
readers.py
935 lines (742 loc) · 35.5 KB
/
readers.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
"""
Functions for loading GST objects from text files.
"""
#***************************************************************************************************
# Copyright 2015, 2019 National Technology & Engineering Solutions of Sandia, LLC (NTESS).
# Under the terms of Contract DE-NA0003525 with NTESS, the U.S. Government retains certain rights
# in this software.
# Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except
# in compliance with the License. You may obtain a copy of the License at
# http://www.apache.org/licenses/LICENSE-2.0 or in the LICENSE file in the root pyGSTi directory.
#***************************************************************************************************
import os as _os
import pathlib as _pathlib
import warnings as _warnings
import json as _json
from pygsti.io import metadir as _metadir
from pygsti.io import mongodb as _mongodb
from pygsti.io import stdinput as _stdinput
from pygsti import baseobjs as _baseobjs
from pygsti import circuits as _circuits
from pygsti import data as _data
from pygsti.tools.legacytools import deprecate as _deprecated_fn
@_deprecated_fn('read_dataset')
def load_dataset(filename, cache=False, collision_action="aggregate",
record_zero_counts=True, ignore_zero_count_lines=True,
with_times="auto", circuit_parse_cache=None, verbosity=1):
"""Deprecated!"""
return read_dataset(filename, cache, collision_action,
record_zero_counts, ignore_zero_count_lines,
with_times, circuit_parse_cache, verbosity)
def read_dataset(filename, cache=False, collision_action="aggregate",
record_zero_counts=True, ignore_zero_count_lines=True,
with_times="auto", circuit_parse_cache=None, verbosity=1):
"""
Load a DataSet from a file.
This function first tries to load file as a saved DataSet object,
then as a standard text-formatted DataSet.
Parameters
----------
filename : string
The name of the file
cache : bool, optional
When set to True, a pickle file with the name filename + ".cache"
is searched for and loaded instead of filename if it exists
and is newer than filename. If no cache file exists or one
exists but it is older than filename, a cache file will be
written after loading from filename.
collision_action : {"aggregate", "keepseparate"}
Specifies how duplicate circuits should be handled. "aggregate"
adds duplicate-circuit counts, whereas "keepseparate" tags duplicate
circuits by setting their `.occurrence` IDs to sequential positive integers.
record_zero_counts : bool, optional
Whether zero-counts are actually recorded (stored) in the returned
DataSet. If False, then zero counts are ignored, except for potentially
registering new outcome labels. When reading from a cache file
(using `cache==True`) this argument is ignored: the presence of zero-
counts is dictated by the value of `record_zero_counts` when the cache file
was created.
ignore_zero_count_lines : bool, optional
Whether circuits for which there are no counts should be ignored
(i.e. omitted from the DataSet) or not.
with_times : bool or "auto", optional
Whether to the time-stamped data format should be read in. If
"auto", then the time-stamped format is allowed but not required on a
per-circuit basis (so the dataset can contain both formats). Typically
you only need to set this to False when reading in a template file.
circuit_parse_cache : dict, optional
A dictionary mapping qubit string representations into created
:class:`Circuit` objects, which can improve performance by reducing
or eliminating the need to parse circuit strings.
verbosity : int, optional
If zero, no output is shown. If greater than zero,
loading progress is shown.
Returns
-------
DataSet
"""
printer = _baseobjs.VerbosityPrinter.create_printer(verbosity)
try:
# a saved Dataset object is ok
ds = _data.DataSet(file_to_load_from=filename)
except:
#Parser functions don't take a VerbosityPrinter yet, and so
# always output to stdout (TODO)
bToStdout = (printer.verbosity > 0 and printer.filename is None)
if cache:
#bReadCache = False
cache_filename = filename + ".cache"
if _os.path.exists(cache_filename) and \
_os.path.getmtime(filename) < _os.path.getmtime(cache_filename):
try:
printer.log("Reading from cache file: %s" % cache_filename)
ds = _data.DataSet(file_to_load_from=cache_filename)
return ds
except: print("WARNING: Failed to load from cache file") # pragma: no cover
else:
printer.log("Cache file not found or is tool old -- one will"
+ "be created after loading is completed")
# otherwise must use standard dataset file format
parser = _stdinput.StdInputParser()
ds = parser.parse_datafile(filename, bToStdout,
collision_action=collision_action,
record_zero_counts=record_zero_counts,
ignore_zero_count_lines=ignore_zero_count_lines,
with_times=with_times)
printer.log("Writing cache file (to speed future loads): %s"
% cache_filename)
ds.save(cache_filename)
else:
# otherwise must use standard dataset file format
parser = _stdinput.StdInputParser()
ds = parser.parse_datafile(filename, bToStdout,
collision_action=collision_action,
record_zero_counts=record_zero_counts,
ignore_zero_count_lines=ignore_zero_count_lines,
with_times=with_times)
return ds
@_deprecated_fn('read_multidataset')
def load_multidataset(filename, cache=False, collision_action="aggregate",
record_zero_counts=True, verbosity=1):
"""Deprecated!"""
return read_multidataset(filename, cache, collision_action,
record_zero_counts, verbosity)
def read_multidataset(filename, cache=False, collision_action="aggregate",
record_zero_counts=True, verbosity=1):
"""
Load a MultiDataSet from a file.
This function first tries to load file as a saved MultiDataSet object,
then as a standard text-formatted MultiDataSet.
Parameters
----------
filename : string
The name of the file
cache : bool, optional
When set to True, a pickle file with the name filename + ".cache"
is searched for and loaded instead of filename if it exists
and is newer than filename. If no cache file exists or one
exists but it is older than filename, a cache file will be
written after loading from filename.
collision_action : {"aggregate", "keepseparate"}
Specifies how duplicate circuits should be handled. "aggregate"
adds duplicate-circuit counts, whereas "keepseparate" tags duplicate
circuits by setting their `.occurrence` IDs to sequential positive integers.
record_zero_counts : bool, optional
Whether zero-counts are actually recorded (stored) in the returned
MultiDataSet. If False, then zero counts are ignored, except for
potentially registering new outcome labels. When reading from a cache
file (using `cache==True`) this argument is ignored: the presence of
zero-counts is dictated by the value of `record_zero_counts` when the cache
file was created.
verbosity : int, optional
If zero, no output is shown. If greater than zero,
loading progress is shown.
Returns
-------
MultiDataSet
"""
printer = _baseobjs.VerbosityPrinter.create_printer(verbosity)
try:
# a saved MultiDataset object is ok
mds = _data.MultiDataSet(file_to_load_from=filename)
except:
#Parser functions don't take a VerbosityPrinter yet, and so
# always output to stdout (TODO)
bToStdout = (printer.verbosity > 0 and printer.filename is None)
if cache:
# bReadCache = False
cache_filename = filename + ".cache"
if _os.path.exists(cache_filename) and \
_os.path.getmtime(filename) < _os.path.getmtime(cache_filename):
try:
printer.log("Reading from cache file: %s" % cache_filename)
mds = _data.MultiDataSet(file_to_load_from=cache_filename)
return mds
except: print("WARNING: Failed to load from cache file") # pragma: no cover
else:
printer.log("Cache file not found or is too old -- one will be"
+ "created after loading is completed")
# otherwise must use standard dataset file format
parser = _stdinput.StdInputParser()
mds = parser.parse_multidatafile(filename, bToStdout,
collision_action=collision_action,
record_zero_counts=record_zero_counts)
printer.log("Writing cache file (to speed future loads): %s"
% cache_filename)
mds.save(cache_filename)
else:
# otherwise must use standard dataset file format
parser = _stdinput.StdInputParser()
mds = parser.parse_multidatafile(filename, bToStdout,
collision_action=collision_action,
record_zero_counts=record_zero_counts)
return mds
@_deprecated_fn('read_time_dependent_dataset')
def load_time_dependent_dataset(filename, cache=False, record_zero_counts=True):
"""Deprecated!"""
return read_time_dependent_dataset(filename, cache, record_zero_counts)
def read_time_dependent_dataset(filename, cache=False, record_zero_counts=True):
"""
Load time-dependent (time-stamped) data as a DataSet.
Parameters
----------
filename : string
The name of the file
cache : bool, optional
Reserved to perform caching similar to `read_dataset`. Currently
this argument doesn't do anything.
record_zero_counts : bool, optional
Whether zero-counts are actually recorded (stored) in the returned
DataSet. If False, then zero counts are ignored, except for
potentially registering new outcome labels.
Returns
-------
DataSet
"""
parser = _stdinput.StdInputParser()
create_subcircuits = not _circuits.Circuit.default_expand_subcircuits
tdds = parser.parse_tddatafile(filename, record_zero_counts=record_zero_counts,
create_subcircuits=create_subcircuits)
return tdds
@_deprecated_fn('pygsti.models.Model.read(...)')
def load_model(filename):
"""
Load a Model from a file, formatted using the standard text-format for models.
Parameters
----------
filename : string
The name of the file
Returns
-------
Model
"""
return _stdinput.parse_model(filename)
@_deprecated_fn()
def load_circuit_dict(filename):
"""
Load a circuit dictionary from a file, formatted using the standard text-format.
Parameters
----------
filename : string
The name of the file.
Returns
-------
Dictionary with keys = circuit labels and values = :class:`Circuit` objects.
"""
std = _stdinput.StdInputParser()
return std.parse_dictfile(filename)
@_deprecated_fn('read_circuit_list')
def load_circuit_list(filename, read_raw_strings=False, line_labels='auto', num_lines=None):
"""Deprecated!"""
return read_circuit_list(filename, read_raw_strings, line_labels, num_lines)
def read_circuit_list(filename, read_raw_strings=False, line_labels='auto', num_lines=None):
"""
Load a circuit list from a file, formatted using the standard text-format.
Parameters
----------
filename : string
The name of the file
read_raw_strings : boolean
If True, circuits are not converted to :class:`Circuit` objects.
line_labels : iterable, optional
The (string valued) line labels used to initialize :class:`Circuit`
objects when line label information is absent from the one-line text
representation contained in `filename`. If `'auto'`, then line labels
are taken to be the list of all state-space labels present in the
circuit's layers. If there are no such labels then the special value
`'*'` is used as a single line label.
num_lines : int, optional
Specify this instead of `line_labels` to set the latter to the
integers between 0 and `num_lines-1`.
Returns
-------
list of Circuit objects
"""
if read_raw_strings:
rawList = []
with open(str(filename), 'r') as circuitlist:
for line in circuitlist:
if len(line.strip()) == 0: continue
if len(line) == 0 or line[0] == '#': continue
rawList.append(line.strip())
return rawList
else:
create_subcircuits = not _circuits.Circuit.default_expand_subcircuits
std = _stdinput.StdInputParser()
return std.parse_stringfile(filename, line_labels, num_lines, create_subcircuits)
def convert_strings_to_circuits(obj):
"""
Converts an object resulting from :func:`convert_circuits_to_strings` back to its original.
Parameters
----------
obj : list or tuple or dict
The object to convert.
Returns
-------
object
"""
from pygsti.circuits import Circuit as _Circuit
std = _stdinput.StdInputParser()
def _replace_strs_with_circuits(x):
if isinstance(x, (list, tuple)):
if len(x) > 0 and x[0] == 'dict_items': # then convert this list into a dictionary
return {_replace_strs_with_circuits(k): _replace_strs_with_circuits(v) for k, v in x[1:]}
else: # normal list/tuple load -- we always load a tuple so it can work as a dict key
return tuple([_replace_strs_with_circuits(el) for el in x])
if isinstance(x, dict): # this case isn't written anymore - just to read old-format files (TODO REMOVE LATER)
return {_replace_strs_with_circuits(k): _replace_strs_with_circuits(v) for k, v in x.items()}
if isinstance(x, str):
return std.parse_circuit(x, create_subcircuits=not _Circuit.default_expand_subcircuits)
return x
return _replace_strs_with_circuits(obj)
def read_circuit_strings(filename):
""" TODO: docstring - load various Circuit-containing standard objects from a file where
they have been replaced by their string representations """
if str(filename).endswith('.json'):
with open(filename, 'r') as f:
json_dict = _json.load(f)
return convert_strings_to_circuits(json_dict)
else:
raise ValueError("Cannot determine format from extension of filename: %s" % str(filename))
@_deprecated_fn('read_protocol_from_dir')
def load_protocol_from_dir(dirname, quick_load=False, comm=None):
"""Deprecated!"""
return read_protocol_from_dir(dirname, quick_load, comm)
def read_protocol_from_dir(dirname, quick_load=False, comm=None):
"""
Load a :class:`Protocol` from a directory on disk.
Parameters
----------
dirname : string
Directory name.
quick_load : bool, optional
Setting this to True skips the loading of components that may take
a long time to load. This can be useful when this information isn't
needed and loading takes a long time.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize file access.
Returns
-------
Protocol
"""
dirname = _pathlib.Path(dirname)
return _metadir._cls_from_meta_json(dirname).from_dir(dirname, quick_load=quick_load)
def read_protocol_from_mongodb(mongodb, doc_id, quick_load=False):
"""
Load a :class:`Protocol` from a MongoDB database.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to load data from.
doc_id : str
The user-defined identifier of the protocol object to load.
quick_load : bool, optional
Setting this to True skips the loading of components that may take
a long time to load. This can be useful when this information isn't
needed and loading takes a long time.
Returns
-------
Protocol
"""
import pygsti.protocols as _proto
return _proto.Protocol.from_mongodb(mongodb, doc_id, quick_load=quick_load)
def remove_protocol_from_mongodb(mongodb, doc_id, session=None, recursive=False):
"""
Remove a :class:`Protocol` from a MongoDB database.
If no protocol object with `doc_id` exists, this function returns `False`,
otherwise it returns `True`.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to remove data from.
doc_id : str
The user-defined identifier of the protocol object to remove.
session : pymongo.client_session.ClientSession, optional
MongoDB session object to use when interacting with the MongoDB
database. This can be used to implement transactions
among other things.
recursive : RecursiveRemovalSpecification, optional
An object that filters the type of documents that are removed.
Used when working with inter-related experiment designs, data,
and results objects to only remove the types of documents you
know aren't being shared with other documents.
Returns
-------
bool
`True` if the specified protocol object was removed, `False` if it didn't exist.
"""
from ..protocols import Protocol as _Protocol
return _Protocol.remove_from_mongodb(mongodb, doc_id, session=session,
recursive=recursive)
@_deprecated_fn('read_edesign_from_dir')
def load_edesign_from_dir(dirname, quick_load=False, comm=None):
"""Deprecated!"""
return read_edesign_from_dir(dirname, quick_load, comm)
def read_edesign_from_dir(dirname, quick_load=False, comm=None):
"""
Load a :class:`ExperimentDesign` from a directory on disk.
Parameters
----------
dirname : string
Directory name.
quick_load : bool, optional
Setting this to True skips the loading of components that may take
a long time to load. This can be useful when this information isn't
needed and loading takes a long time.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize file access.
Returns
-------
ExperimentDesign
"""
dirname = _pathlib.Path(dirname)
return _metadir._cls_from_meta_json(dirname / 'edesign').from_dir(dirname, quick_load=quick_load)
def create_edesign_from_dir(dirname):
from .. import protocols as _proto
topdir = _pathlib.Path(dirname)
edesign_dir = topdir / 'edesign'
circuit_lists = []; circuit_list_names = []
if edesign_dir.is_dir():
if (edesign_dir / 'meta.json').exists(): # load existing edesign
return _metadir._cls_from_meta_json(dirname / 'edesign').from_dir(dirname, quick_load=False)
# Find any circuit list files in the edesign directory
for child in sorted(edesign_dir.iterdir()):
if child.is_file():
try:
lst = read_circuit_list(child, read_raw_strings=False, line_labels='auto')
circuit_lists.append(lst); circuit_list_names.append(child.name)
except Exception:
pass
#Otherwise see if we should recurse or not
subdirs = []
for child in topdir.iterdir():
if child == edesign_dir: continue # special case, shouldn't be strictly needed
if child.is_dir() and (child / 'edesign').is_dir():
subdirs.append(child)
sub_edesigns = [create_edesign_from_dir(subdir) for subdir in subdirs]
if len(sub_edesigns) > 0:
if len(circuit_lists) > 0:
_warnings.warn("Ignoring %d circuit-list files [%s] in %d because sub-designs were detected." %
(len(circuit_lists), ", ".join(circuit_list_names), edesign_dir.name))
return _proto.CombinedExperimentDesign({subdir.name: sub_edesign
for subdir, sub_edesign in zip(subdirs, sub_edesigns)})
elif len(circuit_lists) > 1:
return _proto.CircuitListsDesign(circuit_lists)
elif len(circuit_lists) == 1:
return _proto.ExperimentDesign(circuit_lists[0])
else:
raise ValueError("Could not create an experiment design from the files in this directory!")
def read_edesign_from_mongodb(mongodb, doc_id, quick_load=False, comm=None):
"""
Load a :class:`ExperimentDesign` from a MongoDB database.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to load data from.
doc_id : str
The user-defined identifier of the experiment design to load.
quick_load : bool, optional
Setting this to True skips the loading of components that may take
a long time to load. This can be useful when this information isn't
needed and loading takes a long time.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize file access.
Returns
-------
ExperimentDesign
"""
import pygsti.protocols as _proto
return _proto.ExperimentDesign.from_mongodb(mongodb, doc_id, quick_load=quick_load)
def remove_edesign_from_mongodb(mongodb, doc_id, session=None, recursive="default"):
"""
Remove an :class:`ExperimentDesign` from a MongoDB database.
If no experiment design with `doc_id` exists, this function returns `False`,
otherwise it returns `True`.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to remove data from.
doc_id : str
The user-defined identifier of the experiment design to remove.
session : pymongo.client_session.ClientSession, optional
MongoDB session object to use when interacting with the MongoDB
database. This can be used to implement transactions
among other things.
recursive : RecursiveRemovalSpecification, optional
An object that filters the type of documents that are removed.
Used when working with inter-related experiment designs, data,
and results objects to only remove the types of documents you
know aren't being shared with other documents.
Returns
-------
bool
`True` if the specified experiment design was removed, `False` if it didn't exist.
"""
from ..protocols import ExperimentDesign as _ExperimentDesign
return _ExperimentDesign.remove_from_mongodb(mongodb, doc_id, session=session,
recursive=recursive)
@_deprecated_fn('read_data_from_dir')
def load_data_from_dir(dirname, quick_load=False, comm=None):
"""Deprecated!"""
return read_data_from_dir(dirname, quick_load, comm)
def read_data_from_dir(dirname, preloaded_edesign=None, quick_load=False, comm=None):
"""
Load a :class:`ProtocolData` from a directory on disk.
Parameters
----------
dirname : string
Directory name.
preloaded_edesign : ExperimentDesign, optional
The experiment deisgn belonging to the to-be-loaded data object, in cases
when this has been loaded already (only use this if you know what
you're doing).
quick_load : bool, optional
Setting this to True skips the loading of components that may take
a long time to load. This can be useful when this information isn't
needed and loading takes a long time.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize file access.
Returns
-------
ProtocolData
"""
dirname = _pathlib.Path(dirname)
try:
protocol_data = _metadir._cls_from_meta_json(dirname / 'data')
except FileNotFoundError:
from ..protocols import ProtocolData as _ProtocolData
protocol_data = _ProtocolData # use ProtocolData as default class
return protocol_data.from_dir(dirname, preloaded_edesign=preloaded_edesign, quick_load=quick_load)
def read_data_from_mongodb(mongodb, doc_id, preloaded_edesign=None, quick_load=False, comm=None):
"""
Load a :class:`ProtocolData` from a MongoDB database.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to load data from.
doc_id : str
The user-defined identifier of the data to load.
preloaded_edesign : ExperimentDesign, optional
The experiment deisgn belonging to the to-be-loaded data object, in cases
when this has been loaded already (only use this if you know what
you're doing).
quick_load : bool, optional
Setting this to True skips the loading of components that may take
a long time to load. This can be useful when this information isn't
needed and loading takes a long time.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize database access.
Returns
-------
ProtocolData
"""
import pygsti.protocols as _proto
return _proto.ProtocolData.from_mongodb(mongodb, doc_id, preloaded_edesign=preloaded_edesign, quick_load=quick_load)
def remove_data_from_mongodb(mongodb, doc_id, session=None, recursive="default"):
"""
Remove :class:`ProtocolData` from a MongoDB database.
If no experiment design with `doc_id` exists, this function returns `False`,
otherwise it returns `True`.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to remove data from.
doc_id : str
The user-defined identifier of the experiment design to remove.
session : pymongo.client_session.ClientSession, optional
MongoDB session object to use when interacting with the MongoDB
database. This can be used to implement transactions
among other things.
recursive : RecursiveRemovalSpecification, optional
An object that filters the type of documents that are removed.
Used when working with inter-related experiment designs, data,
and results objects to only remove the types of documents you
know aren't being shared with other documents.
Returns
-------
bool
`True` if the specified experiment design was removed, `False` if it didn't exist.
"""
from ..protocols import ProtocolData as _ProtocolData
return _ProtocolData.remove_from_mongodb(mongodb, doc_id, session,
recursive=recursive)
@_deprecated_fn('read_results_from_dir')
def load_results_from_dir(dirname, name=None, preloaded_data=None, quick_load=False, comm=None):
"""Deprecated!"""
return read_results_from_dir(dirname, name, preloaded_data, quick_load, comm)
def read_results_from_dir(dirname, name=None, preloaded_data=None, quick_load=False, comm=None):
"""
Load a :class:`ProtocolResults` or :class:`ProtocolsResultsDir` from a directory on disk.
Which object type is loaded depends on whether `name` is given: if it is, then
a :class:`ProtocolResults` object is loaded. If not, a :class:`ProtocolsResultsDir`
results.
Parameters
----------
dirname : string
Directory name. This should be a "base" directory, containing
subdirectories like "edesign", "data", and "results"
name : string or None
The 'name' of a particular :class:`ProtocolResults` object, which
is a sub-directory beneath `dirname/results/`. If None, then *all*
the results (all names) at the given base-directory are loaded and
returned as a :class:`ProtocolResultsDir` object.
preloaded_data : ProtocolData, optional
The data object belonging to the to-be-loaded results, in cases
when this has been loaded already (only use this if you know what
you're doing).
quick_load : bool, optional
Setting this to True skips the loading of data and experiment-design
components that may take a long time to load. This can be useful
all the information of interest lies only within the results objects.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize file access.
Returns
-------
ProtocolResults or ProtocolResultsDir
"""
from ..protocols import ProtocolResultsDir as _ProtocolResultsDir
dirname = _pathlib.Path(dirname)
results_dir = dirname / 'results'
if name is None: # then it's a directory object
cls = _metadir._cls_from_meta_json(results_dir) if (results_dir / 'meta.json').exists() \
else _ProtocolResultsDir # default if no meta.json (if only a results obj has been written inside dir)
return cls.from_dir(dirname, preloaded_data=preloaded_data, quick_load=quick_load)
else: # it's a ProtocolResults object
return _metadir._cls_from_meta_json(results_dir / name).from_dir(dirname, name, preloaded_data, quick_load)
def read_results_from_mongodb(mongodb, doc_id, preloaded_data=None, quick_load=False, comm=None):
"""
Load a :class:`ProtocolResults` from a MongoDB database.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to load data from.
doc_id : str
The user-defined identifier of the results directory to load.
preloaded_data : ProtocolData, optional
The data object belonging to the to-be-loaded results, in cases
when this has been loaded already (only use this if you know what
you're doing).
quick_load : bool, optional
Setting this to True skips the loading of data and experiment-design
components that may take a long time to load. This can be useful
all the information of interest lies only within the results objects.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize database access.
Returns
-------
ProtocolResults
"""
from ..protocols import ProtocolResults as _ProtocolResults
return _ProtocolResults.from_mongodb(mongodb, doc_id, preloaded_data=preloaded_data, quick_load=quick_load)
def read_resultsdir_from_mongodb(mongodb, doc_id, preloaded_data=None, quick_load=False,
read_all_results_for_data=False, comm=None):
"""
Load a :class:`ProtocolsResultsDir` from a MongoDB database.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to load data from.
doc_id : str
The user-defined identifier of the results directory to load.
preloaded_data : ProtocolData, optional
The data object belonging to the to-be-loaded results, in cases
when this has been loaded already (only use this if you know what
you're doing).
quick_load : bool, optional
Setting this to True skips the loading of data and experiment-design
components that may take a long time to load. This can be useful
all the information of interest lies only within the results objects.
read_all_results_for_data : bool, optional
If `True`, the loaded result directory and sub-directories will read in all the results
objects stored in the database associated with their :class:`ProtocolData` object. Duplicate
keys will be renamed to avoid collisions with warning messages are printed. If `False`
(the default), then only the specific results associated with the directory when it was last
saved are loaded. This can sometimes be useful for loading old results that have been overwritten
but still exist in the database.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize database access.
Returns
-------
ProtocolResultsDir
"""
#Currently, there's just a single ProtocolResultsDir class. If we want to allow custom classes
# we'll need to use the 'resultdirs' collection to store this information (FUTURE)
from ..protocols import ProtocolResultsDir as _ProtocolResultsDir
return _ProtocolResultsDir.from_mongodb(mongodb, doc_id, preloaded_data=preloaded_data,
quick_load=quick_load, read_all_results_for_data=read_all_results_for_data)
def remove_results_from_mongodb(mongodb, doc_id, comm=None, session=None, recursive="default"):
"""
Remove :class:`ProtocolResults` data from a MongoDB database.
Which object type is removed depends on whether `name` is given: if it is, then
data corresponding to a :class:`ProtocolResults` object is removed. If not, that of
a :class:`ProtocolsResultsDir` is removed.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to remove data from.
doc_id : str
The user-defined identifier of the results directory to remove.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize database access.
session : pymongo.client_session.ClientSession, optional
MongoDB session object to use when interacting with the MongoDB
database. This can be used to implement transactions
among other things.
recursive : RecursiveRemovalSpecification, optional
An object that filters the type of documents that are removed.
Used when working with inter-related experiment designs, data,
and results objects to only remove the types of documents you
know aren't being shared with other documents.
Returns
-------
None
"""
from ..protocols import ProtocolResults as _ProtocolResults
return _ProtocolResults.remove_from_mongodb(mongodb, doc_id, session=session, recursive=recursive)
def remove_resultsdir_from_mongodb(mongodb, doc_id, comm=None, session=None, recursive="default"):
"""
Remove :class:`ProtocolsResultsDir` data from a MongoDB database.
Parameters
----------
mongodb : pymongo.database.Database
The MongoDB instance to remove data from.
doc_id : str
The user-defined identifier of the results directory to remove.
comm : mpi4py.MPI.Comm, optional
When not ``None``, an MPI communicator used to synchronize database access.
session : pymongo.client_session.ClientSession, optional
MongoDB session object to use when interacting with the MongoDB
database. This can be used to implement transactions
among other things.
recursive : RecursiveRemovalSpecification, optional
An object that filters the type of documents that are removed.
Used when working with inter-related experiment designs, data,
and results objects to only remove the types of documents you
know aren't being shared with other documents.
Returns
-------
None
"""
#See FUTURE comment in read_results_from_mongodb above
from ..protocols import ProtocolResultsDir as _ProtocolResultsDir
return _ProtocolResultsDir.remove_from_mongodb(mongodb, doc_id, session=session, recursive=recursive)