lsst · timj · Mar 27, 2024 · Mar 25, 2024 · Mar 25, 2024 · Mar 25, 2024
diff --git a/.github/workflows/build.yaml b/.github/workflows/build.yaml
@@ -16,12 +16,12 @@ jobs:
         python-version: ["3.11", "3.12"]
 
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
         with:
           # Need to clone everything for the git tags.
           fetch-depth: 0
 
-      - uses: conda-incubator/setup-miniconda@v2
+      - uses: conda-incubator/setup-miniconda@v3
         with:
           python-version: ${{ matrix.python-version }}
           channels: conda-forge,defaults
@@ -92,9 +92,10 @@ jobs:
         run: |
           pytest -r a -v -n 3 --open-files --cov=lsst.daf.butler --cov=tests --cov-report=xml --cov-report=term --cov-branch
       - name: Upload coverage to codecov
-        uses: codecov/codecov-action@v3
+        uses: codecov/codecov-action@v4
         with:
           files: ./coverage.xml
+          token: ${{ secrets.CODECOV_TOKEN }}
 
   pypi:
     runs-on: ubuntu-latest
@@ -104,13 +105,13 @@ jobs:
     if: startsWith(github.ref, 'refs/tags') && ! startsWith(github.ref, 'refs/tags/s')
 
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
         with:
           # Need to clone everything to embed the version.
           fetch-depth: 0
 
       - name: Set up Python
-        uses: actions/setup-python@v4
+        uses: actions/setup-python@v5
         with:
           python-version: "3.11"
 

diff --git a/.github/workflows/build_docs.yaml b/.github/workflows/build_docs.yaml
@@ -10,13 +10,13 @@ jobs:
   build_sphinx_docs:
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
         with:
           # Need to clone everything for the git tags.
           fetch-depth: 0
 
       - name: Set up Python
-        uses: actions/setup-python@v4
+        uses: actions/setup-python@v5
         with:
           python-version: "3.11"
           cache: "pip"

diff --git a/.github/workflows/codeql-analysis.yml b/.github/workflows/codeql-analysis.yml
@@ -42,11 +42,11 @@ jobs:
 
     steps:
       - name: Checkout repository
-        uses: actions/checkout@v2
+        uses: actions/checkout@v4
 
       # Initializes the CodeQL tools for scanning.
       - name: Initialize CodeQL
-        uses: github/codeql-action/init@v2
+        uses: github/codeql-action/init@v3
         with:
           languages: ${{ matrix.language }}
           # If you wish to specify custom queries, you can do so here or in a config file.
@@ -57,7 +57,7 @@ jobs:
       # Autobuild attempts to build any compiled languages  (C/C++, C#, or Java).
       # If this step fails, then you should remove it and run the build manually (see below)
       - name: Autobuild
-        uses: github/codeql-action/autobuild@v2
+        uses: github/codeql-action/autobuild@v3
 
       # ℹ️ Command-line programs to run using the OS shell.
       # 📚 https://git.io/JvXDl
@@ -71,4 +71,4 @@ jobs:
       #   make release
 
       - name: Perform CodeQL Analysis
-        uses: github/codeql-action/analyze@v2
+        uses: github/codeql-action/analyze@v3
diff --git a/.github/workflows/do_not_merge.yaml b/.github/workflows/do_not_merge.yaml
@@ -26,7 +26,7 @@ jobs:
             'DO NOT MERGE'. Remove this commit from the branch before merging
             or change the commit summary."
 
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
 
       - name: Check requirements.txt for branches
         shell: bash

diff --git a/.github/workflows/docker.yaml b/.github/workflows/docker.yaml
@@ -41,7 +41,7 @@ jobs:
       packages: write
 
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
         with:
           # Needed to fetch tags, used by Python install process to
           # figure out version number
@@ -65,7 +65,7 @@ jobs:
 
 
       - name: Set up Python
-        uses: actions/setup-python@v4
+        uses: actions/setup-python@v5
         with:
           python-version: "3.11"
 

diff --git a/.github/workflows/docstyle.yaml b/.github/workflows/docstyle.yaml
@@ -14,10 +14,10 @@ jobs:
   numpydoc:
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
 
       - name: Set up Python
-        uses: actions/setup-python@v4
+        uses: actions/setup-python@v5
 
       - name: Install numpydoc
         run: |

diff --git a/.github/workflows/lint.yaml b/.github/workflows/lint.yaml
@@ -12,5 +12,5 @@ jobs:
   ruff:
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v3
+      - uses: actions/checkout@v4
       - uses: chartboost/ruff-action@v1
diff --git a/Dockerfile b/Dockerfile
@@ -62,18 +62,18 @@ RUN python -m venv $VIRTUAL_ENV
 # Make sure we use the virtualenv
 ENV PATH="$VIRTUAL_ENV/bin:$PATH"
 # Put the latest pip and setuptools in the virtualenv
-RUN pip install --upgrade --no-cache-dir pip setuptools wheel
+RUN pip install --upgrade --no-cache-dir pip setuptools wheel uv
 
 # Install the app's Python runtime dependencies
 COPY requirements/docker.txt ./docker-requirements.txt
-RUN pip install --no-cache-dir -r docker-requirements.txt
+RUN uv pip install --no-cache-dir -r docker-requirements.txt
 
 # Install dependencies only required by unit tests in a separate image for better caching
 FROM dependencies-image AS test-dependencies-image
 RUN apt-get update
 RUN apt-get install -y --no-install-recommends postgresql postgresql-pgsphere
 COPY requirements/docker-test.txt ./docker-test-requirements.txt
-RUN pip install --no-cache-dir -r docker-test-requirements.txt
+RUN uv pip install --no-cache-dir -r docker-test-requirements.txt
 
 # Run unit tests
 FROM test-dependencies-image AS unit-test

diff --git a/doc/changes/DM-43499.feature.rst b/doc/changes/DM-43499.feature.rst
@@ -0,0 +1,4 @@
+Added a ``timespan`` parameter to ``Butler.get()`` (for direct and remote butler).
+This parameter can be used to specify an explicit time for calibration selection without requiring a temporal coordinate be included in the data ID.
+Additionally, if no timespan is specified and no timespan can be found in the data ID a default full-range time span will be used for calibration selection.
+This allows a calibration to be selected if there is only one matching calibration in the collection.
diff --git a/python/lsst/daf/butler/direct_butler.py b/python/lsst/daf/butler/direct_butler.py
@@ -779,6 +779,7 @@ def _findDatasetRef(
         predict: bool = False,
         run: str | None = None,
         datastore_records: bool = False,
+        timespan: Timespan | None = None,
         **kwargs: Any,
     ) -> DatasetRef:
         """Shared logic for methods that start with a search for a dataset in
@@ -806,6 +807,11 @@ def _findDatasetRef(
             datasets. Only used if ``predict`` is `True`.
         datastore_records : `bool`, optional
             If `True` add datastore records to returned `DatasetRef`.
+        timespan : `Timespan` or `None`, optional
+            A timespan that the validity range of the dataset must overlap.
+            If not provided and this is a calibration dataset type, an attempt
+            will be made to find the timespan from any temporal coordinate
+            in the data ID.
         **kwargs
             Additional keyword arguments used to augment or construct a
             `DataId`.  See `DataId` parameters.
@@ -836,7 +842,6 @@ def _findDatasetRef(
             if datastore_records and datasetRefOrType._datastore_records is None:
                 datasetRefOrType = self._registry.get_datastore_records(datasetRefOrType)
             return datasetRefOrType
-        timespan: Timespan | None = None
 
         dataId, kwargs = self._rewrite_data_id(dataId, datasetType, **kwargs)
 
@@ -849,9 +854,17 @@ def _findDatasetRef(
             dataId = DataCoordinate.standardize(
                 dataId, universe=self.dimensions, defaults=self._registry.defaults.dataId, **kwargs
             )
-            if dataId.dimensions.temporal:
-                dataId = self._registry.expandDataId(dataId)
-                timespan = dataId.timespan
+            if timespan is None:
+                if dataId.dimensions.temporal:
+                    dataId = self._registry.expandDataId(dataId)
+                    # Use the timespan from the data ID to constrain the
+                    # calibration lookup, but only if the caller has not
+                    # specified an explicit timespan.
+                    timespan = dataId.timespan
+                else:
+                    # Try an arbitrary timespan. Downstream will fail if this
+                    # results in more than one matching dataset.
+                    timespan = Timespan(None, None)
         else:
             # Standardize the data ID to just the dimensions of the dataset
             # type instead of letting registry.findDataset do it, so we get the
@@ -988,6 +1001,7 @@ def getDeferred(
         parameters: dict | None = None,
         collections: Any = None,
         storageClass: str | StorageClass | None = None,
+        timespan: Timespan | None = None,
         **kwargs: Any,
     ) -> DeferredDatasetHandle:
         """Create a `DeferredDatasetHandle` which can later retrieve a dataset,
@@ -1015,6 +1029,11 @@ def getDeferred(
             the dataset type definition for this dataset. Specifying a
             read `StorageClass` can force a different type to be returned.
             This type must be compatible with the original type.
+        timespan : `Timespan` or `None`, optional
+            A timespan that the validity range of the dataset must overlap.
+            If not provided and this is a calibration dataset type, an attempt
+            will be made to find the timespan from any temporal coordinate
+            in the data ID.
         **kwargs
             Additional keyword arguments used to augment or construct a
             `DataId`.  See `DataId` parameters.
@@ -1045,7 +1064,9 @@ def getDeferred(
             else:
                 raise LookupError(f"Dataset reference {datasetRefOrType} does not exist.")
         else:
-            ref = self._findDatasetRef(datasetRefOrType, dataId, collections=collections, **kwargs)
+            ref = self._findDatasetRef(
+                datasetRefOrType, dataId, collections=collections, timespan=timespan, **kwargs
+            )
         return DeferredDatasetHandle(butler=self, ref=ref, parameters=parameters, storageClass=storageClass)
 
     def get(
@@ -1057,6 +1078,7 @@ def get(
         parameters: dict[str, Any] | None = None,
         collections: Any = None,
         storageClass: StorageClass | str | None = None,
+        timespan: Timespan | None = None,
         **kwargs: Any,
     ) -> Any:
         """Retrieve a stored dataset.
@@ -1085,6 +1107,11 @@ def get(
             the dataset type definition for this dataset. Specifying a
             read `StorageClass` can force a different type to be returned.
             This type must be compatible with the original type.
+        timespan : `Timespan` or `None`, optional
+            A timespan that the validity range of the dataset must overlap.
+            If not provided and this is a calibration dataset type, an attempt
+            will be made to find the timespan from any temporal coordinate
+            in the data ID.
         **kwargs
             Additional keyword arguments used to augment or construct a
             `DataCoordinate`.  See `DataCoordinate.standardize`
@@ -1114,7 +1141,12 @@ def get(
         """
         _LOG.debug("Butler get: %s, dataId=%s, parameters=%s", datasetRefOrType, dataId, parameters)
         ref = self._findDatasetRef(
-            datasetRefOrType, dataId, collections=collections, datastore_records=True, **kwargs
+            datasetRefOrType,
+            dataId,
+            collections=collections,
+            datastore_records=True,
+            timespan=timespan,
+            **kwargs,
         )
         return self._datastore.get(ref, parameters=parameters, storageClass=storageClass)
 

diff --git a/python/lsst/daf/butler/remote_butler/_remote_butler.py b/python/lsst/daf/butler/remote_butler/_remote_butler.py
@@ -244,9 +244,10 @@ def getDeferred(
         parameters: dict | None = None,
         collections: Any = None,
         storageClass: str | StorageClass | None = None,
+        timespan: Timespan | None = None,
         **kwargs: Any,
     ) -> DeferredDatasetHandle:
-        response = self._get_file_info(datasetRefOrType, dataId, collections, kwargs)
+        response = self._get_file_info(datasetRefOrType, dataId, collections, timespan, kwargs)
         # Check that artifact information is available.
         _to_file_payload(response)
         ref = DatasetRef.from_simple(response.dataset_ref, universe=self.dimensions)
@@ -261,10 +262,11 @@ def get(
         parameters: dict[str, Any] | None = None,
         collections: Any = None,
         storageClass: StorageClass | str | None = None,
+        timespan: Timespan | None = None,
         **kwargs: Any,
     ) -> Any:
         # Docstring inherited.
-        model = self._get_file_info(datasetRefOrType, dataId, collections, kwargs)
+        model = self._get_file_info(datasetRefOrType, dataId, collections, timespan, kwargs)
 
         ref = DatasetRef.from_simple(model.dataset_ref, universe=self.dimensions)
         # If the caller provided a DatasetRef, they may have overridden the
@@ -287,6 +289,7 @@ def _get_file_info(
         datasetRefOrType: DatasetRef | DatasetType | str,
         dataId: DataId | None,
         collections: CollectionArgType,
+        timespan: Timespan | None,
         kwargs: dict[str, DataIdValue],
     ) -> GetFileResponseModel:
         """Send a request to the server for the file URLs and metadata
@@ -301,6 +304,7 @@ def _get_file_info(
                 dataset_type_name=self._normalize_dataset_type_name(datasetRefOrType),
                 collections=self._normalize_collections(collections),
                 data_id=self._simplify_dataId(dataId, kwargs),
+                timespan=timespan.to_simple() if timespan is not None else None,
             )
             response = self._post("get_file_by_data_id", request)
             return self._parse_model(response, GetFileResponseModel)
@@ -324,7 +328,7 @@ def getURIs(
         if predict or run:
             raise NotImplementedError("Predict mode is not supported by RemoteButler")
 
-        response = self._get_file_info(datasetRefOrType, dataId, collections, kwargs)
+        response = self._get_file_info(datasetRefOrType, dataId, collections, None, kwargs)
         file_info = _to_file_payload(response).file_info
         if len(file_info) == 1:
             return DatasetRefURIs(primaryURI=ResourcePath(str(file_info[0].url)))
@@ -449,7 +453,7 @@ def exists(
     ) -> DatasetExistence:
         try:
             response = self._get_file_info(
-                dataset_ref_or_type, dataId=data_id, collections=collections, kwargs=kwargs
+                dataset_ref_or_type, dataId=data_id, collections=collections, timespan=None, kwargs=kwargs
             )
         except DatasetNotFoundError:
             return DatasetExistence.UNRECOGNIZED

diff --git a/python/lsst/daf/butler/remote_butler/server/handlers/_external.py b/python/lsst/daf/butler/remote_butler/server/handlers/_external.py
@@ -171,11 +171,13 @@ def get_file_by_data_id(
     factory: Factory = Depends(factory_dependency),
 ) -> GetFileResponseModel:
     butler = factory.create_butler()
+    timespan = Timespan.from_simple(request.timespan) if request.timespan is not None else None
     ref = butler._findDatasetRef(
         datasetRefOrType=request.dataset_type_name,
         dataId=request.data_id,
         collections=request.collections,
         datastore_records=True,
+        timespan=timespan,
     )
     return _get_file_by_ref(butler, ref)
 

diff --git a/python/lsst/daf/butler/remote_butler/server_models.py b/python/lsst/daf/butler/remote_butler/server_models.py
@@ -73,6 +73,7 @@ class GetFileByDataIdRequestModel(pydantic.BaseModel):
     dataset_type_name: DatasetTypeName
     data_id: SerializedDataId
     collections: CollectionList
+    timespan: SerializedTimespan | None = None
 
 
 class GetFileResponseModel(pydantic.BaseModel):