Remove old MultibandFitTask and Config

This task is essentially an interface that was only ever implemented in lsst-dm repos that are no longer in active use and likely bitrotted. Furthermore, the design is a monolith that does PSF and source modelling, which is a pattern we are trying to discourage.
lsst · Feb 9, 2023 · 301e94a · 301e94a
1 parent 1cf34a1
commit 301e94a
Showing 1 changed file with 1 addition and 297 deletions.
diff --git a/python/lsst/pipe/tasks/fit_multiband.py b/python/lsst/pipe/tasks/fit_multiband.py
@@ -19,24 +19,15 @@
 # You should have received a copy of the GNU General Public License
 # along with this program.  If not, see <https://www.gnu.org/licenses/>.
 
-__all__ = [
-    "CatalogExposure", "MultibandFitConfig", "MultibandFitSubConfig", "MultibandFitSubTask",
-    "MultibandFitTask",
-]
+__all__ = ["CatalogExposure", "CatalogExposureConfig", ]
 
-from abc import ABC, abstractmethod
 from functools import cached_property
 from pydantic import Field
 from pydantic.dataclasses import dataclass
-from typing import Iterable
 
 import lsst.afw.image as afwImage
 import lsst.afw.table as afwTable
 import lsst.daf.butler as dafButler
-from lsst.obs.base import ExposureIdInfo
-import lsst.pex.config as pexConfig
-import lsst.pipe.base as pipeBase
-import lsst.pipe.base.connectionTypes as cT
 
 
 class CatalogExposureConfig:
@@ -71,290 +62,3 @@ def __post_init__(self):
             raise ValueError("Must specify at least one of catalog/exposure")
         if 'band' not in self.dataId:
             raise ValueError(f"dataId={self.dataId} must have a band")
-
-
-multibandFitBaseTemplates = {
-    "name_input_coadd": "deep",
-    "name_output_coadd": "deep",
-    "name_output_cat": "fit",
-}
-
-
-class MultibandFitConnections(
-    pipeBase.PipelineTaskConnections,
-    dimensions=("tract", "patch", "skymap"),
-    defaultTemplates=multibandFitBaseTemplates,
-):
-    cat_ref = cT.Input(
-        doc="Reference multiband source catalog",
-        name="{name_input_coadd}Coadd_ref",
-        storageClass="SourceCatalog",
-        dimensions=("tract", "patch", "skymap"),
-    )
-    cats_meas = cT.Input(
-        doc="Deblended single-band source catalogs",
-        name="{name_input_coadd}Coadd_meas",
-        storageClass="SourceCatalog",
-        multiple=True,
-        dimensions=("tract", "patch", "band", "skymap"),
-    )
-    coadds = cT.Input(
-        doc="Exposures on which to run fits",
-        name="{name_input_coadd}Coadd_calexp",
-        storageClass="ExposureF",
-        multiple=True,
-        dimensions=("tract", "patch", "band", "skymap"),
-    )
-    cat_output = cT.Output(
-        doc="Measurement multi-band catalog",
-        name="{name_output_coadd}Coadd_{name_output_cat}",
-        storageClass="SourceCatalog",
-        dimensions=("tract", "patch", "skymap"),
-    )
-    cat_ref_schema = cT.InitInput(
-        doc="Schema associated with a ref source catalog",
-        storageClass="SourceCatalog",
-        name="{name_input_coadd}Coadd_ref_schema",
-    )
-    cat_output_schema = cT.InitOutput(
-        doc="Output of the schema used in deblending task",
-        name="{name_output_coadd}Coadd_{name_output_cat}_schema",
-        storageClass="SourceCatalog"
-    )
-
-    def adjustQuantum(self, inputs, outputs, label, data_id):
-        """Validates the `lsst.daf.butler.DatasetRef` bands against the
-        subtask's list of bands to fit and drops unnecessary bands.
-
-        Parameters
-        ----------
-        inputs : `dict`
-            Dictionary whose keys are an input (regular or prerequisite)
-            connection name and whose values are a tuple of the connection
-            instance and a collection of associated `DatasetRef` objects.
-            The exact type of the nested collections is unspecified; it can be
-            assumed to be multi-pass iterable and support `len` and ``in``, but
-            it should not be mutated in place.  In contrast, the outer
-            dictionaries are guaranteed to be temporary copies that are true
-            `dict` instances, and hence may be modified and even returned; this
-            is especially useful for delegating to `super` (see notes below).
-        outputs : `Mapping`
-            Mapping of output datasets, with the same structure as ``inputs``.
-        label : `str`
-            Label for this task in the pipeline (should be used in all
-            diagnostic messages).
-        data_id : `lsst.daf.butler.DataCoordinate`
-            Data ID for this quantum in the pipeline (should be used in all
-            diagnostic messages).
-
-        Returns
-        -------
-        adjusted_inputs : `Mapping`
-            Mapping of the same form as ``inputs`` with updated containers of
-            input `DatasetRef` objects.  All inputs involving the 'band'
-            dimension are adjusted to put them in consistent order and remove
-            unneeded bands.
-        adjusted_outputs : `Mapping`
-            Mapping of updated output datasets; always empty for this task.
-
-        Raises
-        ------
-        lsst.pipe.base.NoWorkFound
-            Raised if there are not enough of the right bands to run the task
-            on this quantum.
-        """
-        # Check which bands are going to be fit
-        bands_fit, bands_read_only = self.config.get_band_sets()
-        bands_needed = bands_fit.union(bands_read_only)
-
-        adjusted_inputs = {}
-        for connection_name, (connection, dataset_refs) in inputs.items():
-            # Datasets without bands in their dimensions should be fine
-            if 'band' in connection.dimensions:
-                datasets_by_band = {dref.dataId['band']: dref for dref in dataset_refs}
-                if not bands_needed.issubset(datasets_by_band.keys()):
-                    raise pipeBase.NoWorkFound(
-                        f'DatasetRefs={dataset_refs} have data with bands in the'
-                        f' set={set(datasets_by_band.keys())},'
-                        f' which is not a superset of the required bands={bands_needed} defined by'
-                        f' {self.config.__class__}.fit_multiband='
-                        f'{self.config.fit_multiband._value.__class__}\'s attributes'
-                        f' bands_fit={bands_fit} and bands_read_only()={bands_read_only}.'
-                        f' Add the required bands={bands_needed.difference(datasets_by_band.keys())}.'
-                    )
-                # Adjust all datasets with band dimensions to include just
-                # the needed bands, in consistent order.
-                adjusted_inputs[connection_name] = (
-                    connection,
-                    [datasets_by_band[band] for band in bands_needed]
-                )
-
-        # Delegate to super for more checks.
-        inputs.update(adjusted_inputs)
-        super().adjustQuantum(inputs, outputs, label, data_id)
-        return adjusted_inputs, {}
-
-
-class MultibandFitSubConfig(pexConfig.Config):
-    """Config class for the MultibandFitTask to define methods returning
-    values that depend on multiple config settings.
-
-    """
-    def bands_read_only(self) -> set:
-        """Return the set of bands that the Task needs to read (e.g. for
-        defining priors) but not necessarily fit.
-
-        Returns
-        -------
-        The set of such bands.
-        """
-        return set()
-
-
-class MultibandFitSubTask(pipeBase.Task, ABC):
-    """An abstract interface for subtasks of MultibandFitTask to perform
-    multiband fitting of deblended sources.
-
-    Parameters
-    ----------
-    schema : `lsst.afw.table.Schema`
-        The input schema for the reference source catalog, used to initialize
-        the output schema.
-    **kwargs
-        Additional arguments to be passed to the `lsst.pipe.base.Task`
-        constructor.
-    """
-    ConfigClass = MultibandFitSubConfig
-
-    def __init__(self, schema: afwTable.Schema, **kwargs):
-        super().__init__(**kwargs)
-
-    @abstractmethod
-    def run(
-        self, catexps: Iterable[CatalogExposure], cat_ref: afwTable.SourceCatalog
-    ) -> pipeBase.Struct:
-        """Fit sources from a reference catalog using data from multiple
-        exposures in the same patch.
-
-        Parameters
-        ----------
-        catexps : `typing.List [CatalogExposure]`
-            A list of catalog-exposure pairs in a given band.
-        cat_ref : `lsst.afw.table.SourceCatalog`
-            A reference source catalog to fit.
-
-        Returns
-        -------
-        retStruct : `lsst.pipe.base.Struct`
-            A struct with a cat_output attribute containing the output
-            measurement catalog.
-
-        Notes
-        -----
-        Subclasses may have further requirements on the input parameters,
-        including:
-            - Passing only one catexp per band;
-            - Catalogs containing HeavyFootprints with deblended images;
-            - Fitting only a subset of the sources.
-        If any requirements are not met, the subtask should fail as soon as
-        possible.
-        """
-        raise NotImplementedError()
-
-    @property
-    @abstractmethod
-    def schema(self) -> afwTable.Schema:
-        raise NotImplementedError()
-
-
-class MultibandFitConfig(
-    pipeBase.PipelineTaskConfig,
-    pipelineConnections=MultibandFitConnections,
-):
-    """Configure a MultibandFitTask, including a configurable fitting subtask.
-    """
-    fit_multiband = pexConfig.ConfigurableField(
-        target=MultibandFitSubTask,
-        doc="Task to fit sources using multiple bands",
-    )
-
-    def get_band_sets(self):
-        """Get the set of bands required by the fit_multiband subtask.
-
-        Returns
-        -------
-        bands_fit : `set`
-            The set of bands that the subtask will fit.
-        bands_read_only : `set`
-            The set of bands that the subtask will only read data
-            (measurement catalog and exposure) for.
-        """
-        try:
-            bands_fit = self.fit_multiband.bands_fit
-        except AttributeError:
-            raise RuntimeError(f'{__class__}.fit_multiband must have bands_fit attribute') from None
-        bands_read_only = self.fit_multiband.bands_read_only()
-        return set(bands_fit), set(bands_read_only)
-
-
-class MultibandFitTask(pipeBase.PipelineTask):
-    """Fit deblended exposures in multiple bands simultaneously.
-
-    It is generally assumed but not enforced (except optionally by the
-    configurable `fit_multiband` subtask) that there is only one exposure
-    per band, presumably a coadd.
-    """
-    ConfigClass = MultibandFitConfig
-    _DefaultName = "multibandFit"
-
-    def __init__(self, initInputs, **kwargs):
-        super().__init__(initInputs=initInputs, **kwargs)
-        self.makeSubtask("fit_multiband", schema=initInputs["cat_ref_schema"].schema)
-        self.cat_output_schema = afwTable.SourceCatalog(self.fit_multiband.schema)
-
-    def runQuantum(self, butlerQC, inputRefs, outputRefs):
-        inputs = butlerQC.get(inputRefs)
-        id_tp = ExposureIdInfo.fromDataId(butlerQC.quantum.dataId, "tract_patch").expId
-        input_refs_objs = [(inputRefs.cats_meas, inputs['cats_meas']), (inputRefs.coadds, inputs['coadds'])]
-        cats, exps = [
-            {dRef.dataId: obj for dRef, obj in zip(refs, objs)}
-            for refs, objs in input_refs_objs
-        ]
-        dataIds = set(cats).union(set(exps))
-        catexps = [
-            CatalogExposure(
-                catalog=cats.get(dataId), exposure=exps.get(dataId), dataId=dataId, id_tract_patch=id_tp,
-            )
-            for dataId in dataIds
-        ]
-        outputs = self.run(catexps=catexps, cat_ref=inputs['cat_ref'])
-        butlerQC.put(outputs, outputRefs)
-        # Validate the output catalog's schema and raise if inconsistent (after output to allow debugging)
-        if outputs.cat_output.schema != self.cat_output_schema.schema:
-            raise RuntimeError(f'{__class__}.config.fit_multiband.run schema != initOutput schema:'
-                               f' {outputs.cat_output.schema} vs {self.cat_output_schema.schema}')
-
-    def run(self, catexps: list[CatalogExposure], cat_ref: afwTable.SourceCatalog) -> pipeBase.Struct:
-        """Fit sources from a reference catalog using data from multiple
-        exposures in the same region (patch).
-
-        Parameters
-        ----------
-        catexps : `typing.List [CatalogExposure]`
-            A list of catalog-exposure pairs in a given band.
-        cat_ref : `lsst.afw.table.SourceCatalog`
-            A reference source catalog to fit.
-
-        Returns
-        -------
-        retStruct : `lsst.pipe.base.Struct`
-            A struct with a cat_output attribute containing the output
-            measurement catalog.
-
-        Notes
-        -----
-        Subtasks may have further requirements; see `MultibandFitSubTask.run`.
-        """
-        cat_output = self.fit_multiband.run(catexps, cat_ref).output
-        retStruct = pipeBase.Struct(cat_output=cat_output)
-        return retStruct