PyPI - lsst-ctrl-mpexec - Versions diffs - 29.2025.3400__py3-none-any.whl → 29.2025.3600__py3-none-any.whl - Mend

lsst-ctrl-mpexec 29.2025.3400py3-none-any.whl → 29.2025.3600py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

lsst/ctrl/mpexec/cmdLineFwk.py DELETED Viewed

@@ -1,534 +0,0 @@
-# This file is part of ctrl_mpexec.
-#
-# Developed for the LSST Data Management System.
-# This product includes software developed by the LSST Project
-# (http://www.lsst.org).
-# See the COPYRIGHT file at the top-level directory of this distribution
-# for details of code ownership.
-#
-# This software is dual licensed under the GNU General Public License and also
-# under a 3-clause BSD license. Recipients may choose which of these licenses
-# to use; please see the files gpl-3.0.txt and/or bsd_license.txt,
-# respectively.  If you choose the GPL option then the following text applies
-# (but note that there is still no warranty even if you opt for BSD instead):
-#
-# This program is free software: you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation, either version 3 of the License, or
-# (at your option) any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program.  If not, see <http://www.gnu.org/licenses/>.
-"""Module defining CmdLineFwk class and related methods."""
-from __future__ import annotations
-__all__ = ["CmdLineFwk"]
-import logging
-import pickle
-from collections.abc import Mapping
-from types import SimpleNamespace
-import astropy.units as u
-from astropy.table import Table
-import lsst.utils.timer
-from lsst.daf.butler import (
-    Butler,
-    Config,
-    DatasetType,
-    DimensionConfig,
-    DimensionUniverse,
-    LimitedButler,
-    Quantum,
-    QuantumBackedButler,
-)
-from lsst.pipe.base import ExecutionResources, QuantumGraph, TaskFactory
-from lsst.pipe.base.all_dimensions_quantum_graph_builder import AllDimensionsQuantumGraphBuilder
-from lsst.pipe.base.dot_tools import graph2dot
-from lsst.pipe.base.execution_graph_fixup import ExecutionGraphFixup
-from lsst.pipe.base.mermaid_tools import graph2mermaid
-from lsst.pipe.base.mp_graph_executor import MPGraphExecutor
-from lsst.pipe.base.quantum_reports import Report
-from lsst.pipe.base.single_quantum_executor import SingleQuantumExecutor
-from lsst.resources import ResourcePath
-from lsst.utils import doImportType
-from lsst.utils.logging import VERBOSE, getLogger
-from lsst.utils.threads import disable_implicit_threading
-from ._pipeline_graph_factory import PipelineGraphFactory
-from .cli.butler_factory import ButlerFactory
-from .preExecInit import PreExecInit, PreExecInitLimited
-_LOG = getLogger(__name__)
-class _QBBFactory:
-    """Class which is a callable for making QBB instances.
-    This class is also responsible for reconstructing correct dimension
-    universe after unpickling. When pickling multiple things that require
-    dimension universe, this class must be unpickled first. The logic in
-    MPGraphExecutor ensures that SingleQuantumExecutor is unpickled first in
-    the subprocess, which causes unpickling of this class.
-    """
-    def __init__(
-        self, butler_config: Config, dimensions: DimensionUniverse, dataset_types: Mapping[str, DatasetType]
-    ):
-        self.butler_config = butler_config
-        self.dimensions = dimensions
-        self.dataset_types = dataset_types
-    def __call__(self, quantum: Quantum) -> LimitedButler:
-        """Return freshly initialized `~lsst.daf.butler.QuantumBackedButler`.
-        Factory method to create QuantumBackedButler instances.
-        """
-        return QuantumBackedButler.initialize(
-            config=self.butler_config,
-            quantum=quantum,
-            dimensions=self.dimensions,
-            dataset_types=self.dataset_types,
-        )
-    @classmethod
-    def _unpickle(
-        cls, butler_config: Config, dimensions_config: DimensionConfig | None, dataset_types_pickle: bytes
-    ) -> _QBBFactory:
-        universe = DimensionUniverse(dimensions_config)
-        dataset_types = pickle.loads(dataset_types_pickle)
-        return _QBBFactory(butler_config, universe, dataset_types)
-    def __reduce__(self) -> tuple:
-        # If dimension universe is not default one, we need to dump/restore
-        # its config.
-        config = self.dimensions.dimensionConfig
-        default = DimensionConfig()
-        # Only send configuration to other side if it is non-default, default
-        # will be instantiated from config=None.
-        if (config["namespace"], config["version"]) != (default["namespace"], default["version"]):
-            dimension_config = config
-        else:
-            dimension_config = None
-        # Dataset types need to be unpickled only after universe is made.
-        dataset_types_pickle = pickle.dumps(self.dataset_types)
-        return (self._unpickle, (self.butler_config, dimension_config, dataset_types_pickle))
-class CmdLineFwk:
-    """PipelineTask framework which executes tasks from command line.
-    In addition to executing tasks this activator provides additional methods
-    for task management like dumping configuration or execution chain.
-    """
-    MP_TIMEOUT = 3600 * 24 * 30  # Default timeout (sec) for multiprocessing
-    def makeGraph(
-        self, pipeline_graph_factory: PipelineGraphFactory | None, args: SimpleNamespace
-    ) -> QuantumGraph | None:
-        """Build a graph from command line arguments.
-        Parameters
-        ----------
-        pipeline_graph_factory : `PipelineGraphFactory`
-            Factory that holds a pipeline and can produce a pipeline graph.
-            Must be ``None`` if and only if graph is read from a file.
-        args : `types.SimpleNamespace`
-            Parsed command line.
-        Returns
-        -------
-        graph : `~lsst.pipe.base.QuantumGraph` or `None`
-            If resulting graph is empty then `None` is returned.
-        """
-        # make sure that --extend-run always enables --skip-existing
-        if args.extend_run:
-            args.skip_existing = True
-        butler, collections, run = ButlerFactory.make_butler_and_collections(args)
-        if args.skip_existing and run:
-            args.skip_existing_in += (run,)
-        if args.qgraph:
-            # click passes empty tuple as default value for qgraph_node_id
-            nodes = args.qgraph_node_id or None
-            qgraph = QuantumGraph.loadUri(args.qgraph, butler.dimensions, nodes=nodes, graphID=args.qgraph_id)
-            # pipeline can not be provided in this case
-            if pipeline_graph_factory:
-                raise ValueError(
-                    "Pipeline must not be given when quantum graph is read from "
-                    f"file: {bool(pipeline_graph_factory)}"
-                )
-            if args.show_qgraph_header:
-                print(QuantumGraph.readHeader(args.qgraph))
-        else:
-            if pipeline_graph_factory is None:
-                raise ValueError("Pipeline must be given when quantum graph is not read from file.")
-            # We can't resolve the pipeline graph if we're mocking until after
-            # we've done the mocking (and the QG build will resolve on its own
-            # anyway).
-            pipeline_graph = pipeline_graph_factory(resolve=False)
-            if args.mock:
-                from lsst.pipe.base.tests.mocks import mock_pipeline_graph
-                pipeline_graph = mock_pipeline_graph(
-                    pipeline_graph,
-                    unmocked_dataset_types=args.unmocked_dataset_types,
-                    force_failures=args.mock_failure,
-                )
-            data_id_tables = []
-            for table_file in args.data_id_table:
-                with ResourcePath(table_file).as_local() as local_path:
-                    table = Table.read(local_path.ospath)
-                    # Add the filename to the metadata for more logging
-                    # information down in the QG builder.
-                    table.meta["filename"] = table_file
-                    data_id_tables.append(table)
-            # make execution plan (a.k.a. DAG) for pipeline
-            graph_builder = AllDimensionsQuantumGraphBuilder(
-                pipeline_graph,
-                butler,
-                where=args.data_query or "",
-                skip_existing_in=args.skip_existing_in if args.skip_existing_in is not None else (),
-                clobber=args.clobber_outputs,
-                dataset_query_constraint=args.dataset_query_constraint,
-                input_collections=collections,
-                output_run=run,
-                data_id_tables=data_id_tables,
-            )
-            # accumulate metadata
-            metadata = {
-                "input": args.input,
-                "output": args.output,
-                "butler_argument": args.butler_config,
-                "output_run": run,
-                "extend_run": args.extend_run,
-                "skip_existing_in": args.skip_existing_in,
-                "skip_existing": args.skip_existing,
-                "data_query": args.data_query or "",
-            }
-            assert run is not None, "Butler output run collection must be defined"
-            qgraph = graph_builder.build(metadata, attach_datastore_records=args.qgraph_datastore_records)
-            if args.show_qgraph_header:
-                qgraph.buildAndPrintHeader()
-        if len(qgraph) == 0:
-            # Nothing to do.
-            return None
-        self._summarize_qgraph(qgraph)
-        if args.save_qgraph:
-            _LOG.verbose("Writing QuantumGraph to %r.", args.save_qgraph)
-            qgraph.saveUri(args.save_qgraph)
-        if args.qgraph_dot:
-            _LOG.verbose("Writing quantum graph DOT visualization to %r.", args.qgraph_dot)
-            graph2dot(qgraph, args.qgraph_dot)
-        if args.qgraph_mermaid:
-            _LOG.verbose("Writing quantum graph Mermaid visualization to %r.", args.qgraph_mermaid)
-            graph2mermaid(qgraph, args.qgraph_mermaid)
-        return qgraph
-    def _make_execution_resources(self, args: SimpleNamespace) -> ExecutionResources:
-        """Construct the execution resource class from arguments.
-        Parameters
-        ----------
-        args : `types.SimpleNamespace`
-            Parsed command line.
-        Returns
-        -------
-        resources : `~lsst.pipe.base.ExecutionResources`
-            The resources available to each quantum.
-        """
-        return ExecutionResources(
-            num_cores=args.cores_per_quantum, max_mem=args.memory_per_quantum, default_mem_units=u.MB
-        )
-    def runPipeline(
-        self,
-        graph: QuantumGraph,
-        taskFactory: TaskFactory,
-        args: SimpleNamespace,
-        butler: Butler | None = None,
-    ) -> None:
-        """Execute complete QuantumGraph.
-        Parameters
-        ----------
-        graph : `~lsst.pipe.base.QuantumGraph`
-            Execution graph.
-        taskFactory : `~lsst.pipe.base.TaskFactory`
-            Task factory.
-        args : `types.SimpleNamespace`
-            Parsed command line.
-        butler : `~lsst.daf.butler.Butler`, optional
-            Data Butler instance, if not defined then new instance is made
-            using command line options.
-        """
-        if not args.enable_implicit_threading:
-            disable_implicit_threading()
-        # Check that output run defined on command line is consistent with
-        # quantum graph.
-        if args.output_run and graph.metadata:
-            graph_output_run = graph.metadata.get("output_run", args.output_run)
-            if graph_output_run != args.output_run:
-                raise ValueError(
-                    f"Output run defined on command line ({args.output_run}) has to be "
-                    f"identical to graph metadata ({graph_output_run}). "
-                    "To update graph metadata run `pipetask update-graph-run` command."
-                )
-        # Make sure that --extend-run always enables --skip-existing,
-        # clobbering should be disabled if --extend-run is not specified.
-        if args.extend_run:
-            args.skip_existing = True
-        else:
-            args.clobber_outputs = False
-        # Make butler instance. QuantumGraph should have an output run defined,
-        # but we ignore it here and let command line decide actual output run.
-        if butler is None:
-            butler = ButlerFactory.make_write_butler(args, graph.pipeline_graph)
-        if args.skip_existing:
-            args.skip_existing_in += (butler.run,)
-        # Enable lsstDebug debugging. Note that this is done once in the
-        # main process before PreExecInit and it is also repeated before
-        # running each task in SingleQuantumExecutor (which may not be
-        # needed if `multiprocessing` always uses fork start method).
-        if args.enableLsstDebug:
-            try:
-                _LOG.debug("Will try to import debug.py")
-                import debug  # type: ignore # noqa:F401
-            except ImportError:
-                _LOG.warning("No 'debug' module found.")
-        # Save all InitOutputs, configs, etc.
-        preExecInit = PreExecInit(butler, taskFactory, extendRun=args.extend_run)
-        preExecInit.initialize(
-            graph,
-            saveInitOutputs=not args.skip_init_writes,
-            registerDatasetTypes=args.register_dataset_types,
-            saveVersions=not args.no_versions,
-        )
-        if not args.init_only:
-            graphFixup = self._importGraphFixup(args)
-            resources = self._make_execution_resources(args)
-            quantumExecutor = SingleQuantumExecutor(
-                butler=butler,
-                task_factory=taskFactory,
-                skip_existing_in=args.skip_existing_in,
-                clobber_outputs=args.clobber_outputs,
-                enable_lsst_debug=args.enableLsstDebug,
-                resources=resources,
-                raise_on_partial_outputs=args.raise_on_partial_outputs,
-            )
-            timeout = self.MP_TIMEOUT if args.timeout is None else args.timeout
-            executor = MPGraphExecutor(
-                num_proc=args.processes,
-                timeout=timeout,
-                start_method=args.start_method,
-                quantum_executor=quantumExecutor,
-                fail_fast=args.fail_fast,
-                pdb=args.pdb,
-                execution_graph_fixup=graphFixup,
-            )
-            # Have to reset connection pool to avoid sharing connections with
-            # forked processes.
-            butler.registry.resetConnectionPool()
-            try:
-                with lsst.utils.timer.profile(args.profile, _LOG):
-                    executor.execute(graph)
-            finally:
-                if args.summary:
-                    report = executor.getReport()
-                    if report:
-                        with open(args.summary, "w") as out:
-                            # Do not save fields that are not set.
-                            out.write(report.model_dump_json(exclude_none=True, indent=2))
-    def _generateTaskTable(self) -> Table:
-        """Generate astropy table listing the number of quanta per task for a
-        given quantum graph.
-        Returns
-        -------
-        qg_task_table : `astropy.table.table.Table`
-            An astropy table containing columns: Quanta and Tasks.
-        """
-        qg_quanta, qg_tasks = [], []
-        for task_label, task_info in self.report.qgraphSummary.qgraphTaskSummaries.items():
-            qg_tasks.append(task_label)
-            qg_quanta.append(task_info.numQuanta)
-        qg_task_table = Table(dict(Quanta=qg_quanta, Tasks=qg_tasks))
-        return qg_task_table
-    def _summarize_qgraph(self, qgraph: QuantumGraph) -> int:
-        """Report a summary of the quanta in the graph.
-        Parameters
-        ----------
-        qgraph : `lsst.pipe.base.QuantumGraph`
-            The graph to be summarized.
-        Returns
-        -------
-        n_quanta : `int`
-            The number of quanta in the graph.
-        """
-        n_quanta = len(qgraph)
-        if n_quanta == 0:
-            _LOG.info("QuantumGraph contains no quanta.")
-        else:
-            self.report = Report(qgraphSummary=qgraph.getSummary())
-            if _LOG.isEnabledFor(logging.INFO):
-                qg_task_table = self._generateTaskTable()
-                qg_task_table_formatted = "\n".join(qg_task_table.pformat())
-                quanta_str = "quantum" if n_quanta == 1 else "quanta"
-                n_tasks = len(qgraph.taskGraph)
-                n_tasks_plural = "" if n_tasks == 1 else "s"
-                _LOG.info(
-                    "QuantumGraph contains %d %s for %d task%s, graph ID: %r\n%s",
-                    n_quanta,
-                    quanta_str,
-                    n_tasks,
-                    n_tasks_plural,
-                    qgraph.graphID,
-                    qg_task_table_formatted,
-                )
-        return n_quanta
-    def _importGraphFixup(self, args: SimpleNamespace) -> ExecutionGraphFixup | None:
-        """Import/instantiate graph fixup object.
-        Parameters
-        ----------
-        args : `types.SimpleNamespace`
-            Parsed command line.
-        Returns
-        -------
-        fixup : `ExecutionGraphFixup` or `None`
-        Raises
-        ------
-        ValueError
-            Raised if import fails, method call raises exception, or returned
-            instance has unexpected type.
-        """
-        if args.graph_fixup:
-            try:
-                factory = doImportType(args.graph_fixup)
-            except Exception as exc:
-                raise ValueError("Failed to import graph fixup class/method") from exc
-            try:
-                fixup = factory()
-            except Exception as exc:
-                raise ValueError("Failed to make instance of graph fixup") from exc
-            if not isinstance(fixup, ExecutionGraphFixup):
-                raise ValueError("Graph fixup is not an instance of ExecutionGraphFixup class")
-            return fixup
-        return None
-    def preExecInitQBB(self, task_factory: TaskFactory, args: SimpleNamespace) -> None:
-        _LOG.verbose("Reading full quantum graph from %s.", args.qgraph)
-        # Load quantum graph. We do not really need individual Quanta here,
-        # but we need datastore records for initInputs, and those are only
-        # available from Quanta, so load the whole thing.
-        qgraph = QuantumGraph.loadUri(args.qgraph, graphID=args.qgraph_id)
-        # Ensure that QBB uses shared datastore cache for writes.
-        ButlerFactory.define_datastore_cache()
-        # Make QBB.
-        _LOG.verbose("Initializing quantum-backed butler.")
-        butler = qgraph.make_init_qbb(args.butler_config, config_search_paths=args.config_search_path)
-        # Save all InitOutputs, configs, etc.
-        _LOG.verbose("Instantiating tasks and saving init-outputs.")
-        preExecInit = PreExecInitLimited(butler, task_factory)
-        preExecInit.initialize(qgraph)
-    def runGraphQBB(self, task_factory: TaskFactory, args: SimpleNamespace) -> None:
-        if not args.enable_implicit_threading:
-            disable_implicit_threading()
-        # Load quantum graph.
-        nodes = args.qgraph_node_id or None
-        with lsst.utils.timer.time_this(
-            _LOG,
-            msg=f"Reading {str(len(nodes)) if nodes is not None else 'all'} quanta.",
-            level=VERBOSE,
-        ) as qg_read_time:
-            qgraph = QuantumGraph.loadUri(args.qgraph, nodes=nodes, graphID=args.qgraph_id)
-        job_metadata = {"qg_read_time": qg_read_time.duration, "qg_size": len(qgraph)}
-        if qgraph.metadata is None:
-            raise ValueError("QuantumGraph is missing metadata, cannot continue.")
-        self._summarize_qgraph(qgraph)
-        dataset_types = {dstype.name: dstype for dstype in qgraph.registryDatasetTypes()}
-        # Ensure that QBB uses shared datastore cache.
-        ButlerFactory.define_datastore_cache()
-        _butler_factory = _QBBFactory(
-            butler_config=args.butler_config,
-            dimensions=qgraph.universe,
-            dataset_types=dataset_types,
-        )
-        # make special quantum executor
-        resources = self._make_execution_resources(args)
-        quantumExecutor = SingleQuantumExecutor(
-            butler=None,
-            task_factory=task_factory,
-            enable_lsst_debug=args.enableLsstDebug,
-            limited_butler_factory=_butler_factory,
-            resources=resources,
-            assume_no_existing_outputs=args.no_existing_outputs,
-            skip_existing=True,
-            clobber_outputs=True,
-            raise_on_partial_outputs=args.raise_on_partial_outputs,
-            job_metadata=job_metadata,
-        )
-        timeout = self.MP_TIMEOUT if args.timeout is None else args.timeout
-        executor = MPGraphExecutor(
-            num_proc=args.processes,
-            timeout=timeout,
-            start_method=args.start_method,
-            quantum_executor=quantumExecutor,
-            fail_fast=args.fail_fast,
-            pdb=args.pdb,
-        )
-        try:
-            with lsst.utils.timer.profile(args.profile, _LOG):
-                executor.execute(qgraph)
-        finally:
-            if args.summary:
-                report = executor.getReport()
-                if report:
-                    with open(args.summary, "w") as out:
-                        # Do not save fields that are not set.
-                        out.write(report.model_dump_json(exclude_none=True, indent=2))