PyPI - fractal-server - Versions diffs - 2.13.1__py3-none-any.whl → 2.14.0__py3-none-any.whl - Mend

fractal-server 2.13.1py3-none-any.whl → 2.14.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (119) hide show

fractal_server/app/runner/v2/runner_functions.py CHANGED Viewed

@@ -1,100 +1,112 @@
 import functools
-import logging
-import traceback
-from concurrent.futures import Executor
 from pathlib import Path
 from typing import Any
 from typing import Callable
 from typing import Literal
 from typing import Optional
-from pydantic import ValidationError
+from pydantic import BaseModel
+from pydantic import ConfigDict
 from ..exceptions import JobExecutionError
+from ..exceptions import TaskOutputValidationError
+from .db_tools import update_status_of_history_unit
 from .deduplicate_list import deduplicate_list
-from .merge_outputs import merge_outputs
 from .runner_functions_low_level import run_single_task
 from .task_interface import InitTaskOutput
 from .task_interface import TaskOutput
+from fractal_server.app.db import get_sync_db
+from fractal_server.app.models.v2 import HistoryUnit
 from fractal_server.app.models.v2 import TaskV2
 from fractal_server.app.models.v2 import WorkflowTaskV2
-from fractal_server.app.runner.components import _COMPONENT_KEY_
-from fractal_server.app.runner.components import _index_to_component
+from fractal_server.app.runner.executors.base_runner import BaseRunner
+from fractal_server.app.runner.task_files import enrich_task_files_multisubmit
+from fractal_server.app.runner.task_files import SUBMIT_PREFIX
+from fractal_server.app.runner.task_files import TaskFiles
+from fractal_server.app.runner.v2.db_tools import (
+    bulk_update_status_of_history_unit,
+)
+from fractal_server.app.runner.v2.db_tools import bulk_upsert_image_cache_fast
+from fractal_server.app.runner.v2.task_interface import (
+    _cast_and_validate_InitTaskOutput,
+)
+from fractal_server.app.runner.v2.task_interface import (
+    _cast_and_validate_TaskOutput,
+)
+from fractal_server.app.schemas.v2 import HistoryUnitStatus
+from fractal_server.logger import set_logger
 __all__ = [
-    "run_v2_task_non_parallel",
     "run_v2_task_parallel",
+    "run_v2_task_non_parallel",
     "run_v2_task_compound",
 ]
-MAX_PARALLELIZATION_LIST_SIZE = 20_000
+logger = set_logger(__name__)
-def _cast_and_validate_TaskOutput(
-    task_output: dict[str, Any]
-) -> Optional[TaskOutput]:
-    try:
-        validated_task_output = TaskOutput(**task_output)
-        return validated_task_output
-    except ValidationError as e:
-        raise JobExecutionError(
-            "Validation of task output failed.\n"
-            f"Original error: {str(e)}\n"
-            f"Original data: {task_output}."
-        )
+class SubmissionOutcome(BaseModel):
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    task_output: TaskOutput | None = None
+    exception: BaseException | None = None
+    invalid_output: bool = False
+class InitSubmissionOutcome(BaseModel):
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    task_output: InitTaskOutput | None = None
+    exception: BaseException | None = None
-def _cast_and_validate_InitTaskOutput(
-    init_task_output: dict[str, Any],
-) -> Optional[InitTaskOutput]:
-    try:
-        validated_init_task_output = InitTaskOutput(**init_task_output)
-        return validated_init_task_output
-    except ValidationError as e:
-        raise JobExecutionError(
-            "Validation of init-task output failed.\n"
-            f"Original error: {str(e)}\n"
-            f"Original data: {init_task_output}."
-        )
+MAX_PARALLELIZATION_LIST_SIZE = 20_000
-def no_op_submit_setup_call(
+def _process_task_output(
     *,
-    wftask: WorkflowTaskV2,
-    workflow_dir_local: Path,
-    workflow_dir_remote: Path,
-    which_type: Literal["non_parallel", "parallel"],
-) -> dict:
-    """
-    Default (no-operation) interface of submit_setup_call in V2.
-    """
-    return {}
+    result: dict[str, Any] | None = None,
+    exception: BaseException | None = None,
+) -> SubmissionOutcome:
+    invalid_output = False
+    if exception is not None:
+        task_output = None
+    else:
+        if result is None:
+            task_output = TaskOutput()
+        else:
+            try:
+                task_output = _cast_and_validate_TaskOutput(result)
+            except TaskOutputValidationError as e:
+                task_output = None
+                exception = e
+                invalid_output = True
+    return SubmissionOutcome(
+        task_output=task_output,
+        exception=exception,
+        invalid_output=invalid_output,
+    )
-# Backend-specific configuration
-def _get_executor_options(
+def _process_init_task_output(
     *,
-    wftask: WorkflowTaskV2,
-    workflow_dir_local: Path,
-    workflow_dir_remote: Path,
-    submit_setup_call: Callable,
-    which_type: Literal["non_parallel", "parallel"],
-) -> dict:
-    try:
-        options = submit_setup_call(
-            wftask=wftask,
-            workflow_dir_local=workflow_dir_local,
-            workflow_dir_remote=workflow_dir_remote,
-            which_type=which_type,
-        )
-    except Exception as e:
-        tb = "".join(traceback.format_tb(e.__traceback__))
-        raise RuntimeError(
-            f"{type(e)} error in {submit_setup_call=}\n"
-            f"Original traceback:\n{tb}"
-        )
-    return options
+    result: dict[str, Any] | None = None,
+    exception: BaseException | None = None,
+) -> SubmissionOutcome:
+    if exception is not None:
+        task_output = None
+    else:
+        if result is None:
+            task_output = InitTaskOutput()
+        else:
+            try:
+                task_output = _cast_and_validate_InitTaskOutput(result)
+            except TaskOutputValidationError as e:
+                task_output = None
+                exception = e
+    return InitSubmissionOutcome(
+        task_output=task_output,
+        exception=exception,
+    )
 def _check_parallelization_list_size(my_list):
@@ -113,51 +125,123 @@ def run_v2_task_non_parallel(
     task: TaskV2,
     wftask: WorkflowTaskV2,
     workflow_dir_local: Path,
-    workflow_dir_remote: Optional[Path] = None,
-    executor: Executor,
-    submit_setup_call: Callable = no_op_submit_setup_call,
-) -> tuple[TaskOutput, int]:
+    workflow_dir_remote: Path,
+    runner: BaseRunner,
+    get_runner_config: Callable[
+        [
+            WorkflowTaskV2,
+            Literal["non_parallel", "parallel"],
+            Optional[Path],
+            int,
+        ],
+        Any,
+    ],
+    dataset_id: int,
+    history_run_id: int,
+    task_type: Literal["non_parallel", "converter_non_parallel"],
+    user_id: int,
+) -> tuple[dict[int, SubmissionOutcome], int]:
     """
     This runs server-side (see `executor` argument)
     """
-    if workflow_dir_remote is None:
-        workflow_dir_remote = workflow_dir_local
-        logging.warning(
-            "In `run_single_task`, workflow_dir_remote=None. Is this right?"
+    if task_type not in ["non_parallel", "converter_non_parallel"]:
+        raise ValueError(
+            f"Invalid {task_type=} for `run_v2_task_non_parallel`."
         )
-        workflow_dir_remote = workflow_dir_local
-    executor_options = _get_executor_options(
+    # Get TaskFiles object
+    task_files = TaskFiles(
+        root_dir_local=workflow_dir_local,
+        root_dir_remote=workflow_dir_remote,
+        task_order=wftask.order,
+        task_name=wftask.task.name,
+        component="",
+        prefix=SUBMIT_PREFIX,
+    )
+    runner_config = get_runner_config(
         wftask=wftask,
-        workflow_dir_local=workflow_dir_local,
-        workflow_dir_remote=workflow_dir_remote,
-        submit_setup_call=submit_setup_call,
         which_type="non_parallel",
     )
-    function_kwargs = dict(
-        zarr_urls=[image["zarr_url"] for image in images],
-        zarr_dir=zarr_dir,
+    function_kwargs = {
+        "zarr_dir": zarr_dir,
         **(wftask.args_non_parallel or {}),
-    )
-    future = executor.submit(
+    }
+    if task_type == "non_parallel":
+        function_kwargs["zarr_urls"] = [img["zarr_url"] for img in images]
+    # Database History operations
+    with next(get_sync_db()) as db:
+        if task_type == "non_parallel":
+            zarr_urls = function_kwargs["zarr_urls"]
+        elif task_type == "converter_non_parallel":
+            zarr_urls = []
+        history_unit = HistoryUnit(
+            history_run_id=history_run_id,
+            status=HistoryUnitStatus.SUBMITTED,
+            logfile=task_files.log_file_local,
+            zarr_urls=zarr_urls,
+        )
+        db.add(history_unit)
+        db.commit()
+        db.refresh(history_unit)
+        logger.debug(
+            "[run_v2_task_non_parallel] Created `HistoryUnit` with "
+            f"{history_run_id=}."
+        )
+        history_unit_id = history_unit.id
+        bulk_upsert_image_cache_fast(
+            db=db,
+            list_upsert_objects=[
+                dict(
+                    workflowtask_id=wftask.id,
+                    dataset_id=dataset_id,
+                    zarr_url=zarr_url,
+                    latest_history_unit_id=history_unit_id,
+                )
+                for zarr_url in history_unit.zarr_urls
+            ],
+        )
+    result, exception = runner.submit(
         functools.partial(
             run_single_task,
-            wftask=wftask,
             command=task.command_non_parallel,
-            workflow_dir_local=workflow_dir_local,
-            workflow_dir_remote=workflow_dir_remote,
+            workflow_task_order=wftask.order,
+            workflow_task_id=wftask.task_id,
+            task_name=wftask.task.name,
         ),
-        function_kwargs,
-        **executor_options,
+        parameters=function_kwargs,
+        task_type=task_type,
+        task_files=task_files,
+        history_unit_id=history_unit_id,
+        config=runner_config,
+        user_id=user_id,
     )
-    output = future.result()
+    positional_index = 0
     num_tasks = 1
-    if output is None:
-        return (TaskOutput(), num_tasks)
-    else:
-        return (_cast_and_validate_TaskOutput(output), num_tasks)
+    outcome = {
+        positional_index: _process_task_output(
+            result=result,
+            exception=exception,
+        )
+    }
+    # NOTE: Here we don't have to handle the
+    # `outcome[0].exception is not None` branch, since for non_parallel
+    # tasks it was already handled within submit
+    if outcome[0].invalid_output:
+        with next(get_sync_db()) as db:
+            update_status_of_history_unit(
+                history_unit_id=history_unit_id,
+                status=HistoryUnitStatus.FAILED,
+                db_sync=db,
+            )
+    return outcome, num_tasks
 def run_v2_task_parallel(
@@ -165,59 +249,132 @@ def run_v2_task_parallel(
     images: list[dict[str, Any]],
     task: TaskV2,
     wftask: WorkflowTaskV2,
-    executor: Executor,
+    runner: BaseRunner,
     workflow_dir_local: Path,
-    workflow_dir_remote: Optional[Path] = None,
-    submit_setup_call: Callable = no_op_submit_setup_call,
-) -> tuple[TaskOutput, int]:
+    workflow_dir_remote: Path,
+    get_runner_config: Callable[
+        [
+            WorkflowTaskV2,
+            Literal["non_parallel", "parallel"],
+            Optional[Path],
+            int,
+        ],
+        Any,
+    ],
+    dataset_id: int,
+    history_run_id: int,
+    user_id: int,
+) -> tuple[dict[int, SubmissionOutcome], int]:
     if len(images) == 0:
-        return (TaskOutput(), 0)
+        return {}, 0
     _check_parallelization_list_size(images)
-    executor_options = _get_executor_options(
+    # Get TaskFiles object
+    task_files = TaskFiles(
+        root_dir_local=workflow_dir_local,
+        root_dir_remote=workflow_dir_remote,
+        task_order=wftask.order,
+        task_name=wftask.task.name,
+    )
+    runner_config = get_runner_config(
         wftask=wftask,
-        workflow_dir_local=workflow_dir_local,
-        workflow_dir_remote=workflow_dir_remote,
-        submit_setup_call=submit_setup_call,
         which_type="parallel",
+        tot_tasks=len(images),
     )
-    list_function_kwargs = []
-    for ind, image in enumerate(images):
-        list_function_kwargs.append(
+    list_function_kwargs = [
+        {
+            "zarr_url": image["zarr_url"],
+            **(wftask.args_parallel or {}),
+        }
+        for image in images
+    ]
+    list_task_files = enrich_task_files_multisubmit(
+        base_task_files=task_files,
+        tot_tasks=len(images),
+        batch_size=runner_config.batch_size,
+    )
+    history_units = [
+        HistoryUnit(
+            history_run_id=history_run_id,
+            status=HistoryUnitStatus.SUBMITTED,
+            logfile=list_task_files[ind].log_file_local,
+            zarr_urls=[image["zarr_url"]],
+        )
+        for ind, image in enumerate(images)
+    ]
+    with next(get_sync_db()) as db:
+        db.add_all(history_units)
+        db.commit()
+        logger.debug(
+            f"[run_v2_task_non_parallel] Created {len(history_units)} "
+            "`HistoryUnit`s."
+        )
+        for history_unit in history_units:
+            db.refresh(history_unit)
+        history_unit_ids = [history_unit.id for history_unit in history_units]
+        history_image_caches = [
             dict(
-                zarr_url=image["zarr_url"],
-                **(wftask.args_parallel or {}),
-            ),
+                workflowtask_id=wftask.id,
+                dataset_id=dataset_id,
+                zarr_url=history_unit.zarr_urls[0],
+                latest_history_unit_id=history_unit.id,
+            )
+            for history_unit in history_units
+        ]
+        bulk_upsert_image_cache_fast(
+            db=db, list_upsert_objects=history_image_caches
         )
-        list_function_kwargs[-1][_COMPONENT_KEY_] = _index_to_component(ind)
-    results_iterator = executor.map(
+    results, exceptions = runner.multisubmit(
         functools.partial(
             run_single_task,
-            wftask=wftask,
             command=task.command_parallel,
-            workflow_dir_local=workflow_dir_local,
-            workflow_dir_remote=workflow_dir_remote,
+            workflow_task_order=wftask.order,
+            workflow_task_id=wftask.task_id,
+            task_name=wftask.task.name,
         ),
-        list_function_kwargs,
-        **executor_options,
+        list_parameters=list_function_kwargs,
+        task_type="parallel",
+        list_task_files=list_task_files,
+        history_unit_ids=history_unit_ids,
+        config=runner_config,
+        user_id=user_id,
     )
-    # Explicitly iterate over the whole list, so that all futures are waited
-    outputs = list(results_iterator)
-    # Validate all non-None outputs
-    for ind, output in enumerate(outputs):
-        if output is None:
-            outputs[ind] = TaskOutput()
-        else:
-            outputs[ind] = _cast_and_validate_TaskOutput(output)
+    outcome = {}
+    for ind in range(len(list_function_kwargs)):
+        if ind not in results.keys() and ind not in exceptions.keys():
+            error_msg = (
+                f"Invalid branch: {ind=} is not in `results.keys()` "
+                "nor in `exceptions.keys()`."
+            )
+            logger.error(error_msg)
+            raise RuntimeError(error_msg)
+        outcome[ind] = _process_task_output(
+            result=results.get(ind, None),
+            exception=exceptions.get(ind, None),
+        )
+        # NOTE: Here we don't have to handle the
+        # `outcome[ind].exception is not None` branch, since for parallel
+        # tasks it was already handled within multisubmit
+        if outcome[ind].invalid_output:
+            with next(get_sync_db()) as db:
+                update_status_of_history_unit(
+                    history_unit_id=history_unit_ids[ind],
+                    status=HistoryUnitStatus.FAILED,
+                    db_sync=db,
+                )
     num_tasks = len(images)
-    merged_output = merge_outputs(outputs)
-    return (merged_output, num_tasks)
+    return outcome, num_tasks
 def run_v2_task_compound(
@@ -226,92 +383,236 @@ def run_v2_task_compound(
     zarr_dir: str,
     task: TaskV2,
     wftask: WorkflowTaskV2,
-    executor: Executor,
+    runner: BaseRunner,
     workflow_dir_local: Path,
-    workflow_dir_remote: Optional[Path] = None,
-    submit_setup_call: Callable = no_op_submit_setup_call,
-) -> TaskOutput:
+    workflow_dir_remote: Path,
+    get_runner_config: Callable[
+        [
+            WorkflowTaskV2,
+            Literal["non_parallel", "parallel"],
+            Optional[Path],
+            int,
+        ],
+        Any,
+    ],
+    dataset_id: int,
+    history_run_id: int,
+    task_type: Literal["compound", "converter_compound"],
+    user_id: int,
+) -> tuple[dict[int, SubmissionOutcome], int]:
+    # Get TaskFiles object
+    task_files_init = TaskFiles(
+        root_dir_local=workflow_dir_local,
+        root_dir_remote=workflow_dir_remote,
+        task_order=wftask.order,
+        task_name=wftask.task.name,
+        component="",
+        prefix=SUBMIT_PREFIX,
+    )
-    executor_options_init = _get_executor_options(
+    runner_config_init = get_runner_config(
         wftask=wftask,
-        workflow_dir_local=workflow_dir_local,
-        workflow_dir_remote=workflow_dir_remote,
-        submit_setup_call=submit_setup_call,
         which_type="non_parallel",
     )
-    executor_options_compute = _get_executor_options(
-        wftask=wftask,
-        workflow_dir_local=workflow_dir_local,
-        workflow_dir_remote=workflow_dir_remote,
-        submit_setup_call=submit_setup_call,
-        which_type="parallel",
-    )
     # 3/A: non-parallel init task
-    function_kwargs = dict(
-        zarr_urls=[image["zarr_url"] for image in images],
-        zarr_dir=zarr_dir,
+    function_kwargs = {
+        "zarr_dir": zarr_dir,
         **(wftask.args_non_parallel or {}),
-    )
-    future = executor.submit(
+    }
+    if task_type == "compound":
+        function_kwargs["zarr_urls"] = [img["zarr_url"] for img in images]
+        input_image_zarr_urls = function_kwargs["zarr_urls"]
+    elif task_type == "converter_compound":
+        input_image_zarr_urls = []
+    # Create database History entries
+    with next(get_sync_db()) as db:
+        # Create a single `HistoryUnit` for the whole compound task
+        history_unit = HistoryUnit(
+            history_run_id=history_run_id,
+            status=HistoryUnitStatus.SUBMITTED,
+            logfile=task_files_init.log_file_local,
+            zarr_urls=input_image_zarr_urls,
+        )
+        db.add(history_unit)
+        db.commit()
+        db.refresh(history_unit)
+        init_history_unit_id = history_unit.id
+        logger.debug(
+            "[run_v2_task_compound] Created `HistoryUnit` with "
+            f"{init_history_unit_id=}."
+        )
+        # Create one `HistoryImageCache` for each input image
+        bulk_upsert_image_cache_fast(
+            db=db,
+            list_upsert_objects=[
+                dict(
+                    workflowtask_id=wftask.id,
+                    dataset_id=dataset_id,
+                    zarr_url=zarr_url,
+                    latest_history_unit_id=init_history_unit_id,
+                )
+                for zarr_url in input_image_zarr_urls
+            ],
+        )
+    result, exception = runner.submit(
         functools.partial(
             run_single_task,
-            wftask=wftask,
             command=task.command_non_parallel,
-            workflow_dir_local=workflow_dir_local,
-            workflow_dir_remote=workflow_dir_remote,
+            workflow_task_order=wftask.order,
+            workflow_task_id=wftask.task_id,
+            task_name=wftask.task.name,
         ),
-        function_kwargs,
-        **executor_options_init,
+        parameters=function_kwargs,
+        task_type=task_type,
+        task_files=task_files_init,
+        history_unit_id=init_history_unit_id,
+        config=runner_config_init,
+        user_id=user_id,
     )
-    output = future.result()
-    if output is None:
-        init_task_output = InitTaskOutput()
-    else:
-        init_task_output = _cast_and_validate_InitTaskOutput(output)
-    parallelization_list = init_task_output.parallelization_list
+    init_outcome = _process_init_task_output(
+        result=result,
+        exception=exception,
+    )
+    num_tasks = 1
+    if init_outcome.exception is not None:
+        positional_index = 0
+        return (
+            {
+                positional_index: SubmissionOutcome(
+                    exception=init_outcome.exception
+                )
+            },
+            num_tasks,
+        )
+    parallelization_list = init_outcome.task_output.parallelization_list
     parallelization_list = deduplicate_list(parallelization_list)
-    num_task = 1 + len(parallelization_list)
+    num_tasks = 1 + len(parallelization_list)
     # 3/B: parallel part of a compound task
     _check_parallelization_list_size(parallelization_list)
     if len(parallelization_list) == 0:
-        return (TaskOutput(), 0)
+        with next(get_sync_db()) as db:
+            update_status_of_history_unit(
+                history_unit_id=init_history_unit_id,
+                status=HistoryUnitStatus.DONE,
+                db_sync=db,
+            )
+        positional_index = 0
+        init_outcome = {
+            positional_index: _process_task_output(
+                result=None,
+                exception=None,
+            )
+        }
+        return init_outcome, num_tasks
+    runner_config_compute = get_runner_config(
+        wftask=wftask,
+        which_type="parallel",
+        tot_tasks=len(parallelization_list),
+    )
-    list_function_kwargs = []
-    for ind, parallelization_item in enumerate(parallelization_list):
-        list_function_kwargs.append(
-            dict(
-                zarr_url=parallelization_item.zarr_url,
-                init_args=parallelization_item.init_args,
-                **(wftask.args_parallel or {}),
-            ),
+    list_task_files = enrich_task_files_multisubmit(
+        base_task_files=TaskFiles(
+            root_dir_local=workflow_dir_local,
+            root_dir_remote=workflow_dir_remote,
+            task_order=wftask.order,
+            task_name=wftask.task.name,
+        ),
+        tot_tasks=len(parallelization_list),
+        batch_size=runner_config_compute.batch_size,
+    )
+    list_function_kwargs = [
+        {
+            "zarr_url": parallelization_item.zarr_url,
+            "init_args": parallelization_item.init_args,
+            **(wftask.args_parallel or {}),
+        }
+        for parallelization_item in parallelization_list
+    ]
+    # Create one `HistoryUnit` per parallelization item
+    history_units = [
+        HistoryUnit(
+            history_run_id=history_run_id,
+            status=HistoryUnitStatus.SUBMITTED,
+            logfile=list_task_files[ind].log_file_local,
+            zarr_urls=[parallelization_item.zarr_url],
         )
-        list_function_kwargs[-1][_COMPONENT_KEY_] = _index_to_component(ind)
+        for ind, parallelization_item in enumerate(parallelization_list)
+    ]
+    with next(get_sync_db()) as db:
+        db.add_all(history_units)
+        db.commit()
+        for history_unit in history_units:
+            db.refresh(history_unit)
+        logger.debug(
+            f"[run_v2_task_compound] Created {len(history_units)} "
+            "`HistoryUnit`s."
+        )
+        history_unit_ids = [history_unit.id for history_unit in history_units]
-    results_iterator = executor.map(
+    results, exceptions = runner.multisubmit(
         functools.partial(
             run_single_task,
-            wftask=wftask,
             command=task.command_parallel,
-            workflow_dir_local=workflow_dir_local,
-            workflow_dir_remote=workflow_dir_remote,
+            workflow_task_order=wftask.order,
+            workflow_task_id=wftask.task_id,
+            task_name=wftask.task.name,
         ),
-        list_function_kwargs,
-        **executor_options_compute,
+        list_parameters=list_function_kwargs,
+        task_type=task_type,
+        list_task_files=list_task_files,
+        history_unit_ids=history_unit_ids,
+        config=runner_config_compute,
+        user_id=user_id,
     )
-    # Explicitly iterate over the whole list, so that all futures are waited
-    outputs = list(results_iterator)
-    # Validate all non-None outputs
-    for ind, output in enumerate(outputs):
-        if output is None:
-            outputs[ind] = TaskOutput()
+    compute_outcomes: dict[int, SubmissionOutcome] = {}
+    failure = False
+    for ind in range(len(list_function_kwargs)):
+        if ind not in results.keys() and ind not in exceptions.keys():
+            # NOTE: see issue 2484
+            error_msg = (
+                f"Invalid branch: {ind=} is not in `results.keys()` "
+                "nor in `exceptions.keys()`."
+            )
+            logger.error(error_msg)
+            raise RuntimeError(error_msg)
+        compute_outcomes[ind] = _process_task_output(
+            result=results.get(ind, None),
+            exception=exceptions.get(ind, None),
+        )
+        # NOTE: For compound task, `multisubmit` did not handle the
+        # `exception is not None` branch, therefore we have to include it here.
+        if (
+            compute_outcomes[ind].exception is not None
+            or compute_outcomes[ind].invalid_output
+        ):
+            failure = True
+    # NOTE: For compound tasks, we update `HistoryUnit.status` from here,
+    # rather than within the submit/multisubmit runner methods. This is
+    # to enforce the fact that either all units succeed or they all fail -
+    # at a difference with the parallel-task case.
+    with next(get_sync_db()) as db:
+        if failure:
+            bulk_update_status_of_history_unit(
+                history_unit_ids=history_unit_ids + [init_history_unit_id],
+                status=HistoryUnitStatus.FAILED,
+                db_sync=db,
+            )
         else:
-            validated_output = _cast_and_validate_TaskOutput(output)
-            outputs[ind] = validated_output
+            bulk_update_status_of_history_unit(
+                history_unit_ids=history_unit_ids + [init_history_unit_id],
+                status=HistoryUnitStatus.DONE,
+                db_sync=db,
+            )
-    merged_output = merge_outputs(outputs)
-    return (merged_output, num_task)
+    return compute_outcomes, num_tasks

fractal-server 2.13.1__py3-none-any.whl → 2.14.0__py3-none-any.whl

fractal-server 2.13.1py3-none-any.whl → 2.14.0py3-none-any.whl