PyPI - ddeutil-workflow - Versions diffs - 0.0.6__py3-none-any.whl → 0.0.8__py3-none-any.whl - Mend

ddeutil-workflow 0.0.6py3-none-any.whl → 0.0.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

ddeutil/workflow/__about__.py +1 -1
ddeutil/workflow/__init__.py +26 -4
ddeutil/workflow/__types.py +11 -1
ddeutil/workflow/api.py +120 -0
ddeutil/workflow/app.py +45 -0
ddeutil/workflow/exceptions.py +3 -3
ddeutil/workflow/log.py +79 -0
ddeutil/workflow/pipeline.py +516 -120
ddeutil/workflow/repeat.py +134 -0
ddeutil/workflow/route.py +78 -0
ddeutil/workflow/stage.py +209 -86
ddeutil/workflow/utils.py +368 -66
{ddeutil_workflow-0.0.6.dist-info → ddeutil_workflow-0.0.8.dist-info}/METADATA +48 -76
ddeutil_workflow-0.0.8.dist-info/RECORD +20 -0
{ddeutil_workflow-0.0.6.dist-info → ddeutil_workflow-0.0.8.dist-info}/WHEEL +1 -1
ddeutil_workflow-0.0.6.dist-info/RECORD +0 -15
{ddeutil_workflow-0.0.6.dist-info → ddeutil_workflow-0.0.8.dist-info}/LICENSE +0 -0
{ddeutil_workflow-0.0.6.dist-info → ddeutil_workflow-0.0.8.dist-info}/top_level.txt +0 -0

ddeutil/workflow/pipeline.py CHANGED Viewed

@@ -7,20 +7,47 @@ from __future__ import annotations
 import copy
 import logging
+import os
 import time
+from concurrent.futures import (
+    FIRST_EXCEPTION,
+    Future,
+    ProcessPoolExecutor,
+    ThreadPoolExecutor,
+    as_completed,
+    wait,
+)
+from datetime import datetime
+from multiprocessing import Event, Manager
+from pickle import PickleError
 from queue import Queue
 from typing import Optional
+from zoneinfo import ZoneInfo
 from pydantic import BaseModel, Field
 from pydantic.functional_validators import model_validator
 from typing_extensions import Self
 from .__types import DictData, DictStr, Matrix, MatrixExclude, MatrixInclude
-from .exceptions import JobException, PipelineException
+from .exceptions import (
+    JobException,
+    PipelineException,
+    StageException,
+    UtilException,
+)
 from .loader import Loader
 from .on import On
+from .scheduler import CronRunner
 from .stage import Stage
-from .utils import Param, Result, cross_product, dash2underscore, gen_id
+from .utils import (
+    Param,
+    Result,
+    cross_product,
+    dash2underscore,
+    filter_func,
+    gen_id,
+    get_diff_sec,
+)
 class Strategy(BaseModel):
@@ -29,9 +56,11 @@ class Strategy(BaseModel):
     Data Validate:
         >>> strategy = {
+        ...     'max-parallel': 1,
+        ...     'fail-fast': False,
         ...     'matrix': {
         ...         'first': [1, 2, 3],
-        ...         'second': ['foo', 'bar']
+        ...         'second': ['foo', 'bar'],
         ...     },
         ...     'include': [{'first': 4, 'second': 'foo'}],
         ...     'exclude': [{'first': 1, 'second': 'bar'}],
@@ -39,7 +68,7 @@ class Strategy(BaseModel):
     """
     fail_fast: bool = Field(default=False)
-    max_parallel: int = Field(default=-1)
+    max_parallel: int = Field(default=1, gt=0)
     matrix: Matrix = Field(default_factory=dict)
     include: MatrixInclude = Field(
         default_factory=list,
@@ -59,6 +88,10 @@ class Strategy(BaseModel):
         dash2underscore("fail-fast", values)
         return values
+    def is_set(self) -> bool:
+        """Return True if this strategy was set from yaml template."""
+        return len(self.matrix) > 0
     def make(self) -> list[DictStr]:
         """Return List of product of matrix values that already filter with
         exclude and add include.
@@ -115,18 +148,25 @@ class Job(BaseModel):
     Data Validate:
         >>> job = {
         ...     "runs-on": None,
-        ...     "strategy": {},
+        ...     "strategy": {
+        ...         "max-parallel": 1,
+        ...         "matrix": {
+        ...             "first": [1, 2, 3],
+        ...             "second": ['foo', 'bar'],
+        ...         },
+        ...     },
         ...     "needs": [],
         ...     "stages": [
         ...         {
         ...             "name": "Some stage",
         ...             "run": "print('Hello World')",
         ...         },
+        ...         ...
         ...     ],
         ... }
     """
-    name: Optional[str] = Field(default=None)
+    id: Optional[str] = Field(default=None)
     desc: Optional[str] = Field(default=None)
     runs_on: Optional[str] = Field(default=None)
     stages: list[Stage] = Field(
@@ -141,6 +181,9 @@ class Job(BaseModel):
         default_factory=Strategy,
         description="A strategy matrix that want to generate.",
     )
+    run_id: Optional[str] = Field(
+        default=None, description="A running job ID.", repr=False
+    )
     @model_validator(mode="before")
     def __prepare_keys(cls, values: DictData) -> DictData:
@@ -150,6 +193,12 @@ class Job(BaseModel):
         dash2underscore("runs-on", values)
         return values
+    @model_validator(mode="after")
+    def __prepare_running_id(self):
+        if self.run_id is None:
+            self.run_id = gen_id(self.id or "", unique=True)
+        return self
     def stage(self, stage_id: str) -> Stage:
         """Return stage model that match with an input stage ID."""
         for stage in self.stages:
@@ -157,40 +206,133 @@ class Job(BaseModel):
                 return stage
         raise ValueError(f"Stage ID {stage_id} does not exists")
-    @staticmethod
-    def set_outputs(output: DictData) -> DictData:
-        if len(output) > 1:
+    def set_outputs(self, output: DictData) -> DictData:
+        if len(output) > 1 and self.strategy.is_set():
             return {"strategies": output}
         return output[next(iter(output))]
-    def strategy_execute(self, strategy: DictData, params: DictData) -> Result:
-        context: DictData = {}
-        context.update(params)
+    def strategy_execute(
+        self,
+        strategy: DictData,
+        params: DictData,
+        *,
+        event: Event | None = None,
+    ) -> Result:
+        """Job Strategy execution with passing dynamic parameters from the
+        pipeline execution to strategy matrix.
+            This execution is the minimum level execution of job model.
+        :param strategy: A metrix strategy value.
+        :param params: A dynamic parameters.
+        :param event: An manger event that pass to the PoolThreadExecutor.
+        :rtype: Result
+        :raise JobException: If it has any error from StageException or
+            UtilException.
+        """
+        if event and event.is_set():
+            return Result(
+                status=1,
+                context={
+                    gen_id(strategy): {
+                        "matrix": strategy,
+                        "stages": {},
+                        "error": {
+                            "message": "Process Event stopped before execution"
+                        },
+                    },
+                },
+            )
+        # NOTE: Create strategy execution context and update a matrix and copied
+        #   of params. So, the context value will have structure like;
+        #   ---
+        #   {
+        #       "params": { ... },      <== Current input params
+        #       "jobs": { ... },        <== Current input params
+        #       "matrix": { ... }       <== Current strategy value
+        #   }
+        #
+        context: DictData = params
         context.update({"matrix": strategy})
+        # IMPORTANT: The stage execution only run sequentially one-by-one.
         for stage in self.stages:
+            # IMPORTANT: Change any stage running IDs to this job running ID.
+            stage.run_id = self.run_id
             _st_name: str = stage.id or stage.name
-            if stage.is_skip(params=context):
-                logging.info(f"[JOB]: Skip the stage: {_st_name!r}")
+            if stage.is_skipped(params=context):
+                logging.info(
+                    f"({self.run_id}) [JOB]: Skip the stage: {_st_name!r}"
+                )
                 continue
-            logging.info(f"[JOB]: Start execute the stage: {_st_name!r}")
-            rs: Result = stage.execute(params=context)
-            if rs.status == 0:
+            logging.info(
+                f"({self.run_id}) [JOB]: Start execute the stage: {_st_name!r}"
+            )
+            # NOTE: Logging a matrix that pass on this stage execution.
+            if strategy:
+                logging.info(f"({self.run_id}) [JOB]: Matrix: {strategy}")
+            # NOTE:
+            #       I do not use below syntax because `params` dict be the
+            #   reference memory pointer and it was changed when I action
+            #   anything like update or re-construct this.
+            #
+            #       ... params |= stage.execute(params=params)
+            #
+            #   This step will add the stage result to ``stages`` key in
+            #   that stage id. It will have structure like;
+            #   ---
+            #   {
+            #       "params": { ... },
+            #       "jobs": { ... },
+            #       "matrix": { ... },
+            #       "stages": { { "stage-id-1": ... }, ... }
+            #   }
+            #
+            if event and event.is_set():
+                return Result(
+                    status=1,
+                    context={
+                        gen_id(strategy): {
+                            "matrix": strategy,
+                            "stages": filter_func(context.pop("stages", {})),
+                            "error": {
+                                "message": (
+                                    "Process Event stopped before execution"
+                                ),
+                            },
+                        },
+                    },
+                )
+            try:
+                rs: Result = stage.execute(params=context)
                 stage.set_outputs(rs.context, params=context)
-            else:
-                raise JobException(
-                    f"Getting status does not equal zero on stage: "
-                    f"{stage.name}."
+            except (StageException, UtilException) as err:
+                logging.error(
+                    f"({self.run_id}) [JOB]: {err.__class__.__name__}: {err}"
                 )
+                raise JobException(
+                    f"Get stage execution error: {err.__class__.__name__}: "
+                    f"{err}"
+                ) from None
         return Result(
             status=0,
             context={
                 gen_id(strategy): {
                     "matrix": strategy,
-                    "stages": context.pop("stages", {}),
+                    # NOTE: (WF001) filter own created function from stages
+                    #   value, because it does not dump with pickle when you
+                    #   execute with multiprocess.
+                    #
+                    "stages": filter_func(context.pop("stages", {})),
                 },
             },
         )
@@ -204,71 +346,132 @@ class Job(BaseModel):
         :rtype: Result
         """
         strategy_context: DictData = {}
-        for strategy in self.strategy.make():
-            # NOTE: Create strategy context and update matrix and params to this
-            #   context. So, the context will have structure like;
-            #   ---
-            #   {
-            #       "params": { ... },      <== Current input params
-            #       "jobs": { ... },
-            #       "matrix": { ... }       <== Current strategy value
-            #   }
-            #
-            context: DictData = {}
-            context.update(params)
-            context.update({"matrix": strategy})
-            # TODO: we should add option for ``wait_as_complete`` for release
-            #   a stage execution to run on background (multi-thread).
-            #   ---
-            #   >>> from concurrency
-            #
-            # IMPORTANT: The stage execution only run sequentially one-by-one.
-            for stage in self.stages:
-                _st_name: str = stage.id or stage.name
+        # NOTE: Normal Job execution.
+        if (not self.strategy.is_set()) or self.strategy.max_parallel == 1:
+            for strategy in self.strategy.make():
+                rs: Result = self.strategy_execute(
+                    strategy, params=copy.deepcopy(params)
+                )
+                strategy_context.update(rs.context)
+            return Result(
+                status=0,
+                context=strategy_context,
+            )
-                if stage.is_skip(params=context):
-                    logging.info(f"[JOB]: Skip the stage: {_st_name!r}")
-                    continue
-                logging.info(f"[JOB]: Start execute the stage: {_st_name!r}")
-                # NOTE: Logging a matrix that pass on this stage execution.
-                if strategy:
-                    logging.info(f"[...]: Matrix: {strategy}")
-                # NOTE:
-                #       I do not use below syntax because `params` dict be the
-                #   reference memory pointer and it was changed when I action
-                #   anything like update or re-construct this.
-                #
-                #       ... params |= stage.execute(params=params)
-                #
-                #   This step will add the stage result to ``stages`` key in
-                #   that stage id. It will have structure like;
-                #   ---
-                #   {
-                #       "params": { ... },
-                #       "jobs": { ... },
-                #       "matrix": { ... },
-                #       "stages": { { "stage-id-1": ... }, ... }
-                #   }
-                #
-                rs: Result = stage.execute(params=context)
-                if rs.status == 0:
-                    stage.set_outputs(rs.context, params=context)
-                else:
-                    raise JobException(
-                        f"Getting status does not equal zero on stage: "
-                        f"{stage.name}."
+        # WARNING: (WF001) I got error that raise when use
+        #  ``ProcessPoolExecutor``;
+        #   ---
+        #   _pickle.PicklingError: Can't pickle
+        #       <function ??? at 0x000001F0BE80F160>: attribute lookup ???
+        #       on ddeutil.workflow.stage failed
+        #
+        with Manager() as manager:
+            event: Event = manager.Event()
+            # NOTE: Start process pool executor for running strategy executor in
+            #   parallel mode.
+            with ProcessPoolExecutor(
+                max_workers=self.strategy.max_parallel
+            ) as executor:
+                features: list[Future] = [
+                    executor.submit(
+                        self.strategy_execute,
+                        strategy,
+                        params=copy.deepcopy(params),
+                        event=event,
                     )
+                    for strategy in self.strategy.make()
+                ]
+                if self.strategy.fail_fast:
+                    rs = self.__catch_fail_fast(event, features)
+                else:
+                    rs = self.__catch_all_completed(features)
+        return Result(
+            status=0,
+            context=rs.context,
+        )
-            strategy_context[gen_id(strategy)] = {
-                "matrix": strategy,
-                "stages": context.pop("stages", {}),
-            }
+    def __catch_fail_fast(self, event: Event, features: list[Future]) -> Result:
+        """Job parallel pool features catching with fail-fast mode. That will
+        stop all not done features if it receive the first exception from all
+        running features.
+        :param event:
+        :param features: A list of features.
+        :rtype: Result
+        """
+        strategy_context: DictData = {}
+        # NOTE: Get results from a collection of tasks with a
+        #   timeout that has the first exception.
+        done, not_done = wait(
+            features, timeout=1800, return_when=FIRST_EXCEPTION
+        )
+        nd: str = (
+            f", the strategies do not run is {not_done}" if not_done else ""
+        )
+        logging.debug(f"[JOB]: Strategy is set Fail Fast{nd}")
+        # NOTE: Stop all running tasks
+        event.set()
+        # NOTE: Cancel any scheduled tasks
+        for future in features:
+            future.cancel()
+        status: int = 0
+        for f in done:
+            if f.exception():
+                status = 1
+                logging.error(
+                    f"({self.run_id}) [JOB]: One stage failed with: "
+                    f"{f.exception()}, shutting down this feature."
+                )
+            elif f.cancelled():
+                continue
+            else:
+                rs: Result = f.result(timeout=60)
+                strategy_context.update(rs.context)
+        return Result(
+            status=status,
+            context=strategy_context,
+        )
-        return Result(status=0, context=strategy_context)
+    def __catch_all_completed(self, features: list[Future]) -> Result:
+        """Job parallel pool features catching with all-completed mode.
+        :param features: A list of features.
+        """
+        strategy_context: DictData = {}
+        status: int = 0
+        for feature in as_completed(features):
+            try:
+                rs: Result = feature.result(timeout=60)
+                strategy_context.update(rs.context)
+            except PickleError as err:
+                # NOTE: (WF001) I do not want to fix this issue because
+                #   it does not make sense and over-engineering with
+                #   this bug fix process.
+                raise JobException(
+                    f"PyStage that create object on locals does use "
+                    f"parallel in strategy execution;\n\t{err}"
+                ) from None
+            except TimeoutError:
+                status = 1
+                logging.warning("Task is hanging. Attempting to kill.")
+                feature.cancel()
+                if not feature.cancelled():
+                    logging.warning("Failed to cancel the task.")
+                else:
+                    logging.warning("Task canceled successfully.")
+            except JobException as err:
+                status = 1
+                logging.error(
+                    f"({self.run_id}) [JOB]: Get stage exception with "
+                    f"fail-fast does not set;\n{err.__class__.__name__}:\n\t"
+                    f"{err}"
+                )
+        return Result(status=status, context=strategy_context)
 class Pipeline(BaseModel):
@@ -297,6 +500,9 @@ class Pipeline(BaseModel):
         default_factory=dict,
         description="A mapping of job ID and job model that already loaded.",
     )
+    run_id: Optional[str] = Field(
+        default=None, description="A running job ID.", repr=False
+    )
     @classmethod
     def from_loader(
@@ -356,6 +562,25 @@ class Pipeline(BaseModel):
             }
         return values
+    @model_validator(mode="after")
+    def __validate_jobs_need_and_prepare_running_id(self):
+        for job in self.jobs:
+            if not_exist := [
+                need for need in self.jobs[job].needs if need not in self.jobs
+            ]:
+                raise PipelineException(
+                    f"This needed jobs: {not_exist} do not exist in this "
+                    f"pipeline."
+                )
+            # NOTE: update a job id with its job id from pipeline template
+            self.jobs[job].id = job
+        if self.run_id is None:
+            self.run_id = gen_id(self.name, unique=True)
+        return self
     def job(self, name: str) -> Job:
         """Return Job model that exists on this pipeline.
@@ -375,6 +600,7 @@ class Pipeline(BaseModel):
         job execution.
         :param params: A parameter mapping that receive from pipeline execution.
+        :rtype: DictData
         """
         # VALIDATE: Incoming params should have keys that set on this pipeline.
         if check_key := tuple(
@@ -382,7 +608,7 @@ class Pipeline(BaseModel):
             for k in self.params
             if (k not in params and self.params[k].required)
         ):
-            raise ValueError(
+            raise PipelineException(
                 f"Required Param on this pipeline setting does not set: "
                 f"{', '.join(check_key)}."
             )
@@ -400,6 +626,103 @@ class Pipeline(BaseModel):
             "jobs": {},
         }
+    def release(
+        self,
+        on: On,
+        params: DictData | None = None,
+        *,
+        waiting_sec: int = 600,
+        sleep_interval: int = 10,
+    ) -> str:
+        """Start running pipeline with the on schedule in period of 30 minutes.
+        That mean it will still running at background 30 minutes until the
+        schedule matching with its time.
+        """
+        params: DictData = params or {}
+        logging.info(f"[CORE] Start release: {self.name!r} : {on.cronjob}")
+        gen: CronRunner = on.generate(datetime.now())
+        tz: ZoneInfo = gen.tz
+        next_running_time: datetime = gen.next
+        if get_diff_sec(next_running_time, tz=tz) < waiting_sec:
+            logging.debug(
+                f"[CORE]: {self.name} closely to run >> "
+                f"{next_running_time:%Y-%m-%d %H:%M:%S}"
+            )
+            # NOTE: Release when the time is nearly to schedule time.
+            while (duration := get_diff_sec(next_running_time, tz=tz)) > 15:
+                time.sleep(sleep_interval)
+                logging.debug(
+                    f"[CORE]: {self.name!r} : Sleep until: {duration}"
+                )
+            time.sleep(1)
+            rs: Result = self.execute(params=params)
+            logging.debug(f"{rs.context}")
+            return f"[CORE]: Start Execute: {self.name}"
+        return f"[CORE]: {self.name} does not closely to run yet."
+    def poke(self, params: DictData | None = None):
+        """Poke pipeline threading task for executing with its schedules that
+        was set on the `on`.
+        """
+        params: DictData = params or {}
+        logging.info(
+            f"[CORE]: Start Poking: {self.name!r} :"
+            f"{gen_id(self.name, unique=True)}"
+        )
+        results = []
+        with ThreadPoolExecutor(
+            max_workers=int(
+                os.getenv("WORKFLOW_CORE_MAX_PIPELINE_POKING", "4")
+            ),
+        ) as executor:
+            futures: list[Future] = [
+                executor.submit(
+                    self.release,
+                    on,
+                    params=params,
+                )
+                for on in self.on
+            ]
+            for future in as_completed(futures):
+                rs = future.result()
+                logging.info(rs)
+                results.append(rs)
+        return results
+    def job_execute(
+        self,
+        job: str,
+        params: DictData,
+    ) -> Result:
+        """Job Executor that use on pipeline executor.
+        :param job: A job ID that want to execute.
+        :param params: A params that was parameterized from pipeline execution.
+        """
+        # VALIDATE: check a job ID that exists in this pipeline or not.
+        if job not in self.jobs:
+            raise PipelineException(
+                f"The job ID: {job} does not exists on {self.name!r} pipeline."
+            )
+        try:
+            logging.info(f"({self.run_id}) [PIPELINE]: Start execute: {job!r}")
+            job_obj: Job = self.jobs[job]
+            j_rs: Result = job_obj.execute(params=params)
+        except JobException as err:
+            raise PipelineException(
+                f"The job ID: {job} get raise error: {err.__class__.__name__}:"
+                f"\n{err}"
+            ) from None
+        return Result(
+            status=j_rs.status,
+            context={job: job_obj.set_outputs(j_rs.context)},
+        )
     def execute(
         self,
         params: DictData | None = None,
@@ -430,7 +753,7 @@ class Pipeline(BaseModel):
         """
         logging.info(
-            f"[CORE]: Start Pipeline {self.name}:"
+            f"[CORE]: Start Execute: {self.name}:"
             f"{gen_id(self.name, unique=True)}"
         )
         params: DictData = params or {}
@@ -440,58 +763,131 @@ class Pipeline(BaseModel):
             logging.warning("[PIPELINE]: This pipeline does not have any jobs")
             return Result(status=0, context=params)
-        # NOTE: create a job queue that keep the job that want to running after
+        # NOTE: Create a job queue that keep the job that want to running after
         #   it dependency condition.
         jq: Queue = Queue()
         for job_id in self.jobs:
             jq.put(job_id)
+        # NOTE: Create start timestamp
         ts: float = time.monotonic()
-        not_time_out_flag: bool = True
         # NOTE: Create result context that will pass this context to any
         #   execution dependency.
         rs: Result = Result(context=self.parameterize(params))
+        try:
+            rs.receive(
+                self.__exec_non_threading(rs, jq, ts, timeout=timeout)
+                if (
+                    worker := int(
+                        os.getenv("WORKFLOW_CORE_MAX_JOB_PARALLEL", "1")
+                    )
+                )
+                == 1
+                else self.__exec_threading(
+                    rs, jq, ts, worker=worker, timeout=timeout
+                )
+            )
+            return rs
+        except PipelineException as err:
+            rs.context.update({"error": {"message": str(err)}})
+            rs.status = 1
+            return rs
-        # IMPORTANT: The job execution can run parallel and waiting by needed.
-        while not jq.empty() and (
+    def __exec_threading(
+        self,
+        rs: Result,
+        job_queue: Queue,
+        ts: float,
+        *,
+        worker: int = 1,
+        timeout: int = 600,
+    ) -> Result:
+        """Pipeline threading execution."""
+        not_time_out_flag: bool = True
+        # IMPORTANT: The job execution can run parallel and waiting by
+        #   needed.
+        with ThreadPoolExecutor(max_workers=worker) as executor:
+            futures: list[Future] = []
+            while not job_queue.empty() and (
+                not_time_out_flag := ((time.monotonic() - ts) < timeout)
+            ):
+                job_id: str = job_queue.get()
+                job: Job = self.jobs[job_id]
+                # IMPORTANT:
+                #   Change any job running IDs to this pipeline running ID.
+                job.run_id = self.run_id
+                if any(need not in rs.context["jobs"] for need in job.needs):
+                    job_queue.put(job_id)
+                    time.sleep(0.5)
+                    continue
+                futures.append(
+                    executor.submit(
+                        self.job_execute,
+                        job_id,
+                        params=copy.deepcopy(rs.context),
+                    ),
+                )
+            for future in as_completed(futures):
+                if err := future.exception():
+                    logging.error(f"{err}")
+                    raise PipelineException(f"{err}")
+                # NOTE: Update job result to pipeline result.
+                rs.receive_jobs(future.result(timeout=20))
+        if not not_time_out_flag:
+            logging.warning(
+                f"({self.run_id}) [PIPELINE]: Execution of pipeline was timeout"
+            )
+            raise PipelineException(
+                f"Execution of pipeline: {self.name} was timeout"
+            )
+        rs.status = 0
+        return rs
+    def __exec_non_threading(
+        self,
+        rs: Result,
+        job_queue: Queue,
+        ts: float,
+        *,
+        timeout: int = 600,
+    ) -> Result:
+        """Pipeline non-threading execution."""
+        not_time_out_flag: bool = True
+        logging.info(f"[CORE]: Run {self.name} with non-threading job executor")
+        while not job_queue.empty() and (
             not_time_out_flag := ((time.monotonic() - ts) < timeout)
         ):
-            job_id: str = jq.get()
-            logging.info(f"[PIPELINE]: Start execute the job: {job_id!r}")
+            job_id: str = job_queue.get()
             job: Job = self.jobs[job_id]
-            # TODO: Condition on ``needs`` of this job was set. It should create
-            #   multithreading process on this step.
-            #   But, I don't know how to handle changes params between each job
-            #   execution while its use them together.
-            #   ---
-            #   >>> import multiprocessing
-            #   >>> with multiprocessing.Pool(processes=3) as pool:
-            #   ...     results = pool.starmap(merge_names, ('', '', ...))
-            #   ---
-            #   This case we use multi-process because I want to split usage of
-            #   data in this level, that mean the data that push to parallel job
-            #   should not use across another job.
-            #
-            if any(rs.context["jobs"].get(need) for need in job.needs):
-                jq.put(job_id)
-            # NOTE: copy current the result context for reference other job
-            #   context.
-            job_context: DictData = copy.deepcopy(rs.context)
-            job_rs: Result = job.execute(params=job_context)
-            if job_rs.status == 0:
-                # NOTE: Receive output of job execution.
-                rs.context["jobs"][job_id] = job.set_outputs(job_rs.context)
-            else:
-                raise PipelineException(
-                    f"Getting status does not equal zero on job: {job_id}."
-                )
+            # IMPORTANT:
+            #   Change any job running IDs to this pipeline running ID.
+            job.run_id = self.run_id
+            # NOTE:
+            if any(need not in rs.context["jobs"] for need in job.needs):
+                job_queue.put(job_id)
+                time.sleep(0.5)
+                continue
+            # NOTE: Start job execution.
+            job_rs = self.job_execute(job_id, params=copy.deepcopy(rs.context))
+            rs.context["jobs"].update(job_rs.context)
         if not not_time_out_flag:
-            logging.warning("Execution of pipeline was time out")
-            rs.status = 1
-            return rs
+            logging.warning(
+                f"({self.run_id}) [PIPELINE]: Execution of pipeline was timeout"
+            )
+            raise PipelineException(
+                f"Execution of pipeline: {self.name} was timeout"
+            )
         rs.status = 0
         return rs

ddeutil-workflow 0.0.6__py3-none-any.whl → 0.0.8__py3-none-any.whl

ddeutil-workflow 0.0.6py3-none-any.whl → 0.0.8py3-none-any.whl