PyPI - runnable - Versions diffs - 0.12.3__py3-none-any.whl → 0.14.0__py3-none-any.whl - Mend

runnable 0.12.3py3-none-any.whl → 0.14.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (64) hide show

runnable/__init__.py +0 -11
runnable/catalog.py +27 -5
runnable/cli.py +122 -26
runnable/datastore.py +71 -35
runnable/defaults.py +0 -1
runnable/entrypoints.py +107 -32
runnable/exceptions.py +6 -2
runnable/executor.py +28 -9
runnable/graph.py +37 -12
runnable/integration.py +7 -2
runnable/nodes.py +15 -17
runnable/parameters.py +27 -8
runnable/pickler.py +1 -1
runnable/sdk.py +101 -33
runnable/secrets.py +3 -1
runnable/tasks.py +246 -34
runnable/utils.py +41 -13
{runnable-0.12.3.dist-info → runnable-0.14.0.dist-info}/METADATA +25 -31
runnable-0.14.0.dist-info/RECORD +24 -0
{runnable-0.12.3.dist-info → runnable-0.14.0.dist-info}/WHEEL +1 -1
runnable-0.14.0.dist-info/entry_points.txt +40 -0
runnable/extensions/__init__.py +0 -0
runnable/extensions/catalog/__init__.py +0 -21
runnable/extensions/catalog/file_system/__init__.py +0 -0
runnable/extensions/catalog/file_system/implementation.py +0 -234
runnable/extensions/catalog/k8s_pvc/__init__.py +0 -0
runnable/extensions/catalog/k8s_pvc/implementation.py +0 -16
runnable/extensions/catalog/k8s_pvc/integration.py +0 -59
runnable/extensions/executor/__init__.py +0 -649
runnable/extensions/executor/argo/__init__.py +0 -0
runnable/extensions/executor/argo/implementation.py +0 -1194
runnable/extensions/executor/argo/specification.yaml +0 -51
runnable/extensions/executor/k8s_job/__init__.py +0 -0
runnable/extensions/executor/k8s_job/implementation_FF.py +0 -259
runnable/extensions/executor/k8s_job/integration_FF.py +0 -69
runnable/extensions/executor/local/__init__.py +0 -0
runnable/extensions/executor/local/implementation.py +0 -71
runnable/extensions/executor/local_container/__init__.py +0 -0
runnable/extensions/executor/local_container/implementation.py +0 -446
runnable/extensions/executor/mocked/__init__.py +0 -0
runnable/extensions/executor/mocked/implementation.py +0 -154
runnable/extensions/executor/retry/__init__.py +0 -0
runnable/extensions/executor/retry/implementation.py +0 -168
runnable/extensions/nodes.py +0 -855
runnable/extensions/run_log_store/__init__.py +0 -0
runnable/extensions/run_log_store/chunked_file_system/__init__.py +0 -0
runnable/extensions/run_log_store/chunked_file_system/implementation.py +0 -111
runnable/extensions/run_log_store/chunked_k8s_pvc/__init__.py +0 -0
runnable/extensions/run_log_store/chunked_k8s_pvc/implementation.py +0 -21
runnable/extensions/run_log_store/chunked_k8s_pvc/integration.py +0 -61
runnable/extensions/run_log_store/db/implementation_FF.py +0 -157
runnable/extensions/run_log_store/db/integration_FF.py +0 -0
runnable/extensions/run_log_store/file_system/__init__.py +0 -0
runnable/extensions/run_log_store/file_system/implementation.py +0 -140
runnable/extensions/run_log_store/generic_chunked.py +0 -557
runnable/extensions/run_log_store/k8s_pvc/__init__.py +0 -0
runnable/extensions/run_log_store/k8s_pvc/implementation.py +0 -21
runnable/extensions/run_log_store/k8s_pvc/integration.py +0 -56
runnable/extensions/secrets/__init__.py +0 -0
runnable/extensions/secrets/dotenv/__init__.py +0 -0
runnable/extensions/secrets/dotenv/implementation.py +0 -100
runnable-0.12.3.dist-info/RECORD +0 -64
runnable-0.12.3.dist-info/entry_points.txt +0 -41
{runnable-0.12.3.dist-info → runnable-0.14.0.dist-info/licenses}/LICENSE +0 -0

runnable/parameters.py CHANGED Viewed

@@ -15,6 +15,8 @@ from runnable.utils import remove_prefix
 logger = logging.getLogger(defaults.LOGGER_NAME)
+# TODO: Revisit this, it might be a bit too complicated than required
 def get_user_set_parameters(remove: bool = False) -> Dict[str, JsonParameter]:
     """
@@ -34,9 +36,13 @@ def get_user_set_parameters(remove: bool = False) -> Dict[str, JsonParameter]:
         if env_var.startswith(defaults.PARAMETER_PREFIX):
             key = remove_prefix(env_var, defaults.PARAMETER_PREFIX)
             try:
-                parameters[key.lower()] = JsonParameter(kind="json", value=json.loads(value))
+                parameters[key.lower()] = JsonParameter(
+                    kind="json", value=json.loads(value)
+                )
             except json.decoder.JSONDecodeError:
-                logger.warning(f"Parameter {key} could not be JSON decoded, adding the literal value")
+                logger.warning(
+                    f"Parameter {key} could not be JSON decoded, adding the literal value"
+                )
                 parameters[key.lower()] = JsonParameter(kind="json", value=value)
             if remove:
@@ -52,7 +58,9 @@ def serialize_parameter_as_str(value: Any) -> str:
 def filter_arguments_for_func(
-    func: Callable[..., Any], params: Dict[str, Any], map_variable: TypeMapVariable = None
+    func: Callable[..., Any],
+    params: Dict[str, Any],
+    map_variable: TypeMapVariable = None,
 ) -> Dict[str, Any]:
     """
     Inspects the function to be called as part of the pipeline to find the arguments of the function.
@@ -96,11 +104,16 @@ def filter_arguments_for_func(
             # No parameter of this name was provided
             if value.default == inspect.Parameter.empty:
                 # No default value is given in the function signature. error as parameter is required.
-                raise ValueError(f"Parameter {name} is required for {func.__name__} but not provided")
+                raise ValueError(
+                    f"Parameter {name} is required for {func.__name__} but not provided"
+                )
             # default value is given in the function signature, nothing further to do.
             continue
-        if type(value.annotation) in [BaseModel, pydantic._internal._model_construction.ModelMetaclass]:
+        if type(value.annotation) in [
+            BaseModel,
+            pydantic._internal._model_construction.ModelMetaclass,
+        ]:
             # We try to cast it as a pydantic model if asked
             named_param = params[name].get_value()
@@ -110,7 +123,9 @@ def filter_arguments_for_func(
             bound_model = bind_args_for_pydantic_model(named_param, value.annotation)
             bound_args[name] = bound_model
-            unassigned_params = unassigned_params.difference(bound_model.model_fields.keys())
+            unassigned_params = unassigned_params.difference(
+                bound_model.model_fields.keys()
+            )
         elif value.annotation in [str, int, float, bool]:
             # Cast it if its a primitive type. Ensure the type matches the annotation.
@@ -120,12 +135,16 @@ def filter_arguments_for_func(
         unassigned_params.remove(name)
-        params = {key: params[key] for key in unassigned_params}  # remove keys from params if they are assigned
+        params = {
+            key: params[key] for key in unassigned_params
+        }  # remove keys from params if they are assigned
     return bound_args
-def bind_args_for_pydantic_model(params: Dict[str, Any], model: Type[BaseModel]) -> BaseModel:
+def bind_args_for_pydantic_model(
+    params: Dict[str, Any], model: Type[BaseModel]
+) -> BaseModel:
     class EasyModel(model):  # type: ignore
         model_config = ConfigDict(extra="ignore")

runnable/pickler.py CHANGED Viewed

@@ -9,7 +9,7 @@ import runnable.context as context
 class BasePickler(ABC, BaseModel):
     """
-    The base class for all picklers.
+    The base class for all pickler.
     We are still in the process of hardening the design of this class.
     For now, we are just going to use pickle.

runnable/sdk.py CHANGED Viewed

@@ -26,8 +26,7 @@ from rich.progress import (
 from rich.table import Column
 from typing_extensions import Self
-from runnable import console, defaults, entrypoints, exceptions, graph, utils
-from runnable.extensions.nodes import (
+from extensions.nodes.nodes import (
     FailNode,
     MapNode,
     ParallelNode,
@@ -35,9 +34,12 @@ from runnable.extensions.nodes import (
     SuccessNode,
     TaskNode,
 )
+from runnable import console, defaults, entrypoints, exceptions, graph, utils
 from runnable.nodes import TraversalNode
 from runnable.tasks import TaskReturns
+# TODO: This might have to be an extension
 logger = logging.getLogger(defaults.LOGGER_NAME)
 StepType = Union["Stub", "PythonTask", "NotebookTask", "ShellTask", "Parallel", "Map"]
@@ -66,7 +68,9 @@ class Catalog(BaseModel):
     """
-    model_config = ConfigDict(extra="forbid")  # Need to be for command, would be validated later
+    model_config = ConfigDict(
+        extra="forbid"
+    )  # Need to be for command, would be validated later
     # Note: compute_data_folder was confusing to explain, might be introduced later.
     # compute_data_folder: str = Field(default="", alias="compute_data_folder")
     get: List[str] = Field(default_factory=list, alias="get")
@@ -95,14 +99,18 @@ class BaseTraversal(ABC, BaseModel):
     def __rshift__(self, other: StepType) -> StepType:
         if self.next_node:
-            raise Exception(f"The node {self} already has a next node: {self.next_node}")
+            raise Exception(
+                f"The node {self} already has a next node: {self.next_node}"
+            )
         self.next_node = other.name
         return other
     def __lshift__(self, other: TraversalNode) -> TraversalNode:
         if other.next_node:
-            raise Exception(f"The {other} node already has a next node: {other.next_node}")
+            raise Exception(
+                f"The {other} node already has a next node: {other.next_node}"
+            )
         other.next_node = self.name
         return other
@@ -112,7 +120,9 @@ class BaseTraversal(ABC, BaseModel):
         assert not isinstance(node, Fail)
         if node.next_node:
-            raise Exception(f"The {node} node already has a next node: {node.next_node}")
+            raise Exception(
+                f"The {node} node already has a next node: {node.next_node}"
+            )
         node.next_node = self.name
         return self
@@ -124,7 +134,9 @@ class BaseTraversal(ABC, BaseModel):
         if self.terminate_with_failure or self.terminate_with_success:
             if self.next_node and self.next_node not in ["success", "fail"]:
-                raise AssertionError("A node being terminated cannot have a user defined next node")
+                raise AssertionError(
+                    "A node being terminated cannot have a user defined next node"
+                )
         if self.terminate_with_failure:
             self.next_node = "fail"
@@ -135,8 +147,7 @@ class BaseTraversal(ABC, BaseModel):
         return self
     @abstractmethod
-    def create_node(self) -> TraversalNode:
-        ...
+    def create_node(self) -> TraversalNode: ...
 class BaseTask(BaseTraversal):
@@ -146,12 +157,16 @@ class BaseTask(BaseTraversal):
     catalog: Optional[Catalog] = Field(default=None, alias="catalog")
     overrides: Dict[str, Any] = Field(default_factory=dict, alias="overrides")
-    returns: List[Union[str, TaskReturns]] = Field(default_factory=list, alias="returns")
+    returns: List[Union[str, TaskReturns]] = Field(
+        default_factory=list, alias="returns"
+    )
     secrets: List[str] = Field(default_factory=list)
     @field_validator("returns", mode="before")
     @classmethod
-    def serialize_returns(cls, returns: List[Union[str, TaskReturns]]) -> List[TaskReturns]:
+    def serialize_returns(
+        cls, returns: List[Union[str, TaskReturns]]
+    ) -> List[TaskReturns]:
         task_returns = []
         for x in returns:
@@ -167,9 +182,13 @@ class BaseTask(BaseTraversal):
     def create_node(self) -> TaskNode:
         if not self.next_node:
             if not (self.terminate_with_failure or self.terminate_with_success):
-                raise AssertionError("A node not being terminated must have a user defined next node")
+                raise AssertionError(
+                    "A node not being terminated must have a user defined next node"
+                )
-        return TaskNode.parse_from_config(self.model_dump(exclude_none=True, by_alias=True))
+        return TaskNode.parse_from_config(
+            self.model_dump(exclude_none=True, by_alias=True)
+        )
 class PythonTask(BaseTask):
@@ -326,7 +345,9 @@ class NotebookTask(BaseTask):
     """
     notebook: str = Field(serialization_alias="command")
-    optional_ploomber_args: Optional[Dict[str, Any]] = Field(default=None, alias="optional_ploomber_args")
+    optional_ploomber_args: Optional[Dict[str, Any]] = Field(
+        default=None, alias="optional_ploomber_args"
+    )
     @computed_field
     def command_type(self) -> str:
@@ -416,7 +437,9 @@ class Stub(BaseTraversal):
     def create_node(self) -> StubNode:
         if not self.next_node:
             if not (self.terminate_with_failure or self.terminate_with_success):
-                raise AssertionError("A node not being terminated must have a user defined next node")
+                raise AssertionError(
+                    "A node not being terminated must have a user defined next node"
+                )
         return StubNode.parse_from_config(self.model_dump(exclude_none=True))
@@ -439,14 +462,23 @@ class Parallel(BaseTraversal):
     @computed_field  # type: ignore
     @property
     def graph_branches(self) -> Dict[str, graph.Graph]:
-        return {name: pipeline._dag.model_copy() for name, pipeline in self.branches.items()}
+        return {
+            name: pipeline._dag.model_copy() for name, pipeline in self.branches.items()
+        }
     def create_node(self) -> ParallelNode:
         if not self.next_node:
             if not (self.terminate_with_failure or self.terminate_with_success):
-                raise AssertionError("A node not being terminated must have a user defined next node")
+                raise AssertionError(
+                    "A node not being terminated must have a user defined next node"
+                )
-        node = ParallelNode(name=self.name, branches=self.graph_branches, internal_name="", next_node=self.next_node)
+        node = ParallelNode(
+            name=self.name,
+            branches=self.graph_branches,
+            internal_name="",
+            next_node=self.next_node,
+        )
         return node
@@ -483,7 +515,9 @@ class Map(BaseTraversal):
     def create_node(self) -> MapNode:
         if not self.next_node:
             if not (self.terminate_with_failure or self.terminate_with_success):
-                raise AssertionError("A node not being terminated must have a user defined next node")
+                raise AssertionError(
+                    "A node not being terminated must have a user defined next node"
+                )
         node = MapNode(
             name=self.name,
@@ -596,16 +630,22 @@ class Pipeline(BaseModel):
         for step in path:
             if step.terminate_with_success:
                 if reached_success:
-                    raise Exception("A pipeline cannot have more than one step that terminates with success")
+                    raise Exception(
+                        "A pipeline cannot have more than one step that terminates with success"
+                    )
                 reached_success = True
                 continue
             if step.terminate_with_failure:
                 if reached_failure:
-                    raise Exception("A pipeline cannot have more than one step that terminates with failure")
+                    raise Exception(
+                        "A pipeline cannot have more than one step that terminates with failure"
+                    )
                 reached_failure = True
         if not reached_success and not reached_failure:
-            raise Exception("A pipeline must have at least one step that terminates with success")
+            raise Exception(
+                "A pipeline must have at least one step that terminates with success"
+            )
     def _construct_path(self, path: List[StepType]) -> None:
         prev_step = path[0]
@@ -615,7 +655,9 @@ class Pipeline(BaseModel):
                 continue
             if prev_step.terminate_with_success or prev_step.terminate_with_failure:
-                raise Exception(f"A step that terminates with success/failure cannot have a next step: {prev_step}")
+                raise Exception(
+                    f"A step that terminates with success/failure cannot have a next step: {prev_step}"
+                )
             if prev_step.next_node and prev_step.next_node not in ["success", "fail"]:
                 raise Exception(f"Step already has a next node: {prev_step} ")
@@ -646,7 +688,9 @@ class Pipeline(BaseModel):
         on_failure_paths: List[List[StepType]] = []
         for step in self.steps:
-            if isinstance(step, (Stub, PythonTask, NotebookTask, ShellTask, Parallel, Map)):
+            if isinstance(
+                step, (Stub, PythonTask, NotebookTask, ShellTask, Parallel, Map)
+            ):
                 success_path.append(step)
                 continue
             # on_failure_paths.append(step)
@@ -731,7 +775,9 @@ class Pipeline(BaseModel):
         logger.setLevel(log_level)
         run_id = utils.generate_run_id(run_id=run_id)
-        configuration_file = os.environ.get("RUNNABLE_CONFIGURATION_FILE", configuration_file)
+        configuration_file = os.environ.get(
+            "RUNNABLE_CONFIGURATION_FILE", configuration_file
+        )
         run_context = entrypoints.prepare_configurations(
             configuration_file=configuration_file,
             run_id=run_id,
@@ -740,7 +786,9 @@ class Pipeline(BaseModel):
         )
         run_context.execution_plan = defaults.EXECUTION_PLAN.CHAINED.value
-        utils.set_runnable_environment_variables(run_id=run_id, configuration_file=configuration_file, tag=tag)
+        utils.set_runnable_environment_variables(
+            run_id=run_id, configuration_file=configuration_file, tag=tag
+        )
         dag_definition = self._dag.model_dump(by_alias=True, exclude_none=True)
@@ -767,7 +815,9 @@ class Pipeline(BaseModel):
         with Progress(
             SpinnerColumn(spinner_name="runner"),
-            TextColumn("[progress.description]{task.description}", table_column=Column(ratio=2)),
+            TextColumn(
+                "[progress.description]{task.description}", table_column=Column(ratio=2)
+            ),
             BarColumn(table_column=Column(ratio=1), style="dark_orange"),
             TimeElapsedColumn(table_column=Column(ratio=1)),
             console=console,
@@ -775,23 +825,41 @@ class Pipeline(BaseModel):
         ) as progress:
             try:
                 run_context.progress = progress
-                pipeline_execution_task = progress.add_task("[dark_orange] Starting execution .. ", total=1)
+                pipeline_execution_task = progress.add_task(
+                    "[dark_orange] Starting execution .. ", total=1
+                )
                 run_context.executor.execute_graph(dag=run_context.dag)
                 if not run_context.executor._local:
                     return {}
-                run_log = run_context.run_log_store.get_run_log_by_id(run_id=run_context.run_id, full=False)
+                run_log = run_context.run_log_store.get_run_log_by_id(
+                    run_id=run_context.run_id, full=False
+                )
                 if run_log.status == defaults.SUCCESS:
-                    progress.update(pipeline_execution_task, description="[green] Success", completed=True)
+                    progress.update(
+                        pipeline_execution_task,
+                        description="[green] Success",
+                        completed=True,
+                    )
                 else:
-                    progress.update(pipeline_execution_task, description="[red] Failed", completed=True)
+                    progress.update(
+                        pipeline_execution_task,
+                        description="[red] Failed",
+                        completed=True,
+                    )
                     raise exceptions.ExecutionFailedError(run_context.run_id)
             except Exception as e:  # noqa: E722
                 console.print(e, style=defaults.error_style)
-                progress.update(pipeline_execution_task, description="[red] Errored execution", completed=True)
+                progress.update(
+                    pipeline_execution_task,
+                    description="[red] Errored execution",
+                    completed=True,
+                )
                 raise
         if run_context.executor._local:
-            return run_context.run_log_store.get_run_log_by_id(run_id=run_context.run_id)
+            return run_context.run_log_store.get_run_log_by_id(
+                run_id=run_context.run_id
+            )

runnable/secrets.py CHANGED Viewed

@@ -92,4 +92,6 @@ class EnvSecretsManager(BaseSecrets):
         try:
             return os.environ[name]
         except KeyError:
-            raise exceptions.SecretNotFoundError(secret_name=name, secret_setting="environment variables")
+            raise exceptions.SecretNotFoundError(
+                secret_name=name, secret_setting="environment variables"
+            )

runnable 0.12.3__py3-none-any.whl → 0.14.0__py3-none-any.whl

runnable 0.12.3py3-none-any.whl → 0.14.0py3-none-any.whl