PyPI - ocean-runner - Versions diffs - 0.2.7__py3-none-any.whl → 0.2.18__py3-none-any.whl - Mend

ocean-runner 0.2.7py3-none-any.whl → 0.2.18py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

ocean_runner/config.py +7 -15
ocean_runner/runner.py +107 -74
{ocean_runner-0.2.7.dist-info → ocean_runner-0.2.18.dist-info}/METADATA +82 -57
ocean_runner-0.2.18.dist-info/RECORD +7 -0
{ocean_runner-0.2.7.dist-info → ocean_runner-0.2.18.dist-info}/WHEEL +1 -1
ocean_runner/runtime_mode.py +0 -6
ocean_runner-0.2.7.dist-info/RECORD +0 -8
{ocean_runner-0.2.7.dist-info → ocean_runner-0.2.18.dist-info}/licenses/LICENSE +0 -0

ocean_runner/config.py CHANGED Viewed

@@ -2,10 +2,12 @@ import os
 from dataclasses import asdict, dataclass, field
 from logging import Logger
 from pathlib import Path
-from typing import Callable, Iterable, Literal, TypeVar
+from typing import Iterable, TypeVar
 T = TypeVar("T")
+DEFAULT = "DEFAULT"
 @dataclass
 class Environment:
@@ -17,25 +19,20 @@ class Environment:
     """Base data directory, defaults to '/data'"""
     dids: str = field(
-        default_factory=lambda: os.environ.get("DIDS"),
+        default_factory=lambda: os.environ.get("DIDS", None),
     )
     """Datasets DID's, format: '["XXXX"]'"""
     transformation_did: str = field(
-        default_factory=lambda: os.environ.get("TRANSFORMATION_DID"),
+        default_factory=lambda: os.environ.get("TRANSFORMATION_DID", DEFAULT),
     )
     """Transformation (algorithm) DID"""
     secret: str = field(
-        default_factory=lambda: os.environ.get("SECRET"),
+        default_factory=lambda: os.environ.get("SECRET", DEFAULT),
     )
     """Super secret secret"""
-    runtime: Literal["dev", "test"] = field(
-        default_factory=lambda: os.environ.get("RUNTIME", "dev").lower()
-    )
-    """Select runtime mode"""
     dict = asdict
@@ -46,9 +43,6 @@ class Config:
     custom_input: T | None = None
     """Algorithm's custom input types, must be a dataclass_json"""
-    error_callback: Callable[[Exception], None] = None
-    """Callback to execute upon exceptions"""
     logger: Logger | None = None
     """Logger to use in the algorithm"""
@@ -57,7 +51,5 @@ class Config:
     )
     """Paths that should be included so the code executes correctly"""
-    environment: Environment = field(
-        default_factory=lambda: Environment(),
-    )
+    environment: Environment = field(default_factory=lambda: Environment())
     """Mock of environment data"""

ocean_runner/runner.py CHANGED Viewed

@@ -3,70 +3,75 @@ from __future__ import annotations
 from dataclasses import InitVar, asdict, dataclass, field
 from logging import Logger
 from pathlib import Path
-from typing import Callable, Generic, Self, TypeVar
+from typing import Callable, Generic, TypeVar
 from oceanprotocol_job_details import JobDetails
 from ocean_runner.config import Config
-from ocean_runner.runtime_mode import RuntimeMode
-JobDetailsT = TypeVar(
-    "JobDetailsT",
-)
+JobDetailsT = TypeVar("JobDetailsT")
 ResultT = TypeVar("ResultT")
-def default_error_callback(_: Algorithm, e: Exception) -> None:
+def default_error_callback(algorithm: Algorithm, e: Exception) -> None:
+    algorithm.logger.exception("Error during algorithm execution")
     raise e
 def default_validation(algorithm: Algorithm) -> None:
     algorithm.logger.info("Validating input using default validation")
     assert algorithm.job_details.ddos, "DDOs missing"
     assert algorithm.job_details.files, "Files missing"
 def default_save(*, result: ResultT, base: Path, algorithm: Algorithm) -> None:
     algorithm.logger.info("Saving results using default save")
     with open(base / "result.txt", "w+") as f:
         f.write(str(result))
-def default_test_run(algorithm: Algorithm) -> int:
-    import pytest
-    result = pytest.main()
-    if result == 0:
-        algorithm.logger.info("Passed all tests")
-    else:
-        algorithm.logger.error("Some tests failed")
-    return result
 @dataclass
 class Algorithm(Generic[JobDetailsT, ResultT]):
+    """
+    A configurable algorithm runner that behaves like a FastAPI app:
+      - You register `validate`, `run`, and `save_results` via decorators.
+      - You execute the full pipeline by calling `app()`.
+    """
     config: InitVar[Config | None] = None
-    # Load from config
     logger: Logger = field(init=False)
     _job_details: JobDetails[JobDetailsT] = field(init=False)
     _result: ResultT | None = field(default=None, init=False)
-    _runtime: RuntimeMode = field(default=RuntimeMode.DEV, init=False)
-    error_callback = default_error_callback
+    # Decorator-registered callbacks
+    _validate_fn: Callable[[Algorithm], None] | None = field(
+        default=None,
+        init=False,
+        repr=False,
+    )
+    _run_fn: Callable[[Algorithm], ResultT] | None = field(
+        default=None,
+        init=False,
+        repr=False,
+    )
+    _save_fn: Callable[[ResultT, Path, Algorithm], None] | None = field(
+        default=None,
+        init=False,
+        repr=False,
+    )
+    _error_callback: Callable[[Algorithm, Exception], None] | None = field(
+        default=None,
+        init=False,
+        repr=False,
+    )
     def __post_init__(self, config: Config | None) -> None:
         config: Config = config or Config()
-        if config.error_callback:
-            self.error_callback = config.error_callback
+        # Configure logger
         if config.logger:
             self.logger = config.logger
         else:
@@ -77,30 +82,20 @@ class Algorithm(Generic[JobDetailsT, ResultT]):
                 format="%(asctime)s | %(levelname)-8s | %(name)s | %(message)s",
                 datefmt="%Y-%m-%d %H:%M:%S",
             )
             self.logger = logging.getLogger("ocean_runner")
+        # Normalize base_dir
         if isinstance(config.environment.base_dir, str):
             config.environment.base_dir = Path(config.environment.base_dir)
+        # Extend sys.path for custom imports
         if config.source_paths:
             import sys
             sys.path.extend([str(path.absolute()) for path in config.source_paths])
             self.logger.debug(f"Added [{len(config.source_paths)}] entries to PATH")
-        self._runtime = RuntimeMode(config.environment.runtime) or self._runtime
-        self._job_details = JobDetails.load(
-            _type=config.custom_input,
-            base_dir=config.environment.base_dir,
-            dids=config.environment.dids,
-            transformation_did=config.environment.transformation_did,
-            secret=config.environment.secret,
-        )
-        self.logger.info("Loaded JobDetails")
-        self.logger.debug(asdict(self.job_details))
+        self.config = config
     class Error(RuntimeError): ...
@@ -112,46 +107,84 @@ class Algorithm(Generic[JobDetailsT, ResultT]):
     @property
     def result(self) -> ResultT:
-        if not self._result:
+        if self._result is None:
             raise Algorithm.Error("Result missing, run the algorithm first")
         return self._result
-    def validate(self, callback: Callable[[Self], None] = default_validation) -> Self:
-        self.logger.info("Validating instance...")
-        try:
-            callback(self)
-        except Exception as e:
-            self.error_callback(e)
+    # ---------------------------
+    # Decorators (FastAPI-style)
+    # ---------------------------
-        return self
+    def validate(self, fn: Callable[[], None]) -> Callable[[], None]:
+        self._validate_fn = fn
+        return fn
-    def run(self, callable: Callable[[Self], ResultT]) -> Self:
-        self.logger.info("Running algorithm...")
-        try:
-            if self._runtime == RuntimeMode.TEST:
-                callable = default_test_run
+    def run(self, fn: Callable[[], ResultT]) -> Callable[[], ResultT]:
+        self._run_fn = fn
+        return fn
-            self._result = callable(self)
-        except Exception as e:
-            self.error_callback(e)
+    def save_results(self, fn: Callable[[ResultT, Path], None]) -> Callable:
+        self._save_fn = fn
+        return fn
+    def on_error(self, fn: Callable[[Exception], None]) -> Callable:
+        self._error_callback = fn
+        return fn
+    # ---------------------------
+    # Execution Pipeline
+    # ---------------------------
+    def __call__(self) -> ResultT | None:
+        """Executes the algorithm pipeline: validate → run → save_results."""
+        # Load job details
+        self._job_details = JobDetails.load(
+            _type=self.config.custom_input,
+            base_dir=self.config.environment.base_dir,
+            dids=self.config.environment.dids,
+            transformation_did=self.config.environment.transformation_did,
+            secret=self.config.environment.secret,
+        )
-        return self
+        self.logger.info("Loaded JobDetails")
+        self.logger.debug(asdict(self.job_details))
-    def save_results(
-        self,
-        callable: Callable[[ResultT, Path, Algorithm], None] = default_save,
-        *,
-        override_path: Path | None = None,
-    ) -> None:
-        self.logger.info("Saving results...")
         try:
-            callable(
-                results=self.result,
-                base_path=override_path or self.job_details.paths.outputs,
-                algorithm=self,
-            )
-        except Exception as e:
-            self.error_callback(e)
+            # Validation step
+            if self._validate_fn:
+                self.logger.info("Running custom validation...")
+                self._validate_fn()
+            else:
+                self.logger.info("Running default validation...")
+                default_validation(self)
+            # Run step
+            if self._run_fn:
+                self.logger.info("Running algorithm...")
+                self._result = self._run_fn()
+            else:
+                self.logger.warning("No run() function defined. Skipping execution.")
+                self._result = None
+            # Save step
+            if self._save_fn:
+                self.logger.info("Saving results...")
+                self._save_fn(
+                    self._result,
+                    self.job_details.paths.outputs,
+                )
+            else:
+                self.logger.info("No save_results() defined. Using default.")
+                default_save(
+                    result=self._result,
+                    base=self.job_details.paths.outputs,
+                    algorithm=self,
+                )
+        except Exception as e:
+            if self._error_callback:
+                self._error_callback(e)
+            else:
+                default_error_callback(self, e)
-__all__ = [Algorithm]
+        return self._result

{ocean_runner-0.2.7.dist-info → ocean_runner-0.2.18.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: ocean-runner
-Version: 0.2.7
+Version: 0.2.18
 Summary: A fluent API for OceanProtocol algorithms
 Project-URL: Homepage, https://github.com/AgrospAI/ocean-runner
 Project-URL: Issues, https://github.com/AgrospAI/ocean-runner/issues
@@ -17,13 +17,13 @@ Classifier: License :: OSI Approved :: MIT License
 Classifier: Operating System :: OS Independent
 Classifier: Programming Language :: Python :: 3
 Requires-Python: >=3.10
-Requires-Dist: oceanprotocol-job-details==0.2.6
+Requires-Dist: oceanprotocol-job-details>=0.2.8
 Requires-Dist: pytest>=8.4.2
 Description-Content-Type: text/markdown
 # ocean-runner
-Ocean Runner is a package that brings a fluent API for APP creation and running in the scope of OceanProtocol.
+Ocean Runner is a package that eases algorithm creation in the scope of OceanProtocol.
 ## Installation
@@ -40,33 +40,40 @@ uv add ocean-runner
 ```python
 import random
-from ocean_runner import Algorithm, Config
+from ocean_runner import Algorithm
+algorithm = Algorithm()
+@algorithm.run
+def run():
+    return random.randint()
-Algorithm().run(lambda _: random.randint()).save_results()
+if __name__ == "__main__":
+    algorithm()
 ```
-To use minimally the API, you can just provide a callback to the run method, defaulting for the rest of behaviours. This code snippet will:
+This code snippet will:
-- Read the OceanProtocol JobDetails from the environment variables and use default file paths.
-- Generate a random integer.
-- Store the result in a "result.txt" file within the default outputs path.
+- Read the OceanProtocol JobDetails from the environment variables and use default configuration file paths.
+- Execute the run function.
+- Execute the default saving function, storing the result in a "result.txt" file within the default outputs path.
 ### Tuning
 #### Application Config
-The application configuration can be tweaked by passing a Config instance to its' constructor.
+The application configuration can be tweaked by passing a Config instance to its constructor.
 ```python
-Algorithm(
+from ocean_runner import Algorithm, Config
+algorithm = Algorithm(
     Config(
         custom_input: ... # dataclass
         # Custom algorithm parameters dataclass.
-        error_callback: ... # Callable[[Exception], None]
-        # Callback to run on exceptions.
         logger: ... # type: logging.Logger
         # Custom logger to use.
@@ -82,6 +89,8 @@ Algorithm(
 ```python
 import logging
+from ocean_runner import Algorithm, Config
 @dataclass
 class CustomInput:
@@ -91,19 +100,13 @@ class CustomInput:
 logger = logging.getLogger(__name__)
-Algorithm(
+algorithm = Algorithm(
     Config(
         custom_input: CustomInput,
         """
         Load the Algorithm's Custom Input into a CustomInput dataclass instance.
         """
-        error_callback: lambda ex: logger.exception(ex),
-        """
-        Run this callback when an exception is caught
-        NOTE: it's not recommended to catch exceptions this way. Should re-raise and halt the execution.
-        """
         source_paths: [Path("/algorithm/src")],
         """
         Source paths to include in the PATH. '/algorithm/src' is the default since our templates place the algorithm source files there.
@@ -134,11 +137,6 @@ Algorithm(
             """
             Random secret to use while testing.
             """
-            runtime: "dev",
-            """
-            Runtime mode. "dev" to run normally, "test" to run pytest
-            """
         )
         """
         Should not be needed in production algorithms, used to mock environment variables, defaults to using env.
@@ -148,44 +146,72 @@ Algorithm(
 ```
-## Default behaviours
+#### Behaviour Config
-### Default implementations
-As seen in the minimal example, all methods implemented in `Algorithm` have a default implementation which will be commented here.
+To fully configure the behaviour of the algorithm as in the [Minimal Example](#minimal-example), you can do it decorating your defined function as in the following example, which features all the possible algorithm customization.
 ```python
+from pathlib import Path
-(
-    Algorithm()
-        """
-        Default constructor, will use default values of Config.
-        """
-    .validate()
-        """
-        Will validate the algorithm's job detail instance, checking for the existence of:
-        - `job_details.ddos`
-        - `job_details.files`
-        """
+import pandas as pd
+from ocean_runner import Algorithm
-    .run()
+algorithm = Algorithm()
-        """
-        Has NO default implementation, must pass a callback that returns a result of any type.
-        """
-    .save_results()
+@algorithm.on_error
+def error_callback(ex: Exception):
+    algorithm.logger.exception(ex)
+    raise algorithm.Error() from ex
-        """
-        Stores the result of running the algorithm in "outputs/results.txt"
-        """
-)
+@algorithm.validate
+def val():
+    assert algorithm.job_details.files, "Empty input dir"
+@algorithm.run
+def run() -> pd.DataFrame:
+    _, filename = next(algorithm.job_details.next_path())
+    return pd.read_csv(filename).describe(include="all")
+@algorithm.save_results
+def save(results: pd.DataFrame, path: Path):
+    algorithm.logger.info(f"Descriptive statistics: {results}")
+    results.to_csv(path / "results.csv")
+if __name__ == "__main__":
+    algorithm()
+```
+### Default implementations
+As seen in the minimal example, all methods implemented in `Algorithm` have a default implementation which will be commented here.
+```python
+.validate()
+    """
+    Will validate the algorithm's job detail instance, checking for the existence of:
+    - `job_details.ddos`
+    - `job_details.files`
+    """
+.run()
+    """
+    Has NO default implementation, must pass a callback that returns a result of any type.
+    """
+.save_results()
+    """
+    Stores the result of running the algorithm in "outputs/results.txt"
+    """
 ```
 ### Job Details
@@ -193,8 +219,7 @@ As seen in the minimal example, all methods implemented in `Algorithm` have a de
 To load the OceanProtocol JobDetails instance, the program will read some environment variables, they can be mocked passing an instance of `Environment` through the configuration of the algorithm.
 Environment variables:
-- `DIDS` Input dataset(s) DID's, must have format: `["abc..90"]`
-- `TRANSFORMATION_DID` Algorithm DID, must have format: `abc..90`
-- `SECRET` Algorithm secret.
+- `DIDS` (optional) Input dataset(s) DID's, must have format: `["abc..90"]`. Defaults to reading them automatically from the `DDO` data directory.
+- `TRANSFORMATION_DID` (optional, default="DEFAULT"): Algorithm DID, must have format: `abc..90`.
+- `SECRET` (optional, default="DEFAULT"): Algorithm secret.
 - `BASE_DIR` (optional, default="/data"): Base path to the OceanProtocol data directories.
-- `RUNTIME` (optional, default="dev"): Runtime mode

ocean_runner-0.2.18.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,7 @@
+ocean_runner/__init__.py,sha256=awAmE6kZhuwcrD3gT7qFZArdhiuzW-EFTA6tGKhw06k,138
+ocean_runner/config.py,sha256=gyyUotPJ7n8wPPdsJZIBUT4zBlkoNbhV876JDTdPNsY,1398
+ocean_runner/runner.py,sha256=2j0XNk06gIlPoer_kVRtSf-noYZzhORi_7-UnPQBJxA,6005
+ocean_runner-0.2.18.dist-info/METADATA,sha256=NsZ4U_FM2scbLrsgP9BrxczPoBzItV1xs2VlttEGTAI,6562
+ocean_runner-0.2.18.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
+ocean_runner-0.2.18.dist-info/licenses/LICENSE,sha256=_B25KqK4amoADWkMN150tnZFm_Fy7VvZpvIC8ZydWdI,1053
+ocean_runner-0.2.18.dist-info/RECORD,,

{ocean_runner-0.2.7.dist-info → ocean_runner-0.2.18.dist-info}/WHEEL RENAMED Viewed

@@ -1,4 +1,4 @@
 Wheel-Version: 1.0
-Generator: hatchling 1.27.0
+Generator: hatchling 1.28.0
 Root-Is-Purelib: true
 Tag: py3-none-any

ocean_runner/runtime_mode.py DELETED Viewed

@@ -1,6 +0,0 @@
-from enum import Enum
-class RuntimeMode(Enum):
-    DEV = "dev"
-    TEST = "test"

ocean_runner-0.2.7.dist-info/RECORD DELETED Viewed

@@ -1,8 +0,0 @@
-ocean_runner/__init__.py,sha256=awAmE6kZhuwcrD3gT7qFZArdhiuzW-EFTA6tGKhw06k,138
-ocean_runner/config.py,sha256=zzpGxotGhGnNdHKFJqQ7fuXK5zW2IGOpzftHilcySD4,1644
-ocean_runner/runner.py,sha256=j0BOuxO9PgI2wV7812VN9FghgwZz4cLjV0bu_mHP3YA,4574
-ocean_runner/runtime_mode.py,sha256=WbGTaoL3hxBWbxM8luwyOwwtQonqyIhbus0_Jd-F-3k,83
-ocean_runner-0.2.7.dist-info/METADATA,sha256=d0KyDgAwzqadDcnelkgENnmCUWU_fXFh7CMKndatRYE,6101
-ocean_runner-0.2.7.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-ocean_runner-0.2.7.dist-info/licenses/LICENSE,sha256=_B25KqK4amoADWkMN150tnZFm_Fy7VvZpvIC8ZydWdI,1053
-ocean_runner-0.2.7.dist-info/RECORD,,

{ocean_runner-0.2.7.dist-info → ocean_runner-0.2.18.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

ocean-runner 0.2.7__py3-none-any.whl → 0.2.18__py3-none-any.whl

ocean-runner 0.2.7py3-none-any.whl → 0.2.18py3-none-any.whl