PyPI - indexify - Versions diffs - 0.3.17__py3-none-any.whl → 0.3.19__py3-none-any.whl - Mend

indexify 0.3.17py3-none-any.whl → 0.3.19py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (35) hide show

indexify/cli/cli.py +21 -18
indexify/executor/api_objects.py +12 -0
indexify/executor/downloader.py +4 -1
indexify/executor/executor.py +65 -28
indexify/executor/executor_flavor.py +7 -0
indexify/executor/function_executor/function_executor.py +24 -11
indexify/executor/function_executor/function_executor_state.py +9 -1
indexify/executor/function_executor/function_executor_states_container.py +3 -1
indexify/executor/function_executor/function_executor_status.py +2 -0
indexify/executor/function_executor/health_checker.py +20 -2
indexify/executor/function_executor/server/subprocess_function_executor_server_factory.py +6 -0
indexify/executor/function_executor/single_task_runner.py +15 -11
indexify/executor/function_executor/task_output.py +35 -2
indexify/executor/grpc/channel_manager.py +160 -0
indexify/executor/grpc/completed_tasks_container.py +26 -0
indexify/executor/grpc/function_executor_controller.py +421 -0
indexify/executor/grpc/state_reconciler.py +33 -38
indexify/executor/grpc/state_reporter.py +100 -39
indexify/executor/grpc/task_controller.py +449 -0
indexify/executor/metrics/task_reporter.py +14 -0
indexify/executor/task_fetcher.py +8 -3
indexify/executor/task_reporter.py +112 -4
indexify/executor/task_runner.py +1 -0
indexify/proto/{task_scheduler.proto → executor_api.proto} +86 -11
indexify/proto/executor_api_pb2.py +80 -0
indexify/proto/{task_scheduler_pb2.pyi → executor_api_pb2.pyi} +162 -7
indexify/proto/executor_api_pb2_grpc.py +227 -0
{indexify-0.3.17.dist-info → indexify-0.3.19.dist-info}/METADATA +1 -1
{indexify-0.3.17.dist-info → indexify-0.3.19.dist-info}/RECORD +32 -28
indexify/executor/grpc/channel_creator.py +0 -53
indexify/proto/task_scheduler_pb2.py +0 -64
indexify/proto/task_scheduler_pb2_grpc.py +0 -170
/indexify/executor/grpc/metrics/{channel_creator.py → channel_manager.py} +0 -0
{indexify-0.3.17.dist-info → indexify-0.3.19.dist-info}/WHEEL +0 -0
{indexify-0.3.17.dist-info → indexify-0.3.19.dist-info}/entry_points.txt +0 -0

indexify/cli/cli.py CHANGED Viewed

@@ -13,7 +13,7 @@ import sys
 from importlib.metadata import version
 from pathlib import Path
 from socket import gethostname
-from typing import Annotated, List, Optional, Tuple
+from typing import Annotated, Dict, List, Optional, Tuple
 import nanoid
 import prometheus_client
@@ -26,6 +26,7 @@ from tensorlake.functions_sdk.image import Image
 from indexify.executor.api_objects import FunctionURI
 from indexify.executor.executor import Executor
+from indexify.executor.executor_flavor import ExecutorFlavor
 from indexify.executor.function_executor.server.subprocess_function_executor_server_factory import (
     SubprocessFunctionExecutorServerFactory,
 )
@@ -77,6 +78,7 @@ def build_image(
 )
 def executor(
     server_addr: str = "localhost:8900",
+    grpc_server_addr: str = "localhost:8901",
     dev: Annotated[
         bool, typer.Option("--dev", "-d", help="Run the executor in development mode")
     ] = False,
@@ -119,17 +121,6 @@ def executor(
             help="Port where to run Executor Monitoring server",
         ),
     ] = 7000,
-    # TODO: Figure out mTLS for gRPC.
-    grpc_server_addr: Annotated[
-        Optional[str],
-        typer.Option(
-            "--grpc-server-addr",
-            help=(
-                "(exprimental) Address of server gRPC API to connect to, e.g. 'localhost:8901'.\n"
-                "Enables gRPC state reporter that will periodically report the state of the Function Executors to Server\n"
-            ),
-        ),
-    ] = None,
     enable_grpc_state_reconciler: Annotated[
         bool,
         typer.Option(
@@ -140,6 +131,15 @@ def executor(
             ),
         ),
     ] = False,
+    labels: Annotated[
+        List[str],
+        typer.Option(
+            "--label",
+            "-l",
+            help="Executor key-value label to be sent to the Server. "
+            "Specified as <key>=<value>",
+        ),
+    ] = [],
 ):
     if dev:
         configure_development_mode_logging()
@@ -157,10 +157,10 @@ def executor(
             "--executor-id should be at least 10 characters long and only include characters _-[0-9][a-z][A-Z]"
         )
-    if enable_grpc_state_reconciler and grpc_server_addr is None:
-        raise typer.BadParameter(
-            "--grpc-server-addr must be set when --enable-grpc-state-reconciler is set"
-        )
+    kv_labels: Dict[str, str] = {}
+    for label in labels:
+        key, value = label.split("=")
+        kv_labels[key] = value
     executor_version = version("indexify")
     logger = structlog.get_logger(module=__name__, executor_id=executor_id)
@@ -169,15 +169,16 @@ def executor(
         "starting executor",
         hostname=gethostname(),
         server_addr=server_addr,
+        grpc_server_addr=grpc_server_addr,
         config_path=config_path,
         executor_version=executor_version,
+        labels=kv_labels,
         executor_cache=executor_cache,
         ports=ports,
         functions=function_uris,
         dev_mode=dev,
         monitoring_server_host=monitoring_server_host,
         monitoring_server_port=monitoring_server_port,
-        grpc_server_addr=grpc_server_addr,
         enable_grpc_state_reconciler=enable_grpc_state_reconciler,
     )
@@ -205,7 +206,9 @@ def executor(
     Executor(
         id=executor_id,
         development_mode=dev,
+        flavor=ExecutorFlavor.OSS,
         version=executor_version,
+        labels=kv_labels,
         health_checker=GenericHealthChecker(),
         code_path=executor_cache,
         function_allowlist=_parse_function_uris(function_uris),
@@ -214,10 +217,10 @@ def executor(
             server_ports=range(ports[0], ports[1]),
         ),
         server_addr=server_addr,
+        grpc_server_addr=grpc_server_addr,
         config_path=config_path,
         monitoring_server_host=monitoring_server_host,
         monitoring_server_port=monitoring_server_port,
-        grpc_server_addr=grpc_server_addr,
         enable_grpc_state_reconciler=enable_grpc_state_reconciler,
     ).run()

indexify/executor/api_objects.py CHANGED Viewed

@@ -49,5 +49,17 @@ class TaskResult(BaseModel):
     reducer: bool = False
+class DataPayload(BaseModel):
+    path: str
+    size: int
+    sha256_hash: str
+class IngestFnOutputsResponse(BaseModel):
+    data_payloads: List[DataPayload]
+    stdout: Optional[DataPayload] = None
+    stderr: Optional[DataPayload] = None
 TASK_OUTCOME_SUCCESS = "success"
 TASK_OUTCOME_FAILURE = "failure"

indexify/executor/downloader.py CHANGED Viewed

@@ -241,7 +241,10 @@ class Downloader:
 def serialized_object_from_http_response(response: httpx.Response) -> SerializedObject:
     # We're hardcoding the content type currently used by Python SDK. It might change in the future.
     # There's no other way for now to determine if the response is a bytes or string.
-    if response.headers["content-type"] == "application/octet-stream":
+    if response.headers["content-type"] in [
+        "application/octet-stream",
+        "application/pickle",
+    ]:
         return SerializedObject(
             bytes=response.content, content_type=response.headers["content-type"]
         )

indexify/executor/executor.py CHANGED Viewed

@@ -9,17 +9,18 @@ import structlog
 from tensorlake.function_executor.proto.function_executor_pb2 import SerializedObject
 from tensorlake.utils.logging import suppress as suppress_logging
-from indexify.proto.task_scheduler_pb2 import ExecutorStatus
+from indexify.proto.executor_api_pb2 import ExecutorStatus
 from .api_objects import FunctionURI, Task
 from .downloader import Downloader
+from .executor_flavor import ExecutorFlavor
 from .function_executor.function_executor_states_container import (
     FunctionExecutorStatesContainer,
 )
 from .function_executor.server.function_executor_server_factory import (
     FunctionExecutorServerFactory,
 )
-from .grpc.channel_creator import ChannelCreator
+from .grpc.channel_manager import ChannelManager
 from .grpc.state_reconciler import ExecutorStateReconciler
 from .grpc.state_reporter import ExecutorStateReporter
 from .metrics.executor import (
@@ -55,16 +56,18 @@ class Executor:
         self,
         id: str,
         development_mode: bool,
+        flavor: ExecutorFlavor,
         version: str,
+        labels: Dict[str, str],
         code_path: Path,
         health_checker: HealthChecker,
         function_allowlist: Optional[List[FunctionURI]],
         function_executor_server_factory: FunctionExecutorServerFactory,
         server_addr: str,
+        grpc_server_addr: str,
         config_path: Optional[str],
         monitoring_server_host: str,
         monitoring_server_port: int,
-        grpc_server_addr: Optional[str],
         enable_grpc_state_reconciler: bool,
     ):
         self._logger = structlog.get_logger(module=__name__)
@@ -94,36 +97,40 @@ class Executor:
         self._downloader = Downloader(
             code_path=code_path, base_url=self._base_url, config_path=config_path
         )
+        self._function_allowlist: Optional[List[FunctionURI]] = function_allowlist
+        self._function_executor_server_factory = function_executor_server_factory
+        self._channel_manager = ChannelManager(
+            server_address=grpc_server_addr,
+            config_path=config_path,
+            logger=self._logger,
+        )
+        self._state_reporter = ExecutorStateReporter(
+            executor_id=id,
+            flavor=flavor,
+            version=version,
+            labels=labels,
+            development_mode=development_mode,
+            function_allowlist=self._function_allowlist,
+            function_executor_states=self._function_executor_states,
+            channel_manager=self._channel_manager,
+            logger=self._logger,
+        )
+        self._state_reporter.update_executor_status(
+            ExecutorStatus.EXECUTOR_STATUS_STARTING_UP
+        )
         self._task_reporter = TaskReporter(
             base_url=self._base_url,
             executor_id=id,
             config_path=config_path,
+            channel_manager=self._channel_manager,
         )
-        self._function_allowlist: Optional[List[FunctionURI]] = function_allowlist
-        self._function_executor_server_factory = function_executor_server_factory
-        # HTTP mode services
+        # HTTP mode task runner
         self._task_runner: Optional[TaskRunner] = None
         self._task_fetcher: Optional[TaskFetcher] = None
-        # gRPC mode services
-        self._channel_creator: Optional[ChannelCreator] = None
-        self._state_reporter: Optional[ExecutorStateReporter] = None
+        # gRPC mode state reconciler that runs tasks
         self._state_reconciler: Optional[ExecutorStateReconciler] = None
-        if grpc_server_addr is not None:
-            self._channel_creator = ChannelCreator(grpc_server_addr, self._logger)
-            self._state_reporter = ExecutorStateReporter(
-                executor_id=id,
-                development_mode=development_mode,
-                function_allowlist=self._function_allowlist,
-                function_executor_states=self._function_executor_states,
-                channel_creator=self._channel_creator,
-                logger=self._logger,
-            )
-            self._state_reporter.update_executor_status(
-                ExecutorStatus.EXECUTOR_STATUS_STARTING_UP
-            )
         if enable_grpc_state_reconciler:
             self._state_reconciler = ExecutorStateReconciler(
                 executor_id=id,
@@ -133,7 +140,8 @@ class Executor:
                 config_path=config_path,
                 downloader=self._downloader,
                 task_reporter=self._task_reporter,
-                channel_creator=self._channel_creator,
+                channel_manager=self._channel_manager,
+                state_reporter=self._state_reporter,
                 logger=self._logger,
             )
         else:
@@ -147,6 +155,7 @@ class Executor:
             self._task_fetcher = TaskFetcher(
                 executor_id=id,
                 executor_version=version,
+                labels=labels,
                 function_allowlist=function_allowlist,
                 protocol=protocol,
                 indexify_server_addr=self._server_addr,
@@ -159,8 +168,8 @@ class Executor:
             "version": version,
             "code_path": str(code_path),
             "server_addr": server_addr,
-            "config_path": str(config_path),
             "grpc_server_addr": str(grpc_server_addr),
+            "config_path": str(config_path),
             "enable_grpc_state_reconciler": str(enable_grpc_state_reconciler),
             "hostname": gethostname(),
         }
@@ -244,6 +253,9 @@ class Executor:
             )
             logger.error("task execution failed", exc_info=e)
+        if output.metrics is not None:
+            self.log_function_metrics(output)
         with (
             metric_tasks_reporting_outcome.track_inprogress(),
             metric_task_outcome_report_latency.time(),
@@ -253,6 +265,28 @@ class Executor:
         metric_task_completion_latency.observe(time.monotonic() - start_time)
+    def log_function_metrics(self, output: TaskOutput):
+        for counter_name, counter_value in output.metrics.counters.items():
+            self._logger.info(
+                f"function_metric",
+                counter_name=counter_name,
+                counter_value=counter_value,
+                invocation_id=output.graph_invocation_id,
+                function_name=output.function_name,
+                graph_name=output.graph_name,
+                namespace=output.namespace,
+            )
+        for timer_name, timer_value in output.metrics.timers.items():
+            self._logger.info(
+                f"function_metric",
+                timer_name=timer_name,
+                timer_value=timer_value,
+                invocation_id=output.graph_invocation_id,
+                function_name=output.function_name,
+                graph_name=output.graph_name,
+                namespace=output.namespace,
+            )
     async def _run_task_and_get_output(self, task: Task, logger: Any) -> TaskOutput:
         graph: SerializedObject = await self._downloader.download_graph(
             namespace=task.namespace,
@@ -326,7 +360,9 @@ class Executor:
             ).inc()
     async def _shutdown(self, loop):
-        self._logger.info("shutting down")
+        self._logger.info(
+            "shutting down, all Executor logs are suppressed, no task outcomes will be reported to Server from this point"
+        )
         if self._state_reporter is not None:
             self._state_reporter.update_executor_status(
                 ExecutorStatus.EXECUTOR_STATUS_STOPPING
@@ -339,12 +375,13 @@ class Executor:
         self._is_shutdown = True
         await self._monitoring_server.shutdown()
+        await self._task_reporter.shutdown()
         if self._task_runner is not None:
             await self._task_runner.shutdown()
-        if self._channel_creator is not None:
-            await self._channel_creator.shutdown()
+        if self._channel_manager is not None:
+            await self._channel_manager.shutdown()
         if self._state_reporter is not None:
             await self._state_reporter.shutdown()
         if self._state_reconciler is not None:

indexify/executor/executor_flavor.py ADDED Viewed

@@ -0,0 +1,7 @@
+from enum import Enum
+class ExecutorFlavor(Enum):
+    UNKNOWN = "unknown"
+    OSS = "oss"
+    PLATFORM = "platform"

indexify/executor/function_executor/function_executor.py CHANGED Viewed

@@ -88,6 +88,7 @@ class FunctionExecutor:
         initialize_request: InitializeRequest,
         base_url: str,
         config_path: Optional[str],
+        customer_code_timeout_sec: Optional[float] = None,
     ):
         """Creates and initializes a FunctionExecutorServer and all resources associated with it.
@@ -103,7 +104,9 @@ class FunctionExecutor:
                 await self._establish_channel()
                 stub: FunctionExecutorStub = FunctionExecutorStub(self._channel)
                 await _collect_server_info(stub)
-                await _initialize_server(stub, initialize_request)
+                await _initialize_server(
+                    stub, initialize_request, customer_code_timeout_sec
+                )
                 await self._create_invocation_state_client(
                     stub=stub,
                     base_url=base_url,
@@ -293,18 +296,28 @@ async def _collect_server_info(stub: FunctionExecutorStub) -> None:
 async def _initialize_server(
-    stub: FunctionExecutorStub, initialize_request: InitializeRequest
+    stub: FunctionExecutorStub,
+    initialize_request: InitializeRequest,
+    customer_code_timeout_sec: Optional[float],
 ) -> None:
     with (
         metric_initialize_rpc_errors.count_exceptions(),
         metric_initialize_rpc_latency.time(),
     ):
-        initialize_response: InitializeResponse = await stub.initialize(
-            initialize_request
-        )
-        if initialize_response.success:
-            return
-        if initialize_response.HasField("customer_error"):
-            raise CustomerError(initialize_response.customer_error)
-        else:
-            raise Exception("initialize RPC failed at function executor server")
+        try:
+            initialize_response: InitializeResponse = await stub.initialize(
+                initialize_request,
+                timeout=customer_code_timeout_sec,
+            )
+            if initialize_response.success:
+                return
+            if initialize_response.HasField("customer_error"):
+                raise CustomerError(initialize_response.customer_error)
+            else:
+                raise Exception("initialize RPC failed at function executor server")
+        except grpc.aio.AioRpcError as e:
+            if e.code() == grpc.StatusCode.DEADLINE_EXCEEDED:
+                raise CustomerError(
+                    f"Customer code timeout {customer_code_timeout_sec} sec expired"
+                ) from e
+            raise

indexify/executor/function_executor/function_executor_state.py CHANGED Viewed

@@ -25,6 +25,7 @@ class FunctionExecutorState:
         graph_version: str,
         function_name: str,
         image_uri: Optional[str],
+        secret_names: List[str],
         logger: Any,
     ):
         # Read only fields.
@@ -33,6 +34,7 @@ class FunctionExecutorState:
         self.graph_name: str = graph_name
         self.function_name: str = function_name
         self.image_uri: Optional[str] = image_uri
+        self.secret_names: List[str] = secret_names
         self._logger: Any = logger.bind(
             module=__name__,
             function_executor_id=id,
@@ -47,6 +49,7 @@ class FunctionExecutorState:
         # TODO: Move graph_version to immutable fields once we migrate to gRPC State Reconciler.
         self.graph_version: str = graph_version
         self.status: FunctionExecutorStatus = FunctionExecutorStatus.DESTROYED
+        self.status_message: str = ""
         self.status_change_notifier: asyncio.Condition = asyncio.Condition(
             lock=self.lock
         )
@@ -62,7 +65,9 @@ class FunctionExecutorState:
         while self.status not in allowlist:
             await self.status_change_notifier.wait()
-    async def set_status(self, new_status: FunctionExecutorStatus) -> None:
+    async def set_status(
+        self, new_status: FunctionExecutorStatus, status_message: str = ""
+    ) -> None:
         """Sets the status of the Function Executor.
         The caller must hold the lock.
@@ -70,6 +75,7 @@ class FunctionExecutorState:
         """
         self.check_locked()
         if is_status_change_allowed(self.status, new_status):
+            # If status didn't change then still log it for visibility.
             self._logger.info(
                 "function executor status changed",
                 old_status=self.status.name,
@@ -78,12 +84,14 @@ class FunctionExecutorState:
             metric_function_executors_with_status.labels(status=self.status.name).dec()
             metric_function_executors_with_status.labels(status=new_status.name).inc()
             self.status = new_status
+            self.status_message = status_message
             self.status_change_notifier.notify_all()
         else:
             raise ValueError(
                 f"Invalid status change from {self.status} to {new_status}"
             )
+    # TODO: Delete this method once HTTP protocol is removed as it's used only there.
     async def destroy_function_executor(self) -> None:
         """Destroys the Function Executor if it exists.

indexify/executor/function_executor/function_executor_states_container.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import asyncio
-from typing import Any, AsyncGenerator, Dict, Optional
+from typing import Any, AsyncGenerator, Dict, List, Optional
 from .function_executor_state import FunctionExecutorState
 from .function_executor_status import FunctionExecutorStatus
@@ -26,6 +26,7 @@ class FunctionExecutorStatesContainer:
         graph_version: str,
         function_name: str,
         image_uri: Optional[str],
+        secret_names: List[str],
     ) -> FunctionExecutorState:
         """Get or create a function executor state with the given ID.
@@ -45,6 +46,7 @@ class FunctionExecutorStatesContainer:
                     graph_version=graph_version,
                     function_name=function_name,
                     image_uri=image_uri,
+                    secret_names=secret_names,
                     logger=self._logger,
                 )
                 self._states[id] = state

indexify/executor/function_executor/function_executor_status.py CHANGED Viewed

@@ -23,6 +23,7 @@ class FunctionExecutorStatus(Enum):
     UNHEALTHY = "Unhealthy"
     # STARTUP_FAILED_CUSTOMER_ERROR -> DESTROYING
     # STARTUP_FAILED_PLATFORM_ERROR -> DESTROYING
+    # RUNNING_TASK -> DESTROYING
     # UNHEALTHY -> DESTROYING
     # IDLE -> DESTROYING
     DESTROYING = "Destroying"
@@ -69,6 +70,7 @@ def is_status_change_allowed(
         ],
         FunctionExecutorStatus.RUNNING_TASK: [
             FunctionExecutorStatus.RUNNING_TASK,
+            FunctionExecutorStatus.DESTROYING,
             FunctionExecutorStatus.IDLE,
             FunctionExecutorStatus.UNHEALTHY,
             FunctionExecutorStatus.SHUTDOWN,

indexify/executor/function_executor/health_checker.py CHANGED Viewed

@@ -70,8 +70,10 @@ class HealthChecker:
                 # code is not involved when TCP connections are established to FE. Problems reestablishing
                 # the TCP connection are usually due to the FE process crashing and its gRPC server socket
                 # not being available anymore or due to prolonged local networking failures on Executor.
-                channel_connectivity = self._channel.get_state()
-                if channel_connectivity == grpc.ChannelConnectivity.TRANSIENT_FAILURE:
+                if (
+                    _channel_state(self._channel, self._logger)
+                    == grpc.ChannelConnectivity.TRANSIENT_FAILURE
+                ):
                     return HealthCheckResult(
                         is_healthy=False,
                         reason="Channel is in TRANSIENT_FAILURE state, assuming Function Executor crashed.",
@@ -126,3 +128,19 @@ class HealthChecker:
         asyncio.create_task(self._health_check_failed_callback(result))
         self._health_check_loop_task = None
+def _channel_state(channel: grpc.aio.Channel, logger: Any) -> grpc.ChannelConnectivity:
+    """Get channel connectivity state and suppresses all exceptions.
+    Suppressing the exceptions is important because the channel connectivity state is an experimental
+    feature. On error fallse back to READY state which assumes that the channel is okay.
+    """
+    try:
+        return channel.get_state()
+    except Exception as e:
+        logger.error(
+            "Failed getting channel state, falling back to default READY state",
+            exc_info=e,
+        )
+        return grpc.ChannelConnectivity.READY

indexify/executor/function_executor/server/subprocess_function_executor_server_factory.py CHANGED Viewed

@@ -25,6 +25,12 @@ class SubprocessFunctionExecutorServerFactory(FunctionExecutorServerFactory):
         logger = logger.bind(module=__name__)
         port: Optional[int] = None
+        if len(config.secret_names) > 0:
+            logger.warning(
+                "Subprocess Function Executor does not support secrets. Please supply secrets as environment variables.",
+                secret_names=config.secret_names,
+            )
         try:
             port = self._allocate_port()
             args = [

indexify/executor/function_executor/single_task_runner.py CHANGED Viewed

@@ -10,6 +10,7 @@ from tensorlake.function_executor.proto.function_executor_pb2 import (
 from tensorlake.function_executor.proto.function_executor_pb2_grpc import (
     FunctionExecutorStub,
 )
+from tensorlake.function_executor.proto.message_validator import MessageValidator
 from ..api_objects import Task
 from .function_executor import CustomerError, FunctionExecutor
@@ -26,7 +27,7 @@ from .server.function_executor_server_factory import (
     FunctionExecutorServerFactory,
 )
 from .task_input import TaskInput
-from .task_output import TaskOutput
+from .task_output import TaskMetrics, TaskOutput
 class SingleTaskRunner:
@@ -286,16 +287,17 @@ class _RunningTaskContextManager:
 def _task_output(task: Task, response: RunTaskResponse) -> TaskOutput:
-    required_fields = [
-        "stdout",
-        "stderr",
-        "is_reducer",
-        "success",
-    ]
-    for field in required_fields:
-        if not response.HasField(field):
-            raise ValueError(f"Response is missing required field: {field}")
+    response_validator = MessageValidator(response)
+    response_validator.required_field("stdout")
+    response_validator.required_field("stderr")
+    response_validator.required_field("is_reducer")
+    response_validator.required_field("success")
+    metrics = TaskMetrics(counters={}, timers={})
+    if response.HasField("metrics"):
+        # Can be None if e.g. function failed.
+        metrics.counters = dict(response.metrics.counters)
+        metrics.timers = dict(response.metrics.timers)
     output = TaskOutput(
         task_id=task.id,
@@ -308,10 +310,12 @@ def _task_output(task: Task, response: RunTaskResponse) -> TaskOutput:
         stderr=response.stderr,
         reducer=response.is_reducer,
         success=response.success,
+        metrics=metrics,
     )
     if response.HasField("function_output"):
         output.function_output = response.function_output
+        output.output_encoding = response.function_output.output_encoding
     if response.HasField("router_output"):
         output.router_output = response.router_output

indexify/executor/function_executor/task_output.py CHANGED Viewed

@@ -1,11 +1,17 @@
-from typing import Optional
+from typing import Dict, Optional
 from tensorlake.function_executor.proto.function_executor_pb2 import (
     FunctionOutput,
     RouterOutput,
 )
-from ..api_objects import Task
+class TaskMetrics:
+    """Metrics for a task."""
+    def __init__(self, counters: Dict[str, int], timers: Dict[str, float]):
+        self.counters = counters
+        self.timers = timers
 class TaskOutput:
@@ -19,6 +25,7 @@ class TaskOutput:
         function_name: str,
         graph_version: str,
         graph_invocation_id: str,
+        output_encoding: Optional[str] = None,
         function_output: Optional[FunctionOutput] = None,
         router_output: Optional[RouterOutput] = None,
         stdout: Optional[str] = None,
@@ -26,6 +33,7 @@ class TaskOutput:
         reducer: bool = False,
         success: bool = False,
         is_internal_error: bool = False,
+        metrics: Optional[TaskMetrics] = None,
     ):
         self.task_id = task_id
         self.namespace = namespace
@@ -40,6 +48,8 @@ class TaskOutput:
         self.reducer = reducer
         self.success = success
         self.is_internal_error = is_internal_error
+        self.metrics = metrics
+        self.output_encoding = output_encoding
     @classmethod
     def internal_error(
@@ -63,3 +73,26 @@ class TaskOutput:
             stderr="Platform failed to execute the function.",
             is_internal_error=True,
         )
+    @classmethod
+    def function_timeout(
+        cls,
+        task_id: str,
+        namespace: str,
+        graph_name: str,
+        function_name: str,
+        graph_version: str,
+        graph_invocation_id: str,
+    ) -> "TaskOutput":
+        """Creates a TaskOutput for an function timeout error."""
+        # Task stdout, stderr is not available.
+        return TaskOutput(
+            task_id=task_id,
+            namespace=namespace,
+            graph_name=graph_name,
+            function_name=function_name,
+            graph_version=graph_version,
+            graph_invocation_id=graph_invocation_id,
+            stderr="Function execution timed out.",
+            is_internal_error=False,
+        )

indexify 0.3.17__py3-none-any.whl → 0.3.19__py3-none-any.whl

indexify 0.3.17py3-none-any.whl → 0.3.19py3-none-any.whl